Skip to content

Commit

Permalink
Add support for partial clones
Browse files Browse the repository at this point in the history
  • Loading branch information
mathomp4 committed Jan 9, 2024
1 parent bf85281 commit ac43f26
Show file tree
Hide file tree
Showing 5 changed files with 91 additions and 7 deletions.
9 changes: 9 additions & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
Expand Up @@ -15,6 +15,15 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0

### Removed

## [1.52.0] - 2024-01-10

### Added

- Added new `--partial` option to `mepo clone` with two settings: `blobless` and `treeless`. If you set, `--partial=blobless` then
the clone will not download blobs by using `--filter=blob:none`. If you set `--partial=treeless` then the clone will not download
trees by using `--filter=tree:0`. The `blobless` option is useful for large repos that have a lot of binary files that you don't
need. The `treeless` option is even more aggressive and *SHOULD NOT* be used unless you know what you are doing.

## [1.51.1] - 2023-08-25

### Fixed
Expand Down
43 changes: 42 additions & 1 deletion etc/mepoconfig-example
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@
#
# .mepoconfig is a config file a la gitconfig with sections and options.
#
# Currently, .mepoconfig files recognize two sections: [init] and [alias]
# Currently, .mepoconfig files recognize three sections: [init], [alias], and [clone].
#
# =======================================================================
#
Expand All @@ -24,6 +24,10 @@
#
# mepo clone --style postfix
#
# You set these options by running:
#
# mepo config set init.style <value>
#
# =======================================================================
#
# [alias] Section
Expand All @@ -40,3 +44,40 @@
# you can only alias mepo primary commands and not "subcommands" or
# "options". So you can have an alias for "commit" and for "branch",
# but you can't do an option for "commit -m" or "branch create".
#
# You can set an alias by running:
#
# mepo config set alias.<alias> <command>
#
# =======================================================================
#
# [clone] Section
#
# The clone section currently recognizes one option, partial.
# This has two allowed values: blobless and treeless
#
# So if you have:
#
# [clone]
# partial = blobless
#
# This is equivalent to doing:
#
# mepo clone --partial=blobless
#
# which corresponds to the git clone option --filter=blob:none
#
# and similarly for treeless:
#
# [clone]
# partial = treeless
#
# is equivalent to doing:
#
# mepo clone --partial=treeless
#
# which corresponds to the git clone option --filter=tree:0
#
# You set these options by running:
#
# mepo config set clone.partial <value>
7 changes: 7 additions & 0 deletions mepo.d/cmdline/parser.py
Original file line number Diff line number Diff line change
Expand Up @@ -104,6 +104,13 @@ def __clone(self):
'--allrepos',
action = 'store_true',
help = 'Must be passed with -b/--branch. When set, it not only checkouts out the branch/tag for the fixture, but for all the subrepositories as well.')
clone.add_argument(
'--partial',
metavar = 'partial-type',
nargs = '?',
default = None,
choices = ['blobless','treeless'],
help = 'Style of partial clone, default: None, allowed options: %(choices)s. Note that blobless means cloning with --filter=blob:none and treeless means cloning with --filter=tree:0. NOTE: We do *not* recommend using "treeless" as it is very aggressive and will cause problems with many git commands.')

def __list(self):
listcomps = self.subparsers.add_parser(
Expand Down
30 changes: 25 additions & 5 deletions mepo.d/command/clone/clone.py
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
from state.state import MepoState, StateDoesNotExistError
from repository.git import GitRepository
from command.init import init as mepo_init
from utilities import shellcmd, colors
from utilities import shellcmd, colors, mepoconfig
from urllib.parse import urlparse

import os
Expand All @@ -18,6 +18,22 @@ def run(args):
if args.allrepos and not args.branch:
raise RuntimeError("The allrepos option must be used with a branch/tag.")

# We can get the blobless and treeless options from the config or the args
if args.partial:
partial = args.partial
elif mepoconfig.has_option('clone','partial'):
allowed = ['blobless','treeless']
partial = mepoconfig.get('clone','partial')
if partial not in allowed:
raise Exception(f'Detected partial clone type [{partial}] from .mepoconfig is not an allowed partial clone type: {allowed}')
else:
print(f'Found partial clone type [{partial}] in .mepoconfig')
else:
partial = None

blobless = partial == 'blobless'
treeless = partial == 'treeless'

# If you pass in a config, with clone, it could be outside the repo.
# So use the full path
passed_in_config = False
Expand All @@ -34,15 +50,15 @@ def run(args):
last_url_node = p.path.rsplit('/')[-1]
url_suffix = pathlib.Path(last_url_node).suffix
if args.directory:
local_clone(args.repo_url,args.branch,args.directory)
local_clone(args.repo_url,args.branch,args.directory,blobless,treeless)
os.chdir(args.directory)
else:
if url_suffix == '.git':
git_url_directory = pathlib.Path(last_url_node).stem
else:
git_url_directory = last_url_node

local_clone(args.repo_url,args.branch,git_url_directory)
local_clone(args.repo_url,args.branch,git_url_directory,blobless,treeless)
os.chdir(git_url_directory)

# Copy the new file into the repo only if we pass it in
Expand Down Expand Up @@ -71,7 +87,7 @@ def run(args):
recurse = comp.recurse_submodules
# We need the type to handle hashes in components.yaml
type = comp.version.type
git.clone(version,recurse,type,comp.name)
git.clone(version,recurse,type,comp.name,blobless,treeless)
if comp.sparse:
git.sparsify(comp.sparse)
print_clone_info(comp, max_namelen)
Expand All @@ -89,8 +105,12 @@ def print_clone_info(comp, name_width):
ver_name_type = '({}) {}'.format(comp.version.type, comp.version.name)
print('{:<{width}} | {:<s}'.format(comp.name, ver_name_type, width = name_width))

def local_clone(url,branch=None,directory=None):
def local_clone(url,branch=None,directory=None,blobless=False,treeless=False):
cmd1 = 'git clone '
if blobless:
cmd1 += '--filter=blob:none '
if treeless:
cmd1 += '--filter=tree:0 '
if branch:
cmd1 += '--branch {} '.format(branch)
cmd1 += '--quiet {}'.format(url)
Expand Down
9 changes: 8 additions & 1 deletion mepo.d/repository/git.py
Original file line number Diff line number Diff line change
Expand Up @@ -39,8 +39,15 @@ def get_full_local_path(self):
def get_remote_url(self):
return self.__remote

def clone(self, version, recurse, type, comp_name):
def clone(self, version, recurse, type, comp_name, blobless=False, treeless=False):
cmd1 = 'git clone '

if blobless:
cmd1 += '--filter=blob:none '

if treeless:
cmd1 += '--filter=tree:0 '

if recurse:
cmd1 += '--recurse-submodules '

Expand Down

0 comments on commit ac43f26

Please sign in to comment.