123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452 |
- # Copyright 2013 The Chromium Authors. All rights reserved.
- # Use of this source code is governed by a BSD-style license that can be
- # found in the LICENSE file.
- import itertools
- import re
- from recipe_engine import recipe_api
- from recipe_engine import util as recipe_util
- class GitApi(recipe_api.RecipeApi):
- _GIT_HASH_RE = re.compile('[0-9a-f]{40}', re.IGNORECASE)
- def __call__(self, *args, **kwargs):
- """Returns a git command step."""
- name = kwargs.pop('name', 'git ' + args[0])
- infra_step = kwargs.pop('infra_step', True)
- git_cmd = ['git']
- options = kwargs.pop('git_config_options', {})
- for k, v in sorted(options.items()):
- git_cmd.extend(['-c', '%s=%s' % (k, v)])
- with self.m.context(cwd=(self.m.context.cwd or self.m.path['checkout'])):
- return self.m.step(name, git_cmd + list(args), infra_step=infra_step,
- **kwargs)
- def fetch_tags(self, remote_name=None, **kwargs):
- """Fetches all tags from the remote."""
- kwargs.setdefault('name', 'git fetch tags')
- remote_name = remote_name or 'origin'
- return self('fetch', remote_name, '--tags', **kwargs)
- def cat_file_at_commit(self, file_path, commit_hash, remote_name=None,
- **kwargs):
- """Outputs the contents of a file at a given revision."""
- self.fetch_tags(remote_name=remote_name, **kwargs)
- kwargs.setdefault('name', 'git cat-file %s:%s' % (commit_hash, file_path))
- return self('cat-file', 'blob', '%s:%s' % (commit_hash, file_path),
- **kwargs)
- def count_objects(self, previous_result=None, raise_on_failure=False, **kwargs):
- """Returns `git count-objects` result as a dict.
- Args:
- * previous_result (dict): the result of previous count_objects call.
- If passed, delta is reported in the log and step text.
- * raise_on_failure (bool): if True, an exception will be raised if the
- operation fails. Defaults to False.
- Returns:
- A dict of count-object values, or None if count-object run failed.
- """
- if previous_result:
- assert isinstance(previous_result, dict)
- assert all(isinstance(v, int) for v in previous_result.values())
- assert 'size' in previous_result
- assert 'size-pack' in previous_result
- step_result = None
- try:
- step_result = self(
- 'count-objects', '-v', stdout=self.m.raw_io.output(),
- raise_on_failure=raise_on_failure, **kwargs)
- if not step_result.stdout:
- return None
- result = {}
- for line in step_result.stdout.splitlines():
- line = line.decode('utf-8')
- name, value = line.split(':', 1)
- result[name] = int(value.strip())
- def results_to_text(results):
- return [' %s: %s' % (k, v) for k, v in sorted(results.items())]
- step_result.presentation.logs['result'] = results_to_text(result)
- if previous_result:
- delta = {
- key: value - previous_result[key]
- for key, value in result.items()
- if key in previous_result}
- step_result.presentation.logs['delta'] = (
- ['before:'] + results_to_text(previous_result) +
- ['', 'after:'] + results_to_text(result) +
- ['', 'delta:'] + results_to_text(delta)
- )
- size_delta = (
- result['size'] + result['size-pack']
- - previous_result['size'] - previous_result['size-pack'])
- # size_delta is in KiB.
- step_result.presentation.step_text = (
- 'size delta: %+.2f MiB' % (size_delta / 1024.0))
- return result
- except Exception as ex:
- if step_result:
- step_result.presentation.logs['exception'] = recipe_util.format_ex(ex)
- step_result.presentation.status = self.m.step.WARNING
- if raise_on_failure:
- raise recipe_api.InfraFailure('count-objects failed: %s' % ex)
- return None
- def checkout(self, url, ref=None, dir_path=None, recursive=False,
- submodules=True, submodule_update_force=False,
- keep_paths=None, step_suffix=None,
- curl_trace_file=None, raise_on_failure=True,
- set_got_revision=False, remote_name=None,
- display_fetch_size=None, file_name=None,
- submodule_update_recursive=True,
- use_git_cache=False, progress=True, tags=False):
- """Performs a full git checkout and returns sha1 of checked out revision.
- Args:
- * url (str): url of remote repo to use as upstream
- * ref (str): ref to fetch and check out
- * dir_path (Path): optional directory to clone into
- * recursive (bool): whether to recursively fetch submodules or not
- * submodules (bool): whether to sync and update submodules or not
- * submodule_update_force (bool): whether to update submodules with --force
- * keep_paths (iterable of strings): paths to ignore during git-clean;
- paths are gitignore-style patterns relative to checkout_path.
- * step_suffix (str): suffix to add to a each step name
- * curl_trace_file (Path): if not None, dump GIT_CURL_VERBOSE=1 trace to that
- file. Useful for debugging git issue reproducible only on bots. It has
- a side effect of all stderr output of 'git fetch' going to that file.
- * raise_on_failure (bool): if False, ignore errors during fetch or checkout.
- * set_got_revision (bool): if True, resolves HEAD and sets got_revision
- property.
- * remote_name (str): name of the git remote to use
- * display_fetch_size (bool): if True, run `git count-objects` before and
- after fetch and display delta. Adds two more steps. Defaults to False.
- * file_name (str): optional path to a single file to checkout.
- * submodule_update_recursive (bool): if True, updates submodules
- recursively.
- * use_git_cache (bool): if True, git cache will be used for this checkout.
- WARNING, this is EXPERIMENTAL!!! This wasn't tested with:
- * submodules
- * since origin url is modified
- to a local path, may cause problem with scripts that do
- "git fetch origin" or "git push origin".
- * arbitrary refs such refs/whatever/not-fetched-by-default-to-cache
- progress (bool): whether to show progress for fetch or not
- * tags (bool): Also fetch tags.
- Returns: If the checkout was successful, this returns the commit hash of
- the checked-out-repo. Otherwise this returns None.
- """
- retVal = None
- # TODO(robertocn): Break this function and refactor calls to it.
- # The problem is that there are way too many unrealated use cases for
- # it, and the function's signature is getting unwieldy and its body
- # unreadable.
- display_fetch_size = display_fetch_size or False
- if not dir_path:
- dir_path = url.rsplit('/', 1)[-1]
- if dir_path.endswith('.git'): # ex: https://host/foobar.git
- dir_path = dir_path[:-len('.git')]
- # ex: ssh://host:repo/foobar/.git
- dir_path = dir_path or dir_path.rsplit('/', 1)[-1]
- dir_path = self.m.path['start_dir'].join(dir_path)
- if 'checkout' not in self.m.path:
- self.m.path['checkout'] = dir_path
- git_setup_args = ['--path', dir_path, '--url', url]
- if remote_name:
- git_setup_args += ['--remote', remote_name]
- else:
- remote_name = 'origin'
- step_suffix = '' if step_suffix is None else ' (%s)' % step_suffix
- self.m.step(
- 'git setup%s' % step_suffix,
- ['python3', '-u', self.resource('git_setup.py')] + git_setup_args)
- # Some of the commands below require depot_tools to be in PATH.
- path = self.m.path.pathsep.join([
- str(self.repo_resource()), '%(PATH)s'])
- with self.m.context(cwd=dir_path):
- if use_git_cache:
- with self.m.context(env={'PATH': path}):
- self('cache', 'populate', '-c',
- self.m.path['cache'].join('git'), url,
- name='populate cache',
- raise_on_failure=raise_on_failure)
- dir_cmd = self(
- 'cache', 'exists', '--quiet',
- '--cache-dir', self.m.path['cache'].join('git'), url,
- raise_on_failure=raise_on_failure,
- stdout=self.m.raw_io.output(),
- step_test_data=lambda:
- self.m.raw_io.test_api.stream_output('mirror_dir'))
- mirror_dir = dir_cmd.stdout.strip().decode('utf-8')
- self('remote', 'set-url', 'origin', mirror_dir,
- raise_on_failure=raise_on_failure)
- # There are five kinds of refs we can be handed:
- # 0) None. In this case, we default to api.buildbucket.gitiles_commit.ref.
- # 1) A fully qualified branch name, e.g. 'refs/heads/main'.
- # Chop off 'refs/heads/' and now it matches case (4).
- # 2) A 40-character SHA1 hash.
- # 3) A fully-qualifed arbitrary ref, e.g. 'refs/foo/bar/baz'.
- # 4) A branch name, e.g. 'main'.
- # Note that 'FETCH_HEAD' can be many things (and therefore not a valid
- # checkout target) if many refs are fetched, but we only explicitly fetch
- # one ref here, so this is safe.
- if not ref: # Case 0.
- ref = self.m.buildbucket.gitiles_commit.ref or 'main'
- # If it's a fully-qualified branch name, trim the 'refs/heads/' prefix.
- if ref.startswith('refs/heads/'): # Case 1.
- ref = ref[len('refs/heads/'):]
- fetch_args = []
- if self._GIT_HASH_RE.match(ref): # Case 2.
- fetch_remote = remote_name
- fetch_ref = ''
- checkout_ref = ref
- else: # Cases 3 and 4.
- fetch_remote = remote_name
- fetch_ref = ref
- checkout_ref = 'FETCH_HEAD'
- fetch_args = [x for x in (fetch_remote, fetch_ref) if x]
- if recursive:
- fetch_args.append('--recurse-submodules')
- if progress:
- fetch_args.append('--progress')
- fetch_env = {'PATH': path}
- fetch_stderr = None
- if curl_trace_file:
- fetch_env['GIT_CURL_VERBOSE'] = '1'
- fetch_stderr = self.m.raw_io.output(leak_to=curl_trace_file)
- if tags:
- fetch_args.append('--tags')
- fetch_step_name = 'git fetch%s' % step_suffix
- if display_fetch_size:
- count_objects_before_fetch = self.count_objects(
- name='count-objects before %s' % fetch_step_name,
- step_test_data=lambda: self.m.raw_io.test_api.stream_output(
- self.test_api.count_objects_output(1000)))
- with self.m.context(env=fetch_env):
- self('fetch', *fetch_args,
- name=fetch_step_name,
- stderr=fetch_stderr,
- raise_on_failure=raise_on_failure)
- if display_fetch_size:
- self.count_objects(
- name='count-objects after %s' % fetch_step_name,
- previous_result=count_objects_before_fetch,
- step_test_data=lambda: self.m.raw_io.test_api.stream_output(
- self.test_api.count_objects_output(2000)))
- if file_name:
- self('checkout', '-f', checkout_ref, '--', file_name,
- name='git checkout%s' % step_suffix,
- raise_on_failure=raise_on_failure)
- else:
- self('checkout', '-f', checkout_ref,
- name='git checkout%s' % step_suffix,
- raise_on_failure=raise_on_failure)
- rev_parse_step = self('rev-parse', 'HEAD',
- name='read revision',
- stdout=self.m.raw_io.output_text(),
- raise_on_failure=False,
- step_test_data=lambda:
- self.m.raw_io.test_api.stream_output_text('deadbeef'))
- if rev_parse_step.presentation.status == 'SUCCESS':
- sha = rev_parse_step.stdout.strip()
- retVal = sha
- rev_parse_step.presentation.step_text = "<br/>checked out %r<br/>" % sha
- if set_got_revision:
- rev_parse_step.presentation.properties['got_revision'] = sha
- clean_args = list(itertools.chain(
- *[('-e', path) for path in keep_paths or []]))
- self('clean', '-f', '-d', '-x', *clean_args,
- name='git clean%s' % step_suffix,
- raise_on_failure=raise_on_failure)
- if submodules:
- self('submodule', 'sync',
- name='submodule sync%s' % step_suffix,
- raise_on_failure=raise_on_failure)
- submodule_update = ['submodule', 'update', '--init']
- if submodule_update_recursive:
- submodule_update.append('--recursive')
- if submodule_update_force:
- submodule_update.append('--force')
- self(*submodule_update,
- name='submodule update%s' % step_suffix,
- raise_on_failure=raise_on_failure)
- return retVal
- def get_timestamp(self, commit='HEAD', test_data=None, **kwargs):
- """Find and return the timestamp of the given commit."""
- step_test_data = None
- if test_data is not None:
- step_test_data = lambda: self.m.raw_io.test_api.stream_output(test_data)
- return self('show', commit, '--format=%at', '-s',
- stdout=self.m.raw_io.output(),
- step_test_data=step_test_data).stdout.rstrip().decode('utf-8')
- def rebase(self, name_prefix, branch, dir_path, remote_name=None,
- **kwargs):
- """Runs rebase HEAD onto branch
- Args:
- * name_prefix (str): a prefix used for the step names
- * branch (str): a branch name or a hash to rebase onto
- * dir_path (Path): directory to clone into
- * remote_name (str): the remote name to rebase from if not origin
- """
- remote_name = remote_name or 'origin'
- with self.m.context(cwd=dir_path):
- try:
- self('rebase', '%s/main' % remote_name,
- name="%s rebase" % name_prefix, **kwargs)
- except self.m.step.StepFailure:
- self('rebase', '--abort', name='%s rebase abort' % name_prefix,
- **kwargs)
- raise
- def config_get(self, prop_name, **kwargs):
- """Returns git config output.
- Args:
- * prop_name: (str) The name of the config property to query.
- * kwargs: Forwarded to '__call__'.
- Returns: (str) The Git config output, or None if no output was generated.
- """
- kwargs['name'] = kwargs.get('name', 'git config %s' % (prop_name,))
- result = self('config', '--get', prop_name, stdout=self.m.raw_io.output(),
- **kwargs)
- value = result.stdout
- if value:
- value = value.strip()
- result.presentation.step_text = value.decode('utf-8')
- return value
- def get_remote_url(self, remote_name=None, **kwargs):
- """Returns the remote Git repository URL, or None.
- Args:
- * remote_name: (str) The name of the remote to query, defaults to 'origin'.
- * kwargs: Forwarded to '__call__'.
- Returns: (str) The URL of the remote Git repository, or None.
- """
- remote_name = remote_name or 'origin'
- return self.config_get('remote.%s.url' % (remote_name,), **kwargs)
- def bundle_create(self, bundle_path, rev_list_args=None, **kwargs):
- """Runs 'git bundle create' on a Git repository.
- Args:
- * bundle_path (Path): The path of the output bundle.
- * refs (list): The list of refs to include in the bundle. If None, all
- refs in the Git checkout will be bundled.
- * kwargs: Forwarded to '__call__'.
- """
- if not rev_list_args:
- rev_list_args = ['--all']
- self('bundle', 'create', bundle_path, *rev_list_args, **kwargs)
- def new_branch(self,
- branch,
- name=None,
- upstream=None,
- upstream_current=False,
- **kwargs):
- """Runs git new-branch on a Git repository, to be used before git cl
- upload.
- Args:
- * branch (str): new branch name, which must not yet exist.
- * name (str): step name.
- * upstream (str): to origin/main.
- * upstream_current (bool): whether to use '--upstream_current'.
- * kwargs: Forwarded to '__call__'.
- """
- if upstream and upstream_current:
- raise ValueError('Can not define both upstream and upstream_current')
- env = self.m.context.env
- env['PATH'] = self.m.path.pathsep.join([
- str(self.repo_resource()), '%(PATH)s'])
- args = ['new-branch', branch]
- if upstream:
- args.extend(['--upstream', upstream])
- if upstream_current:
- args.append('--upstream_current')
- if not name:
- name = 'git new-branch %s' % branch
- with self.m.context(env=env):
- return self(*args, name=name, **kwargs)
- def number(self, commitrefs=None, test_values=None):
- """Computes the generation number of some commits.
- Args:
- * commitrefs (list[str]): A list of commit references. If none are
- provided, the generation number for HEAD will be retrieved.
- * test_values (list[str]): A list of numbers to use as the return
- value during tests. It is an error if the length of the list
- does not match the number of commitrefs (1 if commitrefs is not
- provided).
- Returns:
- A list of strings containing the generation numbers of the commits.
- If non-empty commitrefs was provided, the order of the returned
- numbers will correspond to the order of the provided commitrefs.
- """
- def step_test_data():
- refs = commitrefs or ['HEAD']
- if test_values:
- assert len(test_values) == len(refs)
- values = test_values or range(3000, 3000 + len(refs))
- output = '\n'.join(str(v) for v in values)
- return self.m.raw_io.test_api.stream_output_text(output)
- args = ['number']
- args.extend(commitrefs or [])
- # Put depot_tools on the path so that git-number can be found
- with self.m.depot_tools.on_path():
- # git-number is only meant for use on bots, so it prints an error message
- # if CHROME_HEADLESS is not set
- with self.m.context(env={'CHROME_HEADLESS': '1'}):
- step_result = self(*args,
- stdout=self.m.raw_io.output_text(add_output_log=True),
- step_test_data=step_test_data)
- return [l.strip() for l in step_result.stdout.strip().splitlines()]
|