You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
depot_tools/gerrit_util.py

2019 lines
74 KiB
Python

# Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.
"""
Utilities for requesting information for a Gerrit server via HTTPS.
https://gerrit-review.googlesource.com/Documentation/rest-api.html
"""
from __future__ import annotations
import base64
import contextlib
import functools
import http.cookiejar
import json
import logging
import os
import random
import re
import shutil
import socket
import subprocess
import sys
import tempfile
import threading
import time
import urllib.parse
from dataclasses import dataclass
from io import StringIO
from multiprocessing.pool import ThreadPool
from typing import Any, Container, Dict, List, Optional
from typing import Tuple, TypedDict, cast
import httplib2
import httplib2.socks
import auth
import gclient_utils
import metrics
import metrics_utils
import newauth
import scm
import subprocess2
# HACK: httplib2 has significant bugs with its proxy support in
# python3. All httplib2 code should be rewritten to just use python
# stdlib which does not have these bugs.
#
# Prior to that, however, we will directly patch the buggy
# implementation of httplib2.socks.socksocket.__rewriteproxy which does
# not properly expect bytes as its argument instead of str.
#
# Note that __rewriteproxy is inherently buggy, as it relies on the
# python stdlib client to send the entire request header in a single
# call to socket.sendall, which is not explicitly guaranteed.
#
# Changes:
# * all string literals changed to bytes literals.
# * added more http methods to recognize.
# * all __symbols changed to _socksocket__symbols (Python __ munging).
# * Type annotations added to function signature.
def __fixed_rewrite_proxy(self: httplib2.socks.socksocket, header: bytes):
""" rewrite HTTP request headers to support non-tunneling proxies
(i.e. those which do not support the CONNECT method).
This only works for HTTP (not HTTPS) since HTTPS requires tunneling.
"""
host, endpt = None, None
hdrs = header.split(b"\r\n")
for hdr in hdrs:
if hdr.lower().startswith(b"host:"):
host = hdr
elif hdr.lower().split(b" ")[0] in (b"get", b"head", b"post", b"put",
b"patch"):
endpt = hdr
if host and endpt:
hdrs.remove(host)
hdrs.remove(endpt)
host = host.split(b" ")[1]
endpt = endpt.split(b" ")
if self._socksocket__proxy[4] != None \
and self._socksocket__proxy[5] != None:
hdrs.insert(0, self._socksocket__getauthheader())
hdrs.insert(0, b"Host: %s" % host)
hdrs.insert(0,
b"%s http://%s%s %s" % (endpt[0], host, endpt[1], endpt[2]))
return b"\r\n".join(hdrs)
httplib2.socks.socksocket._socksocket__rewriteproxy = __fixed_rewrite_proxy
# TODO: Should fix these warnings.
# pylint: disable=line-too-long
LOGGER = logging.getLogger()
# With a starting sleep time of 12.0 seconds, x <= [1.8-2.2]x backoff, and six
# total tries, the sleep time between the first and last tries will be ~6 min
# (excluding time for each try).
TRY_LIMIT = 6
SLEEP_TIME = 12.0
MAX_BACKOFF = 2.2
MIN_BACKOFF = 1.8
# Controls the transport protocol used to communicate with Gerrit.
# This is parameterized primarily to enable GerritTestCase.
GERRIT_PROTOCOL = 'https'
# Controls how many concurrent Gerrit connections there can be.
MAX_CONCURRENT_CONNECTION = 20
def time_sleep(seconds):
# Use this so that it can be mocked in tests without interfering with python
# system machinery.
return time.sleep(seconds)
def time_time():
# Use this so that it can be mocked in tests without interfering with python
# system machinery.
return time.time()
def log_retry_and_sleep(seconds, attempt, try_limit):
LOGGER.info('Will retry in %d seconds (%d more times)...', seconds,
try_limit - attempt - 1)
time_sleep(seconds)
return seconds * random.uniform(MIN_BACKOFF, MAX_BACKOFF)
class GerritError(Exception):
"""Exception class for errors commuicating with the gerrit-on-borg service."""
def __init__(self, http_status, message, *args, **kwargs):
super(GerritError, self).__init__(*args, **kwargs)
self.http_status = http_status
self.message = '(%d) %s' % (self.http_status, message)
def __str__(self):
return self.message
def _QueryString(params, first_param=None):
"""Encodes query parameters in the key:val[+key:val...] format specified here:
https://gerrit-review.googlesource.com/Documentation/rest-api-changes.html#list-changes
"""
q = [urllib.parse.quote(first_param)] if first_param else []
q.extend(['%s:%s' % (key, val.replace(" ", "+")) for key, val in params])
return '+'.join(q)
class SSOHelper(object):
"""SSOHelper finds a Google-internal SSO helper."""
_sso_cmd: Optional[str] = None
def find_cmd(self) -> str:
"""Returns the cached command-line to invoke git-remote-sso.
If git-remote-sso is not in $PATH, returns None.
"""
if self._sso_cmd is not None:
return self._sso_cmd
cmd = shutil.which('git-remote-sso')
if cmd is None:
cmd = ''
self._sso_cmd = cmd
return cmd
# Global instance
ssoHelper = SSOHelper()
@functools.lru_cache(maxsize=None)
def ShouldUseSSO(host: str, email: str) -> bool:
"""Return True if we should use SSO for the given Gerrit host and user."""
LOGGER.debug("Determining whether we should use SSO...")
if not newauth.Enabled():
LOGGER.debug("SSO=False: not opted in")
return False
if not host.endswith('.googlesource.com'):
LOGGER.debug("SSO=False: non-googlesource host %r", host)
return False
if newauth.SkipSSO():
LOGGER.debug("SSO=False: set skip SSO config")
return False
if not ssoHelper.find_cmd():
LOGGER.debug("SSO=False: no SSO command")
return False
if gclient_utils.IsEnvCog():
LOGGER.debug("SSO=True: in Cog")
return True
if not email:
LOGGER.debug(
"SSO=True: email is empty or missing (and SSO command available)")
return True
if email.endswith('@google.com'):
LOGGER.debug("SSO=True: email is google.com")
return True
if not email.endswith('@chromium.org'):
LOGGER.debug("SSO=False: not chromium.org")
return False
authenticator = SSOAuthenticator()
try:
records = GetAccountEmails(host, 'self', authenticator=authenticator)
except GerritError as e:
if e.http_status == 400:
# This is likely because the user doesn't have an account on the Gerrit host.
LOGGER.debug("SSO=False: get account emails returned 400")
return False
raise
if any(email == r['email'] for r in records):
LOGGER.debug("SSO=True: email is linked to google.com")
return True
LOGGER.debug("SSO=False: unlinked chromium.org")
return False
class _Authenticator(object):
"""Base authenticator class for authenticator implementations to subclass."""
# Cached _Authenticator subclass instance, resolved via get().
_resolved: Optional[_Authenticator] = None
_resolved_lock = threading.Lock()
def authenticate(self, conn: HttpConn):
"""Adds authentication information to the HttpConn."""
raise NotImplementedError()
def debug_summary_state(self) -> str:
"""If this _Authenticator has any debugging information about its state,
_WriteGitPushTraces will call this to include in the git push traces.
Return value is any relevant debugging information with all PII/secrets
redacted.
"""
raise NotImplementedError()
@classmethod
def is_applicable(cls, *, conn: Optional[HttpConn] = None) -> bool:
"""Must return True if this Authenticator is available in the current
environment.
If conn is not None, return True if this Authenticator is
applicable to the given conn in the current environment.
"""
raise NotImplementedError()
def ensure_authenticated(self, gerrit_host: str, git_host: str) -> Tuple[bool, str]:
"""Returns (bypassable, error message).
If the error message is empty, there is no error to report.
If bypassable is true, the caller will allow the user to continue past the
error.
"""
return (True, '')
@classmethod
def get(cls):
"""Returns: (_Authenticator) The identified _Authenticator to use.
Probes the local system and its environment and identifies the
_Authenticator instance to use.
The resolved _Authenticator instance is cached as a class variable.
"""
with cls._resolved_lock:
if ret := cls._resolved:
return ret
use_new_auth = newauth.Enabled()
# Allow skipping SSOAuthenticator for local testing purposes.
skip_sso = newauth.SkipSSO()
if use_new_auth:
LOGGER.debug('_Authenticator.get: using new auth stack')
if LuciContextAuthenticator.is_applicable():
LOGGER.debug(
'_Authenticator.get: using LUCI context authenticator')
ret = LuciContextAuthenticator()
else:
LOGGER.debug(
'_Authenticator.get: using chained authenticator')
a = [
SSOAuthenticator(),
# GCE detection can't distinguish cloud workstations.
GceAuthenticator(),
GitCredsAuthenticator(),
NoAuthenticator(),
]
if skip_sso:
LOGGER.debug(
'Authenticator.get: skipping SSOAuthenticator.')
a = a[1:]
ret = ChainedAuthenticator(a)
cls._resolved = ret
return ret
authenticators = [
LuciContextAuthenticator,
GceAuthenticator,
CookiesAuthenticator,
]
for candidate in authenticators:
if candidate.is_applicable():
LOGGER.debug('_Authenticator.get: Selected %s.',
candidate.__name__)
ret = candidate()
cls._resolved = ret
return ret
auth_names = ', '.join(a.__name__ for a in authenticators)
raise ValueError(
f"Could not find suitable authenticator, tried: [{auth_names}]."
)
def debug_auth() -> Tuple[str, str]:
"""Returns the name of the chosen auth scheme and any additional debugging
information for that authentication scheme. """
authn = _Authenticator.get()
return authn.__class__.__name__, authn.debug_summary_state()
def ensure_authenticated(gerrit_host: str, git_host: str) -> Tuple[bool, str]:
"""Returns (bypassable, error message).
If the error message is empty, there is no error to report. If bypassable is
true, the caller will allow the user to continue past the error.
"""
return _Authenticator.get().ensure_authenticated(gerrit_host, git_host)
class SSOAuthenticator(_Authenticator):
"""SSOAuthenticator implements a Google-internal authentication scheme."""
# This is set to true in tests, allows _parse_config to consume expired
# cookies.
_testing_load_expired_cookies = False
# How long we should wait for the sso helper to write and close stdout.
# Overridden in tests.
_timeout_secs = 5
# The required fields for the sso config, expected from the sso helper's
# output.
_required_fields = frozenset(
['http.cookiefile', 'http.proxy', 'include.path'])
@dataclass
class SSOInfo:
proxy: httplib2.ProxyInfo
cookies: http.cookiejar.CookieJar
headers: Dict[str, str]
# SSOInfo is a cached blob of information used by the `authenticate` method.
_sso_info: Optional[SSOInfo] = None
_sso_info_lock = threading.Lock()
@classmethod
def _resolve_sso_cmd(cls) -> Tuple[str, ...]:
"""Returns the cached command-line to invoke git-remote-sso.
If git-remote-sso is not in $PATH, returns ().
"""
cmd = ssoHelper.find_cmd()
if not cmd:
return ()
return (
cmd,
'-print_config',
'sso://*.git.corp.google.com',
)
@classmethod
def is_applicable(cls, *, conn: Optional[HttpConn] = None) -> bool:
if not cls._resolve_sso_cmd():
return False
email: str = scm.GIT.GetConfig(os.getcwd(), 'user.email', default='')
if conn is not None:
return ShouldUseSSO(conn.host, email)
return email.endswith('@google.com')
@classmethod
def _parse_config(cls, config: Dict[str, str]) -> SSOInfo:
"""Parses the sso info from the given config.
Note: update cls._required_fields appropriately when making
changes to this method, to ensure the field values are captured
from the sso helper.
"""
fullAuthHeader = cast(
str,
scm.GIT.Capture([
'config',
'-f',
config['include.path'],
'http.extraHeader',
]))
headerKey, headerValue = fullAuthHeader.split(':', 1)
headers = {headerKey.strip(): headerValue.strip()}
proxy_host, proxy_port = config['http.proxy'].split(':', 1)
cfpath = config['http.cookiefile']
cj = http.cookiejar.MozillaCookieJar(cfpath)
# NOTE: python3.8 doesn't support httponly cookie lines, so we parse
# this manually. Once we move to python3.10+, this hack can be removed.
with open(cfpath) as cf:
cookiedata = cf.read().replace('#HttpOnly_', '')
# _really_load is the way that MozillaCookieJar subclasses
# FileCookieJar. Calling this directly is better than reimplementing the
# entire _really_load function manually.
cj._really_load(
StringIO(cookiedata),
cfpath,
ignore_discard=False,
ignore_expires=cls._testing_load_expired_cookies,
)
return cls.SSOInfo(proxy=httplib2.ProxyInfo(
httplib2.socks.PROXY_TYPE_HTTP_NO_TUNNEL, proxy_host.encode(),
int(proxy_port)),
cookies=cj,
headers=headers)
@classmethod
def _launch_sso_helper(cls) -> SSOInfo:
"""Launches the git-remote-sso process and extracts the parsed SSOInfo.
Raises an exception if something goes wrong.
"""
cmd = cls._resolve_sso_cmd()
with tempdir() as tdir:
tf = os.path.join(tdir, 'git-remote-sso.stderr')
with open(tf, mode='w') as stderr_file:
# NOTE: The git-remote-sso helper does the following:
#
# 1. writes files to disk.
# 2. writes config to stdout, referencing those files.
# 3. closes stdout (sending EOF to us, ending the stdout data).
# - Note: on Windows, stdout.read() times out anyway, so
# instead we process stdout line by line.
# 4. waits for stdin to close.
# 5. deletes files on disk (which is why we make sys.stdin a PIPE
# instead of closing it outright).
#
# NOTE: the http.proxy value in the emitted config points to
# a socket which is owned by a system service, not `proc` itself.
with subprocess2.Popen(cmd,
stdout=subprocess2.PIPE,
stderr=stderr_file,
stdin=subprocess2.PIPE,
encoding='utf-8') as proc:
stderr_file.close() # we can close after process starts.
timedout = False
def _fire_timeout():
nonlocal timedout
timedout = True
proc.kill()
timer = threading.Timer(cls._timeout_secs, _fire_timeout)
timer.start()
try:
config = {}
for line in proc.stdout:
if not line:
break
field, value = line.strip().split('=', 1)
config[field] = value
# Stop reading if we have all the required fields.
if cls._required_fields.issubset(config.keys()):
break
finally:
timer.cancel()
missing_fields = cls._required_fields - config.keys()
if timedout:
# Within the time limit, at least one required field was
# still missing. Killing the process has been triggered,
# even if we now have all fields.
details = ''
if missing_fields:
details = ': missing fields [{names}]'.format(
names=', '.join(missing_fields))
LOGGER.error(
'SSOAuthenticator: Timeout: %r: reading config%s.',
cmd, details)
raise subprocess.TimeoutExpired(
cmd=cmd, timeout=cls._timeout_secs)
# if the process already ended, then something is wrong.
retcode = proc.poll()
# if stdout was closed without all required data, we need to
# wait for end-of-process here and hope for an error message
# - the poll above is racy in this case (we could see stdout
# EOF but the process may not have quit yet).
if not retcode and missing_fields:
retcode = proc.wait(timeout=cls._timeout_secs)
# We timed out while doing `wait` - we can't safely open
# stderr on windows, so just emit a generic timeout
# exception.
if retcode is None:
LOGGER.error(
'SSOAuthenticator: Timeout: %r: waiting error output.',
cmd)
raise subprocess.TimeoutExpired(
cmd=cmd, timeout=cls._timeout_secs)
# Finally, if the poll or wait ended up getting the retcode,
# it means the process failed, so we can read the stderr
# file and reflect it back to the user.
if retcode is not None:
# process failed - we should be able to read the tempfile.
with open(tf, encoding='utf-8') as stderr:
sys.exit(
f'SSOAuthenticator: exit {retcode}: {stderr.read().strip()}'
)
return cls._parse_config(config)
@classmethod
def _get_sso_info(cls) -> SSOInfo:
with cls._sso_info_lock:
info = cls._sso_info
if not info:
info = cls._launch_sso_helper()
# HACK: `git-remote-sso` doesn't always properly warm up the
# cookies - in this case, run a canned git operation against
# a public repo to cause `git-remote-sso` to warm the cookies
# up, and then try pulling config again.
#
# BUG: b/342644760
if not any(c.domain == '.google.com' for c in info.cookies):
LOGGER.debug('SSO: Refreshing .google.com cookies.')
scm.GIT.Capture(['ls-remote', 'sso://chromium/All-Projects'])
info = cls._launch_sso_helper()
if not any(c.domain == '.google.com' for c in info.cookies):
raise ValueError('Unable to extract .google.com cookie.')
cls._sso_info = info
return info
def authenticate(self, conn: HttpConn):
sso_info = self._get_sso_info()
conn.proxy_info = sso_info.proxy
conn.req_headers.update(sso_info.headers)
# Now we must rewrite:
# https://xxx.googlesource.com ->
# http://xxx.git.corp.google.com
parsed = urllib.parse.urlparse(conn.req_uri)
parsed = parsed._replace(scheme='http')
if (hostname :=
parsed.hostname) and hostname.endswith('.googlesource.com'):
assert not parsed.port, "SSOAuthenticator: netloc: port not supported"
assert not parsed.username, "SSOAuthenticator: netloc: username not supported"
assert not parsed.password, "SSOAuthenticator: netloc: password not supported"
hostname_parts = hostname.rsplit('.', 2) # X, googlesource, com
conn.req_host = hostname_parts[0] + '.git.corp.google.com'
parsed = parsed._replace(netloc=conn.req_host)
conn.req_uri = parsed.geturl()
# Finally, add cookies
sso_info.cookies.add_cookie_header(conn)
assert 'Cookie' in conn.req_headers, (
'sso_info.cookies.add_cookie_header failed to add Cookie.')
def debug_summary_state(self) -> str:
return ''
class CookiesAuthenticator(_Authenticator):
"""_Authenticator implementation that uses ".gitcookies" for token.
Expected case for developer workstations.
"""
_EMPTY = object()
def __init__(self):
# Credentials will be loaded lazily on first use. This ensures
# _Authenticator get() can always construct an authenticator, even if
# something is broken. This allows 'creds-check' to proceed to actually
# checking creds later, rigorously (instead of blowing up with a cryptic
# error if they are wrong).
self._gitcookies = self._EMPTY
@classmethod
def is_applicable(cls, *, conn: Optional[HttpConn] = None) -> bool:
# We consider CookiesAuthenticator always applicable for now.
return True
@property
def gitcookies(self):
if self._gitcookies is self._EMPTY:
self._gitcookies = self._get_gitcookies()
return self._gitcookies
@classmethod
def get_new_password_url(cls, host):
assert not host.startswith('http')
# Assume *.googlesource.com pattern.
parts = host.split('.')
# remove -review suffix if present.
if parts[0].endswith('-review'):
parts[0] = parts[0][:-len('-review')]
return 'https://%s/new-password' % ('.'.join(parts))
@classmethod
def _get_new_password_message(cls, host):
if host is None:
return ('Git host for Gerrit upload is unknown. Check your remote '
'and the branch your branch is tracking. This tool assumes '
'that you are using a git server at *.googlesource.com.')
url = cls.get_new_password_url(host)
return 'You can (re)generate your credentials by visiting %s' % url
@classmethod
def get_gitcookies_path(cls) -> str:
if envVal := os.getenv('GIT_COOKIES_PATH'):
return envVal
return os.path.expanduser(
scm.GIT.GetConfig(os.getcwd(), 'http.cookiefile',
os.path.join('~', '.gitcookies')))
@classmethod
def _get_gitcookies(cls):
gitcookies = {}
path = cls.get_gitcookies_path()
if not os.path.exists(path):
return gitcookies
try:
f = gclient_utils.FileRead(path, 'rb').splitlines()
except IOError:
return gitcookies
for line in f:
try:
fields = line.strip().split('\t')
if line.strip().startswith('#') or len(fields) != 7:
continue
domain, xpath, key, value = fields[0], fields[2], fields[
5], fields[6]
if xpath == '/' and key == 'o':
if value.startswith('git-'):
login, secret_token = value.split('=', 1)
gitcookies[domain] = (login, secret_token)
else:
gitcookies[domain] = ('', value)
except (IndexError, ValueError, TypeError) as exc:
LOGGER.warning(exc)
return gitcookies
def _get_auth_for_host(self, host):
for domain, creds in self.gitcookies.items():
if http.cookiejar.domain_match(host, domain):
return (creds[0], creds[1])
return None
def authenticate(self, conn: HttpConn):
a = self._get_auth_for_host(conn.req_host)
if a:
login, cred = a
if login:
secret = base64.b64encode(f'{login}:{cred}'.encode('utf-8'))
conn.req_headers[
'Authorization'] = f'Basic {secret.decode("utf-8")}'
else:
conn.req_headers['Authorization'] = f'Bearer {cred}'
def ensure_authenticated(self, gerrit_host: str, git_host: str) -> Tuple[bool, str]:
"""Returns (bypassable, error message).
If the error message is empty, there is no error to report.
If bypassable is true, the caller will allow the user to continue past the
error.
"""
# Lazy-loader to identify Gerrit and Git hosts.
gerrit_auth = self._get_auth_for_host(gerrit_host)
git_auth = self._get_auth_for_host(git_host)
if gerrit_auth and git_auth:
if gerrit_auth == git_auth:
return True, ''
all_gsrc = self._get_auth_for_host('d0esN0tEx1st.googlesource.com')
print(
'WARNING: You have different credentials for Gerrit and git hosts:\n'
' %s\n'
' %s\n'
' Consider running the following command:\n'
' git cl creds-check\n'
' %s\n'
' %s' %
(git_host, gerrit_host,
('Hint: delete creds for .googlesource.com' if all_gsrc else
''), self._get_new_password_message(git_host)))
return True, 'If you know what you are doing'
missing = (([] if gerrit_auth else [gerrit_host]) +
([] if git_auth else [git_host]))
return False, ('Credentials for the following hosts are required:\n'
' %s\n'
'These are read from %s\n'
'%s' % ('\n '.join(missing), self.get_gitcookies_path(),
self._get_new_password_message(git_host)))
# Used to redact the cookies from the gitcookies file.
GITCOOKIES_REDACT_RE = re.compile(r'1/.*')
def debug_summary_state(self) -> str:
gitcookies_path = self.get_gitcookies_path()
if os.path.isfile(gitcookies_path):
gitcookies = gclient_utils.FileRead(gitcookies_path)
return self.GITCOOKIES_REDACT_RE.sub('REDACTED', gitcookies)
return ''
def get_auth_email(self, host):
"""Best effort parsing of email to be used for auth for the given host."""
a = self._get_auth_for_host(host)
if not a:
return None
login = a[0]
# login typically looks like 'git-xxx.example.com'
if not login.startswith('git-') or '.' not in login:
return None
username, domain = login[len('git-'):].split('.', 1)
return '%s@%s' % (username, domain)
class GceAuthenticator(_Authenticator):
"""_Authenticator implementation that uses GCE metadata service for token.
"""
_INFO_URL = 'http://metadata.google.internal'
_ACQUIRE_URL = ('%s/computeMetadata/v1/instance/'
'service-accounts/default/token' % _INFO_URL)
_ACQUIRE_HEADERS = {"Metadata-Flavor": "Google"}
_cache_is_gce = None
_token_cache = None
_token_expiration = None
@classmethod
def is_applicable(cls, *, conn: Optional[HttpConn] = None):
if os.getenv('SKIP_GCE_AUTH_FOR_GIT'):
return False
if cls._cache_is_gce is None:
cls._cache_is_gce = cls._test_is_gce()
return cls._cache_is_gce
@classmethod
def _test_is_gce(cls):
# Based on https://cloud.google.com/compute/docs/metadata#runninggce
resp, _ = cls._get(cls._INFO_URL)
if resp is None:
return False
return resp.get('metadata-flavor') == 'Google'
@staticmethod
def _get(url, **kwargs):
next_delay_sec = 1.0
for i in range(TRY_LIMIT):
p = urllib.parse.urlparse(url)
if p.scheme not in ('http', 'https'):
raise RuntimeError("Don't know how to work with protocol '%s'" %
p.scheme)
try:
resp, contents = httplib2.Http().request(url, 'GET', **kwargs)
except (socket.error, httplib2.HttpLib2Error,
httplib2.socks.ProxyError) as e:
LOGGER.debug('GET [%s] raised %s', url, e)
return None, None
LOGGER.debug('GET [%s] #%d/%d (%d)', url, i + 1, TRY_LIMIT,
resp.status)
if resp.status < 500:
return (resp, contents)
# Retry server error status codes.
LOGGER.warning('Encountered server error')
if TRY_LIMIT - i > 1:
next_delay_sec = log_retry_and_sleep(next_delay_sec, i,
TRY_LIMIT)
return None, None
@classmethod
def _get_token_dict(cls):
# If cached token is valid for at least 25 seconds, return it.
if cls._token_cache and time_time() + 25 < cls._token_expiration:
return cls._token_cache
resp, contents = cls._get(cls._ACQUIRE_URL,
headers=cls._ACQUIRE_HEADERS)
if resp is None or resp.status != 200:
return None
cls._token_cache = json.loads(contents)
cls._token_expiration = cls._token_cache['expires_in'] + time_time()
return cls._token_cache
def authenticate(self, conn: HttpConn):
token_dict = self._get_token_dict()
if not token_dict:
return
conn.req_headers[
'Authorization'] = '%(token_type)s %(access_token)s' % token_dict
def debug_summary_state(self) -> str:
# TODO(b/343230702) - report ambient account name.
return ''
class LuciContextAuthenticator(_Authenticator):
"""_Authenticator implementation that uses LUCI_CONTEXT ambient local auth.
"""
@staticmethod
def is_applicable(*, conn: Optional[HttpConn] = None):
return auth.has_luci_context_local_auth()
def __init__(self):
self._authenticator = auth.Authenticator(' '.join(
[auth.OAUTH_SCOPE_EMAIL, auth.OAUTH_SCOPE_GERRIT]))
@property
def luci_auth(self) -> auth.Authenticator:
return self._authenticator
def authenticate(self, conn: HttpConn):
conn.req_headers[
'Authorization'] = f'Bearer {self._authenticator.get_access_token().token}'
def debug_summary_state(self) -> str:
# TODO(b/343230702) - report ambient account name.
return ''
class GitCredsAuthenticator(_Authenticator):
"""_Authenticator implementation that uses `git-credential-luci` with OAuth.
This is similar to LuciContextAuthenticator, except that it is for
local non-google.com developer credentials.
"""
def __init__(self):
self._authenticator = auth.GerritAuthenticator()
@property
def luci_auth(self) -> auth.Authenticator:
return self._authenticator
def authenticate(self, conn: HttpConn):
conn.req_headers[
'Authorization'] = f'Bearer {self._authenticator.get_access_token()}'
def debug_summary_state(self) -> str:
# TODO(b/343230702) - report ambient account name.
return ''
@classmethod
def gerrit_account_exists(cls, host: str) -> bool:
"""Return True if the Gerrit account exists.
This checks the user currently logged in with git-credential-luci.
If the user is not logged in with git-credential-luci, returns False.
This method caches positive results in the user's Git config.
"""
cwd = os.getcwd()
LOGGER.debug("Checking Gerrit account existence for %r", host)
hosts = scm.GIT.GetConfigList(cwd, 'depot-tools.hosthasaccount')
if host in hosts:
# If a user deletes their Gerrit account, then this cache
# might be stale. This should be a rare case and a user can
# just delete this from their Git config.
LOGGER.debug("Using cached account existence for Gerrit host %r",
host)
return True
try:
info = GetAccountDetails(host, authenticator=cls())
except auth.GitLoginRequiredError:
LOGGER.debug(
"Cannot check Gerrit account existence; missing git-credential-luci login"
)
return False
except GerritError as e:
if e.http_status == 400:
# This is likely because the user doesn't have an
# account on the Gerrit host.
LOGGER.debug(
"Gerrit account check returned 400; likely account missing")
return False
raise
if 'email' not in info:
LOGGER.debug("Gerrit account does not exist on %r", host)
return False
LOGGER.debug("Gerrit account exists on %r", host)
try:
scm.GIT.SetConfig(cwd,
'depot-tools.hostHasAccount',
host,
append=True)
except subprocess2.CalledProcessError as e:
# This may be called outside of a Git repository (e.g., when
# fetching from scratch), in which case we don't have a Git
# repository to cache the results of our check, so skip the
# caching.
LOGGER.debug(
"Got error trying to cache 'depot-tools.hostHasAccount': %s", e)
return True
def is_applicable(self, *, conn: Optional[HttpConn] = None):
return self.gerrit_account_exists(conn.host)
class NoAuthenticator(_Authenticator):
"""_Authenticator implementation that does no auth.
"""
@staticmethod
def is_applicable(*, conn: Optional[HttpConn] = None):
return True
def authenticate(self, conn: HttpConn):
pass
def debug_summary_state(self) -> str:
return ''
class ChainedAuthenticator(_Authenticator):
"""_Authenticator that delegates to others in sequence.
Authenticators should implement the method `is_applicable_for`.
"""
def __init__(self, authenticators: List[_Authenticator]):
self.authenticators = list(authenticators)
def is_applicable(self, *, conn: Optional[HttpConn] = None) -> bool:
return bool(any(
a.is_applicable(conn=conn) for a in self.authenticators))
def authenticate(self, conn: HttpConn):
for a in self.authenticators:
if a.is_applicable(conn=conn):
a.authenticate(conn)
break
else:
raise ValueError(
f'{self!r} has no applicable authenticator for {conn!r}')
def debug_summary_state(self) -> str:
return ''
class ReqParams(TypedDict):
uri: str
method: str
headers: Dict[str, str]
body: Optional[str]
class HttpConn(httplib2.Http):
"""HttpConn is an httplib2.Http with additional request-specific fields."""
def __init__(self, *args, req_host: str, req_uri: str, req_method: str,
req_headers: Dict[str, str], req_body: Optional[str],
**kwargs) -> None:
self.req_host = req_host
self.req_uri = req_uri
self.req_method = req_method
self.req_headers = req_headers
self.req_body = req_body
super().__init__(*args, **kwargs)
@property
def req_params(self) -> ReqParams:
return {
'uri': self.req_uri,
'method': self.req_method,
'headers': self.req_headers,
'body': self.req_body,
}
# NOTE: We want to use HttpConn with CookieJar.add_cookie_header, so have
# compatible interface for that here.
#
# NOTE: Someone should really normalize this 'HttpConn' and httplib2
# implementation to just be plain python3 stdlib instead. All of this was
# written during the bad old days of python2.6/2.7, pre-vpython.
def has_header(self, header: str) -> bool:
return header in self.req_headers
def get_full_url(self) -> str:
return self.req_uri
def get_header(self,
header: str,
default: Optional[str] = None) -> Optional[str]:
return self.req_headers.get(header, default)
def add_unredirected_header(self, header: str, value: str):
# NOTE: httplib2 does not support unredirected headers.
self.req_headers[header] = value
@property
def unverifiable(self) -> bool:
return False
@property
def origin_req_host(self) -> str:
return self.req_host
@property
def type(self) -> str:
return urllib.parse.urlparse(self.req_uri).scheme
@property
def host(self) -> str:
return self.req_host
def CreateHttpConn(host: str,
path: str,
reqtype='GET',
headers: Optional[Dict[str, str]] = None,
body: Optional[Dict] = None,
timeout=300,
*,
authenticator: Optional[_Authenticator] = None) -> HttpConn:
"""Opens an HTTPS connection to a Gerrit service, and sends a request."""
headers = headers or {}
bare_host = host.partition(':')[0]
url = path
if not url.startswith('/'):
url = '/' + url
if not url.startswith('/a/'):
url = '/a%s' % url
rendered_body: Optional[str] = None
if body:
rendered_body = json.dumps(body, sort_keys=True)
headers.setdefault('Content-Type', 'application/json')
uri = urllib.parse.urljoin(f'{GERRIT_PROTOCOL}://{host}', url)
conn = HttpConn(timeout=timeout,
req_host=host,
req_uri=uri,
req_method=reqtype,
req_headers=headers,
req_body=rendered_body)
if authenticator is None:
authenticator = _Authenticator.get()
# TODO(crbug.com/1059384): Automatically detect when running on cloudtop.
if isinstance(authenticator, GceAuthenticator):
print('If you\'re on a cloudtop instance, export '
'SKIP_GCE_AUTH_FOR_GIT=1 in your env.')
authenticator.authenticate(conn)
if 'Authorization' not in conn.req_headers:
LOGGER.debug('No authorization found for %s.' % bare_host)
if LOGGER.isEnabledFor(logging.DEBUG):
LOGGER.debug('%s %s', conn.req_method, conn.req_uri)
LOGGER.debug('conn.proxy_info=%r', conn.proxy_info)
for key, val in conn.req_headers.items():
if key in ('Authorization', 'Cookie'):
val = 'HIDDEN'
LOGGER.debug('%s: %s', key, val)
if conn.req_body:
LOGGER.debug(conn.req_body)
return conn
def ReadHttpResponse(conn: HttpConn,
accept_statuses: Container[int] = frozenset([200]),
max_tries=TRY_LIMIT):
"""Reads an HTTP response from a connection into a string buffer.
Args:
conn: An Http object created by CreateHttpConn above.
accept_statuses: Treat any of these statuses as success. Default: [200]
Common additions include 204, 400, and 404.
max_tries: The maximum number of times the request should be attempted.
Returns:
A string buffer containing the connection's reply.
"""
response = contents = None
sleep_time = SLEEP_TIME
for idx in range(max_tries):
before_response = time.time()
try:
response, contents = conn.request(**conn.req_params)
except socket.timeout:
if idx < max_tries - 1:
sleep_time = log_retry_and_sleep(sleep_time, idx, max_tries)
continue
raise
contents = contents.decode('utf-8', 'replace')
response_time = time.time() - before_response
metrics.collector.add_repeated(
'http_requests',
metrics_utils.extract_http_metrics(conn.req_params['uri'],
conn.req_params['method'],
response.status, response_time))
# If response.status is an accepted status,
# or response.status < 500 then the result is final; break retry loop.
# If the response is 404/409 it might be because of replication lag,
# so keep trying anyway. If it is 429, it is generally ok to retry after
# a backoff.
if (response.status in accept_statuses or response.status < 500
and response.status not in [404, 409, 429]):
LOGGER.debug('got response %d for %s %s', response.status,
conn.req_params['method'], conn.req_params['uri'])
# If 404 was in accept_statuses, then it's expected that the file
# might not exist, so don't return the gitiles error page because
# that's not the "content" that was actually requested.
if response.status == 404:
contents = ''
break
# A status >=500 is assumed to be a possible transient error; retry.
http_version = 'HTTP/%s' % ('1.1' if response.version == 11 else '1.0')
LOGGER.warning(
'A transient error occurred while querying %s:\n'
'%s %s %s\n'
'%s %d %s\n'
'%s', conn.req_host, conn.req_params['method'],
conn.req_params['uri'], http_version, http_version, response.status,
response.reason, contents)
if idx < max_tries - 1:
sleep_time = log_retry_and_sleep(sleep_time, idx, max_tries)
# end of retries loop
# Help the type checker a bit here - it can't figure out the `except` logic
# in the loop above.
assert response, (
'Impossible: End of retry loop without response or exception.')
if response.status in accept_statuses:
return StringIO(contents)
if response.status in (302, 401, 403):
www_authenticate = response.get('www-authenticate')
if not www_authenticate:
print('Your Gerrit credentials might be misconfigured.')
elif not newauth.Enabled():
auth_match = re.search('realm="([^"]+)"', www_authenticate, re.I)
host = auth_match.group(1) if auth_match else conn.req_host
new_password_url = CookiesAuthenticator.get_new_password_url(host)
print('Authentication failed. Please make sure your .gitcookies '
f'file has credentials for {host}.')
print(f'(Re)generate credentials here: {new_password_url}')
print('Try:\n git cl creds-check')
reason = '%s: %s' % (response.reason, contents)
raise GerritError(response.status, reason)
def ReadHttpJsonResponse(conn,
accept_statuses: Container[int] = frozenset([200]),
max_tries=TRY_LIMIT) -> dict:
"""Parses an https response as json."""
fh = ReadHttpResponse(conn, accept_statuses, max_tries)
# The first line of the response should always be: )]}'
s = fh.readline()
if s and s.rstrip() != ")]}'":
raise GerritError(200, 'Unexpected json output: %s' % s[:100])
s = fh.read()
if not s:
return {}
return json.loads(s)
def CallGerritApi(host, path, **kwargs):
"""Helper for calling a Gerrit API that returns a JSON response."""
conn_kwargs = {}
conn_kwargs.update(
(k, kwargs[k]) for k in ['reqtype', 'headers', 'body'] if k in kwargs)
conn = CreateHttpConn(host, path, **conn_kwargs)
read_kwargs = {}
read_kwargs.update(
(k, kwargs[k]) for k in ['accept_statuses'] if k in kwargs)
return ReadHttpJsonResponse(conn, **read_kwargs)
def QueryChanges(host,
params,
first_param=None,
limit=None,
o_params=None,
start=None):
"""
Queries a gerrit-on-borg server for changes matching query terms.
Args:
params: A list of key:value pairs for search parameters, as documented
here (e.g. ('is', 'owner') for a parameter 'is:owner'):
https://gerrit-review.googlesource.com/Documentation/user-search.html#search-operators
first_param: A change identifier
limit: Maximum number of results to return.
start: how many changes to skip (starting with the most recent)
o_params: A list of additional output specifiers, as documented here:
https://gerrit-review.googlesource.com/Documentation/rest-api-changes.html#list-changes
Returns:
A list of json-decoded query results.
"""
# Note that no attempt is made to escape special characters; YMMV.
if not params and not first_param:
raise RuntimeError('QueryChanges requires search parameters')
path = 'changes/?q=%s' % _QueryString(params, first_param)
if start:
path = '%s&start=%s' % (path, start)
if limit:
path = '%s&n=%d' % (path, limit)
if o_params:
path = '%s&%s' % (path, '&'.join(['o=%s' % p for p in o_params]))
return ReadHttpJsonResponse(CreateHttpConn(host, path, timeout=30))
def GenerateAllChanges(host,
params,
first_param=None,
limit=500,
o_params=None,
start=None):
"""Queries a gerrit-on-borg server for all the changes matching the query
terms.
WARNING: this is unreliable if a change matching the query is modified while
this function is being called.
A single query to gerrit-on-borg is limited on the number of results by the
limit parameter on the request (see QueryChanges) and the server maximum
limit.
Args:
params, first_param: Refer to QueryChanges().
limit: Maximum number of requested changes per query.
o_params: Refer to QueryChanges().
start: Refer to QueryChanges().
Returns:
A generator object to the list of returned changes.
"""
already_returned = set()
def at_most_once(cls):
for cl in cls:
if cl['_number'] not in already_returned:
already_returned.add(cl['_number'])
yield cl
start = start or 0
cur_start = start
more_changes = True
while more_changes:
# This will fetch changes[start..start+limit] sorted by most recently
# updated. Since the rank of any change in this list can be changed any
# time (say user posting comment), subsequent calls may overalp like
# this: > initial order ABCDEFGH query[0..3] => ABC > E gets updated.
# New order: EABCDFGH query[3..6] => CDF # C is a dup query[6..9] =>
# GH # E is missed.
page = QueryChanges(host, params, first_param, limit, o_params,
cur_start)
for cl in at_most_once(page):
yield cl
more_changes = [cl for cl in page if '_more_changes' in cl]
if len(more_changes) > 1:
raise GerritError(
200,
'Received %d changes with a _more_changes attribute set but should '
'receive at most one.' % len(more_changes))
if more_changes:
cur_start += len(page)
# If we paged through, query again the first page which in most
# circumstances will fetch all changes that were modified while this
# function was run.
if start != cur_start:
page = QueryChanges(host, params, first_param, limit, o_params, start)
for cl in at_most_once(page):
yield cl
def MultiQueryChanges(host,
params,
change_list,
limit=None,
o_params=None,
start=None):
"""Initiate a query composed of multiple sets of query parameters."""
if not change_list:
raise RuntimeError(
"MultiQueryChanges requires a list of change numbers/id's")
q = [
'q=%s' % '+OR+'.join([urllib.parse.quote(str(x)) for x in change_list])
]
if params:
q.append(_QueryString(params))
if limit:
q.append('n=%d' % limit)
if start:
q.append('S=%s' % start)
if o_params:
q.extend(['o=%s' % p for p in o_params])
path = 'changes/?%s' % '&'.join(q)
try:
result = ReadHttpJsonResponse(CreateHttpConn(host, path))
except GerritError as e:
msg = '%s:\n%s' % (e.message, path)
raise GerritError(e.http_status, msg)
return result
def GetGerritFetchUrl(host):
"""Given a Gerrit host name returns URL of a Gerrit instance to fetch from."""
return '%s://%s/' % (GERRIT_PROTOCOL, host)
def GetCodeReviewTbrScore(host, project):
"""Given a Gerrit host name and project, return the Code-Review score for TBR.
"""
conn = CreateHttpConn(host,
'/projects/%s' % urllib.parse.quote(project, ''))
project = ReadHttpJsonResponse(conn)
if ('labels' not in project or 'Code-Review' not in project['labels']
or 'values' not in project['labels']['Code-Review']):
return 1
return max([int(x) for x in project['labels']['Code-Review']['values']])
def GetChangePageUrl(host, change_number):
"""Given a Gerrit host name and change number, returns change page URL."""
return '%s://%s/#/c/%d/' % (GERRIT_PROTOCOL, host, change_number)
def GetChangeUrl(host, change):
"""Given a Gerrit host name and change ID, returns a URL for the change."""
return '%s://%s/a/changes/%s' % (GERRIT_PROTOCOL, host, change)
def GetChange(host, change, accept_statuses: Container[int] = frozenset([200])):
"""Queries a Gerrit server for information about a single change."""
path = 'changes/%s' % change
return ReadHttpJsonResponse(CreateHttpConn(host, path),
accept_statuses=accept_statuses)
def GetChangeDetail(host, change, o_params=None):
"""Queries a Gerrit server for extended information about a single change."""
path = 'changes/%s/detail' % change
if o_params:
path += '?%s' % '&'.join(['o=%s' % p for p in o_params])
return ReadHttpJsonResponse(CreateHttpConn(host, path))
def GetChangeCommit(host: str, change: str, revision: str = 'current') -> dict:
"""Query a Gerrit server for a revision associated with a change."""
path = 'changes/%s/revisions/%s/commit?links' % (change, revision)
return ReadHttpJsonResponse(CreateHttpConn(host, path))
def GetChangeCurrentRevision(host, change):
"""Get information about the latest revision for a given change."""
return QueryChanges(host, [], change, o_params=('CURRENT_REVISION', ))
def GetChangeRevisions(host, change):
"""Gets information about all revisions associated with a change."""
return QueryChanges(host, [], change, o_params=('ALL_REVISIONS', ))
def GetChangeReview(host, change, revision=None):
"""Gets the current review information for a change."""
if not revision:
jmsg = GetChangeRevisions(host, change)
if not jmsg:
return None
if len(jmsg) > 1:
raise GerritError(
200, 'Multiple changes found for ChangeId %s.' % change)
revision = jmsg[0]['current_revision']
path = 'changes/%s/revisions/%s/review'
return ReadHttpJsonResponse(CreateHttpConn(host, path))
def GetChangeComments(host, change):
"""Get the line- and file-level comments on a change."""
path = 'changes/%s/comments' % change
return ReadHttpJsonResponse(CreateHttpConn(host, path))
def GetChangeRobotComments(host, change):
"""Gets the line- and file-level robot comments on a change."""
path = 'changes/%s/robotcomments' % change
return ReadHttpJsonResponse(CreateHttpConn(host, path))
def GetRelatedChanges(host, change, revision='current'):
"""Gets the related changes for a given change and revision."""
path = 'changes/%s/revisions/%s/related' % (change, revision)
return ReadHttpJsonResponse(CreateHttpConn(host, path))
def AbandonChange(host, change, msg=''):
"""Abandons a Gerrit change."""
path = 'changes/%s/abandon' % change
body = {'message': msg} if msg else {}
conn = CreateHttpConn(host, path, reqtype='POST', body=body)
return ReadHttpJsonResponse(conn)
def MoveChange(host, change, destination_branch):
"""Move a Gerrit change to different destination branch."""
path = 'changes/%s/move' % change
body = {'destination_branch': destination_branch, 'keep_all_votes': True}
conn = CreateHttpConn(host, path, reqtype='POST', body=body)
return ReadHttpJsonResponse(conn)
def RestoreChange(host, change, msg=''):
"""Restores a previously abandoned change."""
path = 'changes/%s/restore' % change
body = {'message': msg} if msg else {}
conn = CreateHttpConn(host, path, reqtype='POST', body=body)
return ReadHttpJsonResponse(conn)
def RebaseChange(host, change, base=None):
"""Rebases a change."""
path = f'changes/{change}/rebase'
body = {'base': base} if base else {}
conn = CreateHttpConn(host, path, reqtype='POST', body=body)
# If a rebase fails due to a merge conflict, Gerrit returns 409. Retrying
# more than once probably won't help since the merge conflict will still
# exist.
return ReadHttpJsonResponse(conn, max_tries=2)
def SubmitChange(host, change):
"""Submits a Gerrit change via Gerrit."""
path = 'changes/%s/submit' % change
conn = CreateHttpConn(host, path, reqtype='POST')
# If a submit fails due to a merge conflict, Gerrit returns 409. Retrying
# more than once probably won't help since the merge conflict will still
# exist.
return ReadHttpJsonResponse(conn, max_tries=2)
def GetChangesSubmittedTogether(host, change):
"""Get all changes submitted with the given one."""
path = 'changes/%s/submitted_together?o=NON_VISIBLE_CHANGES' % change
conn = CreateHttpConn(host, path, reqtype='GET')
return ReadHttpJsonResponse(conn)
def PublishChangeEdit(host, change, notify=True):
"""Publish a Gerrit change edit."""
path = 'changes/%s/edit:publish' % change
body = {'notify': 'ALL' if notify else 'NONE'}
conn = CreateHttpConn(host, path, reqtype='POST', body=body)
return ReadHttpJsonResponse(conn, accept_statuses=(204, ))
def ChangeEdit(host, change, path, data):
"""Puts content of a file into a change edit."""
path = 'changes/%s/edit/%s' % (change, urllib.parse.quote(path, ''))
body = {
'binary_content':
'data:text/plain;base64,%s' %
base64.b64encode(data.encode('utf-8')).decode('utf-8')
}
conn = CreateHttpConn(host, path, reqtype='PUT', body=body)
return ReadHttpJsonResponse(conn, accept_statuses=(204, 409))
def SetChangeEditMessage(host, change, message):
"""Sets the commit message of a change edit."""
path = 'changes/%s/edit:message' % change
body = {'message': message}
conn = CreateHttpConn(host, path, reqtype='PUT', body=body)
return ReadHttpJsonResponse(conn, accept_statuses=(204, 409))
def HasPendingChangeEdit(host, change):
conn = CreateHttpConn(host, 'changes/%s/edit' % change)
try:
ReadHttpResponse(conn)
except GerritError as e:
# 204 No Content means no pending change.
if e.http_status == 204:
return False
raise
return True
def DeletePendingChangeEdit(host, change):
conn = CreateHttpConn(host, 'changes/%s/edit' % change, reqtype='DELETE')
# On success, Gerrit returns status 204; if the edit was already deleted it
# returns 404. Anything else is an error.
ReadHttpResponse(conn, accept_statuses=[204, 404])
def CherryPick(host, change, destination, revision='current', message=None):
"""Create a cherry-pick commit from the given change, onto the given
destination.
"""
path = 'changes/%s/revisions/%s/cherrypick' % (change, revision)
body = {'destination': destination}
if message:
body['message'] = message
conn = CreateHttpConn(host, path, reqtype='POST', body=body)
# If a cherry pick fails due to a merge conflict, Gerrit returns 409.
# Retrying more than once probably won't help since the merge conflict will
# still exist.
return ReadHttpJsonResponse(conn, max_tries=2)
def CherryPickCommit(host, project, commit, destination):
"""Cherry-pick a commit from a project to a destination branch."""
project = urllib.parse.quote(project, '')
path = f'projects/{project}/commits/{commit}/cherrypick'
body = {'destination': destination}
conn = CreateHttpConn(host, path, reqtype='POST', body=body)
return ReadHttpJsonResponse(conn)
def GetFileContents(host, change, path):
"""Get the contents of a file with the given path in the given revision.
Returns:
A bytes object with the file's contents.
"""
path = 'changes/%s/revisions/current/files/%s/content' % (
change, urllib.parse.quote(path, ''))
conn = CreateHttpConn(host, path, reqtype='GET')
return base64.b64decode(ReadHttpResponse(conn).read())
def SetCommitMessage(host, change, description, notify='ALL'):
"""Updates a commit message."""
assert notify in ('ALL', 'NONE')
path = 'changes/%s/message' % change
body = {'message': description, 'notify': notify}
conn = CreateHttpConn(host, path, reqtype='PUT', body=body)
try:
ReadHttpResponse(conn, accept_statuses=[200, 204])
except GerritError as e:
raise GerritError(
e.http_status,
'Received unexpected http status while editing message '
'in change %s' % change)
def GetCommitIncludedIn(host, project, commit):
"""Retrieves the branches and tags for a given commit.
https://gerrit-review.googlesource.com/Documentation/rest-api-projects.html#get-included-in
Returns:
A JSON object with keys of 'branches' and 'tags'.
"""
path = 'projects/%s/commits/%s/in' % (urllib.parse.quote(project,
''), commit)
conn = CreateHttpConn(host, path, reqtype='GET')
return ReadHttpJsonResponse(conn, accept_statuses=[200])
def IsCodeOwnersEnabledOnHost(host):
"""Check if the code-owners plugin is enabled for the host."""
path = 'config/server/capabilities'
capabilities = ReadHttpJsonResponse(CreateHttpConn(host, path))
return 'code-owners-checkCodeOwner' in capabilities
def IsCodeOwnersEnabledOnRepo(host, repo):
"""Check if the code-owners plugin is enabled for the repo."""
repo = PercentEncodeForGitRef(repo)
path = '/projects/%s/code_owners.project_config' % repo
config = ReadHttpJsonResponse(CreateHttpConn(host, path))
return not config['status'].get('disabled', False)
def GetOwnersForFile(host,
project,
branch,
path,
limit=100,
resolve_all_users=True,
highest_score_only=False,
seed=None,
o_params=('DETAILS', )):
"""Gets information about owners attached to a file."""
path = 'projects/%s/branches/%s/code_owners/%s' % (urllib.parse.quote(
project, ''), urllib.parse.quote(branch,
''), urllib.parse.quote(path, ''))
q = ['resolve-all-users=%s' % json.dumps(resolve_all_users)]
if highest_score_only:
q.append('highest-score-only=%s' % json.dumps(highest_score_only))
if seed:
q.append('seed=%d' % seed)
if limit:
q.append('n=%d' % limit)
if o_params:
q.extend(['o=%s' % p for p in o_params])
if q:
path = '%s?%s' % (path, '&'.join(q))
return ReadHttpJsonResponse(CreateHttpConn(host, path))
def GetReviewers(host, change):
"""Gets information about all reviewers attached to a change."""
path = 'changes/%s/reviewers' % change
return ReadHttpJsonResponse(CreateHttpConn(host, path))
def GetReview(host, change, revision):
"""Gets review information about a specific revision of a change."""
path = 'changes/%s/revisions/%s/review' % (change, revision)
return ReadHttpJsonResponse(CreateHttpConn(host, path))
def AddReviewers(host,
change,
reviewers=None,
ccs=None,
notify=True,
accept_statuses: Container[int] = frozenset([200, 400, 422])):
"""Add reviewers to a change."""
if not reviewers and not ccs:
return None
if not change:
return None
reviewers = frozenset(reviewers or [])
ccs = frozenset(ccs or [])
path = 'changes/%s/revisions/current/review' % change
body = {
'drafts': 'KEEP',
'reviewers': [],
'notify': 'ALL' if notify else 'NONE',
}
for r in sorted(reviewers | ccs):
state = 'REVIEWER' if r in reviewers else 'CC'
body['reviewers'].append({
'reviewer': r,
'state': state,
'notify': 'NONE', # We handled `notify` argument above.
})
conn = CreateHttpConn(host, path, reqtype='POST', body=body)
# Gerrit will return 400 if one or more of the requested reviewers are
# unprocessable. We read the response object to see which were rejected,
# warn about them, and retry with the remainder.
resp = ReadHttpJsonResponse(conn, accept_statuses=accept_statuses)
errored = set()
for result in resp.get('reviewers', {}).values():
r = result.get('input')
state = 'REVIEWER' if r in reviewers else 'CC'
if result.get('error'):
errored.add(r)
LOGGER.warning('Note: "%s" not added as a %s' % (r, state.lower()))
if errored:
# Try again, adding only those that didn't fail, and only accepting 200.
AddReviewers(host,
change,
reviewers=(reviewers - errored),
ccs=(ccs - errored),
notify=notify,
accept_statuses=[200])
def SetReview(host,
change,
revision='current',
msg=None,
labels=None,
notify=None,
ready=None,
automatic_attention_set_update: Optional[bool] = None):
"""Sets labels and/or adds a message to a code review.
https://gerrit-review.googlesource.com/Documentation/rest-api-changes.html#set-review
"""
if not msg and not labels:
return
path = f'changes/{change}/revisions/{revision}/review'
body: Dict[str, Any] = {'drafts': 'KEEP'}
if msg:
body['message'] = msg
if labels:
body['labels'] = labels
if notify is not None:
body['notify'] = 'ALL' if notify else 'NONE'
if ready:
body['ready'] = True
if automatic_attention_set_update is not None:
body[
'ignore_automatic_attention_set_rules'] = not automatic_attention_set_update
conn = CreateHttpConn(host, path, reqtype='POST', body=body)
response = ReadHttpJsonResponse(conn)
if labels:
for key, val in labels.items():
if ('labels' not in response or key not in response['labels']
or int(response['labels'][key] != int(val))):
raise GerritError(
200,
'Unable to set "%s" label on change %s.' % (key, change))
return response
def ResetReviewLabels(host,
change,
label,
value='0',
message=None,
notify=None):
"""Resets the value of a given label for all reviewers on a change."""
# This is tricky, because we want to work on the "current revision", but
# there's always the risk that "current revision" will change in between
# API calls. So, we check "current revision" at the beginning and end; if
# it has changed, raise an exception.
jmsg = GetChangeCurrentRevision(host, change)
if not jmsg:
raise GerritError(
200, 'Could not get review information for change "%s"' % change)
value = str(value)
revision = jmsg[0]['current_revision']
path = 'changes/%s/revisions/%s/review' % (change, revision)
message = message or ('%s label set to %s programmatically.' %
(label, value))
jmsg = GetReview(host, change, revision)
if not jmsg:
raise GerritError(
200, 'Could not get review information for revision %s '
'of change %s' % (revision, change))
for review in jmsg.get('labels', {}).get(label, {}).get('all', []):
if str(review.get('value', value)) != value:
body = {
'drafts': 'KEEP',
'message': message,
'labels': {
label: value
},
'on_behalf_of': review['_account_id'],
}
if notify:
body['notify'] = notify
conn = CreateHttpConn(host, path, reqtype='POST', body=body)
response = ReadHttpJsonResponse(conn)
if str(response['labels'][label]) != value:
username = review.get('email', jmsg.get('name', ''))
raise GerritError(
200, 'Unable to set %s label for user "%s"'
' on change %s.' % (label, username, change))
jmsg = GetChangeCurrentRevision(host, change)
if not jmsg:
raise GerritError(
200, 'Could not get review information for change "%s"' % change)
if jmsg[0]['current_revision'] != revision:
raise GerritError(
200, 'While resetting labels on change "%s", '
'a new patchset was uploaded.' % change)
def CreateChange(host, project, branch='main', subject='', params=()):
"""
Creates a new change.
Args:
params: A list of additional ChangeInput specifiers, as documented here:
(e.g. ('is_private', 'true') to mark the change private.
https://gerrit-review.googlesource.com/Documentation/rest-api-changes.html#change-input
Returns:
ChangeInfo for the new change.
"""
path = 'changes/'
body = {'project': project, 'branch': branch, 'subject': subject}
body.update(dict(params))
for key in 'project', 'branch', 'subject':
if not body[key]:
raise GerritError(200, '%s is required' % key.title())
conn = CreateHttpConn(host, path, reqtype='POST', body=body)
return ReadHttpJsonResponse(conn, accept_statuses=[201])
def CreateGerritBranch(host, project, branch, commit):
"""Creates a new branch from given project and commit
https://gerrit-review.googlesource.com/Documentation/rest-api-projects.html#create-branch
Returns:
A JSON object with 'ref' key.
"""
path = 'projects/%s/branches/%s' % (project, branch)
body = {'revision': commit}
conn = CreateHttpConn(host, path, reqtype='PUT', body=body)
response = ReadHttpJsonResponse(conn, accept_statuses=[201, 409])
if response:
return response
raise GerritError(200, 'Unable to create gerrit branch')
def CreateGerritTag(host, project, tag, commit):
"""Creates a new tag at the given commit.
https://gerrit-review.googlesource.com/Documentation/rest-api-projects.html#create-tag
Returns:
A JSON object with 'ref' key.
"""
path = 'projects/%s/tags/%s' % (project, tag)
body = {'revision': commit}
conn = CreateHttpConn(host, path, reqtype='PUT', body=body)
response = ReadHttpJsonResponse(conn, accept_statuses=[201])
if response:
return response
raise GerritError(200, 'Unable to create gerrit tag')
def GetHead(host, project):
"""Retrieves current HEAD of Gerrit project
https://gerrit-review.googlesource.com/Documentation/rest-api-projects.html#get-head
Returns:
A JSON object with 'ref' key.
"""
path = 'projects/%s/HEAD' % (project)
conn = CreateHttpConn(host, path, reqtype='GET')
response = ReadHttpJsonResponse(conn, accept_statuses=[200])
if response:
return response
raise GerritError(200, 'Unable to update gerrit HEAD')
def UpdateHead(host, project, branch):
"""Updates Gerrit HEAD to point to branch
https://gerrit-review.googlesource.com/Documentation/rest-api-projects.html#set-head
Returns:
A JSON object with 'ref' key.
"""
path = 'projects/%s/HEAD' % (project)
body = {'ref': branch}
conn = CreateHttpConn(host, path, reqtype='PUT', body=body)
response = ReadHttpJsonResponse(conn, accept_statuses=[200])
if response:
return response
raise GerritError(200, 'Unable to update gerrit HEAD')
def GetGerritBranch(host, project, branch):
"""Gets a branch info from given project and branch name.
See:
https://gerrit-review.googlesource.com/Documentation/rest-api-projects.html#get-branch
Returns:
A JSON object with 'revision' key if the branch exists, otherwise None.
"""
path = 'projects/%s/branches/%s' % (project, branch)
conn = CreateHttpConn(host, path, reqtype='GET')
return ReadHttpJsonResponse(conn, accept_statuses=[200, 404])
def GetProjectHead(host, project):
conn = CreateHttpConn(host,
'/projects/%s/HEAD' % urllib.parse.quote(project, ''))
return ReadHttpJsonResponse(conn, accept_statuses=[200])
def GetAccountDetails(host,
account_id='self',
*,
authenticator: Optional[_Authenticator] = None):
"""Returns details of the account.
If account_id is not given, uses magic value 'self' which corresponds to
whichever account user is authenticating as.
Documentation:
https://gerrit-review.googlesource.com/Documentation/rest-api-accounts.html#get-account
Returns None if account is not found (i.e., Gerrit returned 404).
"""
conn = CreateHttpConn(host,
'/accounts/%s' % account_id,
authenticator=authenticator)
return ReadHttpJsonResponse(conn, accept_statuses=[200, 404])
class EmailRecord(TypedDict):
email: str
preferred: bool # This should be NotRequired[bool] in 3.11+
def GetAccountEmails(host,
account_id='self',
*,
authenticator: Optional[_Authenticator] = None
) -> Optional[List[EmailRecord]]:
"""Returns all emails for this account, and an indication of which of these
is preferred.
If account_id is not given, uses magic value 'self' which corresponds to
whichever account user is authenticating as.
Requires Modify Account permission to view emails other than 'self'.
Documentation:
https://gerrit-review.googlesource.com/Documentation/rest-api-accounts.html#list-account-emails
Returns None if account is not found (i.e. Gerrit returned 404).
"""
conn = CreateHttpConn(host,
'/accounts/%s/emails' % account_id,
authenticator=authenticator)
resp = ReadHttpJsonResponse(conn, accept_statuses=[200, 404])
if resp is None:
return None
return cast(List[EmailRecord], resp)
def ValidAccounts(host, accounts, max_threads=10):
"""Returns a mapping from valid account to its details.
Invalid accounts, either not existing or without unique match,
are not present as returned dictionary keys.
"""
assert not isinstance(accounts, str), type(accounts)
accounts = list(set(accounts))
if not accounts:
return {}
def get_one(account):
try:
return account, GetAccountDetails(host, account)
except GerritError:
return None, None
valid = {}
with contextlib.closing(ThreadPool(min(max_threads,
len(accounts)))) as pool:
for account, details in pool.map(get_one, accounts):
if account and details:
valid[account] = details
return valid
def PercentEncodeForGitRef(original):
"""Applies percent-encoding for strings sent to Gerrit via git ref metadata.
The encoding used is based on but stricter than URL encoding (Section 2.1 of
RFC 3986). The only non-escaped characters are alphanumerics, and 'SPACE'
(U+0020) can be represented as 'LOW LINE' (U+005F) or 'PLUS SIGN' (U+002B).
For more information, see the Gerrit docs here:
https://gerrit-review.googlesource.com/Documentation/user-upload.html#message
"""
safe = 'abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789 '
encoded = ''.join(c if c in safe else '%%%02X' % ord(c) for c in original)
# Spaces are not allowed in git refs; gerrit will interpret either '_' or
# '+' (or '%20') as space. Use '_' since that has been supported the
# longest.
return encoded.replace(' ', '_')
@contextlib.contextmanager
def tempdir():
tdir = None
try:
tdir = tempfile.mkdtemp(suffix='gerrit_util')
yield tdir
finally:
if tdir:
gclient_utils.rmtree(tdir)
def ChangeIdentifier(project, change_number):
"""Returns change identifier "project~number" suitable for |change| arg of
this module API.
Such format is allows for more efficient Gerrit routing of HTTP requests,
comparing to specifying just change_number.
"""
assert int(change_number)
return '%s~%s' % (urllib.parse.quote(project, ''), change_number)