rhodecode-vcsserver Commit - r1152:a0c49580

lint: auto-fixes

super-admin -

r1152:a0c49580 default

parent child

vcsserver/base.py

0 +3 -3

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import os
              import sys
              import tempfile
              import logging
              import urllib.parse
              from vcsserver.lib.rc_cache.archive_cache import get_archival_cache_store
              from vcsserver import exceptions
              from vcsserver.exceptions import NoContentException
              from vcsserver.hgcompat import archival
              from vcsserver.str_utils import safe_bytes
              from vcsserver.lib.exc_tracking import format_exc
              log = logging.getLogger(__name__)
-             class RepoFactory(object):
+             class RepoFactory:
                  """
                  Utility to create instances of repository
                  It provides internal caching of the `repo` object based on
                  the :term:`call context`.
                  """
                  repo_type = None
                  def __init__(self):
                      pass
                  def _create_config(self, path, config):
                      config = {}
                      return config
                  def _create_repo(self, wire, create):
                      raise NotImplementedError()
                  def repo(self, wire, create=False):
                      raise NotImplementedError()
              def obfuscate_qs(query_string):
                  if query_string is None:
                      return None
                  parsed = []
                  for k, v in urllib.parse.parse_qsl(query_string, keep_blank_values=True):
                      if k in ['auth_token', 'api_key']:
                          v = "*****"
                      parsed.append((k, v))
                  return '&'.join('{}{}'.format(
                      k, f'={v}' if v else '') for k, v in parsed)
              def raise_from_original(new_type, org_exc: Exception):
                  """
                  Raise a new exception type with original args and traceback.
                  """
                  exc_info = sys.exc_info()
                  exc_type, exc_value, exc_traceback = exc_info
                  new_exc = new_type(*exc_value.args)
                  # store the original traceback into the new exc
                  new_exc._org_exc_tb = format_exc(exc_info)
                  try:
                      raise new_exc.with_traceback(exc_traceback)
                  finally:
                      del exc_traceback
-             class ArchiveNode(object):
+             class ArchiveNode:
                  def __init__(self, path, mode, is_link, raw_bytes):
                      self.path = path
                      self.mode = mode
                      self.is_link = is_link
                      self.raw_bytes = raw_bytes
              def store_archive_in_cache(node_walker, archive_key, kind, mtime, archive_at_path, archive_dir_name,
                                         commit_id, write_metadata=True, extra_metadata=None, cache_config=None):
                  """
                  Function that would store generate archive and send it to a dedicated backend store
                  In here we use diskcache
                  :param node_walker: a generator returning nodes to add to archive
                  :param archive_key: key used to store the path
                  :param kind: archive kind
                  :param mtime: time of creation
                  :param archive_at_path: default '/' the path at archive was started.
                      If this is not '/' it means it's a partial archive
                  :param archive_dir_name: inside dir name when creating an archive
                  :param commit_id: commit sha of revision archive was created at
                  :param write_metadata:
                  :param extra_metadata:
                  :param cache_config:
                  walker should be a file walker, for example,
                      def node_walker():
                          for file_info in files:
                              yield ArchiveNode(fn, mode, is_link, ctx[fn].data)
                  """
                  extra_metadata = extra_metadata or {}
                  d_cache = get_archival_cache_store(config=cache_config)
                  if archive_key in d_cache:
                      with d_cache as d_cache_reader:
                          reader, tag = d_cache_reader.get(archive_key, read=True, tag=True, retry=True)
                          return reader.name
                  archive_tmp_path = safe_bytes(tempfile.mkstemp()[1])
                  log.debug('Creating new temp archive in %s', archive_tmp_path)
                  if kind == "tgz":
                      archiver = archival.tarit(archive_tmp_path, mtime, b"gz")
                  elif kind == "tbz2":
                      archiver = archival.tarit(archive_tmp_path, mtime, b"bz2")
                  elif kind == 'zip':
                      archiver = archival.zipit(archive_tmp_path, mtime)
                  else:
                      raise exceptions.ArchiveException()(
                          f'Remote does not support: "{kind}" archive type.')
                  for f in node_walker(commit_id, archive_at_path):
                      f_path = os.path.join(safe_bytes(archive_dir_name), safe_bytes(f.path).lstrip(b'/'))
                      try:
                          archiver.addfile(f_path, f.mode, f.is_link, f.raw_bytes())
                      except NoContentException:
                          # NOTE(marcink): this is a special case for SVN so we can create "empty"
                          # directories which are not supported by archiver
                          archiver.addfile(os.path.join(f_path, b'.dir'), f.mode, f.is_link, b'')
                  if write_metadata:
                      metadata = dict([
                          ('commit_id', commit_id),
                          ('mtime', mtime),
                      ])
                      metadata.update(extra_metadata)
                      meta = [safe_bytes(f"{f_name}:{value}") for f_name, value in metadata.items()]
                      f_path = os.path.join(safe_bytes(archive_dir_name), b'.archival.txt')
                      archiver.addfile(f_path, 0o644, False, b'\n'.join(meta))
                  archiver.done()
                  # ensure set & get are atomic
                  with d_cache.transact():
                      with open(archive_tmp_path, 'rb') as archive_file:
                          add_result = d_cache.set(archive_key, archive_file, read=True, tag='db-name', retry=True)
                          if not add_result:
                              log.error('Failed to store cache for key=%s', archive_key)
                      os.remove(archive_tmp_path)
                      reader, tag = d_cache.get(archive_key, read=True, tag=True, retry=True)
                      if not reader:
                          raise AssertionError(f'empty reader on key={archive_key} added={add_result}')
                      return reader.name
-             class BinaryEnvelope(object):
+             class BinaryEnvelope:
                  def __init__(self, val):
                      self.val = val
              class BytesEnvelope(bytes):
                  def __new__(cls, content):
                      if isinstance(content, bytes):
                          return super().__new__(cls, content)
                      else:
                          raise TypeError('BytesEnvelope content= param must be bytes. Use BinaryEnvelope to wrap other types')
              class BinaryBytesEnvelope(BytesEnvelope):
                  pass

vcsserver/config/settings_maker.py

0 +1 -1

              # Copyright (C) 2010-2023 RhodeCode GmbH
              #
              # This program is free software: you can redistribute it and/or modify
              # it under the terms of the GNU Affero General Public License, version 3
              # (only), as published by the Free Software Foundation.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU Affero General Public License
              # along with this program.  If not, see <http://www.gnu.org/licenses/>.
              #
              # This program is dual-licensed. If you wish to learn more about the
              # RhodeCode Enterprise Edition, including its added features, Support services,
              # and proprietary license terms, please see https://rhodecode.com/licenses/
              import os
              import textwrap
              import string
              import functools
              import logging
              import tempfile
              import logging.config
              from vcsserver.type_utils import str2bool, aslist
              log = logging.getLogger(__name__)
              # skip keys, that are set here, so we don't double process those
              set_keys = {
                  '__file__': ''
              }
-             class SettingsMaker(object):
+             class SettingsMaker:
                  def __init__(self, app_settings):
                      self.settings = app_settings
                  @classmethod
                  def _bool_func(cls, input_val):
                      if isinstance(input_val, bytes):
                          # decode to str
                          input_val = input_val.decode('utf8')
                      return str2bool(input_val)
                  @classmethod
                  def _int_func(cls, input_val):
                      return int(input_val)
                  @classmethod
                  def _list_func(cls, input_val, sep=','):
                      return aslist(input_val, sep=sep)
                  @classmethod
                  def _string_func(cls, input_val, lower=True):
                      if lower:
                          input_val = input_val.lower()
                      return input_val
                  @classmethod
                  def _float_func(cls, input_val):
                      return float(input_val)
                  @classmethod
                  def _dir_func(cls, input_val, ensure_dir=False, mode=0o755):
                      # ensure we have our dir created
                      if not os.path.isdir(input_val) and ensure_dir:
                          os.makedirs(input_val, mode=mode, exist_ok=True)
                      if not os.path.isdir(input_val):
                          raise Exception(f'Dir at {input_val} does not exist')
                      return input_val
                  @classmethod
                  def _file_path_func(cls, input_val, ensure_dir=False, mode=0o755):
                      dirname = os.path.dirname(input_val)
                      cls._dir_func(dirname, ensure_dir=ensure_dir)
                      return input_val
                  @classmethod
                  def _key_transformator(cls, key):
                      return "{}_{}".format('RC'.upper(), key.upper().replace('.', '_').replace('-', '_'))
                  def maybe_env_key(self, key):
                      # now maybe we have this KEY in env, search and use the value with higher priority.
                      transformed_key = self._key_transformator(key)
                      envvar_value = os.environ.get(transformed_key)
                      if envvar_value:
                          log.debug('using `%s` key instead of `%s` key for config', transformed_key, key)
                      return envvar_value
                  def env_expand(self):
                      replaced = {}
                      for k, v in self.settings.items():
                          if k not in set_keys:
                              envvar_value = self.maybe_env_key(k)
                              if envvar_value:
                                  replaced[k] = envvar_value
                                  set_keys[k] = envvar_value
                      # replace ALL keys updated
                      self.settings.update(replaced)
                  def enable_logging(self, logging_conf=None, level='INFO', formatter='generic'):
                      """
                      Helper to enable debug on running instance
                      :return:
                      """
                      if not str2bool(self.settings.get('logging.autoconfigure')):
                          log.info('logging configuration based on main .ini file')
                          return
                      if logging_conf is None:
                          logging_conf = self.settings.get('logging.logging_conf_file') or ''
                      if not os.path.isfile(logging_conf):
                          log.error('Unable to setup logging based on %s, '
                                    'file does not exist.... specify path using logging.logging_conf_file= config setting. ', logging_conf)
                          return
                      with open(logging_conf, 'rt') as f:
                          ini_template = textwrap.dedent(f.read())
                          ini_template = string.Template(ini_template).safe_substitute(
                              RC_LOGGING_LEVEL=os.environ.get('RC_LOGGING_LEVEL', '') or level,
                              RC_LOGGING_FORMATTER=os.environ.get('RC_LOGGING_FORMATTER', '') or formatter
                          )
                      with tempfile.NamedTemporaryFile(prefix='rc_logging_', suffix='.ini', delete=False) as f:
                          log.info('Saved Temporary LOGGING config at %s', f.name)
                          f.write(ini_template)
                      logging.config.fileConfig(f.name)
                      os.remove(f.name)
                  def make_setting(self, key, default, lower=False, default_when_empty=False, parser=None):
                      input_val = self.settings.get(key, default)
                      if default_when_empty and not input_val:
                          # use default value when value is set in the config but it is empty
                          input_val = default
                      parser_func = {
                          'bool': self._bool_func,
                          'int': self._int_func,
                          'list': self._list_func,
                          'list:newline': functools.partial(self._list_func, sep='/n'),
                          'list:spacesep': functools.partial(self._list_func, sep=' '),
                          'string': functools.partial(self._string_func, lower=lower),
                          'dir': self._dir_func,
                          'dir:ensured': functools.partial(self._dir_func, ensure_dir=True),
                          'file': self._file_path_func,
                          'file:ensured': functools.partial(self._file_path_func, ensure_dir=True),
                          None: lambda i: i
                      }[parser]
                      envvar_value = self.maybe_env_key(key)
                      if envvar_value:
                          input_val = envvar_value
                          set_keys[key] = input_val
                      self.settings[key] = parser_func(input_val)
                      return self.settings[key]

vcsserver/echo_stub/echo_app.py

0 +2 -2

              # Copyright (C) 2014-2023 RhodeCode GmbH
              """
              Implementation of :class:`EchoApp`.
              This WSGI application will just echo back the data which it recieves.
              """
              import logging
              log = logging.getLogger(__name__)
-             class EchoApp(object):
+             class EchoApp:
                  def __init__(self, repo_path, repo_name, config):
                      self._repo_path = repo_path
                      log.info("EchoApp initialized for %s", repo_path)
                  def __call__(self, environ, start_response):
                      log.debug("EchoApp called for %s", self._repo_path)
                      log.debug("Content-Length: %s", environ.get('CONTENT_LENGTH'))
                      environ['wsgi.input'].read()
                      status = '200 OK'
                      headers = [('Content-Type', 'text/plain')]
                      start_response(status, headers)
                      return [b"ECHO"]
-             class EchoAppStream(object):
+             class EchoAppStream:
                  def __init__(self, repo_path, repo_name, config):
                      self._repo_path = repo_path
                      log.info("EchoApp initialized for %s", repo_path)
                  def __call__(self, environ, start_response):
                      log.debug("EchoApp called for %s", self._repo_path)
                      log.debug("Content-Length: %s", environ.get('CONTENT_LENGTH'))
                      environ['wsgi.input'].read()
                      status = '200 OK'
                      headers = [('Content-Type', 'text/plain')]
                      start_response(status, headers)
                      def generator():
                          for _ in range(1000000):
                              yield b"ECHO_STREAM"
                      return generator()
              def create_app():
                  """
                  Allows to run this app directly in a WSGI server.
                  """
                  stub_config = {}
                  return EchoApp('stub_path', 'stub_name', stub_config)

vcsserver/echo_stub/remote_wsgi.py

0 +2 -2

              # Copyright (C) 2014-2023 RhodeCode GmbH
              """
              Provides the same API as :mod:`remote_wsgi`.
              Uses the `EchoApp` instead of real implementations.
              """
              import logging
              from .echo_app import EchoApp
              from vcsserver import wsgi_app_caller
              log = logging.getLogger(__name__)
-             class GitRemoteWsgi(object):
+             class GitRemoteWsgi:
                  def handle(self, environ, input_data, *args, **kwargs):
                      app = wsgi_app_caller.WSGIAppCaller(
                          create_echo_wsgi_app(*args, **kwargs))
                      return app.handle(environ, input_data)
-             class HgRemoteWsgi(object):
+             class HgRemoteWsgi:
                  def handle(self, environ, input_data, *args, **kwargs):
                      app = wsgi_app_caller.WSGIAppCaller(
                          create_echo_wsgi_app(*args, **kwargs))
                      return app.handle(environ, input_data)
              def create_echo_wsgi_app(repo_path, repo_name, config):
                  log.debug("Creating EchoApp WSGI application")
                  _assert_valid_config(config)
                  # Remaining items are forwarded to have the extras available
                  return EchoApp(repo_path, repo_name, config=config)
              def _assert_valid_config(config):
                  config = config.copy()
                  # This is what git needs from config at this stage
                  config.pop(b'git_update_server_info')

vcsserver/git_lfs/app.py

0 +4 -4

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import re
              import logging
              from pyramid.config import Configurator
              from pyramid.response import Response, FileIter
              from pyramid.httpexceptions import (
                  HTTPBadRequest, HTTPNotImplemented, HTTPNotFound, HTTPForbidden,
                  HTTPUnprocessableEntity)
              from vcsserver.lib.rc_json import json
              from vcsserver.git_lfs.lib import OidHandler, LFSOidStore
              from vcsserver.git_lfs.utils import safe_result, get_cython_compat_decorator
              from vcsserver.str_utils import safe_int
              log = logging.getLogger(__name__)
              GIT_LFS_CONTENT_TYPE = 'application/vnd.git-lfs'  # +json ?
              GIT_LFS_PROTO_PAT = re.compile(r'^/(.+)/(info/lfs/(.+))')
              def write_response_error(http_exception, text=None):
                  content_type = GIT_LFS_CONTENT_TYPE + '+json'
                  _exception = http_exception(content_type=content_type)
                  _exception.content_type = content_type
                  if text:
                      _exception.body = json.dumps({'message': text})
                  log.debug('LFS: writing response of type %s to client with text:%s',
                            http_exception, text)
                  return _exception
-             class AuthHeaderRequired(object):
+             class AuthHeaderRequired:
                  """
                  Decorator to check if request has proper auth-header
                  """
                  def __call__(self, func):
                      return get_cython_compat_decorator(self.__wrapper, func)
                  def __wrapper(self, func, *fargs, **fkwargs):
                      request = fargs[1]
                      auth = request.authorization
                      if not auth:
                          return write_response_error(HTTPForbidden)
                      return func(*fargs[1:], **fkwargs)
              # views
              def lfs_objects(request):
                  # indicate not supported, V1 API
                  log.warning('LFS: v1 api not supported, reporting it back to client')
                  return write_response_error(HTTPNotImplemented, 'LFS: v1 api not supported')
              @AuthHeaderRequired()
              def lfs_objects_batch(request):
                  """
                  The client sends the following information to the Batch endpoint to transfer some objects:
                      operation - Should be download or upload.
                      transfers - An optional Array of String identifiers for transfer
                          adapters that the client has configured. If omitted, the basic
                          transfer adapter MUST be assumed by the server.
                      objects - An Array of objects to download.
                      oid - String OID of the LFS object.
                      size - Integer byte size of the LFS object. Must be at least zero.
                  """
                  request.response.content_type = GIT_LFS_CONTENT_TYPE + '+json'
                  auth = request.authorization
                  repo = request.matchdict.get('repo')
                  data = request.json
                  operation = data.get('operation')
                  http_scheme = request.registry.git_lfs_http_scheme
                  if operation not in ('download', 'upload'):
                      log.debug('LFS: unsupported operation:%s', operation)
                      return write_response_error(
-                         HTTPBadRequest, 'unsupported operation mode: `%s`' % operation)
+                         HTTPBadRequest, f'unsupported operation mode: `{operation}`')
                  if 'objects' not in data:
                      log.debug('LFS: missing objects data')
                      return write_response_error(
                          HTTPBadRequest, 'missing objects data')
                  log.debug('LFS: handling operation of type: %s', operation)
                  objects = []
                  for o in data['objects']:
                      try:
                          oid = o['oid']
                          obj_size = o['size']
                      except KeyError:
                          log.exception('LFS, failed to extract data')
                          return write_response_error(
                              HTTPBadRequest, 'unsupported data in objects')
                      obj_data = {'oid': oid}
                      obj_href = request.route_url('lfs_objects_oid', repo=repo, oid=oid,
                                                   _scheme=http_scheme)
                      obj_verify_href = request.route_url('lfs_objects_verify', repo=repo,
                                                          _scheme=http_scheme)
                      store = LFSOidStore(
                          oid, repo, store_location=request.registry.git_lfs_store_path)
                      handler = OidHandler(
                          store, repo, auth, oid, obj_size, obj_data,
                          obj_href, obj_verify_href)
                      # this verifies also OIDs
                      actions, errors = handler.exec_operation(operation)
                      if errors:
                          log.warning('LFS: got following errors: %s', errors)
                          obj_data['errors'] = errors
                      if actions:
                          obj_data['actions'] = actions
                      obj_data['size'] = obj_size
                      obj_data['authenticated'] = True
                      objects.append(obj_data)
                  result = {'objects': objects, 'transfer': 'basic'}
                  log.debug('LFS Response %s', safe_result(result))
                  return result
              def lfs_objects_oid_upload(request):
                  request.response.content_type = GIT_LFS_CONTENT_TYPE + '+json'
                  repo = request.matchdict.get('repo')
                  oid = request.matchdict.get('oid')
                  store = LFSOidStore(
                      oid, repo, store_location=request.registry.git_lfs_store_path)
                  engine = store.get_engine(mode='wb')
                  log.debug('LFS: starting chunked write of LFS oid: %s to storage', oid)
                  body = request.environ['wsgi.input']
                  with engine as f:
                      blksize = 64 * 1024  # 64kb
                      while True:
                          # read in chunks as stream comes in from Gunicorn
                          # this is a specific Gunicorn support function.
                          # might work differently on waitress
                          chunk = body.read(blksize)
                          if not chunk:
                              break
                          f.write(chunk)
                  return {'upload': 'ok'}
              def lfs_objects_oid_download(request):
                  repo = request.matchdict.get('repo')
                  oid = request.matchdict.get('oid')
                  store = LFSOidStore(
                      oid, repo, store_location=request.registry.git_lfs_store_path)
                  if not store.has_oid():
                      log.debug('LFS: oid %s does not exists in store', oid)
                      return write_response_error(
-                         HTTPNotFound, 'requested file with oid `%s` not found in store' % oid)
+                         HTTPNotFound, f'requested file with oid `{oid}` not found in store')
                  # TODO(marcink): support range header ?
                  # Range: bytes=0-, `bytes=(\d+)\-.*`
                  f = open(store.oid_path, 'rb')
                  response = Response(
                      content_type='application/octet-stream', app_iter=FileIter(f))
                  response.headers.add('X-RC-LFS-Response-Oid', str(oid))
                  return response
              def lfs_objects_verify(request):
                  request.response.content_type = GIT_LFS_CONTENT_TYPE + '+json'
                  repo = request.matchdict.get('repo')
                  data = request.json
                  oid = data.get('oid')
                  size = safe_int(data.get('size'))
                  if not (oid and size):
                      return write_response_error(
                          HTTPBadRequest, 'missing oid and size in request data')
                  store = LFSOidStore(
                      oid, repo, store_location=request.registry.git_lfs_store_path)
                  if not store.has_oid():
                      log.debug('LFS: oid %s does not exists in store', oid)
                      return write_response_error(
-                         HTTPNotFound, 'oid `%s` does not exists in store' % oid)
+                         HTTPNotFound, f'oid `{oid}` does not exists in store')
                  store_size = store.size_oid()
                  if store_size != size:
                      msg = 'requested file size mismatch store size:{} requested:{}'.format(
                          store_size, size)
                      return write_response_error(
                          HTTPUnprocessableEntity, msg)
                  return {'message': {'size': 'ok', 'in_store': 'ok'}}
              def lfs_objects_lock(request):
                  return write_response_error(
                      HTTPNotImplemented, 'GIT LFS locking api not supported')
              def not_found(request):
                  return write_response_error(
                      HTTPNotFound, 'request path not found')
              def lfs_disabled(request):
                  return write_response_error(
                      HTTPNotImplemented, 'GIT LFS disabled for this repo')
              def git_lfs_app(config):
                  # v1 API deprecation endpoint
                  config.add_route('lfs_objects',
                                   '/{repo:.*?[^/]}/info/lfs/objects')
                  config.add_view(lfs_objects, route_name='lfs_objects',
                                  request_method='POST', renderer='json')
                  # locking API
                  config.add_route('lfs_objects_lock',
                                   '/{repo:.*?[^/]}/info/lfs/locks')
                  config.add_view(lfs_objects_lock, route_name='lfs_objects_lock',
                                  request_method=('POST', 'GET'), renderer='json')
                  config.add_route('lfs_objects_lock_verify',
                                   '/{repo:.*?[^/]}/info/lfs/locks/verify')
                  config.add_view(lfs_objects_lock, route_name='lfs_objects_lock_verify',
                                  request_method=('POST', 'GET'), renderer='json')
                  # batch API
                  config.add_route('lfs_objects_batch',
                                   '/{repo:.*?[^/]}/info/lfs/objects/batch')
                  config.add_view(lfs_objects_batch, route_name='lfs_objects_batch',
                                  request_method='POST', renderer='json')
                  # oid upload/download API
                  config.add_route('lfs_objects_oid',
                                   '/{repo:.*?[^/]}/info/lfs/objects/{oid}')
                  config.add_view(lfs_objects_oid_upload, route_name='lfs_objects_oid',
                                  request_method='PUT', renderer='json')
                  config.add_view(lfs_objects_oid_download, route_name='lfs_objects_oid',
                                  request_method='GET', renderer='json')
                  # verification API
                  config.add_route('lfs_objects_verify',
                                   '/{repo:.*?[^/]}/info/lfs/verify')
                  config.add_view(lfs_objects_verify, route_name='lfs_objects_verify',
                                  request_method='POST', renderer='json')
                  # not found handler for API
                  config.add_notfound_view(not_found, renderer='json')
              def create_app(git_lfs_enabled, git_lfs_store_path, git_lfs_http_scheme):
                  config = Configurator()
                  if git_lfs_enabled:
                      config.include(git_lfs_app)
                      config.registry.git_lfs_store_path = git_lfs_store_path
                      config.registry.git_lfs_http_scheme = git_lfs_http_scheme
                  else:
                      # not found handler for API, reporting disabled LFS support
                      config.add_notfound_view(lfs_disabled, renderer='json')
                  app = config.make_wsgi_app()
                  return app

vcsserver/git_lfs/lib.py

0 +2 -2

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import os
              import shutil
              import logging
              from collections import OrderedDict
              log = logging.getLogger(__name__)
-             class OidHandler(object):
+             class OidHandler:
                  def __init__(self, store, repo_name, auth, oid, obj_size, obj_data, obj_href,
                               obj_verify_href=None):
                      self.current_store = store
                      self.repo_name = repo_name
                      self.auth = auth
                      self.oid = oid
                      self.obj_size = obj_size
                      self.obj_data = obj_data
                      self.obj_href = obj_href
                      self.obj_verify_href = obj_verify_href
                  def get_store(self, mode=None):
                      return self.current_store
                  def get_auth(self):
                      """returns auth header for re-use in upload/download"""
                      return " ".join(self.auth)
                  def download(self):
                      store = self.get_store()
                      response = None
                      has_errors = None
                      if not store.has_oid():
                          # error reply back to client that something is wrong with dl
                          err_msg = f'object: {store.oid} does not exist in store'
                          has_errors = OrderedDict(
                              error=OrderedDict(
                                  code=404,
                                  message=err_msg
                              )
                          )
                      download_action = OrderedDict(
                          href=self.obj_href,
                          header=OrderedDict([("Authorization", self.get_auth())])
                      )
                      if not has_errors:
                          response = OrderedDict(download=download_action)
                      return response, has_errors
                  def upload(self, skip_existing=True):
                      """
                      Write upload action for git-lfs server
                      """
                      store = self.get_store()
                      response = None
                      has_errors = None
                      # verify if we have the OID before, if we do, reply with empty
                      if store.has_oid():
                          log.debug('LFS: store already has oid %s', store.oid)
                          # validate size
                          store_size = store.size_oid()
                          size_match = store_size == self.obj_size
                          if not size_match:
                              log.warning(
                                  'LFS: size mismatch for oid:%s, in store:%s expected: %s',
                                  self.oid, store_size, self.obj_size)
                          elif skip_existing:
                              log.debug('LFS: skipping further action as oid is existing')
                              return response, has_errors
                      chunked = ("Transfer-Encoding", "chunked")
                      upload_action = OrderedDict(
                          href=self.obj_href,
                          header=OrderedDict([("Authorization", self.get_auth()), chunked])
                      )
                      if not has_errors:
                          response = OrderedDict(upload=upload_action)
                          # if specified in handler, return the verification endpoint
                          if self.obj_verify_href:
                              verify_action = OrderedDict(
                                  href=self.obj_verify_href,
                                  header=OrderedDict([("Authorization", self.get_auth())])
                              )
                              response['verify'] = verify_action
                      return response, has_errors
                  def exec_operation(self, operation, *args, **kwargs):
                      handler = getattr(self, operation)
                      log.debug('LFS: handling request using %s handler', handler)
                      return handler(*args, **kwargs)
-             class LFSOidStore(object):
+             class LFSOidStore:
                  def __init__(self, oid, repo, store_location=None):
                      self.oid = oid
                      self.repo = repo
                      self.store_path = store_location or self.get_default_store()
                      self.tmp_oid_path = os.path.join(self.store_path, oid + '.tmp')
                      self.oid_path = os.path.join(self.store_path, oid)
                      self.fd = None
                  def get_engine(self, mode):
                      """
                      engine = .get_engine(mode='wb')
                      with engine as f:
                          f.write('...')
                      """
                      class StoreEngine(object):
                          def __init__(self, mode, store_path, oid_path, tmp_oid_path):
                              self.mode = mode
                              self.store_path = store_path
                              self.oid_path = oid_path
                              self.tmp_oid_path = tmp_oid_path
                          def __enter__(self):
                              if not os.path.isdir(self.store_path):
                                  os.makedirs(self.store_path)
                              # TODO(marcink): maybe write metadata here with size/oid ?
                              fd = open(self.tmp_oid_path, self.mode)
                              self.fd = fd
                              return fd
                          def __exit__(self, exc_type, exc_value, traceback):
                              # close tmp file, and rename to final destination
                              self.fd.close()
                              shutil.move(self.tmp_oid_path, self.oid_path)
                      return StoreEngine(
                          mode, self.store_path, self.oid_path, self.tmp_oid_path)
                  def get_default_store(self):
                      """
                      Default store, consistent with defaults of Mercurial large files store
                      which is /home/username/.cache/largefiles
                      """
                      user_home = os.path.expanduser("~")
                      return os.path.join(user_home, '.cache', 'lfs-store')
                  def has_oid(self):
                      return os.path.exists(os.path.join(self.store_path, self.oid))
                  def size_oid(self):
                      size = -1
                      if self.has_oid():
                          oid = os.path.join(self.store_path, self.oid)
                          size = os.stat(oid).st_size
                      return size

vcsserver/git_lfs/tests/test_lfs_app.py

0 +1 -1

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import os
              import pytest
              from webtest.app import TestApp as WebObTestApp
              from vcsserver.lib.rc_json import json
              from vcsserver.str_utils import safe_bytes
              from vcsserver.git_lfs.app import create_app
              @pytest.fixture(scope='function')
              def git_lfs_app(tmpdir):
                  custom_app = WebObTestApp(create_app(
                      git_lfs_enabled=True, git_lfs_store_path=str(tmpdir),
                      git_lfs_http_scheme='http'))
                  custom_app._store = str(tmpdir)
                  return custom_app
              @pytest.fixture(scope='function')
              def git_lfs_https_app(tmpdir):
                  custom_app = WebObTestApp(create_app(
                      git_lfs_enabled=True, git_lfs_store_path=str(tmpdir),
                      git_lfs_http_scheme='https'))
                  custom_app._store = str(tmpdir)
                  return custom_app
              @pytest.fixture()
              def http_auth():
                  return {'HTTP_AUTHORIZATION': "Basic XXXXX"}
-             class TestLFSApplication(object):
+             class TestLFSApplication:
                  def test_app_wrong_path(self, git_lfs_app):
                      git_lfs_app.get('/repo/info/lfs/xxx', status=404)
                  def test_app_deprecated_endpoint(self, git_lfs_app):
                      response = git_lfs_app.post('/repo/info/lfs/objects', status=501)
                      assert response.status_code == 501
                      assert json.loads(response.text) == {'message': 'LFS: v1 api not supported'}
                  def test_app_lock_verify_api_not_available(self, git_lfs_app):
                      response = git_lfs_app.post('/repo/info/lfs/locks/verify', status=501)
                      assert response.status_code == 501
                      assert json.loads(response.text) == {
                          'message': 'GIT LFS locking api not supported'}
                  def test_app_lock_api_not_available(self, git_lfs_app):
                      response = git_lfs_app.post('/repo/info/lfs/locks', status=501)
                      assert response.status_code == 501
                      assert json.loads(response.text) == {
                          'message': 'GIT LFS locking api not supported'}
                  def test_app_batch_api_missing_auth(self, git_lfs_app):
                      git_lfs_app.post_json(
                          '/repo/info/lfs/objects/batch', params={}, status=403)
                  def test_app_batch_api_unsupported_operation(self, git_lfs_app, http_auth):
                      response = git_lfs_app.post_json(
                          '/repo/info/lfs/objects/batch', params={}, status=400,
                          extra_environ=http_auth)
                      assert json.loads(response.text) == {
                          'message': 'unsupported operation mode: `None`'}
                  def test_app_batch_api_missing_objects(self, git_lfs_app, http_auth):
                      response = git_lfs_app.post_json(
                          '/repo/info/lfs/objects/batch', params={'operation': 'download'},
                          status=400, extra_environ=http_auth)
                      assert json.loads(response.text) == {
                          'message': 'missing objects data'}
                  def test_app_batch_api_unsupported_data_in_objects(
                          self, git_lfs_app, http_auth):
                      params = {'operation': 'download',
                                'objects': [{}]}
                      response = git_lfs_app.post_json(
                          '/repo/info/lfs/objects/batch', params=params, status=400,
                          extra_environ=http_auth)
                      assert json.loads(response.text) == {
                          'message': 'unsupported data in objects'}
                  def test_app_batch_api_download_missing_object(
                          self, git_lfs_app, http_auth):
                      params = {'operation': 'download',
                                'objects': [{'oid': '123', 'size': '1024'}]}
                      response = git_lfs_app.post_json(
                          '/repo/info/lfs/objects/batch', params=params,
                          extra_environ=http_auth)
                      expected_objects = [
                          {'authenticated': True,
                           'errors': {'error': {
                               'code': 404,
                               'message': 'object: 123 does not exist in store'}},
                           'oid': '123',
                           'size': '1024'}
                      ]
                      assert json.loads(response.text) == {
                          'objects': expected_objects, 'transfer': 'basic'}
                  def test_app_batch_api_download(self, git_lfs_app, http_auth):
                      oid = '456'
                      oid_path = os.path.join(git_lfs_app._store, oid)
                      if not os.path.isdir(os.path.dirname(oid_path)):
                          os.makedirs(os.path.dirname(oid_path))
                      with open(oid_path, 'wb') as f:
                          f.write(safe_bytes('OID_CONTENT'))
                      params = {'operation': 'download',
                                'objects': [{'oid': oid, 'size': '1024'}]}
                      response = git_lfs_app.post_json(
                          '/repo/info/lfs/objects/batch', params=params,
                          extra_environ=http_auth)
                      expected_objects = [
                          {'authenticated': True,
                           'actions': {
                               'download': {
                                   'header': {'Authorization': 'Basic XXXXX'},
                                   'href': 'http://localhost/repo/info/lfs/objects/456'},
                           },
                           'oid': '456',
                           'size': '1024'}
                      ]
                      assert json.loads(response.text) == {
                          'objects': expected_objects, 'transfer': 'basic'}
                  def test_app_batch_api_upload(self, git_lfs_app, http_auth):
                      params = {'operation': 'upload',
                                'objects': [{'oid': '123', 'size': '1024'}]}
                      response = git_lfs_app.post_json(
                          '/repo/info/lfs/objects/batch', params=params,
                          extra_environ=http_auth)
                      expected_objects = [
                          {'authenticated': True,
                           'actions': {
                               'upload': {
                                   'header': {'Authorization': 'Basic XXXXX',
                                               'Transfer-Encoding': 'chunked'},
                                   'href': 'http://localhost/repo/info/lfs/objects/123'},
                               'verify': {
                                   'header': {'Authorization': 'Basic XXXXX'},
                                   'href': 'http://localhost/repo/info/lfs/verify'}
                           },
                           'oid': '123',
                           'size': '1024'}
                      ]
                      assert json.loads(response.text) == {
                          'objects': expected_objects, 'transfer': 'basic'}
                  def test_app_batch_api_upload_for_https(self, git_lfs_https_app, http_auth):
                      params = {'operation': 'upload',
                                'objects': [{'oid': '123', 'size': '1024'}]}
                      response = git_lfs_https_app.post_json(
                          '/repo/info/lfs/objects/batch', params=params,
                          extra_environ=http_auth)
                      expected_objects = [
                          {'authenticated': True,
                           'actions': {
                               'upload': {
                                   'header': {'Authorization': 'Basic XXXXX',
                                               'Transfer-Encoding': 'chunked'},
                                   'href': 'https://localhost/repo/info/lfs/objects/123'},
                               'verify': {
                                   'header': {'Authorization': 'Basic XXXXX'},
                                   'href': 'https://localhost/repo/info/lfs/verify'}
                           },
                           'oid': '123',
                           'size': '1024'}
                      ]
                      assert json.loads(response.text) == {
                          'objects': expected_objects, 'transfer': 'basic'}
                  def test_app_verify_api_missing_data(self, git_lfs_app):
                      params = {'oid': 'missing'}
                      response = git_lfs_app.post_json(
                          '/repo/info/lfs/verify', params=params,
                          status=400)
                      assert json.loads(response.text) == {
                          'message': 'missing oid and size in request data'}
                  def test_app_verify_api_missing_obj(self, git_lfs_app):
                      params = {'oid': 'missing', 'size': '1024'}
                      response = git_lfs_app.post_json(
                          '/repo/info/lfs/verify', params=params,
                          status=404)
                      assert json.loads(response.text) == {
                          'message': 'oid `missing` does not exists in store'}
                  def test_app_verify_api_size_mismatch(self, git_lfs_app):
                      oid = 'existing'
                      oid_path = os.path.join(git_lfs_app._store, oid)
                      if not os.path.isdir(os.path.dirname(oid_path)):
                          os.makedirs(os.path.dirname(oid_path))
                      with open(oid_path, 'wb') as f:
                          f.write(safe_bytes('OID_CONTENT'))
                      params = {'oid': oid, 'size': '1024'}
                      response = git_lfs_app.post_json(
                          '/repo/info/lfs/verify', params=params, status=422)
                      assert json.loads(response.text) == {
                          'message': 'requested file size mismatch '
                                      'store size:11 requested:1024'}
                  def test_app_verify_api(self, git_lfs_app):
                      oid = 'existing'
                      oid_path = os.path.join(git_lfs_app._store, oid)
                      if not os.path.isdir(os.path.dirname(oid_path)):
                          os.makedirs(os.path.dirname(oid_path))
                      with open(oid_path, 'wb') as f:
                          f.write(safe_bytes('OID_CONTENT'))
                      params = {'oid': oid, 'size': 11}
                      response = git_lfs_app.post_json(
                          '/repo/info/lfs/verify', params=params)
                      assert json.loads(response.text) == {
                          'message': {'size': 'ok', 'in_store': 'ok'}}
                  def test_app_download_api_oid_not_existing(self, git_lfs_app):
                      oid = 'missing'
                      response = git_lfs_app.get(
                          '/repo/info/lfs/objects/{oid}'.format(oid=oid), status=404)
                      assert json.loads(response.text) == {
                          'message': 'requested file with oid `missing` not found in store'}
                  def test_app_download_api(self, git_lfs_app):
                      oid = 'existing'
                      oid_path = os.path.join(git_lfs_app._store, oid)
                      if not os.path.isdir(os.path.dirname(oid_path)):
                          os.makedirs(os.path.dirname(oid_path))
                      with open(oid_path, 'wb') as f:
                          f.write(safe_bytes('OID_CONTENT'))
                      response = git_lfs_app.get(
                          '/repo/info/lfs/objects/{oid}'.format(oid=oid))
                      assert response
                  def test_app_upload(self, git_lfs_app):
                      oid = 'uploaded'
                      response = git_lfs_app.put(
                          '/repo/info/lfs/objects/{oid}'.format(oid=oid), params='CONTENT')
                      assert json.loads(response.text) == {'upload': 'ok'}
                      # verify that we actually wrote that OID
                      oid_path = os.path.join(git_lfs_app._store, oid)
                      assert os.path.isfile(oid_path)
                      assert 'CONTENT' == open(oid_path).read()

vcsserver/git_lfs/tests/test_lib.py

0 +2 -2

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import os
              import pytest
              from vcsserver.str_utils import safe_bytes
              from vcsserver.git_lfs.lib import OidHandler, LFSOidStore
              @pytest.fixture()
              def lfs_store(tmpdir):
                  repo = 'test'
                  oid = '123456789'
                  store = LFSOidStore(oid=oid, repo=repo, store_location=str(tmpdir))
                  return store
              @pytest.fixture()
              def oid_handler(lfs_store):
                  store = lfs_store
                  repo = store.repo
                  oid = store.oid
                  oid_handler = OidHandler(
                      store=store, repo_name=repo, auth=('basic', 'xxxx'),
                      oid=oid,
                      obj_size='1024', obj_data={}, obj_href='http://localhost/handle_oid',
                      obj_verify_href='http://localhost/verify')
                  return oid_handler
-             class TestOidHandler(object):
+             class TestOidHandler:
                  @pytest.mark.parametrize('exec_action', [
                      'download',
                      'upload',
                  ])
                  def test_exec_action(self, exec_action, oid_handler):
                      handler = oid_handler.exec_operation(exec_action)
                      assert handler
                  def test_exec_action_undefined(self, oid_handler):
                      with pytest.raises(AttributeError):
                          oid_handler.exec_operation('wrong')
                  def test_download_oid_not_existing(self, oid_handler):
                      response, has_errors = oid_handler.exec_operation('download')
                      assert response is None
                      assert has_errors['error'] == {
                          'code': 404,
                          'message': 'object: 123456789 does not exist in store'}
                  def test_download_oid(self, oid_handler):
                      store = oid_handler.get_store()
                      if not os.path.isdir(os.path.dirname(store.oid_path)):
                          os.makedirs(os.path.dirname(store.oid_path))
                      with open(store.oid_path, 'wb') as f:
                          f.write(safe_bytes('CONTENT'))
                      response, has_errors = oid_handler.exec_operation('download')
                      assert has_errors is None
                      assert response['download'] == {
                          'header': {'Authorization': 'basic xxxx'},
                          'href': 'http://localhost/handle_oid'
                      }
                  def test_upload_oid_that_exists(self, oid_handler):
                      store = oid_handler.get_store()
                      if not os.path.isdir(os.path.dirname(store.oid_path)):
                          os.makedirs(os.path.dirname(store.oid_path))
                      with open(store.oid_path, 'wb') as f:
                          f.write(safe_bytes('CONTENT'))
                      oid_handler.obj_size = 7
                      response, has_errors = oid_handler.exec_operation('upload')
                      assert has_errors is None
                      assert response is None
                  def test_upload_oid_that_exists_but_has_wrong_size(self, oid_handler):
                      store = oid_handler.get_store()
                      if not os.path.isdir(os.path.dirname(store.oid_path)):
                          os.makedirs(os.path.dirname(store.oid_path))
                      with open(store.oid_path, 'wb') as f:
                          f.write(safe_bytes('CONTENT'))
                      oid_handler.obj_size = 10240
                      response, has_errors = oid_handler.exec_operation('upload')
                      assert has_errors is None
                      assert response['upload'] == {
                          'header': {'Authorization': 'basic xxxx',
                                     'Transfer-Encoding': 'chunked'},
                          'href': 'http://localhost/handle_oid',
                      }
                  def test_upload_oid(self, oid_handler):
                      response, has_errors = oid_handler.exec_operation('upload')
                      assert has_errors is None
                      assert response['upload'] == {
                          'header': {'Authorization': 'basic xxxx',
                                     'Transfer-Encoding': 'chunked'},
                          'href': 'http://localhost/handle_oid'
                      }
-             class TestLFSStore(object):
+             class TestLFSStore:
                  def test_write_oid(self, lfs_store):
                      oid_location = lfs_store.oid_path
                      assert not os.path.isfile(oid_location)
                      engine = lfs_store.get_engine(mode='wb')
                      with engine as f:
                          f.write(safe_bytes('CONTENT'))
                      assert os.path.isfile(oid_location)
                  def test_detect_has_oid(self, lfs_store):
                      assert lfs_store.has_oid() is False
                      engine = lfs_store.get_engine(mode='wb')
                      with engine as f:
                          f.write(safe_bytes('CONTENT'))
                      assert lfs_store.has_oid() is True

vcsserver/hook_utils/__init__.py

0 +2 -2

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import re
              import os
              import sys
              import datetime
              import logging
              import pkg_resources
              import vcsserver
              from vcsserver.str_utils import safe_bytes
              log = logging.getLogger(__name__)
              def get_git_hooks_path(repo_path, bare):
                  hooks_path = os.path.join(repo_path, 'hooks')
                  if not bare:
                      hooks_path = os.path.join(repo_path, '.git', 'hooks')
                  return hooks_path
              def install_git_hooks(repo_path, bare, executable=None, force_create=False):
                  """
                  Creates a RhodeCode hook inside a git repository
                  :param repo_path: path to repository
                  :param executable: binary executable to put in the hooks
                  :param force_create: Create even if same name hook exists
                  """
                  executable = executable or sys.executable
                  hooks_path = get_git_hooks_path(repo_path, bare)
                  if not os.path.isdir(hooks_path):
                      os.makedirs(hooks_path, mode=0o777, exist_ok=True)
                  tmpl_post = pkg_resources.resource_string(
                      'vcsserver', '/'.join(
                          ('hook_utils', 'hook_templates', 'git_post_receive.py.tmpl')))
                  tmpl_pre = pkg_resources.resource_string(
                      'vcsserver', '/'.join(
                          ('hook_utils', 'hook_templates', 'git_pre_receive.py.tmpl')))
                  path = ''  # not used for now
                  timestamp = datetime.datetime.utcnow().isoformat()
                  for h_type, template in [('pre', tmpl_pre), ('post', tmpl_post)]:
                      log.debug('Installing git hook in repo %s', repo_path)
-                     _hook_file = os.path.join(hooks_path, '%s-receive' % h_type)
+                     _hook_file = os.path.join(hooks_path, f'{h_type}-receive')
                      _rhodecode_hook = check_rhodecode_hook(_hook_file)
                      if _rhodecode_hook or force_create:
                          log.debug('writing git %s hook file at %s !', h_type, _hook_file)
                          try:
                              with open(_hook_file, 'wb') as f:
                                  template = template.replace(b'_TMPL_', safe_bytes(vcsserver.__version__))
                                  template = template.replace(b'_DATE_', safe_bytes(timestamp))
                                  template = template.replace(b'_ENV_', safe_bytes(executable))
                                  template = template.replace(b'_PATH_', safe_bytes(path))
                                  f.write(template)
                              os.chmod(_hook_file, 0o755)
                          except OSError:
                              log.exception('error writing hook file %s', _hook_file)
                      else:
                          log.debug('skipping writing hook file')
                  return True
              def get_svn_hooks_path(repo_path):
                  hooks_path = os.path.join(repo_path, 'hooks')
                  return hooks_path
              def install_svn_hooks(repo_path, executable=None, force_create=False):
                  """
                  Creates RhodeCode hooks inside a svn repository
                  :param repo_path: path to repository
                  :param executable: binary executable to put in the hooks
                  :param force_create: Create even if same name hook exists
                  """
                  executable = executable or sys.executable
                  hooks_path = get_svn_hooks_path(repo_path)
                  if not os.path.isdir(hooks_path):
                      os.makedirs(hooks_path, mode=0o777, exist_ok=True)
                  tmpl_post = pkg_resources.resource_string(
                      'vcsserver', '/'.join(
                          ('hook_utils', 'hook_templates', 'svn_post_commit_hook.py.tmpl')))
                  tmpl_pre = pkg_resources.resource_string(
                      'vcsserver', '/'.join(
                          ('hook_utils', 'hook_templates', 'svn_pre_commit_hook.py.tmpl')))
                  path = ''  # not used for now
                  timestamp = datetime.datetime.utcnow().isoformat()
                  for h_type, template in [('pre', tmpl_pre), ('post', tmpl_post)]:
                      log.debug('Installing svn hook in repo %s', repo_path)
-                     _hook_file = os.path.join(hooks_path, '%s-commit' % h_type)
+                     _hook_file = os.path.join(hooks_path, f'{h_type}-commit')
                      _rhodecode_hook = check_rhodecode_hook(_hook_file)
                      if _rhodecode_hook or force_create:
                          log.debug('writing svn %s hook file at %s !', h_type, _hook_file)
                          try:
                              with open(_hook_file, 'wb') as f:
                                  template = template.replace(b'_TMPL_', safe_bytes(vcsserver.__version__))
                                  template = template.replace(b'_DATE_', safe_bytes(timestamp))
                                  template = template.replace(b'_ENV_', safe_bytes(executable))
                                  template = template.replace(b'_PATH_', safe_bytes(path))
                                  f.write(template)
                              os.chmod(_hook_file, 0o755)
                          except OSError:
                              log.exception('error writing hook file %s', _hook_file)
                      else:
                          log.debug('skipping writing hook file')
                  return True
              def get_version_from_hook(hook_path):
                  version = b''
                  hook_content = read_hook_content(hook_path)
                  matches = re.search(rb'RC_HOOK_VER\s*=\s*(.*)', hook_content)
                  if matches:
                      try:
                          version = matches.groups()[0]
                          log.debug('got version %s from hooks.', version)
                      except Exception:
                          log.exception("Exception while reading the hook version.")
                  return version.replace(b"'", b"")
              def check_rhodecode_hook(hook_path):
                  """
                  Check if the hook was created by RhodeCode
                  """
                  if not os.path.exists(hook_path):
                      return True
                  log.debug('hook exists, checking if it is from RhodeCode')
                  version = get_version_from_hook(hook_path)
                  if version:
                      return True
                  return False
              def read_hook_content(hook_path) -> bytes:
                  content = b''
                  if os.path.isfile(hook_path):
                      with open(hook_path, 'rb') as f:
                          content = f.read()
                  return content
              def get_git_pre_hook_version(repo_path, bare):
                  hooks_path = get_git_hooks_path(repo_path, bare)
                  _hook_file = os.path.join(hooks_path, 'pre-receive')
                  version = get_version_from_hook(_hook_file)
                  return version
              def get_git_post_hook_version(repo_path, bare):
                  hooks_path = get_git_hooks_path(repo_path, bare)
                  _hook_file = os.path.join(hooks_path, 'post-receive')
                  version = get_version_from_hook(_hook_file)
                  return version
              def get_svn_pre_hook_version(repo_path):
                  hooks_path = get_svn_hooks_path(repo_path)
                  _hook_file = os.path.join(hooks_path, 'pre-commit')
                  version = get_version_from_hook(_hook_file)
                  return version
              def get_svn_post_hook_version(repo_path):
                  hooks_path = get_svn_hooks_path(repo_path)
                  _hook_file = os.path.join(hooks_path, 'post-commit')
                  version = get_version_from_hook(_hook_file)
                  return version

vcsserver/hooks.py

0 +6 -6

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import io
              import os
              import sys
              import logging
              import collections
              import importlib
              import base64
              import msgpack
              import dataclasses
              import pygit2
              import http.client
              import mercurial.scmutil
              import mercurial.node
              from vcsserver.lib.rc_json import json
              from vcsserver import exceptions, subprocessio, settings
              from vcsserver.str_utils import ascii_str, safe_str
              from vcsserver.remote.git_remote import Repository
              log = logging.getLogger(__name__)
-             class HooksHttpClient(object):
+             class HooksHttpClient:
                  proto = 'msgpack.v1'
                  connection = None
                  def __init__(self, hooks_uri):
                      self.hooks_uri = hooks_uri
                  def __repr__(self):
                      return f'{self.__class__}(hook_uri={self.hooks_uri}, proto={self.proto})'
                  def __call__(self, method, extras):
                      connection = http.client.HTTPConnection(self.hooks_uri)
                      # binary msgpack body
                      headers, body = self._serialize(method, extras)
                      log.debug('Doing a new hooks call using HTTPConnection to %s', self.hooks_uri)
                      try:
                          try:
                              connection.request('POST', '/', body, headers)
                          except Exception as error:
                              log.error('Hooks calling Connection failed on %s, org error: %s', connection.__dict__, error)
                              raise
                          response = connection.getresponse()
                          try:
                              return msgpack.load(response)
                          except Exception:
                              response_data = response.read()
                              log.exception('Failed to decode hook response json data. '
                                            'response_code:%s, raw_data:%s',
                                            response.status, response_data)
                              raise
                      finally:
                          connection.close()
                  @classmethod
                  def _serialize(cls, hook_name, extras):
                      data = {
                          'method': hook_name,
                          'extras': extras
                      }
                      headers = {
                          "rc-hooks-protocol": cls.proto,
                          "Connection": "keep-alive"
                      }
                      return headers, msgpack.packb(data)
-             class HooksDummyClient(object):
+             class HooksDummyClient:
                  def __init__(self, hooks_module):
                      self._hooks_module = importlib.import_module(hooks_module)
                  def __call__(self, hook_name, extras):
                      with self._hooks_module.Hooks() as hooks:
                          return getattr(hooks, hook_name)(extras)
-             class HooksShadowRepoClient(object):
+             class HooksShadowRepoClient:
                  def __call__(self, hook_name, extras):
                      return {'output': '', 'status': 0}
-             class RemoteMessageWriter(object):
+             class RemoteMessageWriter:
                  """Writer base class."""
                  def write(self, message):
                      raise NotImplementedError()
              class HgMessageWriter(RemoteMessageWriter):
                  """Writer that knows how to send messages to mercurial clients."""
                  def __init__(self, ui):
                      self.ui = ui
                  def write(self, message: str):
                      # TODO: Check why the quiet flag is set by default.
                      old = self.ui.quiet
                      self.ui.quiet = False
                      self.ui.status(message.encode('utf-8'))
                      self.ui.quiet = old
              class GitMessageWriter(RemoteMessageWriter):
                  """Writer that knows how to send messages to git clients."""
                  def __init__(self, stdout=None):
                      self.stdout = stdout or sys.stdout
                  def write(self, message: str):
                      self.stdout.write(message)
              class SvnMessageWriter(RemoteMessageWriter):
                  """Writer that knows how to send messages to svn clients."""
                  def __init__(self, stderr=None):
                      # SVN needs data sent to stderr for back-to-client messaging
                      self.stderr = stderr or sys.stderr
                  def write(self, message):
                      self.stderr.write(message.encode('utf-8'))
              def _handle_exception(result):
                  exception_class = result.get('exception')
                  exception_traceback = result.get('exception_traceback')
                  log.debug('Handling hook-call exception: %s', exception_class)
                  if exception_traceback:
                      log.error('Got traceback from remote call:%s', exception_traceback)
                  if exception_class == 'HTTPLockedRC':
                      raise exceptions.RepositoryLockedException()(*result['exception_args'])
                  elif exception_class == 'HTTPBranchProtected':
                      raise exceptions.RepositoryBranchProtectedException()(*result['exception_args'])
                  elif exception_class == 'RepositoryError':
                      raise exceptions.VcsException()(*result['exception_args'])
                  elif exception_class:
                      raise Exception(
                          f"""Got remote exception "{exception_class}" with args "{result['exception_args']}" """
                      )
              def _get_hooks_client(extras):
                  hooks_uri = extras.get('hooks_uri')
                  is_shadow_repo = extras.get('is_shadow_repo')
                  if hooks_uri:
                      return HooksHttpClient(extras['hooks_uri'])
                  elif is_shadow_repo:
                      return HooksShadowRepoClient()
                  else:
                      return HooksDummyClient(extras['hooks_module'])
              def _call_hook(hook_name, extras, writer):
                  hooks_client = _get_hooks_client(extras)
                  log.debug('Hooks, using client:%s', hooks_client)
                  result = hooks_client(hook_name, extras)
                  log.debug('Hooks got result: %s', result)
                  _handle_exception(result)
                  writer.write(result['output'])
                  return result['status']
              def _extras_from_ui(ui):
                  hook_data = ui.config(b'rhodecode', b'RC_SCM_DATA')
                  if not hook_data:
                      # maybe it's inside environ ?
                      env_hook_data = os.environ.get('RC_SCM_DATA')
                      if env_hook_data:
                          hook_data = env_hook_data
                  extras = {}
                  if hook_data:
                      extras = json.loads(hook_data)
                  return extras
              def _rev_range_hash(repo, node, check_heads=False):
                  from vcsserver.hgcompat import get_ctx
                  commits = []
                  revs = []
                  start = get_ctx(repo, node).rev()
                  end = len(repo)
                  for rev in range(start, end):
                      revs.append(rev)
                      ctx = get_ctx(repo, rev)
                      commit_id = ascii_str(mercurial.node.hex(ctx.node()))
                      branch = safe_str(ctx.branch())
                      commits.append((commit_id, branch))
                  parent_heads = []
                  if check_heads:
                      parent_heads = _check_heads(repo, start, end, revs)
                  return commits, parent_heads
              def _check_heads(repo, start, end, commits):
                  from vcsserver.hgcompat import get_ctx
                  changelog = repo.changelog
                  parents = set()
                  for new_rev in commits:
                      for p in changelog.parentrevs(new_rev):
                          if p == mercurial.node.nullrev:
                              continue
                          if p < start:
                              parents.add(p)
                  for p in parents:
                      branch = get_ctx(repo, p).branch()
                      # The heads descending from that parent, on the same branch
                      parent_heads = {p}
                      reachable = {p}
                      for x in range(p + 1, end):
                          if get_ctx(repo, x).branch() != branch:
                              continue
                          for pp in changelog.parentrevs(x):
                              if pp in reachable:
                                  reachable.add(x)
                                  parent_heads.discard(pp)
                                  parent_heads.add(x)
                      # More than one head? Suggest merging
                      if len(parent_heads) > 1:
                          return list(parent_heads)
                  return []
              def _get_git_env():
                  env = {}
                  for k, v in os.environ.items():
                      if k.startswith('GIT'):
                          env[k] = v
                  # serialized version
                  return [(k, v) for k, v in env.items()]
              def _get_hg_env(old_rev, new_rev, txnid, repo_path):
                  env = {}
                  for k, v in os.environ.items():
                      if k.startswith('HG'):
                          env[k] = v
                  env['HG_NODE'] = old_rev
                  env['HG_NODE_LAST'] = new_rev
                  env['HG_TXNID'] = txnid
                  env['HG_PENDING'] = repo_path
                  return [(k, v) for k, v in env.items()]
              def repo_size(ui, repo, **kwargs):
                  extras = _extras_from_ui(ui)
                  return _call_hook('repo_size', extras, HgMessageWriter(ui))
              def pre_pull(ui, repo, **kwargs):
                  extras = _extras_from_ui(ui)
                  return _call_hook('pre_pull', extras, HgMessageWriter(ui))
              def pre_pull_ssh(ui, repo, **kwargs):
                  extras = _extras_from_ui(ui)
                  if extras and extras.get('SSH'):
                      return pre_pull(ui, repo, **kwargs)
                  return 0
              def post_pull(ui, repo, **kwargs):
                  extras = _extras_from_ui(ui)
                  return _call_hook('post_pull', extras, HgMessageWriter(ui))
              def post_pull_ssh(ui, repo, **kwargs):
                  extras = _extras_from_ui(ui)
                  if extras and extras.get('SSH'):
                      return post_pull(ui, repo, **kwargs)
                  return 0
              def pre_push(ui, repo, node=None, **kwargs):
                  """
                  Mercurial pre_push hook
                  """
                  extras = _extras_from_ui(ui)
                  detect_force_push = extras.get('detect_force_push')
                  rev_data = []
                  hook_type: str = safe_str(kwargs.get('hooktype'))
                  if node and hook_type == 'pretxnchangegroup':
                      branches = collections.defaultdict(list)
                      commits, _heads = _rev_range_hash(repo, node, check_heads=detect_force_push)
                      for commit_id, branch in commits:
                          branches[branch].append(commit_id)
                      for branch, commits in branches.items():
                          old_rev = ascii_str(kwargs.get('node_last')) or commits[0]
                          rev_data.append({
                              'total_commits': len(commits),
                              'old_rev': old_rev,
                              'new_rev': commits[-1],
                              'ref': '',
                              'type': 'branch',
                              'name': branch,
                          })
                      for push_ref in rev_data:
                          push_ref['multiple_heads'] = _heads
                          repo_path = os.path.join(
                              extras.get('repo_store', ''), extras.get('repository', ''))
                          push_ref['hg_env'] = _get_hg_env(
                              old_rev=push_ref['old_rev'],
                              new_rev=push_ref['new_rev'], txnid=ascii_str(kwargs.get('txnid')),
                              repo_path=repo_path)
                  extras['hook_type'] = hook_type or 'pre_push'
                  extras['commit_ids'] = rev_data
                  return _call_hook('pre_push', extras, HgMessageWriter(ui))
              def pre_push_ssh(ui, repo, node=None, **kwargs):
                  extras = _extras_from_ui(ui)
                  if extras.get('SSH'):
                      return pre_push(ui, repo, node, **kwargs)
                  return 0
              def pre_push_ssh_auth(ui, repo, node=None, **kwargs):
                  """
                  Mercurial pre_push hook for SSH
                  """
                  extras = _extras_from_ui(ui)
                  if extras.get('SSH'):
                      permission = extras['SSH_PERMISSIONS']
                      if 'repository.write' == permission or 'repository.admin' == permission:
                          return 0
                      # non-zero ret code
                      return 1
                  return 0
              def post_push(ui, repo, node, **kwargs):
                  """
                  Mercurial post_push hook
                  """
                  extras = _extras_from_ui(ui)
                  commit_ids = []
                  branches = []
                  bookmarks = []
                  tags = []
                  hook_type: str = safe_str(kwargs.get('hooktype'))
                  commits, _heads = _rev_range_hash(repo, node)
                  for commit_id, branch in commits:
                      commit_ids.append(commit_id)
                      if branch not in branches:
                          branches.append(branch)
                  if hasattr(ui, '_rc_pushkey_bookmarks'):
                      bookmarks = ui._rc_pushkey_bookmarks
                  extras['hook_type'] = hook_type or 'post_push'
                  extras['commit_ids'] = commit_ids
                  extras['new_refs'] = {
                      'branches': branches,
                      'bookmarks': bookmarks,
                      'tags': tags
                  }
                  return _call_hook('post_push', extras, HgMessageWriter(ui))
              def post_push_ssh(ui, repo, node, **kwargs):
                  """
                  Mercurial post_push hook for SSH
                  """
                  if _extras_from_ui(ui).get('SSH'):
                      return post_push(ui, repo, node, **kwargs)
                  return 0
              def key_push(ui, repo, **kwargs):
                  from vcsserver.hgcompat import get_ctx
                  if kwargs['new'] != b'0' and kwargs['namespace'] == b'bookmarks':
                      # store new bookmarks in our UI object propagated later to post_push
                      ui._rc_pushkey_bookmarks = get_ctx(repo, kwargs['key']).bookmarks()
                  return
              # backward compat
              log_pull_action = post_pull
              # backward compat
              log_push_action = post_push
              def handle_git_pre_receive(unused_repo_path, unused_revs, unused_env):
                  """
                  Old hook name: keep here for backward compatibility.
                  This is only required when the installed git hooks are not upgraded.
                  """
                  pass
              def handle_git_post_receive(unused_repo_path, unused_revs, unused_env):
                  """
                  Old hook name: keep here for backward compatibility.
                  This is only required when the installed git hooks are not upgraded.
                  """
                  pass
              @dataclasses.dataclass
              class HookResponse:
                  status: int
                  output: str
              def git_pre_pull(extras) -> HookResponse:
                  """
                  Pre pull hook.
                  :param extras: dictionary containing the keys defined in simplevcs
                  :type extras: dict
                  :return: status code of the hook. 0 for success.
                  :rtype: int
                  """
                  if 'pull' not in extras['hooks']:
                      return HookResponse(0, '')
                  stdout = io.StringIO()
                  try:
                      status_code = _call_hook('pre_pull', extras, GitMessageWriter(stdout))
                  except Exception as error:
                      log.exception('Failed to call pre_pull hook')
                      status_code = 128
                      stdout.write(f'ERROR: {error}\n')
                  return HookResponse(status_code, stdout.getvalue())
              def git_post_pull(extras) -> HookResponse:
                  """
                  Post pull hook.
                  :param extras: dictionary containing the keys defined in simplevcs
                  :type extras: dict
                  :return: status code of the hook. 0 for success.
                  :rtype: int
                  """
                  if 'pull' not in extras['hooks']:
                      return HookResponse(0, '')
                  stdout = io.StringIO()
                  try:
                      status = _call_hook('post_pull', extras, GitMessageWriter(stdout))
                  except Exception as error:
                      status = 128
                      stdout.write(f'ERROR: {error}\n')
                  return HookResponse(status, stdout.getvalue())
              def _parse_git_ref_lines(revision_lines):
                  rev_data = []
                  for revision_line in revision_lines or []:
                      old_rev, new_rev, ref = revision_line.strip().split(' ')
                      ref_data = ref.split('/', 2)
                      if ref_data[1] in ('tags', 'heads'):
                          rev_data.append({
                              # NOTE(marcink):
                              # we're unable to tell total_commits for git at this point
                              # but we set the variable for consistency with GIT
                              'total_commits': -1,
                              'old_rev': old_rev,
                              'new_rev': new_rev,
                              'ref': ref,
                              'type': ref_data[1],
                              'name': ref_data[2],
                          })
                  return rev_data
              def git_pre_receive(unused_repo_path, revision_lines, env) -> int:
                  """
                  Pre push hook.
                  :return: status code of the hook. 0 for success.
                  """
                  extras = json.loads(env['RC_SCM_DATA'])
                  rev_data = _parse_git_ref_lines(revision_lines)
                  if 'push' not in extras['hooks']:
                      return 0
                  empty_commit_id = '0' * 40
                  detect_force_push = extras.get('detect_force_push')
                  for push_ref in rev_data:
                      # store our git-env which holds the temp store
                      push_ref['git_env'] = _get_git_env()
                      push_ref['pruned_sha'] = ''
                      if not detect_force_push:
                          # don't check for forced-push when we don't need to
                          continue
                      type_ = push_ref['type']
                      new_branch = push_ref['old_rev'] == empty_commit_id
                      delete_branch = push_ref['new_rev'] == empty_commit_id
                      if type_ == 'heads' and not (new_branch or delete_branch):
                          old_rev = push_ref['old_rev']
                          new_rev = push_ref['new_rev']
                          cmd = [settings.GIT_EXECUTABLE, 'rev-list', old_rev, f'^{new_rev}']
                          stdout, stderr = subprocessio.run_command(
                              cmd, env=os.environ.copy())
                          # means we're having some non-reachable objects, this forced push was used
                          if stdout:
                              push_ref['pruned_sha'] = stdout.splitlines()
                  extras['hook_type'] = 'pre_receive'
                  extras['commit_ids'] = rev_data
                  stdout = sys.stdout
                  status_code = _call_hook('pre_push', extras, GitMessageWriter(stdout))
                  return status_code
              def git_post_receive(unused_repo_path, revision_lines, env) -> int:
                  """
                  Post push hook.
                  :return: status code of the hook. 0 for success.
                  """
                  extras = json.loads(env['RC_SCM_DATA'])
                  if 'push' not in extras['hooks']:
                      return 0
                  rev_data = _parse_git_ref_lines(revision_lines)
                  git_revs = []
                  # N.B.(skreft): it is ok to just call git, as git before calling a
                  # subcommand sets the PATH environment variable so that it point to the
                  # correct version of the git executable.
                  empty_commit_id = '0' * 40
                  branches = []
                  tags = []
                  for push_ref in rev_data:
                      type_ = push_ref['type']
                      if type_ == 'heads':
                          # starting new branch case
                          if push_ref['old_rev'] == empty_commit_id:
                              push_ref_name = push_ref['name']
                              if push_ref_name not in branches:
                                  branches.append(push_ref_name)
                              need_head_set = ''
                              with Repository(os.getcwd()) as repo:
                                  try:
                                      repo.head
                                  except pygit2.GitError:
                                      need_head_set = f'refs/heads/{push_ref_name}'
                                  if need_head_set:
                                      repo.set_head(need_head_set)
                                      print(f"Setting default branch to {push_ref_name}")
                              cmd = [settings.GIT_EXECUTABLE, 'for-each-ref', '--format=%(refname)', 'refs/heads/*']
                              stdout, stderr = subprocessio.run_command(
                                  cmd, env=os.environ.copy())
                              heads = safe_str(stdout)
                              heads = heads.replace(push_ref['ref'], '')
                              heads = ' '.join(head for head
                                               in heads.splitlines() if head) or '.'
                              cmd = [settings.GIT_EXECUTABLE, 'log', '--reverse',
                                     '--pretty=format:%H', '--', push_ref['new_rev'],
                                     '--not', heads]
                              stdout, stderr = subprocessio.run_command(
                                  cmd, env=os.environ.copy())
                              git_revs.extend(list(map(ascii_str, stdout.splitlines())))
                          # delete branch case
                          elif push_ref['new_rev'] == empty_commit_id:
-                             git_revs.append('delete_branch=>%s' % push_ref['name'])
+                             git_revs.append(f'delete_branch=>{push_ref["name"]}')
                          else:
                              if push_ref['name'] not in branches:
                                  branches.append(push_ref['name'])
                              cmd = [settings.GIT_EXECUTABLE, 'log',
                                     '{old_rev}..{new_rev}'.format(**push_ref),
                                     '--reverse', '--pretty=format:%H']
                              stdout, stderr = subprocessio.run_command(
                                  cmd, env=os.environ.copy())
                              # we get bytes from stdout, we need str to be consistent
                              log_revs = list(map(ascii_str, stdout.splitlines()))
                              git_revs.extend(log_revs)
                              # Pure pygit2 impl. but still 2-3x slower :/
                              # results = []
                              #
                              # with Repository(os.getcwd()) as repo:
                              #     repo_new_rev = repo[push_ref['new_rev']]
                              #     repo_old_rev = repo[push_ref['old_rev']]
                              #     walker = repo.walk(repo_new_rev.id, pygit2.GIT_SORT_TOPOLOGICAL)
                              #
                              #     for commit in walker:
                              #         if commit.id == repo_old_rev.id:
                              #             break
                              #         results.append(commit.id.hex)
                              #     # reverse the order, can't use GIT_SORT_REVERSE
                              #     log_revs = results[::-1]
                      elif type_ == 'tags':
                          if push_ref['name'] not in tags:
                              tags.append(push_ref['name'])
-                         git_revs.append('tag=>%s' % push_ref['name'])
+                         git_revs.append(f'tag=>{push_ref["name"]}')
                  extras['hook_type'] = 'post_receive'
                  extras['commit_ids'] = git_revs
                  extras['new_refs'] = {
                      'branches': branches,
                      'bookmarks': [],
                      'tags': tags,
                  }
                  stdout = sys.stdout
                  if 'repo_size' in extras['hooks']:
                      try:
                          _call_hook('repo_size', extras, GitMessageWriter(stdout))
                      except Exception:
                          pass
                  status_code = _call_hook('post_push', extras, GitMessageWriter(stdout))
                  return status_code
              def _get_extras_from_txn_id(path, txn_id):
                  extras = {}
                  try:
                      cmd = [settings.SVNLOOK_EXECUTABLE, 'pget',
                             '-t', txn_id,
                             '--revprop', path, 'rc-scm-extras']
                      stdout, stderr = subprocessio.run_command(
                          cmd, env=os.environ.copy())
                      extras = json.loads(base64.urlsafe_b64decode(stdout))
                  except Exception:
                      log.exception('Failed to extract extras info from txn_id')
                  return extras
              def _get_extras_from_commit_id(commit_id, path):
                  extras = {}
                  try:
                      cmd = [settings.SVNLOOK_EXECUTABLE, 'pget',
                             '-r', commit_id,
                             '--revprop', path, 'rc-scm-extras']
                      stdout, stderr = subprocessio.run_command(
                          cmd, env=os.environ.copy())
                      extras = json.loads(base64.urlsafe_b64decode(stdout))
                  except Exception:
                      log.exception('Failed to extract extras info from commit_id')
                  return extras
              def svn_pre_commit(repo_path, commit_data, env):
                  path, txn_id = commit_data
                  branches = []
                  tags = []
                  if env.get('RC_SCM_DATA'):
                      extras = json.loads(env['RC_SCM_DATA'])
                  else:
                      # fallback method to read from TXN-ID stored data
                      extras = _get_extras_from_txn_id(path, txn_id)
                      if not extras:
                          return 0
                  extras['hook_type'] = 'pre_commit'
                  extras['commit_ids'] = [txn_id]
                  extras['txn_id'] = txn_id
                  extras['new_refs'] = {
                      'total_commits': 1,
                      'branches': branches,
                      'bookmarks': [],
                      'tags': tags,
                  }
                  return _call_hook('pre_push', extras, SvnMessageWriter())
              def svn_post_commit(repo_path, commit_data, env):
                  """
                  commit_data is path, rev, txn_id
                  """
                  if len(commit_data) == 3:
                      path, commit_id, txn_id = commit_data
                  elif len(commit_data) == 2:
                      log.error('Failed to extract txn_id from commit_data using legacy method. '
                                'Some functionality might be limited')
                      path, commit_id = commit_data
                      txn_id = None
                  branches = []
                  tags = []
                  if env.get('RC_SCM_DATA'):
                      extras = json.loads(env['RC_SCM_DATA'])
                  else:
                      # fallback method to read from TXN-ID stored data
                      extras = _get_extras_from_commit_id(commit_id, path)
                      if not extras:
                          return 0
                  extras['hook_type'] = 'post_commit'
                  extras['commit_ids'] = [commit_id]
                  extras['txn_id'] = txn_id
                  extras['new_refs'] = {
                      'branches': branches,
                      'bookmarks': [],
                      'tags': tags,
                      'total_commits': 1,
                  }
                  if 'repo_size' in extras['hooks']:
                      try:
                          _call_hook('repo_size', extras, SvnMessageWriter())
                      except Exception:
                          pass
                  return _call_hook('post_push', extras, SvnMessageWriter())

vcsserver/http_main.py

0 +5 -5

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import io
              import os
              import platform
              import sys
              import locale
              import logging
              import uuid
              import time
              import wsgiref.util
              import tempfile
              import psutil
              from itertools import chain
              import msgpack
              import configparser
              from pyramid.config import Configurator
              from pyramid.wsgi import wsgiapp
              from pyramid.response import Response
              from vcsserver.base import BytesEnvelope, BinaryEnvelope
              from vcsserver.lib.rc_json import json
              from vcsserver.config.settings_maker import SettingsMaker
              from vcsserver.str_utils import safe_int
              from vcsserver.lib.statsd_client import StatsdClient
              from vcsserver.tweens.request_wrapper import get_headers_call_context
              import vcsserver
              from vcsserver import remote_wsgi, scm_app, settings, hgpatches
              from vcsserver.git_lfs.app import GIT_LFS_CONTENT_TYPE, GIT_LFS_PROTO_PAT
              from vcsserver.echo_stub import remote_wsgi as remote_wsgi_stub
              from vcsserver.echo_stub.echo_app import EchoApp
              from vcsserver.exceptions import HTTPRepoLocked, HTTPRepoBranchProtected
              from vcsserver.lib.exc_tracking import store_exception, format_exc
              from vcsserver.server import VcsServer
              strict_vcs = True
              git_import_err = None
              try:
                  from vcsserver.remote.git_remote import GitFactory, GitRemote
              except ImportError as e:
                  GitFactory = None
                  GitRemote = None
                  git_import_err = e
                  if strict_vcs:
                      raise
              hg_import_err = None
              try:
                  from vcsserver.remote.hg_remote import MercurialFactory, HgRemote
              except ImportError as e:
                  MercurialFactory = None
                  HgRemote = None
                  hg_import_err = e
                  if strict_vcs:
                      raise
              svn_import_err = None
              try:
                  from vcsserver.remote.svn_remote import SubversionFactory, SvnRemote
              except ImportError as e:
                  SubversionFactory = None
                  SvnRemote = None
                  svn_import_err = e
                  if strict_vcs:
                      raise
              log = logging.getLogger(__name__)
              # due to Mercurial/glibc2.27 problems we need to detect if locale settings are
              # causing problems and "fix" it in case they do and fallback to LC_ALL = C
              try:
                  locale.setlocale(locale.LC_ALL, '')
              except locale.Error as e:
                  log.error(
                      'LOCALE ERROR: failed to set LC_ALL, fallback to LC_ALL=C, org error: %s', e)
                  os.environ['LC_ALL'] = 'C'
              def _is_request_chunked(environ):
                  stream = environ.get('HTTP_TRANSFER_ENCODING', '') == 'chunked'
                  return stream
              def log_max_fd():
                  try:
                      maxfd = psutil.Process().rlimit(psutil.RLIMIT_NOFILE)[1]
                      log.info('Max file descriptors value: %s', maxfd)
                  except Exception:
                      pass
-             class VCS(object):
+             class VCS:
                  def __init__(self, locale_conf=None, cache_config=None):
                      self.locale = locale_conf
                      self.cache_config = cache_config
                      self._configure_locale()
                      log_max_fd()
                      if GitFactory and GitRemote:
                          git_factory = GitFactory()
                          self._git_remote = GitRemote(git_factory)
                      else:
                          log.error("Git client import failed: %s", git_import_err)
                      if MercurialFactory and HgRemote:
                          hg_factory = MercurialFactory()
                          self._hg_remote = HgRemote(hg_factory)
                      else:
                          log.error("Mercurial client import failed: %s", hg_import_err)
                      if SubversionFactory and SvnRemote:
                          svn_factory = SubversionFactory()
                          # hg factory is used for svn url validation
                          hg_factory = MercurialFactory()
                          self._svn_remote = SvnRemote(svn_factory, hg_factory=hg_factory)
                      else:
                          log.error("Subversion client import failed: %s", svn_import_err)
                      self._vcsserver = VcsServer()
                  def _configure_locale(self):
                      if self.locale:
                          log.info('Settings locale: `LC_ALL` to %s', self.locale)
                      else:
                          log.info('Configuring locale subsystem based on environment variables')
                      try:
                          # If self.locale is the empty string, then the locale
                          # module will use the environment variables. See the
                          # documentation of the package `locale`.
                          locale.setlocale(locale.LC_ALL, self.locale)
                          language_code, encoding = locale.getlocale()
                          log.info(
                              'Locale set to language code "%s" with encoding "%s".',
                              language_code, encoding)
                      except locale.Error:
                          log.exception('Cannot set locale, not configuring the locale system')
-             class WsgiProxy(object):
+             class WsgiProxy:
                  def __init__(self, wsgi):
                      self.wsgi = wsgi
                  def __call__(self, environ, start_response):
                      input_data = environ['wsgi.input'].read()
                      input_data = msgpack.unpackb(input_data)
                      error = None
                      try:
                          data, status, headers = self.wsgi.handle(
                              input_data['environment'], input_data['input_data'],
                              *input_data['args'], **input_data['kwargs'])
                      except Exception as e:
                          data, status, headers = [], None, None
                          error = {
                              'message': str(e),
                              '_vcs_kind': getattr(e, '_vcs_kind', None)
                          }
                      start_response(200, {})
                      return self._iterator(error, status, headers, data)
                  def _iterator(self, error, status, headers, data):
                      initial_data = [
                          error,
                          status,
                          headers,
                      ]
                      for d in chain(initial_data, data):
                          yield msgpack.packb(d)
              def not_found(request):
                  return {'status': '404 NOT FOUND'}
-             class VCSViewPredicate(object):
+             class VCSViewPredicate:
                  def __init__(self, val, config):
                      self.remotes = val
                  def text(self):
                      return f'vcs view method = {list(self.remotes.keys())}'
                  phash = text
                  def __call__(self, context, request):
                      """
                      View predicate that returns true if given backend is supported by
                      defined remotes.
                      """
                      backend = request.matchdict.get('backend')
                      return backend in self.remotes
-             class HTTPApplication(object):
+             class HTTPApplication:
                  ALLOWED_EXCEPTIONS = ('KeyError', 'URLError')
                  remote_wsgi = remote_wsgi
                  _use_echo_app = False
                  def __init__(self, settings=None, global_config=None):
                      self.config = Configurator(settings=settings)
                      # Init our statsd at very start
                      self.config.registry.statsd = StatsdClient.statsd
                      self.config.registry.vcs_call_context = {}
                      self.global_config = global_config
                      self.config.include('vcsserver.lib.rc_cache')
                      self.config.include('vcsserver.lib.rc_cache.archive_cache')
                      settings_locale = settings.get('locale', '') or 'en_US.UTF-8'
                      vcs = VCS(locale_conf=settings_locale, cache_config=settings)
                      self._remotes = {
                          'hg': vcs._hg_remote,
                          'git': vcs._git_remote,
                          'svn': vcs._svn_remote,
                          'server': vcs._vcsserver,
                      }
                      if settings.get('dev.use_echo_app', 'false').lower() == 'true':
                          self._use_echo_app = True
                          log.warning("Using EchoApp for VCS operations.")
                          self.remote_wsgi = remote_wsgi_stub
                      self._configure_settings(global_config, settings)
                      self._configure()
                  def _configure_settings(self, global_config, app_settings):
                      """
                      Configure the settings module.
                      """
                      settings_merged = global_config.copy()
                      settings_merged.update(app_settings)
                      git_path = app_settings.get('git_path', None)
                      if git_path:
                          settings.GIT_EXECUTABLE = git_path
                      binary_dir = app_settings.get('core.binary_dir', None)
                      if binary_dir:
                          settings.BINARY_DIR = binary_dir
                      # Store the settings to make them available to other modules.
                      vcsserver.PYRAMID_SETTINGS = settings_merged
                      vcsserver.CONFIG = settings_merged
                  def _configure(self):
                      self.config.add_renderer(name='msgpack', factory=self._msgpack_renderer_factory)
                      self.config.add_route('service', '/_service')
                      self.config.add_route('status', '/status')
                      self.config.add_route('hg_proxy', '/proxy/hg')
                      self.config.add_route('git_proxy', '/proxy/git')
                      # rpc methods
                      self.config.add_route('vcs', '/{backend}')
                      # streaming rpc remote methods
                      self.config.add_route('vcs_stream', '/{backend}/stream')
                      # vcs operations clone/push as streaming
                      self.config.add_route('stream_git', '/stream/git/*repo_name')
                      self.config.add_route('stream_hg', '/stream/hg/*repo_name')
                      self.config.add_view(self.status_view, route_name='status', renderer='json')
                      self.config.add_view(self.service_view, route_name='service', renderer='msgpack')
                      self.config.add_view(self.hg_proxy(), route_name='hg_proxy')
                      self.config.add_view(self.git_proxy(), route_name='git_proxy')
                      self.config.add_view(self.vcs_view, route_name='vcs', renderer='msgpack',
                                           vcs_view=self._remotes)
                      self.config.add_view(self.vcs_stream_view, route_name='vcs_stream',
                                           vcs_view=self._remotes)
                      self.config.add_view(self.hg_stream(), route_name='stream_hg')
                      self.config.add_view(self.git_stream(), route_name='stream_git')
                      self.config.add_view_predicate('vcs_view', VCSViewPredicate)
                      self.config.add_notfound_view(not_found, renderer='json')
                      self.config.add_view(self.handle_vcs_exception, context=Exception)
                      self.config.add_tween(
                          'vcsserver.tweens.request_wrapper.RequestWrapperTween',
                      )
                      self.config.add_request_method(
                          'vcsserver.lib.request_counter.get_request_counter',
                          'request_count')
                  def wsgi_app(self):
                      return self.config.make_wsgi_app()
                  def _vcs_view_params(self, request):
                      remote = self._remotes[request.matchdict['backend']]
                      payload = msgpack.unpackb(request.body, use_list=True)
                      method = payload.get('method')
                      params = payload['params']
                      wire = params.get('wire')
                      args = params.get('args')
                      kwargs = params.get('kwargs')
                      context_uid = None
                      request.registry.vcs_call_context = {
                          'method': method,
                          'repo_name': payload.get('_repo_name'),
                      }
                      if wire:
                          try:
                              wire['context'] = context_uid = uuid.UUID(wire['context'])
                          except KeyError:
                              pass
                          args.insert(0, wire)
                      repo_state_uid = wire.get('repo_state_uid') if wire else None
                      # NOTE(marcink): trading complexity for slight performance
                      if log.isEnabledFor(logging.DEBUG):
                          # also we SKIP printing out any of those methods args since they maybe excessive
                          just_args_methods = {
                              'commitctx': ('content', 'removed', 'updated'),
                              'commit': ('content', 'removed', 'updated')
                          }
                          if method in just_args_methods:
                              skip_args = just_args_methods[method]
                              call_args = ''
                              call_kwargs = {}
                              for k in kwargs:
                                  if k in skip_args:
                                      # replace our skip key with dummy
                                      call_kwargs[k] = f'RemovedParam({k})'
                                  else:
                                      call_kwargs[k] = kwargs[k]
                          else:
                              call_args = args[1:]
                              call_kwargs = kwargs
                          log.debug('Method requested:`%s` with args:%s kwargs:%s context_uid: %s, repo_state_uid:%s',
                                    method, call_args, call_kwargs, context_uid, repo_state_uid)
                      statsd = request.registry.statsd
                      if statsd:
                          statsd.incr(
                              'vcsserver_method_total', tags=[
                                  f"method:{method}",
                              ])
                      return payload, remote, method, args, kwargs
                  def vcs_view(self, request):
                      payload, remote, method, args, kwargs = self._vcs_view_params(request)
                      payload_id = payload.get('id')
                      try:
                          resp = getattr(remote, method)(*args, **kwargs)
                      except Exception as e:
                          exc_info = list(sys.exc_info())
                          exc_type, exc_value, exc_traceback = exc_info
                          org_exc = getattr(e, '_org_exc', None)
                          org_exc_name = None
                          org_exc_tb = ''
                          if org_exc:
                              org_exc_name = org_exc.__class__.__name__
                              org_exc_tb = getattr(e, '_org_exc_tb', '')
                              # replace our "faked" exception with our org
                              exc_info[0] = org_exc.__class__
                              exc_info[1] = org_exc
                          should_store_exc = True
                          if org_exc:
                              def get_exc_fqn(_exc_obj):
                                  module_name = getattr(org_exc.__class__, '__module__', 'UNKNOWN')
                                  return module_name + '.' + org_exc_name
                              exc_fqn = get_exc_fqn(org_exc)
                              if exc_fqn in ['mercurial.error.RepoLookupError',
                                             'vcsserver.exceptions.RefNotFoundException']:
                                  should_store_exc = False
                          if should_store_exc:
                              store_exception(id(exc_info), exc_info, request_path=request.path)
                          tb_info = format_exc(exc_info)
                          type_ = e.__class__.__name__
                          if type_ not in self.ALLOWED_EXCEPTIONS:
                              type_ = None
                          resp = {
                              'id': payload_id,
                              'error': {
                                  'message': str(e),
                                  'traceback': tb_info,
                                  'org_exc': org_exc_name,
                                  'org_exc_tb': org_exc_tb,
                                  'type': type_
                              }
                          }
                          try:
                              resp['error']['_vcs_kind'] = getattr(e, '_vcs_kind', None)
                          except AttributeError:
                              pass
                      else:
                          resp = {
                              'id': payload_id,
                              'result': resp
                          }
                      log.debug('Serving data for method %s', method)
                      return resp
                  def vcs_stream_view(self, request):
                      payload, remote, method, args, kwargs = self._vcs_view_params(request)
                      # this method has a stream: marker we remove it here
                      method = method.split('stream:')[-1]
                      chunk_size = safe_int(payload.get('chunk_size')) or 4096
                      resp = getattr(remote, method)(*args, **kwargs)
                      def get_chunked_data(method_resp):
                          stream = io.BytesIO(method_resp)
                          while 1:
                              chunk = stream.read(chunk_size)
                              if not chunk:
                                  break
                              yield chunk
                      response = Response(app_iter=get_chunked_data(resp))
                      response.content_type = 'application/octet-stream'
                      return response
                  def status_view(self, request):
                      import vcsserver
                      _platform_id = platform.uname()[1] or 'instance'
                      return {
                          "status": "OK",
                          "vcsserver_version": vcsserver.__version__,
                          "platform": _platform_id,
                          "pid": os.getpid(),
                      }
                  def service_view(self, request):
                      import vcsserver
                      payload = msgpack.unpackb(request.body, use_list=True)
                      server_config, app_config = {}, {}
                      try:
                          path = self.global_config['__file__']
                          config = configparser.RawConfigParser()
                          config.read(path)
                          if config.has_section('server:main'):
                              server_config = dict(config.items('server:main'))
                          if config.has_section('app:main'):
                              app_config = dict(config.items('app:main'))
                      except Exception:
                          log.exception('Failed to read .ini file for display')
                      environ = list(os.environ.items())
                      resp = {
                          'id': payload.get('id'),
                          'result': dict(
                              version=vcsserver.__version__,
                              config=server_config,
                              app_config=app_config,
                              environ=environ,
                              payload=payload,
                          )
                      }
                      return resp
                  def _msgpack_renderer_factory(self, info):
                      def _render(value, system):
                          bin_type = False
                          res = value.get('result')
                          if isinstance(res, BytesEnvelope):
                              log.debug('Result is wrapped in BytesEnvelope type')
                              bin_type = True
                          elif isinstance(res, BinaryEnvelope):
                              log.debug('Result is wrapped in BinaryEnvelope type')
                              value['result'] = res.val
                              bin_type = True
                          request = system.get('request')
                          if request is not None:
                              response = request.response
                              ct = response.content_type
                              if ct == response.default_content_type:
                                  response.content_type = 'application/x-msgpack'
                                  if bin_type:
                                      response.content_type = 'application/x-msgpack-bin'
                          return msgpack.packb(value, use_bin_type=bin_type)
                      return _render
                  def set_env_from_config(self, environ, config):
                      dict_conf = {}
                      try:
                          for elem in config:
                              if elem[0] == 'rhodecode':
                                  dict_conf = json.loads(elem[2])
                                  break
                      except Exception:
                          log.exception('Failed to fetch SCM CONFIG')
                          return
                      username = dict_conf.get('username')
                      if username:
                          environ['REMOTE_USER'] = username
                          # mercurial specific, some extension api rely on this
                          environ['HGUSER'] = username
                      ip = dict_conf.get('ip')
                      if ip:
                          environ['REMOTE_HOST'] = ip
                      if _is_request_chunked(environ):
                          # set the compatibility flag for webob
                          environ['wsgi.input_terminated'] = True
                  def hg_proxy(self):
                      @wsgiapp
                      def _hg_proxy(environ, start_response):
                          app = WsgiProxy(self.remote_wsgi.HgRemoteWsgi())
                          return app(environ, start_response)
                      return _hg_proxy
                  def git_proxy(self):
                      @wsgiapp
                      def _git_proxy(environ, start_response):
                          app = WsgiProxy(self.remote_wsgi.GitRemoteWsgi())
                          return app(environ, start_response)
                      return _git_proxy
                  def hg_stream(self):
                      if self._use_echo_app:
                          @wsgiapp
                          def _hg_stream(environ, start_response):
                              app = EchoApp('fake_path', 'fake_name', None)
                              return app(environ, start_response)
                          return _hg_stream
                      else:
                          @wsgiapp
                          def _hg_stream(environ, start_response):
                              log.debug('http-app: handling hg stream')
                              call_context = get_headers_call_context(environ)
                              repo_path = call_context['repo_path']
                              repo_name = call_context['repo_name']
                              config = call_context['repo_config']
                              app = scm_app.create_hg_wsgi_app(
                                  repo_path, repo_name, config)
                              # Consistent path information for hgweb
                              environ['PATH_INFO'] = call_context['path_info']
                              environ['REPO_NAME'] = repo_name
                              self.set_env_from_config(environ, config)
                              log.debug('http-app: starting app handler '
                                        'with %s and process request', app)
                              return app(environ, ResponseFilter(start_response))
                          return _hg_stream
                  def git_stream(self):
                      if self._use_echo_app:
                          @wsgiapp
                          def _git_stream(environ, start_response):
                              app = EchoApp('fake_path', 'fake_name', None)
                              return app(environ, start_response)
                          return _git_stream
                      else:
                          @wsgiapp
                          def _git_stream(environ, start_response):
                              log.debug('http-app: handling git stream')
                              call_context = get_headers_call_context(environ)
                              repo_path = call_context['repo_path']
                              repo_name = call_context['repo_name']
                              config = call_context['repo_config']
                              environ['PATH_INFO'] = call_context['path_info']
                              self.set_env_from_config(environ, config)
                              content_type = environ.get('CONTENT_TYPE', '')
                              path = environ['PATH_INFO']
                              is_lfs_request = GIT_LFS_CONTENT_TYPE in content_type
                              log.debug(
                                  'LFS: Detecting if request `%s` is LFS server path based '
                                  'on content type:`%s`, is_lfs:%s',
                                  path, content_type, is_lfs_request)
                              if not is_lfs_request:
                                  # fallback detection by path
                                  if GIT_LFS_PROTO_PAT.match(path):
                                      is_lfs_request = True
                                  log.debug(
                                      'LFS: fallback detection by path of: `%s`, is_lfs:%s',
                                      path, is_lfs_request)
                              if is_lfs_request:
                                  app = scm_app.create_git_lfs_wsgi_app(
                                      repo_path, repo_name, config)
                              else:
                                  app = scm_app.create_git_wsgi_app(
                                      repo_path, repo_name, config)
                              log.debug('http-app: starting app handler '
                                        'with %s and process request', app)
                              return app(environ, start_response)
                          return _git_stream
                  def handle_vcs_exception(self, exception, request):
                      _vcs_kind = getattr(exception, '_vcs_kind', '')
                      if _vcs_kind == 'repo_locked':
                          headers_call_context = get_headers_call_context(request.environ)
                          status_code = safe_int(headers_call_context['locked_status_code'])
                          return HTTPRepoLocked(
                              title=str(exception), status_code=status_code, headers=[('X-Rc-Locked', '1')])
                      elif _vcs_kind == 'repo_branch_protected':
                          # Get custom repo-branch-protected status code if present.
                          return HTTPRepoBranchProtected(
                              title=str(exception), headers=[('X-Rc-Branch-Protection', '1')])
                      exc_info = request.exc_info
                      store_exception(id(exc_info), exc_info)
                      traceback_info = 'unavailable'
                      if request.exc_info:
                          traceback_info = format_exc(request.exc_info)
                      log.error(
                          'error occurred handling this request for path: %s, \n%s',
                          request.path, traceback_info)
                      statsd = request.registry.statsd
                      if statsd:
                          exc_type = f"{exception.__class__.__module__}.{exception.__class__.__name__}"
                          statsd.incr('vcsserver_exception_total',
                                      tags=[f"type:{exc_type}"])
                      raise exception
-             class ResponseFilter(object):
+             class ResponseFilter:
                  def __init__(self, start_response):
                      self._start_response = start_response
                  def __call__(self, status, response_headers, exc_info=None):
                      headers = tuple(
                          (h, v) for h, v in response_headers
                          if not wsgiref.util.is_hop_by_hop(h))
                      return self._start_response(status, headers, exc_info)
              def sanitize_settings_and_apply_defaults(global_config, settings):
                  _global_settings_maker = SettingsMaker(global_config)
                  settings_maker = SettingsMaker(settings)
                  settings_maker.make_setting('logging.autoconfigure', False, parser='bool')
                  logging_conf = os.path.join(os.path.dirname(global_config.get('__file__')), 'logging.ini')
                  settings_maker.enable_logging(logging_conf)
                  # Default includes, possible to change as a user
                  pyramid_includes = settings_maker.make_setting('pyramid.includes', [], parser='list:newline')
                  log.debug("Using the following pyramid.includes: %s", pyramid_includes)
                  settings_maker.make_setting('__file__', global_config.get('__file__'))
                  settings_maker.make_setting('pyramid.default_locale_name', 'en')
                  settings_maker.make_setting('locale', 'en_US.UTF-8')
                  settings_maker.make_setting('core.binary_dir', '')
                  temp_store = tempfile.gettempdir()
                  default_cache_dir = os.path.join(temp_store, 'rc_cache')
                  # save default, cache dir, and use it for all backends later.
                  default_cache_dir = settings_maker.make_setting(
                      'cache_dir',
                      default=default_cache_dir, default_when_empty=True,
                      parser='dir:ensured')
                  # exception store cache
                  settings_maker.make_setting(
                      'exception_tracker.store_path',
                      default=os.path.join(default_cache_dir, 'exc_store'), default_when_empty=True,
                      parser='dir:ensured'
                  )
                  # repo_object cache defaults
                  settings_maker.make_setting(
                      'rc_cache.repo_object.backend',
                      default='dogpile.cache.rc.file_namespace',
                      parser='string')
                  settings_maker.make_setting(
                      'rc_cache.repo_object.expiration_time',
                      default=30 * 24 * 60 * 60,  # 30days
                      parser='int')
                  settings_maker.make_setting(
                      'rc_cache.repo_object.arguments.filename',
                      default=os.path.join(default_cache_dir, 'vcsserver_cache_repo_object.db'),
                      parser='string')
                  # statsd
                  settings_maker.make_setting('statsd.enabled', False, parser='bool')
                  settings_maker.make_setting('statsd.statsd_host', 'statsd-exporter', parser='string')
                  settings_maker.make_setting('statsd.statsd_port', 9125, parser='int')
                  settings_maker.make_setting('statsd.statsd_prefix', '')
                  settings_maker.make_setting('statsd.statsd_ipv6', False, parser='bool')
                  settings_maker.env_expand()
              def main(global_config, **settings):
                  start_time = time.time()
                  log.info('Pyramid app config starting')
                  if MercurialFactory:
                      hgpatches.patch_largefiles_capabilities()
                      hgpatches.patch_subrepo_type_mapping()
                  # Fill in and sanitize the defaults & do ENV expansion
                  sanitize_settings_and_apply_defaults(global_config, settings)
                  # init and bootstrap StatsdClient
                  StatsdClient.setup(settings)
                  pyramid_app = HTTPApplication(settings=settings, global_config=global_config).wsgi_app()
                  total_time = time.time() - start_time
                  log.info('Pyramid app created and configured in %.2fs', total_time)
                  return pyramid_app

vcsserver/lib/_vendor/redis_lock/__init__.py

0 +1 -1

              import threading
              import weakref
              from base64 import b64encode
              from logging import getLogger
              from os import urandom
              from typing import Union
              from redis import StrictRedis
              __version__ = '4.0.0'
              loggers = {
                  k: getLogger("vcsserver." + ".".join((__name__, k)))
                  for k in [
                      "acquire",
                      "refresh.thread.start",
                      "refresh.thread.stop",
                      "refresh.thread.exit",
                      "refresh.start",
                      "refresh.shutdown",
                      "refresh.exit",
                      "release",
                  ]
              }
              text_type = str
              binary_type = bytes
              # Check if the id match. If not, return an error code.
              UNLOCK_SCRIPT = b"""
                  if redis.call("get", KEYS[1]) ~= ARGV[1] then
                      return 1
                  else
                      redis.call("del", KEYS[2])
                      redis.call("lpush", KEYS[2], 1)
                      redis.call("pexpire", KEYS[2], ARGV[2])
                      redis.call("del", KEYS[1])
                      return 0
                  end
              """
              # Covers both cases when key doesn't exist and doesn't equal to lock's id
              EXTEND_SCRIPT = b"""
                  if redis.call("get", KEYS[1]) ~= ARGV[1] then
                      return 1
                  elseif redis.call("ttl", KEYS[1]) < 0 then
                      return 2
                  else
                      redis.call("expire", KEYS[1], ARGV[2])
                      return 0
                  end
              """
              RESET_SCRIPT = b"""
                  redis.call('del', KEYS[2])
                  redis.call('lpush', KEYS[2], 1)
                  redis.call('pexpire', KEYS[2], ARGV[2])
                  return redis.call('del', KEYS[1])
              """
              RESET_ALL_SCRIPT = b"""
                  local locks = redis.call('keys', 'lock:*')
                  local signal
                  for _, lock in pairs(locks) do
                      signal = 'lock-signal:' .. string.sub(lock, 6)
                      redis.call('del', signal)
                      redis.call('lpush', signal, 1)
                      redis.call('expire', signal, 1)
                      redis.call('del', lock)
                  end
                  return #locks
              """
              class AlreadyAcquired(RuntimeError):
                  pass
              class NotAcquired(RuntimeError):
                  pass
              class AlreadyStarted(RuntimeError):
                  pass
              class TimeoutNotUsable(RuntimeError):
                  pass
              class InvalidTimeout(RuntimeError):
                  pass
              class TimeoutTooLarge(RuntimeError):
                  pass
              class NotExpirable(RuntimeError):
                  pass
-             class Lock(object):
+             class Lock:
                  """
                  A Lock context manager implemented via redis SETNX/BLPOP.
                  """
                  unlock_script = None
                  extend_script = None
                  reset_script = None
                  reset_all_script = None
                  _lock_renewal_interval: float
                  _lock_renewal_thread: Union[threading.Thread, None]
                  def __init__(self, redis_client, name, expire=None, id=None, auto_renewal=False, strict=True, signal_expire=1000):
                      """
                      :param redis_client:
                          An instance of :class:`~StrictRedis`.
                      :param name:
                          The name (redis key) the lock should have.
                      :param expire:
                          The lock expiry time in seconds. If left at the default (None)
                          the lock will not expire.
                      :param id:
                          The ID (redis value) the lock should have. A random value is
                          generated when left at the default.
                          Note that if you specify this then the lock is marked as "held". Acquires
                          won't be possible.
                      :param auto_renewal:
                          If set to ``True``, Lock will automatically renew the lock so that it
                          doesn't expire for as long as the lock is held (acquire() called
                          or running in a context manager).
                          Implementation note: Renewal will happen using a daemon thread with
                          an interval of ``expire*2/3``. If wishing to use a different renewal
                          time, subclass Lock, call ``super().__init__()`` then set
                          ``self._lock_renewal_interval`` to your desired interval.
                      :param strict:
                          If set ``True`` then the ``redis_client`` needs to be an instance of ``redis.StrictRedis``.
                      :param signal_expire:
                          Advanced option to override signal list expiration in milliseconds. Increase it for very slow clients. Default: ``1000``.
                      """
                      if strict and not isinstance(redis_client, StrictRedis):
                          raise ValueError("redis_client must be instance of StrictRedis. "
                                           "Use strict=False if you know what you're doing.")
                      if auto_renewal and expire is None:
                          raise ValueError("Expire may not be None when auto_renewal is set")
                      self._client = redis_client
                      if expire:
                          expire = int(expire)
                          if expire < 0:
                              raise ValueError("A negative expire is not acceptable.")
                      else:
                          expire = None
                      self._expire = expire
                      self._signal_expire = signal_expire
                      if id is None:
                          self._id = b64encode(urandom(18)).decode('ascii')
                      elif isinstance(id, binary_type):
                          try:
                              self._id = id.decode('ascii')
                          except UnicodeDecodeError:
                              self._id = b64encode(id).decode('ascii')
                      elif isinstance(id, text_type):
                          self._id = id
                      else:
                          raise TypeError(f"Incorrect type for `id`. Must be bytes/str not {type(id)}.")
                      self._name = 'lock:' + name
                      self._signal = 'lock-signal:' + name
                      self._lock_renewal_interval = (float(expire) * 2 / 3
                                                     if auto_renewal
                                                     else None)
                      self._lock_renewal_thread = None
                      self.register_scripts(redis_client)
                  @classmethod
                  def register_scripts(cls, redis_client):
                      global reset_all_script
                      if reset_all_script is None:
                          cls.unlock_script = redis_client.register_script(UNLOCK_SCRIPT)
                          cls.extend_script = redis_client.register_script(EXTEND_SCRIPT)
                          cls.reset_script = redis_client.register_script(RESET_SCRIPT)
                          cls.reset_all_script = redis_client.register_script(RESET_ALL_SCRIPT)
                          reset_all_script = redis_client.register_script(RESET_ALL_SCRIPT)
                  @property
                  def _held(self):
                      return self.id == self.get_owner_id()
                  def reset(self):
                      """
                      Forcibly deletes the lock. Use this with care.
                      """
                      self.reset_script(client=self._client, keys=(self._name, self._signal), args=(self.id, self._signal_expire))
                  @property
                  def id(self):
                      return self._id
                  def get_owner_id(self):
                      owner_id = self._client.get(self._name)
                      if isinstance(owner_id, binary_type):
                          owner_id = owner_id.decode('ascii', 'replace')
                      return owner_id
                  def acquire(self, blocking=True, timeout=None):
                      """
                      :param blocking:
                          Boolean value specifying whether lock should be blocking or not.
                      :param timeout:
                          An integer value specifying the maximum number of seconds to block.
                      """
                      logger = loggers["acquire"]
                      logger.debug("Getting blocking: %s acquire on %r ...", blocking, self._name)
                      if self._held:
                          owner_id = self.get_owner_id()
                          raise AlreadyAcquired("Already acquired from this Lock instance. Lock id: {}".format(owner_id))
                      if not blocking and timeout is not None:
                          raise TimeoutNotUsable("Timeout cannot be used if blocking=False")
                      if timeout:
                          timeout = int(timeout)
                          if timeout < 0:
                              raise InvalidTimeout(f"Timeout ({timeout}) cannot be less than or equal to 0")
                          if self._expire and not self._lock_renewal_interval and timeout > self._expire:
                              raise TimeoutTooLarge(f"Timeout ({timeout}) cannot be greater than expire ({self._expire})")
                      busy = True
                      blpop_timeout = timeout or self._expire or 0
                      timed_out = False
                      while busy:
                          busy = not self._client.set(self._name, self._id, nx=True, ex=self._expire)
                          if busy:
                              if timed_out:
                                  return False
                              elif blocking:
                                  timed_out = not self._client.blpop(self._signal, blpop_timeout) and timeout
                              else:
                                  logger.warning("Failed to acquire Lock(%r).", self._name)
                                  return False
                      logger.debug("Acquired Lock(%r).", self._name)
                      if self._lock_renewal_interval is not None:
                          self._start_lock_renewer()
                      return True
                  def extend(self, expire=None):
                      """
                      Extends expiration time of the lock.
                      :param expire:
                          New expiration time. If ``None`` - `expire` provided during
                          lock initialization will be taken.
                      """
                      if expire:
                          expire = int(expire)
                          if expire < 0:
                              raise ValueError("A negative expire is not acceptable.")
                      elif self._expire is not None:
                          expire = self._expire
                      else:
                          raise TypeError(
                              "To extend a lock 'expire' must be provided as an "
                              "argument to extend() method or at initialization time."
                          )
                      error = self.extend_script(client=self._client, keys=(self._name, self._signal), args=(self._id, expire))
                      if error == 1:
                          raise NotAcquired(f"Lock {self._name} is not acquired or it already expired.")
                      elif error == 2:
                          raise NotExpirable(f"Lock {self._name} has no assigned expiration time")
                      elif error:
                          raise RuntimeError(f"Unsupported error code {error} from EXTEND script")
                  @staticmethod
                  def _lock_renewer(name, lockref, interval, stop):
                      """
                      Renew the lock key in redis every `interval` seconds for as long
                      as `self._lock_renewal_thread.should_exit` is False.
                      """
                      while not stop.wait(timeout=interval):
                          loggers["refresh.thread.start"].debug("Refreshing Lock(%r).", name)
                          lock: "Lock" = lockref()
                          if lock is None:
                              loggers["refresh.thread.stop"].debug(
                                  "Stopping loop because Lock(%r) was garbage collected.", name
                              )
                              break
                          lock.extend(expire=lock._expire)
                          del lock
                      loggers["refresh.thread.exit"].debug("Exiting renewal thread for Lock(%r).", name)
                  def _start_lock_renewer(self):
                      """
                      Starts the lock refresher thread.
                      """
                      if self._lock_renewal_thread is not None:
                          raise AlreadyStarted("Lock refresh thread already started")
                      loggers["refresh.start"].debug(
                          "Starting renewal thread for Lock(%r). Refresh interval: %s seconds.",
                          self._name, self._lock_renewal_interval
                      )
                      self._lock_renewal_stop = threading.Event()
                      self._lock_renewal_thread = threading.Thread(
                          group=None,
                          target=self._lock_renewer,
                          kwargs={
                              'name': self._name,
                              'lockref': weakref.ref(self),
                              'interval': self._lock_renewal_interval,
                              'stop': self._lock_renewal_stop,
                          },
                      )
                      self._lock_renewal_thread.daemon = True
                      self._lock_renewal_thread.start()
                  def _stop_lock_renewer(self):
                      """
                      Stop the lock renewer.
                      This signals the renewal thread and waits for its exit.
                      """
                      if self._lock_renewal_thread is None or not self._lock_renewal_thread.is_alive():
                          return
                      loggers["refresh.shutdown"].debug("Signaling renewal thread for Lock(%r) to exit.", self._name)
                      self._lock_renewal_stop.set()
                      self._lock_renewal_thread.join()
                      self._lock_renewal_thread = None
                      loggers["refresh.exit"].debug("Renewal thread for Lock(%r) exited.", self._name)
                  def __enter__(self):
                      acquired = self.acquire(blocking=True)
                      if not acquired:
                          raise AssertionError(f"Lock({self._name}) wasn't acquired, but blocking=True was used!")
                      return self
                  def __exit__(self, exc_type=None, exc_value=None, traceback=None):
                      self.release()
                  def release(self):
                      """Releases the lock, that was acquired with the same object.
                      .. note::
                          If you want to release a lock that you acquired in a different place you have two choices:
                          * Use ``Lock("name", id=id_from_other_place).release()``
                          * Use ``Lock("name").reset()``
                      """
                      if self._lock_renewal_thread is not None:
                          self._stop_lock_renewer()
                      loggers["release"].debug("Releasing Lock(%r).", self._name)
                      error = self.unlock_script(client=self._client, keys=(self._name, self._signal), args=(self._id, self._signal_expire))
                      if error == 1:
                          raise NotAcquired(f"Lock({self._name}) is not acquired or it already expired.")
                      elif error:
                          raise RuntimeError(f"Unsupported error code {error} from EXTEND script.")
                  def locked(self):
                      """
                      Return true if the lock is acquired.
                      Checks that lock with same name already exists. This method returns true, even if
                      lock have another id.
                      """
                      return self._client.exists(self._name) == 1
              reset_all_script = None
              def reset_all(redis_client):
                  """
                  Forcibly deletes all locks if its remains (like a crash reason). Use this with care.
                  :param redis_client:
                      An instance of :class:`~StrictRedis`.
                  """
                  Lock.register_scripts(redis_client)
                  reset_all_script(client=redis_client)  # noqa

vcsserver/lib/_vendor/statsd/base.py

0 +1 -1

              import re
              import random
              from collections import deque
              from datetime import timedelta
              from repoze.lru import lru_cache
              from .timer import Timer
              TAG_INVALID_CHARS_RE = re.compile(
                  r"[^\w\d_\-:/\.]",
                  #re.UNICODE
              )
              TAG_INVALID_CHARS_SUBS = "_"
              # we save and expose methods called by statsd for discovery
              buckets_dict = {
              }
              @lru_cache(maxsize=500)
              def _normalize_tags_with_cache(tag_list):
                  return [TAG_INVALID_CHARS_RE.sub(TAG_INVALID_CHARS_SUBS, tag) for tag in tag_list]
              def normalize_tags(tag_list):
                  # We have to turn our input tag list into a non-mutable tuple for it to
                  # be hashable (and thus usable) by the @lru_cache decorator.
                  return _normalize_tags_with_cache(tuple(tag_list))
-             class StatsClientBase(object):
+             class StatsClientBase:
                  """A Base class for various statsd clients."""
                  def close(self):
                      """Used to close and clean up any underlying resources."""
                      raise NotImplementedError()
                  def _send(self):
                      raise NotImplementedError()
                  def pipeline(self):
                      raise NotImplementedError()
                  def timer(self, stat, rate=1, tags=None, auto_send=True):
                      """
                      statsd = StatsdClient.statsd
                      with statsd.timer('bucket_name', auto_send=True) as tmr:
                          # This block will be timed.
                          for i in range(0, 100000):
                              i ** 2
                      # you can access time here...
                      elapsed_ms = tmr.ms
                      """
                      return Timer(self, stat, rate, tags, auto_send=auto_send)
                  def timing(self, stat, delta, rate=1, tags=None, use_decimals=True):
                      """
                      Send new timing information.
                      `delta` can be either a number of milliseconds or a timedelta.
                      """
                      if isinstance(delta, timedelta):
                          # Convert timedelta to number of milliseconds.
                          delta = delta.total_seconds() * 1000.
                      if use_decimals:
                          fmt = '%0.6f|ms'
                      else:
                          fmt = '%s|ms'
                      self._send_stat(stat, fmt % delta, rate, tags)
                  def incr(self, stat, count=1, rate=1, tags=None):
                      """Increment a stat by `count`."""
                      self._send_stat(stat, '%s|c' % count, rate, tags)
                  def decr(self, stat, count=1, rate=1, tags=None):
                      """Decrement a stat by `count`."""
                      self.incr(stat, -count, rate, tags)
                  def gauge(self, stat, value, rate=1, delta=False, tags=None):
                      """Set a gauge value."""
                      if value < 0 and not delta:
                          if rate < 1:
                              if random.random() > rate:
                                  return
                          with self.pipeline() as pipe:
                              pipe._send_stat(stat, '0|g', 1)
                              pipe._send_stat(stat, '%s|g' % value, 1)
                      else:
                          prefix = '+' if delta and value >= 0 else ''
                          self._send_stat(stat, '%s%s|g' % (prefix, value), rate, tags)
                  def set(self, stat, value, rate=1):
                      """Set a set value."""
                      self._send_stat(stat, '%s|s' % value, rate)
                  def histogram(self, stat, value, rate=1, tags=None):
                      """Set a histogram"""
                      self._send_stat(stat, '%s|h' % value, rate, tags)
                  def _send_stat(self, stat, value, rate, tags=None):
                      self._after(self._prepare(stat, value, rate, tags))
                  def _prepare(self, stat, value, rate, tags=None):
                      global buckets_dict
                      buckets_dict[stat] = 1
                      if rate < 1:
                          if random.random() > rate:
                              return
                          value = '%s|@%s' % (value, rate)
                      if self._prefix:
                          stat = '%s.%s' % (self._prefix, stat)
                      res = '%s:%s%s' % (
                          stat,
                          value,
                          ("|#" + ",".join(normalize_tags(tags))) if tags else "",
                      )
                      return res
                  def _after(self, data):
                      if data:
                          self._send(data)
              class PipelineBase(StatsClientBase):
                  def __init__(self, client):
                      self._client = client
                      self._prefix = client._prefix
                      self._stats = deque()
                  def _send(self):
                      raise NotImplementedError()
                  def _after(self, data):
                      if data is not None:
                          self._stats.append(data)
                  def __enter__(self):
                      return self
                  def __exit__(self, typ, value, tb):
                      self.send()
                  def send(self):
                      if not self._stats:
                          return
                      self._send()
                  def pipeline(self):
                      return self.__class__(self)

vcsserver/lib/_vendor/statsd/timer.py

0 +1 -1

              import functools
              from time import perf_counter as time_now
              def safe_wraps(wrapper, *args, **kwargs):
                  """Safely wraps partial functions."""
                  while isinstance(wrapper, functools.partial):
                      wrapper = wrapper.func
                  return functools.wraps(wrapper, *args, **kwargs)
-             class Timer(object):
+             class Timer:
                  """A context manager/decorator for statsd.timing()."""
                  def __init__(self, client, stat, rate=1, tags=None, use_decimals=True, auto_send=True):
                      self.client = client
                      self.stat = stat
                      self.rate = rate
                      self.tags = tags
                      self.ms = None
                      self._sent = False
                      self._start_time = None
                      self.use_decimals = use_decimals
                      self.auto_send = auto_send
                  def __call__(self, f):
                      """Thread-safe timing function decorator."""
                      @safe_wraps(f)
                      def _wrapped(*args, **kwargs):
                          start_time = time_now()
                          try:
                              return f(*args, **kwargs)
                          finally:
                              elapsed_time_ms = 1000.0 * (time_now() - start_time)
                              self.client.timing(self.stat, elapsed_time_ms, self.rate, self.tags, self.use_decimals)
                              self._sent = True
                      return _wrapped
                  def __enter__(self):
                      return self.start()
                  def __exit__(self, typ, value, tb):
                      self.stop(send=self.auto_send)
                  def start(self):
                      self.ms = None
                      self._sent = False
                      self._start_time = time_now()
                      return self
                  def stop(self, send=True):
                      if self._start_time is None:
                          raise RuntimeError('Timer has not started.')
                      dt = time_now() - self._start_time
                      self.ms = 1000.0 * dt  # Convert to milliseconds.
                      if send:
                          self.send()
                      return self
                  def send(self):
                      if self.ms is None:
                          raise RuntimeError('No data recorded.')
                      if self._sent:
                          raise RuntimeError('Already sent data.')
                      self._sent = True
                      self.client.timing(self.stat, self.ms, self.rate, self.tags, self.use_decimals)

vcsserver/lib/rc_cache/backends.py

0 +2 -2

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              #import errno
              import fcntl
              import functools
              import logging
              import os
              import pickle
              #import time
              #import gevent
              import msgpack
              import redis
              flock_org = fcntl.flock
              from typing import Union
              from dogpile.cache.api import Deserializer, Serializer
              from dogpile.cache.backends import file as file_backend
              from dogpile.cache.backends import memory as memory_backend
              from dogpile.cache.backends import redis as redis_backend
              from dogpile.cache.backends.file import FileLock
              from dogpile.cache.util import memoized_property
              from vcsserver.lib.memory_lru_dict import LRUDict, LRUDictDebug
              from vcsserver.str_utils import safe_bytes, safe_str
              from vcsserver.type_utils import str2bool
              _default_max_size = 1024
              log = logging.getLogger(__name__)
              class LRUMemoryBackend(memory_backend.MemoryBackend):
                  key_prefix = 'lru_mem_backend'
                  pickle_values = False
                  def __init__(self, arguments):
                      self.max_size = arguments.pop('max_size', _default_max_size)
                      LRUDictClass = LRUDict
                      if arguments.pop('log_key_count', None):
                          LRUDictClass = LRUDictDebug
                      arguments['cache_dict'] = LRUDictClass(self.max_size)
                      super().__init__(arguments)
                  def __repr__(self):
                      return f'{self.__class__}(maxsize=`{self.max_size}`)'
                  def __str__(self):
                      return self.__repr__()
                  def delete(self, key):
                      try:
                          del self._cache[key]
                      except KeyError:
                          # we don't care if key isn't there at deletion
                          pass
                  def delete_multi(self, keys):
                      for key in keys:
                          self.delete(key)
              class PickleSerializer:
                  serializer: None | Serializer = staticmethod(  # type: ignore
                      functools.partial(pickle.dumps, protocol=pickle.HIGHEST_PROTOCOL)
                  )
                  deserializer: None | Deserializer = staticmethod(  # type: ignore
                      functools.partial(pickle.loads)
                  )
-             class MsgPackSerializer(object):
+             class MsgPackSerializer:
                  serializer: None | Serializer = staticmethod(  # type: ignore
                      msgpack.packb
                  )
                  deserializer: None | Deserializer = staticmethod(  # type: ignore
                      functools.partial(msgpack.unpackb, use_list=False)
                  )
              class CustomLockFactory(FileLock):
                  pass
              class FileNamespaceBackend(PickleSerializer, file_backend.DBMBackend):
                  key_prefix = 'file_backend'
                  def __init__(self, arguments):
                      arguments['lock_factory'] = CustomLockFactory
                      db_file = arguments.get('filename')
                      log.debug('initialing cache-backend=%s db in %s', self.__class__.__name__, db_file)
                      db_file_dir = os.path.dirname(db_file)
                      if not os.path.isdir(db_file_dir):
                          os.makedirs(db_file_dir)
                      try:
                          super().__init__(arguments)
                      except Exception:
                          log.exception('Failed to initialize db at: %s', db_file)
                          raise
                  def __repr__(self):
                      return f'{self.__class__}(file=`{self.filename}`)'
                  def __str__(self):
                      return self.__repr__()
                  def _get_keys_pattern(self, prefix: bytes = b''):
                      return b'%b:%b' % (safe_bytes(self.key_prefix), safe_bytes(prefix))
                  def list_keys(self, prefix: bytes = b''):
                      prefix = self._get_keys_pattern(prefix)
                      def cond(dbm_key: bytes):
                          if not prefix:
                              return True
                          if dbm_key.startswith(prefix):
                              return True
                          return False
                      with self._dbm_file(True) as dbm:
                          try:
                              return list(filter(cond, dbm.keys()))
                          except Exception:
                              log.error('Failed to fetch DBM keys from DB: %s', self.get_store())
                              raise
                  def get_store(self):
                      return self.filename
              class BaseRedisBackend(redis_backend.RedisBackend):
                  key_prefix = ''
                  def __init__(self, arguments):
                      self.db_conn = arguments.get('host', '') or arguments.get('url', '') or 'redis-host'
                      super().__init__(arguments)
                      self._lock_timeout = self.lock_timeout
                      self._lock_auto_renewal = str2bool(arguments.pop("lock_auto_renewal", True))
                      if self._lock_auto_renewal and not self._lock_timeout:
                          # set default timeout for auto_renewal
                          self._lock_timeout = 30
                  def __repr__(self):
                      return f'{self.__class__}(conn=`{self.db_conn}`)'
                  def __str__(self):
                      return self.__repr__()
                  def _create_client(self):
                      args = {}
                      if self.url is not None:
                          args.update(url=self.url)
                      else:
                          args.update(
                              host=self.host, password=self.password,
                              port=self.port, db=self.db
                          )
                      connection_pool = redis.ConnectionPool(**args)
                      self.writer_client = redis.StrictRedis(
                          connection_pool=connection_pool
                      )
                      self.reader_client = self.writer_client
                  def _get_keys_pattern(self, prefix: bytes = b''):
                      return b'%b:%b*' % (safe_bytes(self.key_prefix), safe_bytes(prefix))
                  def list_keys(self, prefix: bytes = b''):
                      prefix = self._get_keys_pattern(prefix)
                      return self.reader_client.keys(prefix)
                  def get_store(self):
                      return self.reader_client.connection_pool
                  def get_mutex(self, key):
                      if self.distributed_lock:
                          lock_key = f'_lock_{safe_str(key)}'
                          return get_mutex_lock(
                              self.writer_client, lock_key,
                              self._lock_timeout,
                              auto_renewal=self._lock_auto_renewal
                          )
                      else:
                          return None
              class RedisPickleBackend(PickleSerializer, BaseRedisBackend):
                  key_prefix = 'redis_pickle_backend'
                  pass
              class RedisMsgPackBackend(MsgPackSerializer, BaseRedisBackend):
                  key_prefix = 'redis_msgpack_backend'
                  pass
              def get_mutex_lock(client, lock_key, lock_timeout, auto_renewal=False):
                  from vcsserver.lib._vendor import redis_lock
-                 class _RedisLockWrapper(object):
+                 class _RedisLockWrapper:
                      """LockWrapper for redis_lock"""
                      @classmethod
                      def get_lock(cls):
                          return redis_lock.Lock(
                              redis_client=client,
                              name=lock_key,
                              expire=lock_timeout,
                              auto_renewal=auto_renewal,
                              strict=True,
                          )
                      def __repr__(self):
                          return f"{self.__class__.__name__}:{lock_key}"
                      def __str__(self):
                          return f"{self.__class__.__name__}:{lock_key}"
                      def __init__(self):
                          self.lock = self.get_lock()
                          self.lock_key = lock_key
                      def acquire(self, wait=True):
                          log.debug('Trying to acquire Redis lock for key %s', self.lock_key)
                          try:
                              acquired = self.lock.acquire(wait)
                              log.debug('Got lock for key %s, %s', self.lock_key, acquired)
                              return acquired
                          except redis_lock.AlreadyAcquired:
                              return False
                          except redis_lock.AlreadyStarted:
                              # refresh thread exists, but it also means we acquired the lock
                              return True
                      def release(self):
                          try:
                              self.lock.release()
                          except redis_lock.NotAcquired:
                              pass
                  return _RedisLockWrapper()

vcsserver/lib/svnremoterepo.py

0 +2 -2

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import os
              import tempfile
              from svn import client
              from svn import core
              from svn import ra
              from mercurial import error
              from vcsserver.str_utils import safe_bytes
              core.svn_config_ensure(None)
              svn_config = core.svn_config_get_config(None)
              class RaCallbacks(ra.Callbacks):
                  @staticmethod
                  def open_tmp_file(pool):  # pragma: no cover
                      (fd, fn) = tempfile.mkstemp()
                      os.close(fd)
                      return fn
                  @staticmethod
                  def get_client_string(pool):
                      return b'RhodeCode-subversion-url-checker'
              class SubversionException(Exception):
                  pass
              class SubversionConnectionException(SubversionException):
                  """Exception raised when a generic error occurs when connecting to a repository."""
              def normalize_url(url):
                  if not url:
                      return url
                  if url.startswith(b'svn+http://') or url.startswith(b'svn+https://'):
                      url = url[4:]
                  url = url.rstrip(b'/')
                  return url
              def _create_auth_baton(pool):
                  """Create a Subversion authentication baton. """
                  # Give the client context baton a suite of authentication
                  # providers.h
                  platform_specific = [
                      'svn_auth_get_gnome_keyring_simple_provider',
                      'svn_auth_get_gnome_keyring_ssl_client_cert_pw_provider',
                      'svn_auth_get_keychain_simple_provider',
                      'svn_auth_get_keychain_ssl_client_cert_pw_provider',
                      'svn_auth_get_kwallet_simple_provider',
                      'svn_auth_get_kwallet_ssl_client_cert_pw_provider',
                      'svn_auth_get_ssl_client_cert_file_provider',
                      'svn_auth_get_windows_simple_provider',
                      'svn_auth_get_windows_ssl_server_trust_provider',
                  ]
                  providers = []
                  for p in platform_specific:
                      if getattr(core, p, None) is not None:
                          try:
                              providers.append(getattr(core, p)())
                          except RuntimeError:
                              pass
                  providers += [
                      client.get_simple_provider(),
                      client.get_username_provider(),
                      client.get_ssl_client_cert_file_provider(),
                      client.get_ssl_client_cert_pw_file_provider(),
                      client.get_ssl_server_trust_file_provider(),
                  ]
                  return core.svn_auth_open(providers, pool)
-             class SubversionRepo(object):
+             class SubversionRepo:
                  """Wrapper for a Subversion repository.
                  It uses the SWIG Python bindings, see above for requirements.
                  """
                  def __init__(self, svn_url: bytes = b'', username: bytes = b'', password: bytes = b''):
                      self.username = username
                      self.password = password
                      self.svn_url = core.svn_path_canonicalize(svn_url)
                      self.auth_baton_pool = core.Pool()
                      self.auth_baton = _create_auth_baton(self.auth_baton_pool)
                      # self.init_ra_and_client() assumes that a pool already exists
                      self.pool = core.Pool()
                      self.ra = self.init_ra_and_client()
                      self.uuid = ra.get_uuid(self.ra, self.pool)
                  def init_ra_and_client(self):
                      """Initializes the RA and client layers, because sometimes getting
                      unified diffs runs the remote server out of open files.
                      """
                      if self.username:
                          core.svn_auth_set_parameter(self.auth_baton,
                                                      core.SVN_AUTH_PARAM_DEFAULT_USERNAME,
                                                      self.username)
                      if self.password:
                          core.svn_auth_set_parameter(self.auth_baton,
                                                      core.SVN_AUTH_PARAM_DEFAULT_PASSWORD,
                                                      self.password)
                      callbacks = RaCallbacks()
                      callbacks.auth_baton = self.auth_baton
                      try:
                          return ra.open2(self.svn_url, callbacks, svn_config, self.pool)
                      except SubversionException as e:
                          # e.child contains a detailed error messages
                          msglist = []
                          svn_exc = e
                          while svn_exc:
                              if svn_exc.args[0]:
                                  msglist.append(svn_exc.args[0])
                              svn_exc = svn_exc.child
                          msg = '\n'.join(msglist)
                          raise SubversionConnectionException(msg)
-             class svnremoterepo(object):
+             class svnremoterepo:
                  """ the dumb wrapper for actual Subversion repositories """
                  def __init__(self, username: bytes = b'', password: bytes = b'', svn_url: bytes = b''):
                      self.username = username or b''
                      self.password = password or b''
                      self.path = normalize_url(svn_url)
                  def svn(self):
                      try:
                          return SubversionRepo(self.path, self.username, self.password)
                      except SubversionConnectionException as e:
                          raise error.Abort(safe_bytes(e))

vcsserver/pygrack.py

0 +2 -2

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              """Handles the Git smart protocol."""
              import os
              import socket
              import logging
              import dulwich.protocol
              from dulwich.protocol import CAPABILITY_SIDE_BAND, CAPABILITY_SIDE_BAND_64K
              from webob import Request, Response, exc
              from vcsserver.lib.rc_json import json
              from vcsserver import hooks, subprocessio
              from vcsserver.str_utils import ascii_bytes
              log = logging.getLogger(__name__)
-             class FileWrapper(object):
+             class FileWrapper:
                  """File wrapper that ensures how much data is read from it."""
                  def __init__(self, fd, content_length):
                      self.fd = fd
                      self.content_length = content_length
                      self.remain = content_length
                  def read(self, size):
                      if size <= self.remain:
                          try:
                              data = self.fd.read(size)
                          except socket.error:
                              raise IOError(self)
                          self.remain -= size
                      elif self.remain:
                          data = self.fd.read(self.remain)
                          self.remain = 0
                      else:
                          data = None
                      return data
                  def __repr__(self):
                      return '<FileWrapper {} len: {}, read: {}>'.format(
                          self.fd, self.content_length, self.content_length - self.remain
                      )
-             class GitRepository(object):
+             class GitRepository:
                  """WSGI app for handling Git smart protocol endpoints."""
                  git_folder_signature = frozenset(('config', 'head', 'info', 'objects', 'refs'))
                  commands = frozenset(('git-upload-pack', 'git-receive-pack'))
                  valid_accepts = frozenset(f'application/x-{c}-result' for c in commands)
                  # The last bytes are the SHA1 of the first 12 bytes.
                  EMPTY_PACK = (
                      b'PACK\x00\x00\x00\x02\x00\x00\x00\x00\x02\x9d\x08' +
                      b'\x82;\xd8\xa8\xea\xb5\x10\xadj\xc7\\\x82<\xfd>\xd3\x1e'
                  )
                  FLUSH_PACKET = b"0000"
                  SIDE_BAND_CAPS = frozenset((CAPABILITY_SIDE_BAND, CAPABILITY_SIDE_BAND_64K))
                  def __init__(self, repo_name, content_path, git_path, update_server_info, extras):
                      files = frozenset(f.lower() for f in os.listdir(content_path))
                      valid_dir_signature = self.git_folder_signature.issubset(files)
                      if not valid_dir_signature:
                          raise OSError(f'{content_path} missing git signature')
                      self.content_path = content_path
                      self.repo_name = repo_name
                      self.extras = extras
                      self.git_path = git_path
                      self.update_server_info = update_server_info
                  def _get_fixedpath(self, path):
                      """
                      Small fix for repo_path
                      :param path:
                      """
                      path = path.split(self.repo_name, 1)[-1]
                      if path.startswith('.git'):
                          # for bare repos we still get the .git prefix inside, we skip it
                          # here, and remove from the service command
                          path = path[4:]
                      return path.strip('/')
                  def inforefs(self, request, unused_environ):
                      """
                      WSGI Response producer for HTTP GET Git Smart
                      HTTP /info/refs request.
                      """
                      git_command = request.GET.get('service')
                      if git_command not in self.commands:
                          log.debug('command %s not allowed', git_command)
                          return exc.HTTPForbidden()
                      # please, resist the urge to add '\n' to git capture and increment
                      # line count by 1.
                      # by git docs: Documentation/technical/http-protocol.txt#L214 \n is
                      # a part of protocol.
                      # The code in Git client not only does NOT need '\n', but actually
                      # blows up if you sprinkle "flush" (0000) as "0001\n".
                      # It reads binary, per number of bytes specified.
                      # if you do add '\n' as part of data, count it.
                      server_advert = '# service=%s\n' % git_command
                      packet_len = hex(len(server_advert) + 4)[2:].rjust(4, '0').lower()
                      try:
                          gitenv = dict(os.environ)
                          # forget all configs
                          gitenv['RC_SCM_DATA'] = json.dumps(self.extras)
                          command = [self.git_path, git_command[4:], '--stateless-rpc',
                                     '--advertise-refs', self.content_path]
                          out = subprocessio.SubprocessIOChunker(
                              command,
                              env=gitenv,
                              starting_values=[ascii_bytes(packet_len + server_advert) + self.FLUSH_PACKET],
                              shell=False
                          )
                      except OSError:
                          log.exception('Error processing command')
                          raise exc.HTTPExpectationFailed()
                      resp = Response()
                      resp.content_type = f'application/x-{git_command}-advertisement'
                      resp.charset = None
                      resp.app_iter = out
                      return resp
                  def _get_want_capabilities(self, request):
                      """Read the capabilities found in the first want line of the request."""
                      pos = request.body_file_seekable.tell()
                      first_line = request.body_file_seekable.readline()
                      request.body_file_seekable.seek(pos)
                      return frozenset(
                          dulwich.protocol.extract_want_line_capabilities(first_line)[1])
                  def _build_failed_pre_pull_response(self, capabilities, pre_pull_messages):
                      """
                      Construct a response with an empty PACK file.
                      We use an empty PACK file, as that would trigger the failure of the pull
                      or clone command.
                      We also print in the error output a message explaining why the command
                      was aborted.
                      If additionally, the user is accepting messages we send them the output
                      of the pre-pull hook.
                      Note that for clients not supporting side-band we just send them the
                      emtpy PACK file.
                      """
                      if self.SIDE_BAND_CAPS.intersection(capabilities):
                          response = []
                          proto = dulwich.protocol.Protocol(None, response.append)
                          proto.write_pkt_line(dulwich.protocol.NAK_LINE)
                          self._write_sideband_to_proto(proto, ascii_bytes(pre_pull_messages, allow_bytes=True), capabilities)
                          # N.B.(skreft): Do not change the sideband channel to 3, as that
                          # produces a fatal error in the client:
                          #   fatal: error in sideband demultiplexer
                          proto.write_sideband(
                              dulwich.protocol.SIDE_BAND_CHANNEL_PROGRESS,
                              ascii_bytes('Pre pull hook failed: aborting\n', allow_bytes=True))
                          proto.write_sideband(
                              dulwich.protocol.SIDE_BAND_CHANNEL_DATA,
                              ascii_bytes(self.EMPTY_PACK, allow_bytes=True))
                          # writes b"0000" as default
                          proto.write_pkt_line(None)
                          return response
                      else:
                          return [ascii_bytes(self.EMPTY_PACK, allow_bytes=True)]
                  def _build_post_pull_response(self, response, capabilities, start_message, end_message):
                      """
                      Given a list response we inject the post-pull messages.
                      We only inject the messages if the client supports sideband, and the
                      response has the format:
 NAK\n...0000
                      Note that we do not check the no-progress capability as by default, git
                      sends it, which effectively would block all messages.
                      """
                      if not self.SIDE_BAND_CAPS.intersection(capabilities):
                          return response
                      if not start_message and not end_message:
                          return response
                      try:
                          iter(response)
                          # iterator probably will work, we continue
                      except TypeError:
                          raise TypeError(f'response must be an iterator: got {type(response)}')
                      if isinstance(response, (list, tuple)):
                          raise TypeError(f'response must be an iterator: got {type(response)}')
                      def injected_response():
                          do_loop = 1
                          header_injected = 0
                          next_item = None
                          has_item = False
                          item = b''
                          while do_loop:
                              try:
                                  next_item = next(response)
                              except StopIteration:
                                  do_loop = 0
                              if has_item:
                                  # last item ! alter it now
                                  if do_loop == 0 and item.endswith(self.FLUSH_PACKET):
                                      new_response = [item[:-4]]
                                      new_response.extend(self._get_messages(end_message, capabilities))
                                      new_response.append(self.FLUSH_PACKET)
                                      item = b''.join(new_response)
                                  yield item
                              has_item = True
                              item = next_item
                              # alter item if it's the initial chunk
                              if not header_injected and item.startswith(b'0008NAK\n'):
                                  new_response = [b'0008NAK\n']
                                  new_response.extend(self._get_messages(start_message, capabilities))
                                  new_response.append(item[8:])
                                  item = b''.join(new_response)
                                  header_injected = 1
                      return injected_response()
                  def _write_sideband_to_proto(self, proto, data, capabilities):
                      """
                      Write the data to the proto's sideband number 2 == SIDE_BAND_CHANNEL_PROGRESS
                      We do not use dulwich's write_sideband directly as it only supports
                      side-band-64k.
                      """
                      if not data:
                          return
                      # N.B.(skreft): The values below are explained in the pack protocol
                      # documentation, section Packfile Data.
                      # https://github.com/git/git/blob/master/Documentation/technical/pack-protocol.txt
                      if CAPABILITY_SIDE_BAND_64K in capabilities:
                          chunk_size = 65515
                      elif CAPABILITY_SIDE_BAND in capabilities:
                          chunk_size = 995
                      else:
                          return
                      chunker = (data[i:i + chunk_size] for i in range(0, len(data), chunk_size))
                      for chunk in chunker:
                          proto.write_sideband(dulwich.protocol.SIDE_BAND_CHANNEL_PROGRESS, ascii_bytes(chunk, allow_bytes=True))
                  def _get_messages(self, data, capabilities):
                      """Return a list with packets for sending data in sideband number 2."""
                      response = []
                      proto = dulwich.protocol.Protocol(None, response.append)
                      self._write_sideband_to_proto(proto, data, capabilities)
                      return response
                  def backend(self, request, environ):
                      """
                      WSGI Response producer for HTTP POST Git Smart HTTP requests.
                      Reads commands and data from HTTP POST's body.
                      returns an iterator obj with contents of git command's
                      response to stdout
                      """
                      # TODO(skreft): think how we could detect an HTTPLockedException, as
                      # we probably want to have the same mechanism used by mercurial and
                      # simplevcs.
                      # For that we would need to parse the output of the command looking for
                      # some signs of the HTTPLockedError, parse the data and reraise it in
                      # pygrack. However, that would interfere with the streaming.
                      #
                      # Now the output of a blocked push is:
                      # Pushing to http://test_regular:test12@127.0.0.1:5001/vcs_test_git
                      # POST git-receive-pack (1047 bytes)
                      # remote: ERROR: Repository `vcs_test_git` locked by user `test_admin`. Reason:`lock_auto`
                      # To http://test_regular:test12@127.0.0.1:5001/vcs_test_git
                      # ! [remote rejected] master -> master (pre-receive hook declined)
                      # error: failed to push some refs to 'http://test_regular:test12@127.0.0.1:5001/vcs_test_git'
                      git_command = self._get_fixedpath(request.path_info)
                      if git_command not in self.commands:
                          log.debug('command %s not allowed', git_command)
                          return exc.HTTPForbidden()
                      capabilities = None
                      if git_command == 'git-upload-pack':
                          capabilities = self._get_want_capabilities(request)
                      if 'CONTENT_LENGTH' in environ:
                          inputstream = FileWrapper(request.body_file_seekable,
                                                    request.content_length)
                      else:
                          inputstream = request.body_file_seekable
                      resp = Response()
                      resp.content_type = f'application/x-{git_command}-result'
                      resp.charset = None
                      pre_pull_messages = ''
                      # Upload-pack == clone
                      if git_command == 'git-upload-pack':
                          hook_response = hooks.git_pre_pull(self.extras)
                          if hook_response.status != 0:
                              pre_pull_messages = hook_response.output
                              resp.app_iter = self._build_failed_pre_pull_response(
                                  capabilities, pre_pull_messages)
                              return resp
                      gitenv = dict(os.environ)
                      # forget all configs
                      gitenv['GIT_CONFIG_NOGLOBAL'] = '1'
                      gitenv['RC_SCM_DATA'] = json.dumps(self.extras)
                      cmd = [self.git_path, git_command[4:], '--stateless-rpc',
                             self.content_path]
                      log.debug('handling cmd %s', cmd)
                      out = subprocessio.SubprocessIOChunker(
                          cmd,
                          input_stream=inputstream,
                          env=gitenv,
                          cwd=self.content_path,
                          shell=False,
                          fail_on_stderr=False,
                          fail_on_return_code=False
                      )
                      if self.update_server_info and git_command == 'git-receive-pack':
                          # We need to fully consume the iterator here, as the
                          # update-server-info command needs to be run after the push.
                          out = list(out)
                          # Updating refs manually after each push.
                          # This is required as some clients are exposing Git repos internally
                          # with the dumb protocol.
                          cmd = [self.git_path, 'update-server-info']
                          log.debug('handling cmd %s', cmd)
                          output = subprocessio.SubprocessIOChunker(
                              cmd,
                              input_stream=inputstream,
                              env=gitenv,
                              cwd=self.content_path,
                              shell=False,
                              fail_on_stderr=False,
                              fail_on_return_code=False
                          )
                          # Consume all the output so the subprocess finishes
                          for _ in output:
                              pass
                      # Upload-pack == clone
                      if git_command == 'git-upload-pack':
                          hook_response = hooks.git_post_pull(self.extras)
                          post_pull_messages = hook_response.output
                          resp.app_iter = self._build_post_pull_response(out, capabilities, pre_pull_messages, post_pull_messages)
                      else:
                          resp.app_iter = out
                      return resp
                  def __call__(self, environ, start_response):
                      request = Request(environ)
                      _path = self._get_fixedpath(request.path_info)
                      if _path.startswith('info/refs'):
                          app = self.inforefs
                      else:
                          app = self.backend
                      try:
                          resp = app(request, environ)
                      except exc.HTTPException as error:
                          log.exception('HTTP Error')
                          resp = error
                      except Exception:
                          log.exception('Unknown error')
                          resp = exc.HTTPInternalServerError()
                      return resp(environ, start_response)

vcsserver/remote/git_remote.py

0 +3 -4

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import collections
              import logging
              import os
              import re
              import stat
              import traceback
              import urllib.request
              import urllib.parse
              import urllib.error
              from functools import wraps
              import more_itertools
              import pygit2
              from pygit2 import Repository as LibGit2Repo
              from pygit2 import index as LibGit2Index
              from dulwich import index, objects
              from dulwich.client import HttpGitClient, LocalGitClient, FetchPackResult
              from dulwich.errors import (
                  NotGitRepository, ChecksumMismatch, WrongObjectException,
                  MissingCommitError, ObjectMissing, HangupException,
                  UnexpectedCommandError)
              from dulwich.repo import Repo as DulwichRepo
              from dulwich.server import update_server_info
              from vcsserver import exceptions, settings, subprocessio
              from vcsserver.str_utils import safe_str, safe_int, safe_bytes, ascii_bytes
              from vcsserver.base import RepoFactory, obfuscate_qs, ArchiveNode, store_archive_in_cache, BytesEnvelope, BinaryEnvelope
              from vcsserver.hgcompat import (
                  hg_url as url_parser, httpbasicauthhandler, httpdigestauthhandler)
              from vcsserver.git_lfs.lib import LFSOidStore
              from vcsserver.vcs_base import RemoteBase
              DIR_STAT = stat.S_IFDIR
              FILE_MODE = stat.S_IFMT
              GIT_LINK = objects.S_IFGITLINK
              PEELED_REF_MARKER = b'^{}'
              HEAD_MARKER = b'HEAD'
              log = logging.getLogger(__name__)
              def reraise_safe_exceptions(func):
                  """Converts Dulwich exceptions to something neutral."""
                  @wraps(func)
                  def wrapper(*args, **kwargs):
                      try:
                          return func(*args, **kwargs)
                      except (ChecksumMismatch, WrongObjectException, MissingCommitError, ObjectMissing,) as e:
                          exc = exceptions.LookupException(org_exc=e)
                          raise exc(safe_str(e))
                      except (HangupException, UnexpectedCommandError) as e:
                          exc = exceptions.VcsException(org_exc=e)
                          raise exc(safe_str(e))
                      except Exception:
                          # NOTE(marcink): because of how dulwich handles some exceptions
                          # (KeyError on empty repos), we cannot track this and catch all
                          # exceptions, it's an exceptions from other handlers
                          #if not hasattr(e, '_vcs_kind'):
                              #log.exception("Unhandled exception in git remote call")
                              #raise_from_original(exceptions.UnhandledException)
                          raise
                  return wrapper
              class Repo(DulwichRepo):
                  """
                  A wrapper for dulwich Repo class.
                  Since dulwich is sometimes keeping .idx file descriptors open, it leads to
                  "Too many open files" error. We need to close all opened file descriptors
                  once the repo object is destroyed.
                  """
                  def __del__(self):
                      if hasattr(self, 'object_store'):
                          self.close()
              class Repository(LibGit2Repo):
                  def __enter__(self):
                      return self
                  def __exit__(self, exc_type, exc_val, exc_tb):
                      self.free()
              class GitFactory(RepoFactory):
                  repo_type = 'git'
                  def _create_repo(self, wire, create, use_libgit2=False):
                      if use_libgit2:
                          repo = Repository(safe_bytes(wire['path']))
                      else:
                          # dulwich mode
                          repo_path = safe_str(wire['path'], to_encoding=settings.WIRE_ENCODING)
                          repo = Repo(repo_path)
                      log.debug('repository created: got GIT object: %s', repo)
                      return repo
                  def repo(self, wire, create=False, use_libgit2=False):
                      """
                      Get a repository instance for the given path.
                      """
                      return self._create_repo(wire, create, use_libgit2)
                  def repo_libgit2(self, wire):
                      return self.repo(wire, use_libgit2=True)
              def create_signature_from_string(author_str, **kwargs):
                  """
                  Creates a pygit2.Signature object from a string of the format 'Name <email>'.
                  :param author_str: String of the format 'Name <email>'
                  :return: pygit2.Signature object
                  """
                  match = re.match(r'^(.+) <(.+)>$', author_str)
                  if match is None:
                      raise ValueError(f"Invalid format: {author_str}")
                  name, email = match.groups()
                  return pygit2.Signature(name, email, **kwargs)
              def get_obfuscated_url(url_obj):
                  url_obj.passwd = b'*****' if url_obj.passwd else url_obj.passwd
                  url_obj.query = obfuscate_qs(url_obj.query)
                  obfuscated_uri = str(url_obj)
                  return obfuscated_uri
              class GitRemote(RemoteBase):
                  def __init__(self, factory):
                      self._factory = factory
                      self._bulk_methods = {
                          "date": self.date,
                          "author": self.author,
                          "branch": self.branch,
                          "message": self.message,
                          "parents": self.parents,
                          "_commit": self.revision,
                      }
                      self._bulk_file_methods = {
                          "size": self.get_node_size,
                          "data": self.get_node_data,
                          "flags": self.get_node_flags,
                          "is_binary": self.get_node_is_binary,
                          "md5": self.md5_hash
                      }
                  def _wire_to_config(self, wire):
                      if 'config' in wire:
                          return {x[0] + '_' + x[1]: x[2] for x in wire['config']}
                      return {}
                  def _remote_conf(self, config):
                      params = [
                          '-c', 'core.askpass=""',
                      ]
                      ssl_cert_dir = config.get('vcs_ssl_dir')
                      if ssl_cert_dir:
                          params.extend(['-c', f'http.sslCAinfo={ssl_cert_dir}'])
                      return params
                  @reraise_safe_exceptions
                  def discover_git_version(self):
                      stdout, _ = self.run_git_command(
                          {}, ['--version'], _bare=True, _safe=True)
                      prefix = b'git version'
                      if stdout.startswith(prefix):
                          stdout = stdout[len(prefix):]
                      return safe_str(stdout.strip())
                  @reraise_safe_exceptions
                  def is_empty(self, wire):
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          try:
                              has_head = repo.head.name
                              if has_head:
                                  return False
                              # NOTE(marcink): check again using more expensive method
                              return repo.is_empty
                          except Exception:
                              pass
                          return True
                  @reraise_safe_exceptions
                  def assert_correct_path(self, wire):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _assert_correct_path(_context_uid, _repo_id, fast_check):
                          if fast_check:
                              path = safe_str(wire['path'])
                              if pygit2.discover_repository(path):
                                  return True
                              return False
                          else:
                              try:
                                  repo_init = self._factory.repo_libgit2(wire)
                                  with repo_init:
                                      pass
                              except pygit2.GitError:
                                  path = wire.get('path')
                                  tb = traceback.format_exc()
                                  log.debug("Invalid Git path `%s`, tb: %s", path, tb)
                                  return False
                              return True
                      return _assert_correct_path(context_uid, repo_id, True)
                  @reraise_safe_exceptions
                  def bare(self, wire):
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          return repo.is_bare
                  @reraise_safe_exceptions
                  def get_node_data(self, wire, commit_id, path):
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          commit = repo[commit_id]
                          blob_obj = commit.tree[path]
                          if blob_obj.type != pygit2.GIT_OBJ_BLOB:
                              raise exceptions.LookupException()(
                                  f'Tree for commit_id:{commit_id} is not a blob: {blob_obj.type_str}')
                          return BytesEnvelope(blob_obj.data)
                  @reraise_safe_exceptions
                  def get_node_size(self, wire, commit_id, path):
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          commit = repo[commit_id]
                          blob_obj = commit.tree[path]
                          if blob_obj.type != pygit2.GIT_OBJ_BLOB:
                              raise exceptions.LookupException()(
                                  f'Tree for commit_id:{commit_id} is not a blob: {blob_obj.type_str}')
                          return blob_obj.size
                  @reraise_safe_exceptions
                  def get_node_flags(self, wire, commit_id, path):
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          commit = repo[commit_id]
                          blob_obj = commit.tree[path]
                          if blob_obj.type != pygit2.GIT_OBJ_BLOB:
                              raise exceptions.LookupException()(
                                  f'Tree for commit_id:{commit_id} is not a blob: {blob_obj.type_str}')
                          return blob_obj.filemode
                  @reraise_safe_exceptions
                  def get_node_is_binary(self, wire, commit_id, path):
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          commit = repo[commit_id]
                          blob_obj = commit.tree[path]
                          if blob_obj.type != pygit2.GIT_OBJ_BLOB:
                              raise exceptions.LookupException()(
                                  f'Tree for commit_id:{commit_id} is not a blob: {blob_obj.type_str}')
                          return blob_obj.is_binary
                  @reraise_safe_exceptions
                  def blob_as_pretty_string(self, wire, sha):
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          blob_obj = repo[sha]
                          return BytesEnvelope(blob_obj.data)
                  @reraise_safe_exceptions
                  def blob_raw_length(self, wire, sha):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _blob_raw_length(_repo_id, _sha):
                          repo_init = self._factory.repo_libgit2(wire)
                          with repo_init as repo:
                              blob = repo[sha]
                              return blob.size
                      return _blob_raw_length(repo_id, sha)
                  def _parse_lfs_pointer(self, raw_content):
                      spec_string = b'version https://git-lfs.github.com/spec'
                      if raw_content and raw_content.startswith(spec_string):
                          pattern = re.compile(rb"""
                          (?:\n)?
                          ^version[ ]https://git-lfs\.github\.com/spec/(?P<spec_ver>v\d+)\n
                          ^oid[ ] sha256:(?P<oid_hash>[0-9a-f]{64})\n
                          ^size[ ](?P<oid_size>[0-9]+)\n
                          (?:\n)?
                          """, re.VERBOSE | re.MULTILINE)
                          match = pattern.match(raw_content)
                          if match:
                              return match.groupdict()
                      return {}
                  @reraise_safe_exceptions
                  def is_large_file(self, wire, commit_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _is_large_file(_repo_id, _sha):
                          repo_init = self._factory.repo_libgit2(wire)
                          with repo_init as repo:
                              blob = repo[commit_id]
                              if blob.is_binary:
                                  return {}
                              return self._parse_lfs_pointer(blob.data)
                      return _is_large_file(repo_id, commit_id)
                  @reraise_safe_exceptions
                  def is_binary(self, wire, tree_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _is_binary(_repo_id, _tree_id):
                          repo_init = self._factory.repo_libgit2(wire)
                          with repo_init as repo:
                              blob_obj = repo[tree_id]
                              return blob_obj.is_binary
                      return _is_binary(repo_id, tree_id)
                  @reraise_safe_exceptions
                  def md5_hash(self, wire, commit_id, path):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _md5_hash(_repo_id, _commit_id, _path):
                          repo_init = self._factory.repo_libgit2(wire)
                          with repo_init as repo:
                              commit = repo[_commit_id]
                              blob_obj = commit.tree[_path]
                              if blob_obj.type != pygit2.GIT_OBJ_BLOB:
                                  raise exceptions.LookupException()(
                                      f'Tree for commit_id:{_commit_id} is not a blob: {blob_obj.type_str}')
                              return ''
                      return _md5_hash(repo_id, commit_id, path)
                  @reraise_safe_exceptions
                  def in_largefiles_store(self, wire, oid):
                      conf = self._wire_to_config(wire)
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          repo_name = repo.path
                      store_location = conf.get('vcs_git_lfs_store_location')
                      if store_location:
                          store = LFSOidStore(
                              oid=oid, repo=repo_name, store_location=store_location)
                          return store.has_oid()
                      return False
                  @reraise_safe_exceptions
                  def store_path(self, wire, oid):
                      conf = self._wire_to_config(wire)
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          repo_name = repo.path
                      store_location = conf.get('vcs_git_lfs_store_location')
                      if store_location:
                          store = LFSOidStore(
                              oid=oid, repo=repo_name, store_location=store_location)
                          return store.oid_path
                      raise ValueError(f'Unable to fetch oid with path {oid}')
                  @reraise_safe_exceptions
                  def bulk_request(self, wire, rev, pre_load):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _bulk_request(_repo_id, _rev, _pre_load):
                          result = {}
                          for attr in pre_load:
                              try:
                                  method = self._bulk_methods[attr]
                                  wire.update({'cache': False})  # disable cache for bulk calls so we don't double cache
                                  args = [wire, rev]
                                  result[attr] = method(*args)
                              except KeyError as e:
                                  raise exceptions.VcsException(e)(f"Unknown bulk attribute: {attr}")
                          return result
                      return _bulk_request(repo_id, rev, sorted(pre_load))
                  @reraise_safe_exceptions
                  def bulk_file_request(self, wire, commit_id, path, pre_load):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _bulk_file_request(_repo_id, _commit_id, _path, _pre_load):
                          result = {}
                          for attr in pre_load:
                              try:
                                  method = self._bulk_file_methods[attr]
                                  wire.update({'cache': False})  # disable cache for bulk calls so we don't double cache
                                  result[attr] = method(wire, _commit_id, _path)
                              except KeyError as e:
                                  raise exceptions.VcsException(e)(f'Unknown bulk attribute: "{attr}"')
                          return result
                      return BinaryEnvelope(_bulk_file_request(repo_id, commit_id, path, sorted(pre_load)))
                  def _build_opener(self, url: str):
                      handlers = []
                      url_obj = url_parser(safe_bytes(url))
                      authinfo = url_obj.authinfo()[1]
                      if authinfo:
                          # create a password manager
                          passmgr = urllib.request.HTTPPasswordMgrWithDefaultRealm()
                          passmgr.add_password(*authinfo)
                          handlers.extend((httpbasicauthhandler(passmgr),
                                           httpdigestauthhandler(passmgr)))
                      return urllib.request.build_opener(*handlers)
                  @reraise_safe_exceptions
                  def check_url(self, url, config):
                      url_obj = url_parser(safe_bytes(url))
                      test_uri = safe_str(url_obj.authinfo()[0])
                      obfuscated_uri = get_obfuscated_url(url_obj)
                      log.info("Checking URL for remote cloning/import: %s", obfuscated_uri)
                      if not test_uri.endswith('info/refs'):
                          test_uri = test_uri.rstrip('/') + '/info/refs'
                      o = self._build_opener(test_uri)
                      o.addheaders = [('User-Agent', 'git/1.7.8.0')]  # fake some git
                      q = {"service": 'git-upload-pack'}
-                     qs = '?%s' % urllib.parse.urlencode(q)
+                     qs = f'?{urllib.parse.urlencode(q)}'
                      cu = f"{test_uri}{qs}"
                      req = urllib.request.Request(cu, None, {})
                      try:
                          log.debug("Trying to open URL %s", obfuscated_uri)
                          resp = o.open(req)
                          if resp.code != 200:
                              raise exceptions.URLError()('Return Code is not 200')
                      except Exception as e:
                          log.warning("URL cannot be opened: %s", obfuscated_uri, exc_info=True)
                          # means it cannot be cloned
                          raise exceptions.URLError(e)(f"[{obfuscated_uri}] org_exc: {e}")
                      # now detect if it's proper git repo
                      gitdata: bytes = resp.read()
                      if b'service=git-upload-pack' in gitdata:
                          pass
                      elif re.findall(br'[0-9a-fA-F]{40}\s+refs', gitdata):
                          # old style git can return some other format !
                          pass
                      else:
                          e = None
                          raise exceptions.URLError(e)(
-                             "url [%s] does not look like an hg repo org_exc: %s"
-                             % (obfuscated_uri, e))
+                             f"url [{obfuscated_uri}] does not look like an hg repo org_exc: {e}")
                      return True
                  @reraise_safe_exceptions
                  def clone(self, wire, url, deferred, valid_refs, update_after_clone):
                      # TODO(marcink): deprecate this method. Last i checked we don't use it anymore
                      remote_refs = self.pull(wire, url, apply_refs=False)
                      repo = self._factory.repo(wire)
                      if isinstance(valid_refs, list):
                          valid_refs = tuple(valid_refs)
                      for k in remote_refs:
                          # only parse heads/tags and skip so called deferred tags
                          if k.startswith(valid_refs) and not k.endswith(deferred):
                              repo[k] = remote_refs[k]
                      if update_after_clone:
                          # we want to checkout HEAD
                          repo["HEAD"] = remote_refs["HEAD"]
                          index.build_index_from_tree(repo.path, repo.index_path(),
                                                      repo.object_store, repo["HEAD"].tree)
                  @reraise_safe_exceptions
                  def branch(self, wire, commit_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _branch(_context_uid, _repo_id, _commit_id):
                          regex = re.compile('^refs/heads')
                          def filter_with(ref):
                              return regex.match(ref[0]) and ref[1] == _commit_id
                          branches = list(filter(filter_with, list(self.get_refs(wire).items())))
                          return [x[0].split('refs/heads/')[-1] for x in branches]
                      return _branch(context_uid, repo_id, commit_id)
                  @reraise_safe_exceptions
                  def commit_branches(self, wire, commit_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _commit_branches(_context_uid, _repo_id, _commit_id):
                          repo_init = self._factory.repo_libgit2(wire)
                          with repo_init as repo:
                              branches = [x for x in repo.branches.with_commit(_commit_id)]
                              return branches
                      return _commit_branches(context_uid, repo_id, commit_id)
                  @reraise_safe_exceptions
                  def add_object(self, wire, content):
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          blob = objects.Blob()
                          blob.set_raw_string(content)
                          repo.object_store.add_object(blob)
                          return blob.id
                  @reraise_safe_exceptions
                  def create_commit(self, wire, author, committer, message, branch, new_tree_id, date_args: list[int, int] = None):
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          if date_args:
                              current_time, offset = date_args
                              kw = {
                                  'time': current_time,
                                  'offset': offset
                              }
                          author = create_signature_from_string(author, **kw)
                          committer = create_signature_from_string(committer, **kw)
                          tree = new_tree_id
                          if isinstance(tree, (bytes, str)):
                              # validate this tree is in the repo...
                              tree = repo[safe_str(tree)].id
                          parents = []
                          # ensure we COMMIT on top of given branch head
                          # check if this repo has ANY branches, otherwise it's a new branch case we need to make
                          if branch in repo.branches.local:
                              parents += [repo.branches[branch].target]
                          elif [x for x in repo.branches.local]:
                              parents += [repo.head.target]
                          #else:
                              # in case we want to commit on new branch we create it on top of HEAD
                              #repo.branches.local.create(branch, repo.revparse_single('HEAD'))
                          # # Create a new commit
                          commit_oid = repo.create_commit(
                              f'refs/heads/{branch}',  # the name of the reference to update
                              author,  # the author of the commit
                              committer,  # the committer of the commit
                              message,  # the commit message
                              tree,  # the tree produced by the index
                              parents  # list of parents for the new commit, usually just one,
                          )
                          new_commit_id = safe_str(commit_oid)
                          return new_commit_id
                  @reraise_safe_exceptions
                  def commit(self, wire, commit_data, branch, commit_tree, updated, removed):
                      def mode2pygit(mode):
                          """
                          git only supports two filemode 644 and 755
 o100755 -> 33261
 o100644 -> 33188
                          """
                          return {
 o100644: pygit2.GIT_FILEMODE_BLOB,
 o100755: pygit2.GIT_FILEMODE_BLOB_EXECUTABLE,
 o120000: pygit2.GIT_FILEMODE_LINK
                          }.get(mode) or pygit2.GIT_FILEMODE_BLOB
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          repo_index = repo.index
                          for pathspec in updated:
                              blob_id = repo.create_blob(pathspec['content'])
                              ie = pygit2.IndexEntry(pathspec['path'], blob_id, mode2pygit(pathspec['mode']))
                              repo_index.add(ie)
                          for pathspec in removed:
                              repo_index.remove(pathspec)
                          # Write changes to the index
                          repo_index.write()
                          # Create a tree from the updated index
                          commit_tree = repo_index.write_tree()
                      new_tree_id = commit_tree
                      author = commit_data['author']
                      committer = commit_data['committer']
                      message = commit_data['message']
                      date_args = [int(commit_data['commit_time']), int(commit_data['commit_timezone'])]
                      new_commit_id = self.create_commit(wire, author, committer, message, branch,
                                                         new_tree_id, date_args=date_args)
                      # libgit2, ensure the branch is there and exists
                      self.create_branch(wire, branch, new_commit_id)
                      # libgit2, set new ref to this created commit
                      self.set_refs(wire, f'refs/heads/{branch}', new_commit_id)
                      return new_commit_id
                  @reraise_safe_exceptions
                  def pull(self, wire, url, apply_refs=True, refs=None, update_after=False):
                      if url != 'default' and '://' not in url:
                          client = LocalGitClient(url)
                      else:
                          url_obj = url_parser(safe_bytes(url))
                          o = self._build_opener(url)
                          url = url_obj.authinfo()[0]
                          client = HttpGitClient(base_url=url, opener=o)
                      repo = self._factory.repo(wire)
                      determine_wants = repo.object_store.determine_wants_all
                      if refs:
                          refs = [ascii_bytes(x) for x in refs]
                          def determine_wants_requested(remote_refs):
                              determined = []
                              for ref_name, ref_hash in remote_refs.items():
                                  bytes_ref_name = safe_bytes(ref_name)
                                  if bytes_ref_name in refs:
                                      bytes_ref_hash = safe_bytes(ref_hash)
                                      determined.append(bytes_ref_hash)
                              return determined
                          # swap with our custom requested wants
                          determine_wants = determine_wants_requested
                      try:
                          remote_refs = client.fetch(
                              path=url, target=repo, determine_wants=determine_wants)
                      except NotGitRepository as e:
                          log.warning(
                              'Trying to fetch from "%s" failed, not a Git repository.', url)
                          # Exception can contain unicode which we convert
                          raise exceptions.AbortException(e)(repr(e))
                      # mikhail: client.fetch() returns all the remote refs, but fetches only
                      # refs filtered by `determine_wants` function. We need to filter result
                      # as well
                      if refs:
                          remote_refs = {k: remote_refs[k] for k in remote_refs if k in refs}
                      if apply_refs:
                          # TODO: johbo: Needs proper test coverage with a git repository
                          # that contains a tag object, so that we would end up with
                          # a peeled ref at this point.
                          for k in remote_refs:
                              if k.endswith(PEELED_REF_MARKER):
                                  log.debug("Skipping peeled reference %s", k)
                                  continue
                              repo[k] = remote_refs[k]
                          if refs and not update_after:
                              # mikhail: explicitly set the head to the last ref.
                              repo[HEAD_MARKER] = remote_refs[refs[-1]]
                      if update_after:
                          # we want to check out HEAD
                          repo[HEAD_MARKER] = remote_refs[HEAD_MARKER]
                          index.build_index_from_tree(repo.path, repo.index_path(),
                                                      repo.object_store, repo[HEAD_MARKER].tree)
                      if isinstance(remote_refs, FetchPackResult):
                          return remote_refs.refs
                      return remote_refs
                  @reraise_safe_exceptions
                  def sync_fetch(self, wire, url, refs=None, all_refs=False):
                      self._factory.repo(wire)
                      if refs and not isinstance(refs, (list, tuple)):
                          refs = [refs]
                      config = self._wire_to_config(wire)
                      # get all remote refs we'll use to fetch later
                      cmd = ['ls-remote']
                      if not all_refs:
                          cmd += ['--heads', '--tags']
                      cmd += [url]
                      output, __ = self.run_git_command(
                          wire, cmd, fail_on_stderr=False,
                          _copts=self._remote_conf(config),
                          extra_env={'GIT_TERMINAL_PROMPT': '0'})
                      remote_refs = collections.OrderedDict()
                      fetch_refs = []
                      for ref_line in output.splitlines():
                          sha, ref = ref_line.split(b'\t')
                          sha = sha.strip()
                          if ref in remote_refs:
                              # duplicate, skip
                              continue
                          if ref.endswith(PEELED_REF_MARKER):
                              log.debug("Skipping peeled reference %s", ref)
                              continue
                          # don't sync HEAD
                          if ref in [HEAD_MARKER]:
                              continue
                          remote_refs[ref] = sha
                          if refs and sha in refs:
                              # we filter fetch using our specified refs
                              fetch_refs.append(f'{safe_str(ref)}:{safe_str(ref)}')
                          elif not refs:
                              fetch_refs.append(f'{safe_str(ref)}:{safe_str(ref)}')
                      log.debug('Finished obtaining fetch refs, total: %s', len(fetch_refs))
                      if fetch_refs:
                          for chunk in more_itertools.chunked(fetch_refs, 1024 * 4):
                              fetch_refs_chunks = list(chunk)
                              log.debug('Fetching %s refs from import url', len(fetch_refs_chunks))
                              self.run_git_command(
                                  wire, ['fetch', url, '--force', '--prune', '--'] + fetch_refs_chunks,
                                  fail_on_stderr=False,
                                  _copts=self._remote_conf(config),
                                  extra_env={'GIT_TERMINAL_PROMPT': '0'})
                      return remote_refs
                  @reraise_safe_exceptions
                  def sync_push(self, wire, url, refs=None):
                      if not self.check_url(url, wire):
                          return
                      config = self._wire_to_config(wire)
                      self._factory.repo(wire)
                      self.run_git_command(
                          wire, ['push', url, '--mirror'], fail_on_stderr=False,
                          _copts=self._remote_conf(config),
                          extra_env={'GIT_TERMINAL_PROMPT': '0'})
                  @reraise_safe_exceptions
                  def get_remote_refs(self, wire, url):
                      repo = Repo(url)
                      return repo.get_refs()
                  @reraise_safe_exceptions
                  def get_description(self, wire):
                      repo = self._factory.repo(wire)
                      return repo.get_description()
                  @reraise_safe_exceptions
                  def get_missing_revs(self, wire, rev1, rev2, path2):
                      repo = self._factory.repo(wire)
                      LocalGitClient(thin_packs=False).fetch(path2, repo)
                      wire_remote = wire.copy()
                      wire_remote['path'] = path2
                      repo_remote = self._factory.repo(wire_remote)
                      LocalGitClient(thin_packs=False).fetch(path2, repo_remote)
                      revs = [
                          x.commit.id
                          for x in repo_remote.get_walker(include=[safe_bytes(rev2)], exclude=[safe_bytes(rev1)])]
                      return revs
                  @reraise_safe_exceptions
                  def get_object(self, wire, sha, maybe_unreachable=False):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _get_object(_context_uid, _repo_id, _sha):
                          repo_init = self._factory.repo_libgit2(wire)
                          with repo_init as repo:
                              missing_commit_err = 'Commit {} does not exist for `{}`'.format(sha, wire['path'])
                              try:
                                  commit = repo.revparse_single(sha)
                              except KeyError:
                                  # NOTE(marcink): KeyError doesn't give us any meaningful information
                                  # here, we instead give something more explicit
                                  e = exceptions.RefNotFoundException('SHA: %s not found', sha)
                                  raise exceptions.LookupException(e)(missing_commit_err)
                              except ValueError as e:
                                  raise exceptions.LookupException(e)(missing_commit_err)
                              is_tag = False
                              if isinstance(commit, pygit2.Tag):
                                  commit = repo.get(commit.target)
                                  is_tag = True
                              check_dangling = True
                              if is_tag:
                                  check_dangling = False
                              if check_dangling and maybe_unreachable:
                                  check_dangling = False
                              # we used a reference and it parsed means we're not having a dangling commit
                              if sha != commit.hex:
                                  check_dangling = False
                              if check_dangling:
                                  # check for dangling commit
                                  for branch in repo.branches.with_commit(commit.hex):
                                      if branch:
                                          break
                                  else:
                                      # NOTE(marcink): Empty error doesn't give us any meaningful information
                                      # here, we instead give something more explicit
                                      e = exceptions.RefNotFoundException('SHA: %s not found in branches', sha)
                                      raise exceptions.LookupException(e)(missing_commit_err)
                              commit_id = commit.hex
                              type_str = commit.type_str
                              return {
                                  'id': commit_id,
                                  'type': type_str,
                                  'commit_id': commit_id,
                                  'idx': 0
                              }
                      return _get_object(context_uid, repo_id, sha)
                  @reraise_safe_exceptions
                  def get_refs(self, wire):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _get_refs(_context_uid, _repo_id):
                          repo_init = self._factory.repo_libgit2(wire)
                          with repo_init as repo:
                              regex = re.compile('^refs/(heads|tags)/')
                              return {x.name: x.target.hex for x in
                                      [ref for ref in repo.listall_reference_objects() if regex.match(ref.name)]}
                      return _get_refs(context_uid, repo_id)
                  @reraise_safe_exceptions
                  def get_branch_pointers(self, wire):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _get_branch_pointers(_context_uid, _repo_id):
                          repo_init = self._factory.repo_libgit2(wire)
                          regex = re.compile('^refs/heads')
                          with repo_init as repo:
                              branches = [ref for ref in repo.listall_reference_objects() if regex.match(ref.name)]
                              return {x.target.hex: x.shorthand for x in branches}
                      return _get_branch_pointers(context_uid, repo_id)
                  @reraise_safe_exceptions
                  def head(self, wire, show_exc=True):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _head(_context_uid, _repo_id, _show_exc):
                          repo_init = self._factory.repo_libgit2(wire)
                          with repo_init as repo:
                              try:
                                  return repo.head.peel().hex
                              except Exception:
                                  if show_exc:
                                      raise
                      return _head(context_uid, repo_id, show_exc)
                  @reraise_safe_exceptions
                  def init(self, wire):
                      repo_path = safe_str(wire['path'])
                      pygit2.init_repository(repo_path, bare=False)
                  @reraise_safe_exceptions
                  def init_bare(self, wire):
                      repo_path = safe_str(wire['path'])
                      pygit2.init_repository(repo_path, bare=True)
                  @reraise_safe_exceptions
                  def revision(self, wire, rev):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _revision(_context_uid, _repo_id, _rev):
                          repo_init = self._factory.repo_libgit2(wire)
                          with repo_init as repo:
                              commit = repo[rev]
                              obj_data = {
                                  'id': commit.id.hex,
                              }
                              # tree objects itself don't have tree_id attribute
                              if hasattr(commit, 'tree_id'):
                                  obj_data['tree'] = commit.tree_id.hex
                              return obj_data
                      return _revision(context_uid, repo_id, rev)
                  @reraise_safe_exceptions
                  def date(self, wire, commit_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _date(_repo_id, _commit_id):
                          repo_init = self._factory.repo_libgit2(wire)
                          with repo_init as repo:
                              commit = repo[commit_id]
                              if hasattr(commit, 'commit_time'):
                                  commit_time, commit_time_offset = commit.commit_time, commit.commit_time_offset
                              else:
                                  commit = commit.get_object()
                                  commit_time, commit_time_offset = commit.commit_time, commit.commit_time_offset
                              # TODO(marcink): check dulwich difference of offset vs timezone
                              return [commit_time, commit_time_offset]
                      return _date(repo_id, commit_id)
                  @reraise_safe_exceptions
                  def author(self, wire, commit_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _author(_repo_id, _commit_id):
                          repo_init = self._factory.repo_libgit2(wire)
                          with repo_init as repo:
                              commit = repo[commit_id]
                              if hasattr(commit, 'author'):
                                  author = commit.author
                              else:
                                  author = commit.get_object().author
                              if author.email:
                                  return f"{author.name} <{author.email}>"
                              try:
                                  return f"{author.name}"
                              except Exception:
                                  return f"{safe_str(author.raw_name)}"
                      return _author(repo_id, commit_id)
                  @reraise_safe_exceptions
                  def message(self, wire, commit_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _message(_repo_id, _commit_id):
                          repo_init = self._factory.repo_libgit2(wire)
                          with repo_init as repo:
                              commit = repo[commit_id]
                              return commit.message
                      return _message(repo_id, commit_id)
                  @reraise_safe_exceptions
                  def parents(self, wire, commit_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _parents(_repo_id, _commit_id):
                          repo_init = self._factory.repo_libgit2(wire)
                          with repo_init as repo:
                              commit = repo[commit_id]
                              if hasattr(commit, 'parent_ids'):
                                  parent_ids = commit.parent_ids
                              else:
                                  parent_ids = commit.get_object().parent_ids
                              return [x.hex for x in parent_ids]
                      return _parents(repo_id, commit_id)
                  @reraise_safe_exceptions
                  def children(self, wire, commit_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      head = self.head(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _children(_repo_id, _commit_id):
                          output, __ = self.run_git_command(
                              wire, ['rev-list', '--all', '--children', f'{commit_id}^..{head}'])
                          child_ids = []
                          pat = re.compile(fr'^{commit_id}')
                          for line in output.splitlines():
                              line = safe_str(line)
                              if pat.match(line):
                                  found_ids = line.split(' ')[1:]
                                  child_ids.extend(found_ids)
                                  break
                          return child_ids
                      return _children(repo_id, commit_id)
                  @reraise_safe_exceptions
                  def set_refs(self, wire, key, value):
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          repo.references.create(key, value, force=True)
                  @reraise_safe_exceptions
                  def create_branch(self, wire, branch_name, commit_id, force=False):
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          if commit_id:
                              commit = repo[commit_id]
                          else:
                              # if commit is not given  just use the HEAD
                              commit = repo.head()
                          if force:
                              repo.branches.local.create(branch_name, commit, force=force)
                          elif not repo.branches.get(branch_name):
                              # create only if that branch isn't existing
                              repo.branches.local.create(branch_name, commit, force=force)
                  @reraise_safe_exceptions
                  def remove_ref(self, wire, key):
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          repo.references.delete(key)
                  @reraise_safe_exceptions
                  def tag_remove(self, wire, tag_name):
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          key = f'refs/tags/{tag_name}'
                          repo.references.delete(key)
                  @reraise_safe_exceptions
                  def tree_changes(self, wire, source_id, target_id):
                      repo = self._factory.repo(wire)
                      # source can be empty
                      source_id = safe_bytes(source_id if source_id else b'')
                      target_id = safe_bytes(target_id)
                      source = repo[source_id].tree if source_id else None
                      target = repo[target_id].tree
                      result = repo.object_store.tree_changes(source, target)
                      added = set()
                      modified = set()
                      deleted = set()
                      for (old_path, new_path), (_, _), (_, _) in list(result):
                          if new_path and old_path:
                              modified.add(new_path)
                          elif new_path and not old_path:
                              added.add(new_path)
                          elif not new_path and old_path:
                              deleted.add(old_path)
                      return list(added), list(modified), list(deleted)
                  @reraise_safe_exceptions
                  def tree_and_type_for_path(self, wire, commit_id, path):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _tree_and_type_for_path(_context_uid, _repo_id, _commit_id, _path):
                          repo_init = self._factory.repo_libgit2(wire)
                          with repo_init as repo:
                              commit = repo[commit_id]
                              try:
                                  tree = commit.tree[path]
                              except KeyError:
                                  return None, None, None
                              return tree.id.hex, tree.type_str, tree.filemode
                      return _tree_and_type_for_path(context_uid, repo_id, commit_id, path)
                  @reraise_safe_exceptions
                  def tree_items(self, wire, tree_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _tree_items(_repo_id, _tree_id):
                          repo_init = self._factory.repo_libgit2(wire)
                          with repo_init as repo:
                              try:
                                  tree = repo[tree_id]
                              except KeyError:
                                  raise ObjectMissing(f'No tree with id: {tree_id}')
                              result = []
                              for item in tree:
                                  item_sha = item.hex
                                  item_mode = item.filemode
                                  item_type = item.type_str
                                  if item_type == 'commit':
                                      # NOTE(marcink): submodules we translate to 'link' for backward compat
                                      item_type = 'link'
                                  result.append((item.name, item_mode, item_sha, item_type))
                              return result
                      return _tree_items(repo_id, tree_id)
                  @reraise_safe_exceptions
                  def diff_2(self, wire, commit_id_1, commit_id_2, file_filter, opt_ignorews, context):
                      """
                      Old version that uses subprocess to call diff
                      """
                      flags = [
-                         '-U%s' % context, '--patch',
+                         f'-U{context}', '--patch',
                          '--binary',
                          '--find-renames',
                          '--no-indent-heuristic',
                          # '--indent-heuristic',
                          #'--full-index',
                          #'--abbrev=40'
                      ]
                      if opt_ignorews:
                          flags.append('--ignore-all-space')
                      if commit_id_1 == self.EMPTY_COMMIT:
                          cmd = ['show'] + flags + [commit_id_2]
                      else:
                          cmd = ['diff'] + flags + [commit_id_1, commit_id_2]
                      if file_filter:
                          cmd.extend(['--', file_filter])
                      diff, __ = self.run_git_command(wire, cmd)
                      # If we used 'show' command, strip first few lines (until actual diff
                      # starts)
                      if commit_id_1 == self.EMPTY_COMMIT:
                          lines = diff.splitlines()
                          x = 0
                          for line in lines:
                              if line.startswith(b'diff'):
                                  break
                              x += 1
                          # Append new line just like 'diff' command do
                          diff = '\n'.join(lines[x:]) + '\n'
                      return diff
                  @reraise_safe_exceptions
                  def diff(self, wire, commit_id_1, commit_id_2, file_filter, opt_ignorews, context):
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          swap = True
                          flags = 0
                          flags |= pygit2.GIT_DIFF_SHOW_BINARY
                          if opt_ignorews:
                              flags |= pygit2.GIT_DIFF_IGNORE_WHITESPACE
                          if commit_id_1 == self.EMPTY_COMMIT:
                              comm1 = repo[commit_id_2]
                              diff_obj = comm1.tree.diff_to_tree(
                                  flags=flags, context_lines=context, swap=swap)
                          else:
                              comm1 = repo[commit_id_2]
                              comm2 = repo[commit_id_1]
                              diff_obj = comm1.tree.diff_to_tree(
                                  comm2.tree, flags=flags, context_lines=context, swap=swap)
                          similar_flags = 0
                          similar_flags |= pygit2.GIT_DIFF_FIND_RENAMES
                          diff_obj.find_similar(flags=similar_flags)
                          if file_filter:
                              for p in diff_obj:
                                  if p.delta.old_file.path == file_filter:
                                      return BytesEnvelope(p.data) or BytesEnvelope(b'')
                              # fo matching path == no diff
                              return BytesEnvelope(b'')
                          return BytesEnvelope(safe_bytes(diff_obj.patch)) or BytesEnvelope(b'')
                  @reraise_safe_exceptions
                  def node_history(self, wire, commit_id, path, limit):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _node_history(_context_uid, _repo_id, _commit_id, _path, _limit):
                          # optimize for n==1, rev-list is much faster for that use-case
                          if limit == 1:
                              cmd = ['rev-list', '-1', commit_id, '--', path]
                          else:
                              cmd = ['log']
                              if limit:
                                  cmd.extend(['-n', str(safe_int(limit, 0))])
                              cmd.extend(['--pretty=format: %H', '-s', commit_id, '--', path])
                          output, __ = self.run_git_command(wire, cmd)
                          commit_ids = re.findall(rb'[0-9a-fA-F]{40}', output)
                          return [x for x in commit_ids]
                      return _node_history(context_uid, repo_id, commit_id, path, limit)
                  @reraise_safe_exceptions
                  def node_annotate_legacy(self, wire, commit_id, path):
                      # note: replaced by pygit2 implementation
                      cmd = ['blame', '-l', '--root', '-r', commit_id, '--', path]
                      # -l     ==> outputs long shas (and we need all 40 characters)
                      # --root ==> doesn't put '^' character for boundaries
                      # -r commit_id ==> blames for the given commit
                      output, __ = self.run_git_command(wire, cmd)
                      result = []
                      for i, blame_line in enumerate(output.splitlines()[:-1]):
                          line_no = i + 1
                          blame_commit_id, line = re.split(rb' ', blame_line, 1)
                          result.append((line_no, blame_commit_id, line))
                      return result
                  @reraise_safe_exceptions
                  def node_annotate(self, wire, commit_id, path):
                      result_libgit = []
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          commit = repo[commit_id]
                          blame_obj = repo.blame(path, newest_commit=commit_id)
                          for i, line in enumerate(commit.tree[path].data.splitlines()):
                              line_no = i + 1
                              hunk = blame_obj.for_line(line_no)
                              blame_commit_id = hunk.final_commit_id.hex
                              result_libgit.append((line_no, blame_commit_id, line))
                      return BinaryEnvelope(result_libgit)
                  @reraise_safe_exceptions
                  def update_server_info(self, wire):
                      repo = self._factory.repo(wire)
                      update_server_info(repo)
                  @reraise_safe_exceptions
                  def get_all_commit_ids(self, wire):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _get_all_commit_ids(_context_uid, _repo_id):
                          cmd = ['rev-list', '--reverse', '--date-order', '--branches', '--tags']
                          try:
                              output, __ = self.run_git_command(wire, cmd)
                              return output.splitlines()
                          except Exception:
                              # Can be raised for empty repositories
                              return []
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _get_all_commit_ids_pygit2(_context_uid, _repo_id):
                          repo_init = self._factory.repo_libgit2(wire)
                          from pygit2 import GIT_SORT_REVERSE, GIT_SORT_TIME, GIT_BRANCH_ALL
                          results = []
                          with repo_init as repo:
                              for commit in repo.walk(repo.head.target, GIT_SORT_TIME | GIT_BRANCH_ALL | GIT_SORT_REVERSE):
                                  results.append(commit.id.hex)
                      return _get_all_commit_ids(context_uid, repo_id)
                  @reraise_safe_exceptions
                  def run_git_command(self, wire, cmd, **opts):
                      path = wire.get('path', None)
                      if path and os.path.isdir(path):
                          opts['cwd'] = path
                      if '_bare' in opts:
                          _copts = []
                          del opts['_bare']
                      else:
                          _copts = ['-c', 'core.quotepath=false',]
                      safe_call = False
                      if '_safe' in opts:
                          # no exc on failure
                          del opts['_safe']
                          safe_call = True
                      if '_copts' in opts:
                          _copts.extend(opts['_copts'] or [])
                          del opts['_copts']
                      gitenv = os.environ.copy()
                      gitenv.update(opts.pop('extra_env', {}))
                      # need to clean fix GIT_DIR !
                      if 'GIT_DIR' in gitenv:
                          del gitenv['GIT_DIR']
                      gitenv['GIT_CONFIG_NOGLOBAL'] = '1'
                      gitenv['GIT_DISCOVERY_ACROSS_FILESYSTEM'] = '1'
                      cmd = [settings.GIT_EXECUTABLE] + _copts + cmd
                      _opts = {'env': gitenv, 'shell': False}
                      proc = None
                      try:
                          _opts.update(opts)
                          proc = subprocessio.SubprocessIOChunker(cmd, **_opts)
                          return b''.join(proc), b''.join(proc.stderr)
                      except OSError as err:
                          cmd = ' '.join(map(safe_str, cmd))  # human friendly CMD
                          tb_err = ("Couldn't run git command (%s).\n"
                                    "Original error was:%s\n"
                                    "Call options:%s\n"
                                    % (cmd, err, _opts))
                          log.exception(tb_err)
                          if safe_call:
                              return '', err
                          else:
                              raise exceptions.VcsException()(tb_err)
                      finally:
                          if proc:
                              proc.close()
                  @reraise_safe_exceptions
                  def install_hooks(self, wire, force=False):
                      from vcsserver.hook_utils import install_git_hooks
                      bare = self.bare(wire)
                      path = wire['path']
                      binary_dir = settings.BINARY_DIR
                      if binary_dir:
                          os.path.join(binary_dir, 'python3')
                      return install_git_hooks(path, bare, force_create=force)
                  @reraise_safe_exceptions
                  def get_hooks_info(self, wire):
                      from vcsserver.hook_utils import (
                          get_git_pre_hook_version, get_git_post_hook_version)
                      bare = self.bare(wire)
                      path = wire['path']
                      return {
                          'pre_version': get_git_pre_hook_version(path, bare),
                          'post_version': get_git_post_hook_version(path, bare),
                      }
                  @reraise_safe_exceptions
                  def set_head_ref(self, wire, head_name):
                      log.debug('Setting refs/head to `%s`', head_name)
                      repo_init = self._factory.repo_libgit2(wire)
                      with repo_init as repo:
                          repo.set_head(f'refs/heads/{head_name}')
                      return [head_name] + [f'set HEAD to refs/heads/{head_name}']
                  @reraise_safe_exceptions
                  def archive_repo(self, wire, archive_name_key, kind, mtime, archive_at_path,
                                   archive_dir_name, commit_id, cache_config):
                      def file_walker(_commit_id, path):
                          repo_init = self._factory.repo_libgit2(wire)
                          with repo_init as repo:
                              commit = repo[commit_id]
                              if path in ['', '/']:
                                  tree = commit.tree
                              else:
                                  tree = commit.tree[path.rstrip('/')]
                                  tree_id = tree.id.hex
                                  try:
                                      tree = repo[tree_id]
                                  except KeyError:
                                      raise ObjectMissing(f'No tree with id: {tree_id}')
                              index = LibGit2Index.Index()
                              index.read_tree(tree)
                              file_iter = index
                              for file_node in file_iter:
                                  file_path = file_node.path
                                  mode = file_node.mode
                                  is_link = stat.S_ISLNK(mode)
                                  if mode == pygit2.GIT_FILEMODE_COMMIT:
                                      log.debug('Skipping path %s as a commit node', file_path)
                                      continue
                                  yield ArchiveNode(file_path, mode, is_link, repo[file_node.hex].read_raw)
                      return store_archive_in_cache(
                          file_walker, archive_name_key, kind, mtime, archive_at_path, archive_dir_name, commit_id, cache_config=cache_config)

vcsserver/remote/hg_remote.py

0 +3 -4

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import binascii
              import io
              import logging
              import stat
              import sys
              import urllib.request
              import urllib.parse
              import hashlib
              from hgext import largefiles, rebase, purge
              from mercurial import commands
              from mercurial import unionrepo
              from mercurial import verify
              from mercurial import repair
              from mercurial.error import AmbiguousPrefixLookupError
              import vcsserver
              from vcsserver import exceptions
              from vcsserver.base import (
                  RepoFactory,
                  obfuscate_qs,
                  raise_from_original,
                  store_archive_in_cache,
                  ArchiveNode,
                  BytesEnvelope,
                  BinaryEnvelope,
              )
              from vcsserver.hgcompat import (
                  archival,
                  bin,
                  clone,
                  config as hgconfig,
                  diffopts,
                  hex,
                  get_ctx,
                  hg_url as url_parser,
                  httpbasicauthhandler,
                  httpdigestauthhandler,
                  makepeer,
                  instance,
                  match,
                  memctx,
                  exchange,
                  memfilectx,
                  nullrev,
                  hg_merge,
                  patch,
                  peer,
                  revrange,
                  ui,
                  hg_tag,
                  Abort,
                  LookupError,
                  RepoError,
                  RepoLookupError,
                  InterventionRequired,
                  RequirementError,
                  alwaysmatcher,
                  patternmatcher,
                  hgutil,
                  hgext_strip,
              )
              from vcsserver.str_utils import ascii_bytes, ascii_str, safe_str, safe_bytes
              from vcsserver.vcs_base import RemoteBase
              from vcsserver.config import hooks as hooks_config
              from vcsserver.lib.exc_tracking import format_exc
              log = logging.getLogger(__name__)
              def make_ui_from_config(repo_config):
                  class LoggingUI(ui.ui):
                      def status(self, *msg, **opts):
                          str_msg = map(safe_str, msg)
                          log.info(' '.join(str_msg).rstrip('\n'))
                          #super(LoggingUI, self).status(*msg, **opts)
                      def warn(self, *msg, **opts):
                          str_msg = map(safe_str, msg)
                          log.warning('ui_logger:'+' '.join(str_msg).rstrip('\n'))
                          #super(LoggingUI, self).warn(*msg, **opts)
                      def error(self, *msg, **opts):
                          str_msg = map(safe_str, msg)
                          log.error('ui_logger:'+' '.join(str_msg).rstrip('\n'))
                          #super(LoggingUI, self).error(*msg, **opts)
                      def note(self, *msg, **opts):
                          str_msg = map(safe_str, msg)
                          log.info('ui_logger:'+' '.join(str_msg).rstrip('\n'))
                          #super(LoggingUI, self).note(*msg, **opts)
                      def debug(self, *msg, **opts):
                          str_msg = map(safe_str, msg)
                          log.debug('ui_logger:'+' '.join(str_msg).rstrip('\n'))
                          #super(LoggingUI, self).debug(*msg, **opts)
                  baseui = LoggingUI()
                  # clean the baseui object
                  baseui._ocfg = hgconfig.config()
                  baseui._ucfg = hgconfig.config()
                  baseui._tcfg = hgconfig.config()
                  for section, option, value in repo_config:
                      baseui.setconfig(ascii_bytes(section), ascii_bytes(option), ascii_bytes(value))
                  # make our hgweb quiet so it doesn't print output
                  baseui.setconfig(b'ui', b'quiet', b'true')
                  baseui.setconfig(b'ui', b'paginate', b'never')
                  # for better Error reporting of Mercurial
                  baseui.setconfig(b'ui', b'message-output', b'stderr')
                  # force mercurial to only use 1 thread, otherwise it may try to set a
                  # signal in a non-main thread, thus generating a ValueError.
                  baseui.setconfig(b'worker', b'numcpus', 1)
                  # If there is no config for the largefiles extension, we explicitly disable
                  # it here. This overrides settings from repositories hgrc file. Recent
                  # mercurial versions enable largefiles in hgrc on clone from largefile
                  # repo.
                  if not baseui.hasconfig(b'extensions', b'largefiles'):
                      log.debug('Explicitly disable largefiles extension for repo.')
                      baseui.setconfig(b'extensions', b'largefiles', b'!')
                  return baseui
              def reraise_safe_exceptions(func):
                  """Decorator for converting mercurial exceptions to something neutral."""
                  def wrapper(*args, **kwargs):
                      try:
                          return func(*args, **kwargs)
                      except (Abort, InterventionRequired) as e:
                          raise_from_original(exceptions.AbortException(e), e)
                      except RepoLookupError as e:
                          raise_from_original(exceptions.LookupException(e), e)
                      except RequirementError as e:
                          raise_from_original(exceptions.RequirementException(e), e)
                      except RepoError as e:
                          raise_from_original(exceptions.VcsException(e), e)
                      except LookupError as e:
                          raise_from_original(exceptions.LookupException(e), e)
                      except Exception as e:
                          if not hasattr(e, '_vcs_kind'):
                              log.exception("Unhandled exception in hg remote call")
                              raise_from_original(exceptions.UnhandledException(e), e)
                          raise
                  return wrapper
              class MercurialFactory(RepoFactory):
                  repo_type = 'hg'
                  def _create_config(self, config, hooks=True):
                      if not hooks:
                          hooks_to_clean = {
                              hooks_config.HOOK_REPO_SIZE,
                              hooks_config.HOOK_PRE_PULL,
                              hooks_config.HOOK_PULL,
                              hooks_config.HOOK_PRE_PUSH,
                              # TODO: what about PRETXT, this was disabled in pre 5.0.0
                              hooks_config.HOOK_PRETX_PUSH,
                          }
                          new_config = []
                          for section, option, value in config:
                              if section == 'hooks' and option in hooks_to_clean:
                                  continue
                              new_config.append((section, option, value))
                          config = new_config
                      baseui = make_ui_from_config(config)
                      return baseui
                  def _create_repo(self, wire, create):
                      baseui = self._create_config(wire["config"])
                      repo = instance(baseui, safe_bytes(wire["path"]), create)
                      log.debug('repository created: got HG object: %s', repo)
                      return repo
                  def repo(self, wire, create=False):
                      """
                      Get a repository instance for the given path.
                      """
                      return self._create_repo(wire, create)
              def patch_ui_message_output(baseui):
                  baseui.setconfig(b'ui', b'quiet', b'false')
                  output = io.BytesIO()
                  def write(data, **unused_kwargs):
                      output.write(data)
                  baseui.status = write
                  baseui.write = write
                  baseui.warn = write
                  baseui.debug = write
                  return baseui, output
              def get_obfuscated_url(url_obj):
                  url_obj.passwd = b'*****' if url_obj.passwd else url_obj.passwd
                  url_obj.query = obfuscate_qs(url_obj.query)
                  obfuscated_uri = str(url_obj)
                  return obfuscated_uri
              def normalize_url_for_hg(url: str):
                  _proto = None
                  if '+' in url[:url.find('://')]:
                      _proto = url[0:url.find('+')]
                      url = url[url.find('+') + 1:]
                  return url, _proto
              class HgRemote(RemoteBase):
                  def __init__(self, factory):
                      self._factory = factory
                      self._bulk_methods = {
                          "affected_files": self.ctx_files,
                          "author": self.ctx_user,
                          "branch": self.ctx_branch,
                          "children": self.ctx_children,
                          "date": self.ctx_date,
                          "message": self.ctx_description,
                          "parents": self.ctx_parents,
                          "status": self.ctx_status,
                          "obsolete": self.ctx_obsolete,
                          "phase": self.ctx_phase,
                          "hidden": self.ctx_hidden,
                          "_file_paths": self.ctx_list,
                      }
                      self._bulk_file_methods = {
                          "size": self.fctx_size,
                          "data": self.fctx_node_data,
                          "flags": self.fctx_flags,
                          "is_binary": self.is_binary,
                          "md5": self.md5_hash,
                      }
                  def _get_ctx(self, repo, ref):
                      return get_ctx(repo, ref)
                  @reraise_safe_exceptions
                  def discover_hg_version(self):
                      from mercurial import util
                      return safe_str(util.version())
                  @reraise_safe_exceptions
                  def is_empty(self, wire):
                      repo = self._factory.repo(wire)
                      try:
                          return len(repo) == 0
                      except Exception:
                          log.exception("failed to read object_store")
                          return False
                  @reraise_safe_exceptions
                  def bookmarks(self, wire):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _bookmarks(_context_uid, _repo_id):
                          repo = self._factory.repo(wire)
                          return {safe_str(name): ascii_str(hex(sha)) for name, sha in repo._bookmarks.items()}
                      return _bookmarks(context_uid, repo_id)
                  @reraise_safe_exceptions
                  def branches(self, wire, normal, closed):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _branches(_context_uid, _repo_id, _normal, _closed):
                          repo = self._factory.repo(wire)
                          iter_branches = repo.branchmap().iterbranches()
                          bt = {}
                          for branch_name, _heads, tip_node, is_closed in iter_branches:
                              if normal and not is_closed:
                                  bt[safe_str(branch_name)] = ascii_str(hex(tip_node))
                              if closed and is_closed:
                                  bt[safe_str(branch_name)] = ascii_str(hex(tip_node))
                          return bt
                      return _branches(context_uid, repo_id, normal, closed)
                  @reraise_safe_exceptions
                  def bulk_request(self, wire, commit_id, pre_load):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _bulk_request(_repo_id, _commit_id, _pre_load):
                          result = {}
                          for attr in pre_load:
                              try:
                                  method = self._bulk_methods[attr]
                                  wire.update({'cache': False})  # disable cache for bulk calls so we don't double cache
                                  result[attr] = method(wire, commit_id)
                              except KeyError as e:
                                  raise exceptions.VcsException(e)(
-                                     'Unknown bulk attribute: "%s"' % attr)
+                                     f'Unknown bulk attribute: "{attr}"')
                          return result
                      return _bulk_request(repo_id, commit_id, sorted(pre_load))
                  @reraise_safe_exceptions
                  def ctx_branch(self, wire, commit_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _ctx_branch(_repo_id, _commit_id):
                          repo = self._factory.repo(wire)
                          ctx = self._get_ctx(repo, commit_id)
                          return ctx.branch()
                      return _ctx_branch(repo_id, commit_id)
                  @reraise_safe_exceptions
                  def ctx_date(self, wire, commit_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _ctx_date(_repo_id, _commit_id):
                          repo = self._factory.repo(wire)
                          ctx = self._get_ctx(repo, commit_id)
                          return ctx.date()
                      return _ctx_date(repo_id, commit_id)
                  @reraise_safe_exceptions
                  def ctx_description(self, wire, revision):
                      repo = self._factory.repo(wire)
                      ctx = self._get_ctx(repo, revision)
                      return ctx.description()
                  @reraise_safe_exceptions
                  def ctx_files(self, wire, commit_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _ctx_files(_repo_id, _commit_id):
                          repo = self._factory.repo(wire)
                          ctx = self._get_ctx(repo, commit_id)
                          return ctx.files()
                      return _ctx_files(repo_id, commit_id)
                  @reraise_safe_exceptions
                  def ctx_list(self, path, revision):
                      repo = self._factory.repo(path)
                      ctx = self._get_ctx(repo, revision)
                      return list(ctx)
                  @reraise_safe_exceptions
                  def ctx_parents(self, wire, commit_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _ctx_parents(_repo_id, _commit_id):
                          repo = self._factory.repo(wire)
                          ctx = self._get_ctx(repo, commit_id)
                          return [parent.hex() for parent in ctx.parents()
                                  if not (parent.hidden() or parent.obsolete())]
                      return _ctx_parents(repo_id, commit_id)
                  @reraise_safe_exceptions
                  def ctx_children(self, wire, commit_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _ctx_children(_repo_id, _commit_id):
                          repo = self._factory.repo(wire)
                          ctx = self._get_ctx(repo, commit_id)
                          return [child.hex() for child in ctx.children()
                                  if not (child.hidden() or child.obsolete())]
                      return _ctx_children(repo_id, commit_id)
                  @reraise_safe_exceptions
                  def ctx_phase(self, wire, commit_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _ctx_phase(_context_uid, _repo_id, _commit_id):
                          repo = self._factory.repo(wire)
                          ctx = self._get_ctx(repo, commit_id)
                          # public=0, draft=1, secret=3
                          return ctx.phase()
                      return _ctx_phase(context_uid, repo_id, commit_id)
                  @reraise_safe_exceptions
                  def ctx_obsolete(self, wire, commit_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _ctx_obsolete(_context_uid, _repo_id, _commit_id):
                          repo = self._factory.repo(wire)
                          ctx = self._get_ctx(repo, commit_id)
                          return ctx.obsolete()
                      return _ctx_obsolete(context_uid, repo_id, commit_id)
                  @reraise_safe_exceptions
                  def ctx_hidden(self, wire, commit_id):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _ctx_hidden(_context_uid, _repo_id, _commit_id):
                          repo = self._factory.repo(wire)
                          ctx = self._get_ctx(repo, commit_id)
                          return ctx.hidden()
                      return _ctx_hidden(context_uid, repo_id, commit_id)
                  @reraise_safe_exceptions
                  def ctx_substate(self, wire, revision):
                      repo = self._factory.repo(wire)
                      ctx = self._get_ctx(repo, revision)
                      return ctx.substate
                  @reraise_safe_exceptions
                  def ctx_status(self, wire, revision):
                      repo = self._factory.repo(wire)
                      ctx = self._get_ctx(repo, revision)
                      status = repo[ctx.p1().node()].status(other=ctx.node())
                      # object of status (odd, custom named tuple in mercurial) is not
                      # correctly serializable, we make it a list, as the underling
                      # API expects this to be a list
                      return list(status)
                  @reraise_safe_exceptions
                  def ctx_user(self, wire, revision):
                      repo = self._factory.repo(wire)
                      ctx = self._get_ctx(repo, revision)
                      return ctx.user()
                  @reraise_safe_exceptions
                  def check_url(self, url, config):
                      url, _proto = normalize_url_for_hg(url)
                      url_obj = url_parser(safe_bytes(url))
                      test_uri = safe_str(url_obj.authinfo()[0])
                      authinfo = url_obj.authinfo()[1]
                      obfuscated_uri = get_obfuscated_url(url_obj)
                      log.info("Checking URL for remote cloning/import: %s", obfuscated_uri)
                      handlers = []
                      if authinfo:
                          # create a password manager
                          passmgr = urllib.request.HTTPPasswordMgrWithDefaultRealm()
                          passmgr.add_password(*authinfo)
                          handlers.extend((httpbasicauthhandler(passmgr),
                                           httpdigestauthhandler(passmgr)))
                      o = urllib.request.build_opener(*handlers)
                      o.addheaders = [('Content-Type', 'application/mercurial-0.1'),
                                      ('Accept', 'application/mercurial-0.1')]
                      q = {"cmd": 'between'}
                      q.update({'pairs': "{}-{}".format('0' * 40, '0' * 40)})
-                     qs = '?%s' % urllib.parse.urlencode(q)
+                     qs = f'?{urllib.parse.urlencode(q)}'
                      cu = f"{test_uri}{qs}"
                      req = urllib.request.Request(cu, None, {})
                      try:
                          log.debug("Trying to open URL %s", obfuscated_uri)
                          resp = o.open(req)
                          if resp.code != 200:
                              raise exceptions.URLError()('Return Code is not 200')
                      except Exception as e:
                          log.warning("URL cannot be opened: %s", obfuscated_uri, exc_info=True)
                          # means it cannot be cloned
                          raise exceptions.URLError(e)(f"[{obfuscated_uri}] org_exc: {e}")
                      # now check if it's a proper hg repo, but don't do it for svn
                      try:
                          if _proto == 'svn':
                              pass
                          else:
                              # check for pure hg repos
                              log.debug(
                                  "Verifying if URL is a Mercurial repository: %s", obfuscated_uri)
                              ui = make_ui_from_config(config)
                              peer_checker = makepeer(ui, safe_bytes(url))
                              peer_checker.lookup(b'tip')
                      except Exception as e:
                          log.warning("URL is not a valid Mercurial repository: %s",
                                      obfuscated_uri)
                          raise exceptions.URLError(e)(
-                             "url [%s] does not look like an hg repo org_exc: %s"
-                             % (obfuscated_uri, e))
+                             f"url [{obfuscated_uri}] does not look like an hg repo org_exc: {e}")
                      log.info("URL is a valid Mercurial repository: %s", obfuscated_uri)
                      return True
                  @reraise_safe_exceptions
                  def diff(self, wire, commit_id_1, commit_id_2, file_filter, opt_git, opt_ignorews, context):
                      repo = self._factory.repo(wire)
                      if file_filter:
                          # unpack the file-filter
                          repo_path, node_path = file_filter
                          match_filter = match(safe_bytes(repo_path), b'', [safe_bytes(node_path)])
                      else:
                          match_filter = file_filter
                      opts = diffopts(git=opt_git, ignorews=opt_ignorews, context=context, showfunc=1)
                      try:
                          diff_iter = patch.diff(
                              repo, node1=commit_id_1, node2=commit_id_2, match=match_filter, opts=opts)
                          return BytesEnvelope(b"".join(diff_iter))
                      except RepoLookupError as e:
                          raise exceptions.LookupException(e)()
                  @reraise_safe_exceptions
                  def node_history(self, wire, revision, path, limit):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _node_history(_context_uid, _repo_id, _revision, _path, _limit):
                          repo = self._factory.repo(wire)
                          ctx = self._get_ctx(repo, revision)
                          fctx = ctx.filectx(safe_bytes(path))
                          def history_iter():
                              limit_rev = fctx.rev()
                              for fctx_candidate in reversed(list(fctx.filelog())):
                                  f_obj = fctx.filectx(fctx_candidate)
                                  # NOTE: This can be problematic...we can hide ONLY history node resulting in empty history
                                  _ctx = obj.changectx()
                                  if _ctx.hidden() or _ctx.obsolete():
                                      continue
                                  if limit_rev >= f_obj.rev():
                                      yield f_obj
                          history = []
                          for cnt, obj in enumerate(history_iter()):
                              if limit and cnt >= limit:
                                  break
                              history.append(hex(obj.node()))
                          return [x for x in history]
                      return _node_history(context_uid, repo_id, revision, path, limit)
                  @reraise_safe_exceptions
                  def node_history_until(self, wire, revision, path, limit):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _node_history_until(_context_uid, _repo_id):
                          repo = self._factory.repo(wire)
                          ctx = self._get_ctx(repo, revision)
                          fctx = ctx.filectx(safe_bytes(path))
                          file_log = list(fctx.filelog())
                          if limit:
                              # Limit to the last n items
                              file_log = file_log[-limit:]
                          return [hex(fctx.filectx(cs).node()) for cs in reversed(file_log)]
                      return _node_history_until(context_uid, repo_id, revision, path, limit)
                  @reraise_safe_exceptions
                  def bulk_file_request(self, wire, commit_id, path, pre_load):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _bulk_file_request(_repo_id, _commit_id, _path, _pre_load):
                          result = {}
                          for attr in pre_load:
                              try:
                                  method = self._bulk_file_methods[attr]
                                  wire.update({'cache': False})  # disable cache for bulk calls so we don't double cache
                                  result[attr] = method(wire, _commit_id, _path)
                              except KeyError as e:
                                  raise exceptions.VcsException(e)(f'Unknown bulk attribute: "{attr}"')
                          return result
                      return BinaryEnvelope(_bulk_file_request(repo_id, commit_id, path, sorted(pre_load)))
                  @reraise_safe_exceptions
                  def fctx_annotate(self, wire, revision, path):
                      repo = self._factory.repo(wire)
                      ctx = self._get_ctx(repo, revision)
                      fctx = ctx.filectx(safe_bytes(path))
                      result = []
                      for i, annotate_obj in enumerate(fctx.annotate(), 1):
                          ln_no = i
                          sha = hex(annotate_obj.fctx.node())
                          content = annotate_obj.text
                          result.append((ln_no, ascii_str(sha), content))
                      return BinaryEnvelope(result)
                  @reraise_safe_exceptions
                  def fctx_node_data(self, wire, revision, path):
                      repo = self._factory.repo(wire)
                      ctx = self._get_ctx(repo, revision)
                      fctx = ctx.filectx(safe_bytes(path))
                      return BytesEnvelope(fctx.data())
                  @reraise_safe_exceptions
                  def fctx_flags(self, wire, commit_id, path):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _fctx_flags(_repo_id, _commit_id, _path):
                          repo = self._factory.repo(wire)
                          ctx = self._get_ctx(repo, commit_id)
                          fctx = ctx.filectx(safe_bytes(path))
                          return fctx.flags()
                      return _fctx_flags(repo_id, commit_id, path)
                  @reraise_safe_exceptions
                  def fctx_size(self, wire, commit_id, path):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _fctx_size(_repo_id, _revision, _path):
                          repo = self._factory.repo(wire)
                          ctx = self._get_ctx(repo, commit_id)
                          fctx = ctx.filectx(safe_bytes(path))
                          return fctx.size()
                      return _fctx_size(repo_id, commit_id, path)
                  @reraise_safe_exceptions
                  def get_all_commit_ids(self, wire, name):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _get_all_commit_ids(_context_uid, _repo_id, _name):
                          repo = self._factory.repo(wire)
                          revs = [ascii_str(repo[x].hex()) for x in repo.filtered(b'visible').changelog.revs()]
                          return revs
                      return _get_all_commit_ids(context_uid, repo_id, name)
                  @reraise_safe_exceptions
                  def get_config_value(self, wire, section, name, untrusted=False):
                      repo = self._factory.repo(wire)
                      return repo.ui.config(ascii_bytes(section), ascii_bytes(name), untrusted=untrusted)
                  @reraise_safe_exceptions
                  def is_large_file(self, wire, commit_id, path):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _is_large_file(_context_uid, _repo_id, _commit_id, _path):
                          return largefiles.lfutil.isstandin(safe_bytes(path))
                      return _is_large_file(context_uid, repo_id, commit_id, path)
                  @reraise_safe_exceptions
                  def is_binary(self, wire, revision, path):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _is_binary(_repo_id, _sha, _path):
                          repo = self._factory.repo(wire)
                          ctx = self._get_ctx(repo, revision)
                          fctx = ctx.filectx(safe_bytes(path))
                          return fctx.isbinary()
                      return _is_binary(repo_id, revision, path)
                  @reraise_safe_exceptions
                  def md5_hash(self, wire, revision, path):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _md5_hash(_repo_id, _sha, _path):
                          repo = self._factory.repo(wire)
                          ctx = self._get_ctx(repo, revision)
                          fctx = ctx.filectx(safe_bytes(path))
                          return hashlib.md5(fctx.data()).hexdigest()
                      return _md5_hash(repo_id, revision, path)
                  @reraise_safe_exceptions
                  def in_largefiles_store(self, wire, sha):
                      repo = self._factory.repo(wire)
                      return largefiles.lfutil.instore(repo, sha)
                  @reraise_safe_exceptions
                  def in_user_cache(self, wire, sha):
                      repo = self._factory.repo(wire)
                      return largefiles.lfutil.inusercache(repo.ui, sha)
                  @reraise_safe_exceptions
                  def store_path(self, wire, sha):
                      repo = self._factory.repo(wire)
                      return largefiles.lfutil.storepath(repo, sha)
                  @reraise_safe_exceptions
                  def link(self, wire, sha, path):
                      repo = self._factory.repo(wire)
                      largefiles.lfutil.link(
                          largefiles.lfutil.usercachepath(repo.ui, sha), path)
                  @reraise_safe_exceptions
                  def localrepository(self, wire, create=False):
                      self._factory.repo(wire, create=create)
                  @reraise_safe_exceptions
                  def lookup(self, wire, revision, both):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _lookup(_context_uid, _repo_id, _revision, _both):
                          repo = self._factory.repo(wire)
                          rev = _revision
                          if isinstance(rev, int):
                              # NOTE(marcink):
                              # since Mercurial doesn't support negative indexes properly
                              # we need to shift accordingly by one to get proper index, e.g
                              # repo[-1] => repo[-2]
                              # repo[0]  => repo[-1]
                              if rev <= 0:
                                  rev = rev + -1
                          try:
                              ctx = self._get_ctx(repo, rev)
                          except AmbiguousPrefixLookupError:
                              e = RepoLookupError(rev)
                              e._org_exc_tb = format_exc(sys.exc_info())
                              raise exceptions.LookupException(e)(rev)
                          except (TypeError, RepoLookupError, binascii.Error) as e:
                              e._org_exc_tb = format_exc(sys.exc_info())
                              raise exceptions.LookupException(e)(rev)
                          except LookupError as e:
                              e._org_exc_tb = format_exc(sys.exc_info())
                              raise exceptions.LookupException(e)(e.name)
                          if not both:
                              return ctx.hex()
                          ctx = repo[ctx.hex()]
                          return ctx.hex(), ctx.rev()
                      return _lookup(context_uid, repo_id, revision, both)
                  @reraise_safe_exceptions
                  def sync_push(self, wire, url):
                      if not self.check_url(url, wire['config']):
                          return
                      repo = self._factory.repo(wire)
                      # Disable any prompts for this repo
                      repo.ui.setconfig(b'ui', b'interactive', b'off', b'-y')
                      bookmarks = list(dict(repo._bookmarks).keys())
                      remote = peer(repo, {}, safe_bytes(url))
                      # Disable any prompts for this remote
                      remote.ui.setconfig(b'ui', b'interactive', b'off', b'-y')
                      return exchange.push(
                          repo, remote, newbranch=True, bookmarks=bookmarks).cgresult
                  @reraise_safe_exceptions
                  def revision(self, wire, rev):
                      repo = self._factory.repo(wire)
                      ctx = self._get_ctx(repo, rev)
                      return ctx.rev()
                  @reraise_safe_exceptions
                  def rev_range(self, wire, commit_filter):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _rev_range(_context_uid, _repo_id, _filter):
                          repo = self._factory.repo(wire)
                          revisions = [
                              ascii_str(repo[rev].hex())
                              for rev in revrange(repo, list(map(ascii_bytes, commit_filter)))
                          ]
                          return revisions
                      return _rev_range(context_uid, repo_id, sorted(commit_filter))
                  @reraise_safe_exceptions
                  def rev_range_hash(self, wire, node):
                      repo = self._factory.repo(wire)
                      def get_revs(repo, rev_opt):
                          if rev_opt:
                              revs = revrange(repo, rev_opt)
                              if len(revs) == 0:
                                  return (nullrev, nullrev)
                              return max(revs), min(revs)
                          else:
                              return len(repo) - 1, 0
                      stop, start = get_revs(repo, [node + ':'])
                      revs = [ascii_str(repo[r].hex()) for r in range(start, stop + 1)]
                      return revs
                  @reraise_safe_exceptions
                  def revs_from_revspec(self, wire, rev_spec, *args, **kwargs):
                      org_path = safe_bytes(wire["path"])
                      other_path = safe_bytes(kwargs.pop('other_path', ''))
                      # case when we want to compare two independent repositories
                      if other_path and other_path != wire["path"]:
                          baseui = self._factory._create_config(wire["config"])
                          repo = unionrepo.makeunionrepository(baseui, other_path, org_path)
                      else:
                          repo = self._factory.repo(wire)
                      return list(repo.revs(rev_spec, *args))
                  @reraise_safe_exceptions
                  def verify(self, wire,):
                      repo = self._factory.repo(wire)
                      baseui = self._factory._create_config(wire['config'])
                      baseui, output = patch_ui_message_output(baseui)
                      repo.ui = baseui
                      verify.verify(repo)
                      return output.getvalue()
                  @reraise_safe_exceptions
                  def hg_update_cache(self, wire,):
                      repo = self._factory.repo(wire)
                      baseui = self._factory._create_config(wire['config'])
                      baseui, output = patch_ui_message_output(baseui)
                      repo.ui = baseui
                      with repo.wlock(), repo.lock():
                          repo.updatecaches(full=True)
                      return output.getvalue()
                  @reraise_safe_exceptions
                  def hg_rebuild_fn_cache(self, wire,):
                      repo = self._factory.repo(wire)
                      baseui = self._factory._create_config(wire['config'])
                      baseui, output = patch_ui_message_output(baseui)
                      repo.ui = baseui
                      repair.rebuildfncache(baseui, repo)
                      return output.getvalue()
                  @reraise_safe_exceptions
                  def tags(self, wire):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _tags(_context_uid, _repo_id):
                          repo = self._factory.repo(wire)
                          return {safe_str(name): ascii_str(hex(sha)) for name, sha in repo.tags().items()}
                      return _tags(context_uid, repo_id)
                  @reraise_safe_exceptions
                  def update(self, wire, node='', clean=False):
                      repo = self._factory.repo(wire)
                      baseui = self._factory._create_config(wire['config'])
                      node = safe_bytes(node)
                      commands.update(baseui, repo, node=node, clean=clean)
                  @reraise_safe_exceptions
                  def identify(self, wire):
                      repo = self._factory.repo(wire)
                      baseui = self._factory._create_config(wire['config'])
                      output = io.BytesIO()
                      baseui.write = output.write
                      # This is required to get a full node id
                      baseui.debugflag = True
                      commands.identify(baseui, repo, id=True)
                      return output.getvalue()
                  @reraise_safe_exceptions
                  def heads(self, wire, branch=None):
                      repo = self._factory.repo(wire)
                      baseui = self._factory._create_config(wire['config'])
                      output = io.BytesIO()
                      def write(data, **unused_kwargs):
                          output.write(data)
                      baseui.write = write
                      if branch:
                          args = [safe_bytes(branch)]
                      else:
                          args = []
                      commands.heads(baseui, repo, template=b'{node} ', *args)
                      return output.getvalue()
                  @reraise_safe_exceptions
                  def ancestor(self, wire, revision1, revision2):
                      repo = self._factory.repo(wire)
                      changelog = repo.changelog
                      lookup = repo.lookup
                      a = changelog.ancestor(lookup(safe_bytes(revision1)), lookup(safe_bytes(revision2)))
                      return hex(a)
                  @reraise_safe_exceptions
                  def clone(self, wire, source, dest, update_after_clone=False, hooks=True):
                      baseui = self._factory._create_config(wire["config"], hooks=hooks)
                      clone(baseui, safe_bytes(source), safe_bytes(dest), noupdate=not update_after_clone)
                  @reraise_safe_exceptions
                  def commitctx(self, wire, message, parents, commit_time, commit_timezone, user, files, extra, removed, updated):
                      repo = self._factory.repo(wire)
                      baseui = self._factory._create_config(wire['config'])
                      publishing = baseui.configbool(b'phases', b'publish')
                      def _filectxfn(_repo, ctx, path: bytes):
                          """
                          Marks given path as added/changed/removed in a given _repo. This is
                          for internal mercurial commit function.
                          """
                          # check if this path is removed
                          if safe_str(path) in removed:
                              # returning None is a way to mark node for removal
                              return None
                          # check if this path is added
                          for node in updated:
                              if safe_bytes(node['path']) == path:
                                  return memfilectx(
                                      _repo,
                                      changectx=ctx,
                                      path=safe_bytes(node['path']),
                                      data=safe_bytes(node['content']),
                                      islink=False,
                                      isexec=bool(node['mode'] & stat.S_IXUSR),
                                      copysource=False)
                          abort_exc = exceptions.AbortException()
                          raise abort_exc(f"Given path haven't been marked as added, changed or removed ({path})")
                      if publishing:
                          new_commit_phase = b'public'
                      else:
                          new_commit_phase = b'draft'
                      with repo.ui.configoverride({(b'phases', b'new-commit'): new_commit_phase}):
                          kwargs = {safe_bytes(k): safe_bytes(v) for k, v in extra.items()}
                          commit_ctx = memctx(
                              repo=repo,
                              parents=parents,
                              text=safe_bytes(message),
                              files=[safe_bytes(x) for x in files],
                              filectxfn=_filectxfn,
                              user=safe_bytes(user),
                              date=(commit_time, commit_timezone),
                              extra=kwargs)
                          n = repo.commitctx(commit_ctx)
                          new_id = hex(n)
                          return new_id
                  @reraise_safe_exceptions
                  def pull(self, wire, url, commit_ids=None):
                      repo = self._factory.repo(wire)
                      # Disable any prompts for this repo
                      repo.ui.setconfig(b'ui', b'interactive', b'off', b'-y')
                      remote = peer(repo, {}, safe_bytes(url))
                      # Disable any prompts for this remote
                      remote.ui.setconfig(b'ui', b'interactive', b'off', b'-y')
                      if commit_ids:
                          commit_ids = [bin(commit_id) for commit_id in commit_ids]
                      return exchange.pull(
                          repo, remote, heads=commit_ids, force=None).cgresult
                  @reraise_safe_exceptions
                  def pull_cmd(self, wire, source, bookmark='', branch='', revision='', hooks=True):
                      repo = self._factory.repo(wire)
                      baseui = self._factory._create_config(wire['config'], hooks=hooks)
                      source = safe_bytes(source)
                      # Mercurial internally has a lot of logic that checks ONLY if
                      # option is defined, we just pass those if they are defined then
                      opts = {}
                      if bookmark:
                          opts['bookmark'] = [safe_bytes(x) for x in bookmark] \
                              if isinstance(bookmark, list) else safe_bytes(bookmark)
                      if branch:
                          opts['branch'] = [safe_bytes(x) for x in branch] \
                              if isinstance(branch, list) else safe_bytes(branch)
                      if revision:
                          opts['rev'] = [safe_bytes(x) for x in revision] \
                              if isinstance(revision, list) else safe_bytes(revision)
                      commands.pull(baseui, repo, source, **opts)
                  @reraise_safe_exceptions
                  def push(self, wire, revisions, dest_path, hooks: bool = True, push_branches: bool = False):
                      repo = self._factory.repo(wire)
                      baseui = self._factory._create_config(wire['config'], hooks=hooks)
                      revisions = [safe_bytes(x) for x in revisions] \
                          if isinstance(revisions, list) else safe_bytes(revisions)
                      commands.push(baseui, repo, safe_bytes(dest_path),
                                    rev=revisions,
                                    new_branch=push_branches)
                  @reraise_safe_exceptions
                  def strip(self, wire, revision, update, backup):
                      repo = self._factory.repo(wire)
                      ctx = self._get_ctx(repo, revision)
                      hgext_strip.strip(
                          repo.baseui, repo, ctx.node(), update=update, backup=backup)
                  @reraise_safe_exceptions
                  def get_unresolved_files(self, wire):
                      repo = self._factory.repo(wire)
                      log.debug('Calculating unresolved files for repo: %s', repo)
                      output = io.BytesIO()
                      def write(data, **unused_kwargs):
                          output.write(data)
                      baseui = self._factory._create_config(wire['config'])
                      baseui.write = write
                      commands.resolve(baseui, repo, list=True)
                      unresolved = output.getvalue().splitlines(0)
                      return unresolved
                  @reraise_safe_exceptions
                  def merge(self, wire, revision):
                      repo = self._factory.repo(wire)
                      baseui = self._factory._create_config(wire['config'])
                      repo.ui.setconfig(b'ui', b'merge', b'internal:dump')
                      # In case of sub repositories are used mercurial prompts the user in
                      # case of merge conflicts or different sub repository sources. By
                      # setting the interactive flag to `False` mercurial doesn't prompt the
                      # used but instead uses a default value.
                      repo.ui.setconfig(b'ui', b'interactive', False)
                      commands.merge(baseui, repo, rev=safe_bytes(revision))
                  @reraise_safe_exceptions
                  def merge_state(self, wire):
                      repo = self._factory.repo(wire)
                      repo.ui.setconfig(b'ui', b'merge', b'internal:dump')
                      # In case of sub repositories are used mercurial prompts the user in
                      # case of merge conflicts or different sub repository sources. By
                      # setting the interactive flag to `False` mercurial doesn't prompt the
                      # used but instead uses a default value.
                      repo.ui.setconfig(b'ui', b'interactive', False)
                      ms = hg_merge.mergestate(repo)
                      return [x for x in ms.unresolved()]
                  @reraise_safe_exceptions
                  def commit(self, wire, message, username, close_branch=False):
                      repo = self._factory.repo(wire)
                      baseui = self._factory._create_config(wire['config'])
                      repo.ui.setconfig(b'ui', b'username', safe_bytes(username))
                      commands.commit(baseui, repo, message=safe_bytes(message), close_branch=close_branch)
                  @reraise_safe_exceptions
                  def rebase(self, wire, source='', dest='', abort=False):
                      repo = self._factory.repo(wire)
                      baseui = self._factory._create_config(wire['config'])
                      repo.ui.setconfig(b'ui', b'merge', b'internal:dump')
                      # In case of sub repositories are used mercurial prompts the user in
                      # case of merge conflicts or different sub repository sources. By
                      # setting the interactive flag to `False` mercurial doesn't prompt the
                      # used but instead uses a default value.
                      repo.ui.setconfig(b'ui', b'interactive', False)
                      rebase.rebase(baseui, repo, base=safe_bytes(source or ''), dest=safe_bytes(dest or ''),
                                    abort=abort, keep=not abort)
                  @reraise_safe_exceptions
                  def tag(self, wire, name, revision, message, local, user, tag_time, tag_timezone):
                      repo = self._factory.repo(wire)
                      ctx = self._get_ctx(repo, revision)
                      node = ctx.node()
                      date = (tag_time, tag_timezone)
                      try:
                          hg_tag.tag(repo, safe_bytes(name), node, safe_bytes(message), local, safe_bytes(user), date)
                      except Abort as e:
                          log.exception("Tag operation aborted")
                          # Exception can contain unicode which we convert
                          raise exceptions.AbortException(e)(repr(e))
                  @reraise_safe_exceptions
                  def bookmark(self, wire, bookmark, revision=''):
                      repo = self._factory.repo(wire)
                      baseui = self._factory._create_config(wire['config'])
                      revision = revision or ''
                      commands.bookmark(baseui, repo, safe_bytes(bookmark), rev=safe_bytes(revision), force=True)
                  @reraise_safe_exceptions
                  def install_hooks(self, wire, force=False):
                      # we don't need any special hooks for Mercurial
                      pass
                  @reraise_safe_exceptions
                  def get_hooks_info(self, wire):
                      return {
                          'pre_version': vcsserver.__version__,
                          'post_version': vcsserver.__version__,
                      }
                  @reraise_safe_exceptions
                  def set_head_ref(self, wire, head_name):
                      pass
                  @reraise_safe_exceptions
                  def archive_repo(self, wire, archive_name_key, kind, mtime, archive_at_path,
                                   archive_dir_name, commit_id, cache_config):
                      def file_walker(_commit_id, path):
                          repo = self._factory.repo(wire)
                          ctx = repo[_commit_id]
                          is_root = path in ['', '/']
                          if is_root:
                              matcher = alwaysmatcher(badfn=None)
                          else:
                              matcher = patternmatcher('', [(b'glob', safe_bytes(path)+b'/**', b'')], badfn=None)
                          file_iter = ctx.manifest().walk(matcher)
                          for fn in file_iter:
                              file_path = fn
                              flags = ctx.flags(fn)
                              mode = b'x' in flags and 0o755 or 0o644
                              is_link = b'l' in flags
                              yield ArchiveNode(file_path, mode, is_link, ctx[fn].data)
                      return store_archive_in_cache(
                          file_walker, archive_name_key, kind, mtime, archive_at_path, archive_dir_name, commit_id, cache_config=cache_config)

vcsserver/remote/svn_remote.py

0 +5 -6

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import os
              import subprocess
              from urllib.error import URLError
              import urllib.parse
              import logging
              import posixpath as vcspath
              import io
              import urllib.request
              import urllib.parse
              import urllib.error
              import traceback
              import svn.client  # noqa
              import svn.core  # noqa
              import svn.delta  # noqa
              import svn.diff  # noqa
              import svn.fs  # noqa
              import svn.repos  # noqa
              from vcsserver import svn_diff, exceptions, subprocessio, settings
              from vcsserver.base import (
                  RepoFactory,
                  raise_from_original,
                  ArchiveNode,
                  store_archive_in_cache,
                  BytesEnvelope,
                  BinaryEnvelope,
              )
              from vcsserver.exceptions import NoContentException
              from vcsserver.str_utils import safe_str, safe_bytes
              from vcsserver.type_utils import assert_bytes
              from vcsserver.vcs_base import RemoteBase
              from vcsserver.lib.svnremoterepo import svnremoterepo
              log = logging.getLogger(__name__)
              svn_compatible_versions_map = {
                  'pre-1.4-compatible': '1.3',
                  'pre-1.5-compatible': '1.4',
                  'pre-1.6-compatible': '1.5',
                  'pre-1.8-compatible': '1.7',
                  'pre-1.9-compatible': '1.8',
              }
              current_compatible_version = '1.14'
              def reraise_safe_exceptions(func):
                  """Decorator for converting svn exceptions to something neutral."""
                  def wrapper(*args, **kwargs):
                      try:
                          return func(*args, **kwargs)
                      except Exception as e:
                          if not hasattr(e, '_vcs_kind'):
                              log.exception("Unhandled exception in svn remote call")
                              raise_from_original(exceptions.UnhandledException(e), e)
                          raise
                  return wrapper
              class SubversionFactory(RepoFactory):
                  repo_type = 'svn'
                  def _create_repo(self, wire, create, compatible_version):
                      path = svn.core.svn_path_canonicalize(wire['path'])
                      if create:
                          fs_config = {'compatible-version': current_compatible_version}
                          if compatible_version:
                              compatible_version_string = \
                                  svn_compatible_versions_map.get(compatible_version) \
                                  or compatible_version
                              fs_config['compatible-version'] = compatible_version_string
                          log.debug('Create SVN repo with config `%s`', fs_config)
                          repo = svn.repos.create(path, "", "", None, fs_config)
                      else:
                          repo = svn.repos.open(path)
                      log.debug('repository created: got SVN object: %s', repo)
                      return repo
                  def repo(self, wire, create=False, compatible_version=None):
                      """
                      Get a repository instance for the given path.
                      """
                      return self._create_repo(wire, create, compatible_version)
              NODE_TYPE_MAPPING = {
                  svn.core.svn_node_file: 'file',
                  svn.core.svn_node_dir: 'dir',
              }
              class SvnRemote(RemoteBase):
                  def __init__(self, factory, hg_factory=None):
                      self._factory = factory
                      self._bulk_methods = {
                          # NOT supported in SVN ATM...
                      }
                      self._bulk_file_methods = {
                          "size": self.get_file_size,
                          "data": self.get_file_content,
                          "flags": self.get_node_type,
                          "is_binary": self.is_binary,
                          "md5": self.md5_hash
                      }
                  @reraise_safe_exceptions
                  def bulk_file_request(self, wire, commit_id, path, pre_load):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      # since we use unified API, we need to cast from str to in for SVN
                      commit_id = int(commit_id)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _bulk_file_request(_repo_id, _commit_id, _path, _pre_load):
                          result = {}
                          for attr in pre_load:
                              try:
                                  method = self._bulk_file_methods[attr]
                                  wire.update({'cache': False})  # disable cache for bulk calls so we don't double cache
                                  result[attr] = method(wire, _commit_id, _path)
                              except KeyError as e:
                                  raise exceptions.VcsException(e)(f'Unknown bulk attribute: "{attr}"')
                          return result
                      return BinaryEnvelope(_bulk_file_request(repo_id, commit_id, path, sorted(pre_load)))
                  @reraise_safe_exceptions
                  def discover_svn_version(self):
                      try:
                          import svn.core
                          svn_ver = svn.core.SVN_VERSION
                      except ImportError:
                          svn_ver = None
                      return safe_str(svn_ver)
                  @reraise_safe_exceptions
                  def is_empty(self, wire):
                      try:
                          return self.lookup(wire, -1) == 0
                      except Exception:
                          log.exception("failed to read object_store")
                          return False
                  def check_url(self, url, config):
                      # uuid function gets only valid UUID from proper repo, else
                      # throws exception
                      username, password, src_url = self.get_url_and_credentials(url)
                      try:
                          svnremoterepo(safe_bytes(username), safe_bytes(password), safe_bytes(src_url)).svn().uuid
                      except Exception:
                          tb = traceback.format_exc()
                          log.debug("Invalid Subversion url: `%s`, tb: %s", url, tb)
                          raise URLError(f'"{url}" is not a valid Subversion source url.')
                      return True
                  def is_path_valid_repository(self, wire, path):
                      # NOTE(marcink):  short circuit the check for SVN repo
                      # the repos.open might be expensive to check, but we have one cheap
                      # pre condition that we can use, to check for 'format' file
                      if not os.path.isfile(os.path.join(path, 'format')):
                          return False
                      try:
                          svn.repos.open(path)
                      except svn.core.SubversionException:
                          tb = traceback.format_exc()
                          log.debug("Invalid Subversion path `%s`, tb: %s", path, tb)
                          return False
                      return True
                  @reraise_safe_exceptions
                  def verify(self, wire,):
                      repo_path = wire['path']
                      if not self.is_path_valid_repository(wire, repo_path):
                          raise Exception(
-                             "Path %s is not a valid Subversion repository." % repo_path)
+                             f"Path {repo_path} is not a valid Subversion repository.")
                      cmd = ['svnadmin', 'info', repo_path]
                      stdout, stderr = subprocessio.run_command(cmd)
                      return stdout
                  @reraise_safe_exceptions
                  def lookup(self, wire, revision):
                      if revision not in [-1, None, 'HEAD']:
                          raise NotImplementedError
                      repo = self._factory.repo(wire)
                      fs_ptr = svn.repos.fs(repo)
                      head = svn.fs.youngest_rev(fs_ptr)
                      return head
                  @reraise_safe_exceptions
                  def lookup_interval(self, wire, start_ts, end_ts):
                      repo = self._factory.repo(wire)
                      fsobj = svn.repos.fs(repo)
                      start_rev = None
                      end_rev = None
                      if start_ts:
                          start_ts_svn = apr_time_t(start_ts)
                          start_rev = svn.repos.dated_revision(repo, start_ts_svn) + 1
                      else:
                          start_rev = 1
                      if end_ts:
                          end_ts_svn = apr_time_t(end_ts)
                          end_rev = svn.repos.dated_revision(repo, end_ts_svn)
                      else:
                          end_rev = svn.fs.youngest_rev(fsobj)
                      return start_rev, end_rev
                  @reraise_safe_exceptions
                  def revision_properties(self, wire, revision):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _revision_properties(_repo_id, _revision):
                          repo = self._factory.repo(wire)
                          fs_ptr = svn.repos.fs(repo)
                          return svn.fs.revision_proplist(fs_ptr, revision)
                      return _revision_properties(repo_id, revision)
                  def revision_changes(self, wire, revision):
                      repo = self._factory.repo(wire)
                      fsobj = svn.repos.fs(repo)
                      rev_root = svn.fs.revision_root(fsobj, revision)
                      editor = svn.repos.ChangeCollector(fsobj, rev_root)
                      editor_ptr, editor_baton = svn.delta.make_editor(editor)
                      base_dir = ""
                      send_deltas = False
                      svn.repos.replay2(
                          rev_root, base_dir, svn.core.SVN_INVALID_REVNUM, send_deltas,
                          editor_ptr, editor_baton, None)
                      added = []
                      changed = []
                      removed = []
                      # TODO: CHANGE_ACTION_REPLACE: Figure out where it belongs
                      for path, change in editor.changes.items():
                          # TODO: Decide what to do with directory nodes. Subversion can add
                          # empty directories.
                          if change.item_kind == svn.core.svn_node_dir:
                              continue
                          if change.action in [svn.repos.CHANGE_ACTION_ADD]:
                              added.append(path)
                          elif change.action in [svn.repos.CHANGE_ACTION_MODIFY,
                                                 svn.repos.CHANGE_ACTION_REPLACE]:
                              changed.append(path)
                          elif change.action in [svn.repos.CHANGE_ACTION_DELETE]:
                              removed.append(path)
                          else:
                              raise NotImplementedError(
                                  "Action {} not supported on path {}".format(
                                      change.action, path))
                      changes = {
                          'added': added,
                          'changed': changed,
                          'removed': removed,
                      }
                      return changes
                  @reraise_safe_exceptions
                  def node_history(self, wire, path, revision, limit):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _assert_correct_path(_context_uid, _repo_id, _path, _revision, _limit):
                          cross_copies = False
                          repo = self._factory.repo(wire)
                          fsobj = svn.repos.fs(repo)
                          rev_root = svn.fs.revision_root(fsobj, revision)
                          history_revisions = []
                          history = svn.fs.node_history(rev_root, path)
                          history = svn.fs.history_prev(history, cross_copies)
                          while history:
                              __, node_revision = svn.fs.history_location(history)
                              history_revisions.append(node_revision)
                              if limit and len(history_revisions) >= limit:
                                  break
                              history = svn.fs.history_prev(history, cross_copies)
                          return history_revisions
                      return _assert_correct_path(context_uid, repo_id, path, revision, limit)
                  @reraise_safe_exceptions
                  def node_properties(self, wire, path, revision):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _node_properties(_repo_id, _path, _revision):
                          repo = self._factory.repo(wire)
                          fsobj = svn.repos.fs(repo)
                          rev_root = svn.fs.revision_root(fsobj, revision)
                          return svn.fs.node_proplist(rev_root, path)
                      return _node_properties(repo_id, path, revision)
                  def file_annotate(self, wire, path, revision):
                      abs_path = 'file://' + urllib.request.pathname2url(
                          vcspath.join(wire['path'], path))
                      file_uri = svn.core.svn_path_canonicalize(abs_path)
                      start_rev = svn_opt_revision_value_t(0)
                      peg_rev = svn_opt_revision_value_t(revision)
                      end_rev = peg_rev
                      annotations = []
                      def receiver(line_no, revision, author, date, line, pool):
                          annotations.append((line_no, revision, line))
                      # TODO: Cannot use blame5, missing typemap function in the swig code
                      try:
                          svn.client.blame2(
                              file_uri, peg_rev, start_rev, end_rev,
                              receiver, svn.client.create_context())
                      except svn.core.SubversionException as exc:
                          log.exception("Error during blame operation.")
                          raise Exception(
                              f"Blame not supported or file does not exist at path {path}. "
                              f"Error {exc}.")
                      return BinaryEnvelope(annotations)
                  @reraise_safe_exceptions
                  def get_node_type(self, wire, revision=None, path=''):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _get_node_type(_repo_id, _revision, _path):
                          repo = self._factory.repo(wire)
                          fs_ptr = svn.repos.fs(repo)
                          if _revision is None:
                              _revision = svn.fs.youngest_rev(fs_ptr)
                          root = svn.fs.revision_root(fs_ptr, _revision)
                          node = svn.fs.check_path(root, path)
                          return NODE_TYPE_MAPPING.get(node, None)
                      return _get_node_type(repo_id, revision, path)
                  @reraise_safe_exceptions
                  def get_nodes(self, wire, revision=None, path=''):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _get_nodes(_repo_id, _path, _revision):
                          repo = self._factory.repo(wire)
                          fsobj = svn.repos.fs(repo)
                          if _revision is None:
                              _revision = svn.fs.youngest_rev(fsobj)
                          root = svn.fs.revision_root(fsobj, _revision)
                          entries = svn.fs.dir_entries(root, path)
                          result = []
                          for entry_path, entry_info in entries.items():
                              result.append(
                                  (entry_path, NODE_TYPE_MAPPING.get(entry_info.kind, None)))
                          return result
                      return _get_nodes(repo_id, path, revision)
                  @reraise_safe_exceptions
                  def get_file_content(self, wire, rev=None, path=''):
                      repo = self._factory.repo(wire)
                      fsobj = svn.repos.fs(repo)
                      if rev is None:
                          rev = svn.fs.youngest_rev(fsobj)
                      root = svn.fs.revision_root(fsobj, rev)
                      content = svn.core.Stream(svn.fs.file_contents(root, path))
                      return BytesEnvelope(content.read())
                  @reraise_safe_exceptions
                  def get_file_size(self, wire, revision=None, path=''):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _get_file_size(_repo_id, _revision, _path):
                          repo = self._factory.repo(wire)
                          fsobj = svn.repos.fs(repo)
                          if _revision is None:
                              _revision = svn.fs.youngest_revision(fsobj)
                          root = svn.fs.revision_root(fsobj, _revision)
                          size = svn.fs.file_length(root, path)
                          return size
                      return _get_file_size(repo_id, revision, path)
                  def create_repository(self, wire, compatible_version=None):
                      log.info('Creating Subversion repository in path "%s"', wire['path'])
                      self._factory.repo(wire, create=True,
                                         compatible_version=compatible_version)
                  def get_url_and_credentials(self, src_url) -> tuple[str, str, str]:
                      obj = urllib.parse.urlparse(src_url)
                      username = obj.username or ''
                      password = obj.password or ''
                      return username, password, src_url
                  def import_remote_repository(self, wire, src_url):
                      repo_path = wire['path']
                      if not self.is_path_valid_repository(wire, repo_path):
                          raise Exception(
-                             "Path %s is not a valid Subversion repository." % repo_path)
+                             f"Path {repo_path} is not a valid Subversion repository.")
                      username, password, src_url = self.get_url_and_credentials(src_url)
                      rdump_cmd = ['svnrdump', 'dump', '--non-interactive',
                                   '--trust-server-cert-failures=unknown-ca']
                      if username and password:
                          rdump_cmd += ['--username', username, '--password', password]
                      rdump_cmd += [src_url]
                      rdump = subprocess.Popen(
                          rdump_cmd,
                          stdout=subprocess.PIPE, stderr=subprocess.PIPE)
                      load = subprocess.Popen(
                          ['svnadmin', 'load', repo_path], stdin=rdump.stdout)
                      # TODO: johbo: This can be a very long operation, might be better
                      # to track some kind of status and provide an api to check if the
                      # import is done.
                      rdump.wait()
                      load.wait()
                      log.debug('Return process ended with code: %s', rdump.returncode)
                      if rdump.returncode != 0:
                          errors = rdump.stderr.read()
                          log.error('svnrdump dump failed: statuscode %s: message: %s', rdump.returncode, errors)
                          reason = 'UNKNOWN'
                          if b'svnrdump: E230001:' in errors:
                              reason = 'INVALID_CERTIFICATE'
                          if reason == 'UNKNOWN':
                              reason = f'UNKNOWN:{safe_str(errors)}'
                          raise Exception(
                              'Failed to dump the remote repository from {}. Reason:{}'.format(
                                  src_url, reason))
                      if load.returncode != 0:
                          raise Exception(
-                             'Failed to load the dump of remote repository from %s.' %
-                             (src_url, ))
+                             f'Failed to load the dump of remote repository from {src_url}.')
                  def commit(self, wire, message, author, timestamp, updated, removed):
                      message = safe_bytes(message)
                      author = safe_bytes(author)
                      repo = self._factory.repo(wire)
                      fsobj = svn.repos.fs(repo)
                      rev = svn.fs.youngest_rev(fsobj)
                      txn = svn.repos.fs_begin_txn_for_commit(repo, rev, author, message)
                      txn_root = svn.fs.txn_root(txn)
                      for node in updated:
                          TxnNodeProcessor(node, txn_root).update()
                      for node in removed:
                          TxnNodeProcessor(node, txn_root).remove()
                      commit_id = svn.repos.fs_commit_txn(repo, txn)
                      if timestamp:
                          apr_time = apr_time_t(timestamp)
                          ts_formatted = svn.core.svn_time_to_cstring(apr_time)
                          svn.fs.change_rev_prop(fsobj, commit_id, 'svn:date', ts_formatted)
                      log.debug('Committed revision "%s" to "%s".', commit_id, wire['path'])
                      return commit_id
                  @reraise_safe_exceptions
                  def diff(self, wire, rev1, rev2, path1=None, path2=None,
                           ignore_whitespace=False, context=3):
                      wire.update(cache=False)
                      repo = self._factory.repo(wire)
                      diff_creator = SvnDiffer(
                          repo, rev1, path1, rev2, path2, ignore_whitespace, context)
                      try:
                          return BytesEnvelope(diff_creator.generate_diff())
                      except svn.core.SubversionException as e:
                          log.exception(
                              "Error during diff operation operation. "
                              "Path might not exist %s, %s", path1, path2)
                          return BytesEnvelope(b'')
                  @reraise_safe_exceptions
                  def is_large_file(self, wire, path):
                      return False
                  @reraise_safe_exceptions
                  def is_binary(self, wire, rev, path):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _is_binary(_repo_id, _rev, _path):
                          raw_bytes = self.get_file_content(wire, rev, path)
                          if not raw_bytes:
                              return False
                          return b'\0' in raw_bytes
                      return _is_binary(repo_id, rev, path)
                  @reraise_safe_exceptions
                  def md5_hash(self, wire, rev, path):
                      cache_on, context_uid, repo_id = self._cache_on(wire)
                      region = self._region(wire)
                      @region.conditional_cache_on_arguments(condition=cache_on)
                      def _md5_hash(_repo_id, _rev, _path):
                          return ''
                      return _md5_hash(repo_id, rev, path)
                  @reraise_safe_exceptions
                  def run_svn_command(self, wire, cmd, **opts):
                      path = wire.get('path', None)
                      if path and os.path.isdir(path):
                          opts['cwd'] = path
                      safe_call = opts.pop('_safe', False)
                      svnenv = os.environ.copy()
                      svnenv.update(opts.pop('extra_env', {}))
                      _opts = {'env': svnenv, 'shell': False}
                      try:
                          _opts.update(opts)
                          proc = subprocessio.SubprocessIOChunker(cmd, **_opts)
                          return b''.join(proc), b''.join(proc.stderr)
                      except OSError as err:
                          if safe_call:
                              return '', safe_str(err).strip()
                          else:
                              cmd = ' '.join(map(safe_str, cmd))  # human friendly CMD
                              tb_err = ("Couldn't run svn command (%s).\n"
                                        "Original error was:%s\n"
                                        "Call options:%s\n"
                                        % (cmd, err, _opts))
                              log.exception(tb_err)
                              raise exceptions.VcsException()(tb_err)
                  @reraise_safe_exceptions
                  def install_hooks(self, wire, force=False):
                      from vcsserver.hook_utils import install_svn_hooks
                      repo_path = wire['path']
                      binary_dir = settings.BINARY_DIR
                      executable = None
                      if binary_dir:
                          executable = os.path.join(binary_dir, 'python3')
                      return install_svn_hooks(repo_path, force_create=force)
                  @reraise_safe_exceptions
                  def get_hooks_info(self, wire):
                      from vcsserver.hook_utils import (
                          get_svn_pre_hook_version, get_svn_post_hook_version)
                      repo_path = wire['path']
                      return {
                          'pre_version': get_svn_pre_hook_version(repo_path),
                          'post_version': get_svn_post_hook_version(repo_path),
                      }
                  @reraise_safe_exceptions
                  def set_head_ref(self, wire, head_name):
                      pass
                  @reraise_safe_exceptions
                  def archive_repo(self, wire, archive_name_key, kind, mtime, archive_at_path,
                                   archive_dir_name, commit_id, cache_config):
                      def walk_tree(root, root_dir, _commit_id):
                          """
                          Special recursive svn repo walker
                          """
                          root_dir = safe_bytes(root_dir)
                          filemode_default = 0o100644
                          filemode_executable = 0o100755
                          file_iter = svn.fs.dir_entries(root, root_dir)
                          for f_name in file_iter:
                              f_type = NODE_TYPE_MAPPING.get(file_iter[f_name].kind, None)
                              if f_type == 'dir':
                                  # return only DIR, and then all entries in that dir
                                  yield os.path.join(root_dir, f_name), {'mode': filemode_default}, f_type
                                  new_root = os.path.join(root_dir, f_name)
                                  yield from walk_tree(root, new_root, _commit_id)
                              else:
                                  f_path = os.path.join(root_dir, f_name).rstrip(b'/')
                                  prop_list = svn.fs.node_proplist(root, f_path)
                                  f_mode = filemode_default
                                  if prop_list.get('svn:executable'):
                                      f_mode = filemode_executable
                                  f_is_link = False
                                  if prop_list.get('svn:special'):
                                      f_is_link = True
                                  data = {
                                      'is_link': f_is_link,
                                      'mode': f_mode,
                                      'content_stream': svn.core.Stream(svn.fs.file_contents(root, f_path)).read
                                  }
                                  yield f_path, data, f_type
                      def file_walker(_commit_id, path):
                          repo = self._factory.repo(wire)
                          root = svn.fs.revision_root(svn.repos.fs(repo), int(commit_id))
                          def no_content():
                              raise NoContentException()
                          for f_name, f_data, f_type in walk_tree(root, path, _commit_id):
                              file_path = f_name
                              if f_type == 'dir':
                                  mode = f_data['mode']
                                  yield ArchiveNode(file_path, mode, False, no_content)
                              else:
                                  mode = f_data['mode']
                                  is_link = f_data['is_link']
                                  data_stream = f_data['content_stream']
                                  yield ArchiveNode(file_path, mode, is_link, data_stream)
                      return store_archive_in_cache(
                          file_walker, archive_name_key, kind, mtime, archive_at_path, archive_dir_name, commit_id, cache_config=cache_config)
-             class SvnDiffer(object):
+             class SvnDiffer:
                  """
                  Utility to create diffs based on difflib and the Subversion api
                  """
                  binary_content = False
                  def __init__(
                          self, repo, src_rev, src_path, tgt_rev, tgt_path,
                          ignore_whitespace, context):
                      self.repo = repo
                      self.ignore_whitespace = ignore_whitespace
                      self.context = context
                      fsobj = svn.repos.fs(repo)
                      self.tgt_rev = tgt_rev
                      self.tgt_path = tgt_path or ''
                      self.tgt_root = svn.fs.revision_root(fsobj, tgt_rev)
                      self.tgt_kind = svn.fs.check_path(self.tgt_root, self.tgt_path)
                      self.src_rev = src_rev
                      self.src_path = src_path or self.tgt_path
                      self.src_root = svn.fs.revision_root(fsobj, src_rev)
                      self.src_kind = svn.fs.check_path(self.src_root, self.src_path)
                      self._validate()
                  def _validate(self):
                      if (self.tgt_kind != svn.core.svn_node_none and
                              self.src_kind != svn.core.svn_node_none and
                              self.src_kind != self.tgt_kind):
                          # TODO: johbo: proper error handling
                          raise Exception(
                              "Source and target are not compatible for diff generation. "
                              "Source type: %s, target type: %s" %
                              (self.src_kind, self.tgt_kind))
                  def generate_diff(self) -> bytes:
                      buf = io.BytesIO()
                      if self.tgt_kind == svn.core.svn_node_dir:
                          self._generate_dir_diff(buf)
                      else:
                          self._generate_file_diff(buf)
                      return buf.getvalue()
                  def _generate_dir_diff(self, buf: io.BytesIO):
                      editor = DiffChangeEditor()
                      editor_ptr, editor_baton = svn.delta.make_editor(editor)
                      svn.repos.dir_delta2(
                          self.src_root,
                          self.src_path,
                          '',  # src_entry
                          self.tgt_root,
                          self.tgt_path,
                          editor_ptr, editor_baton,
                          authorization_callback_allow_all,
                          False,  # text_deltas
                          svn.core.svn_depth_infinity,  # depth
                          False,  # entry_props
                          False,  # ignore_ancestry
                      )
                      for path, __, change in sorted(editor.changes):
                          self._generate_node_diff(
                              buf, change, path, self.tgt_path, path, self.src_path)
                  def _generate_file_diff(self, buf: io.BytesIO):
                      change = None
                      if self.src_kind == svn.core.svn_node_none:
                          change = "add"
                      elif self.tgt_kind == svn.core.svn_node_none:
                          change = "delete"
                      tgt_base, tgt_path = vcspath.split(self.tgt_path)
                      src_base, src_path = vcspath.split(self.src_path)
                      self._generate_node_diff(
                          buf, change, tgt_path, tgt_base, src_path, src_base)
                  def _generate_node_diff(
                          self, buf: io.BytesIO, change, tgt_path, tgt_base, src_path, src_base):
                      tgt_path_bytes = safe_bytes(tgt_path)
                      tgt_path = safe_str(tgt_path)
                      src_path_bytes = safe_bytes(src_path)
                      src_path = safe_str(src_path)
                      if self.src_rev == self.tgt_rev and tgt_base == src_base:
                          # makes consistent behaviour with git/hg to return empty diff if
                          # we compare same revisions
                          return
                      tgt_full_path = vcspath.join(tgt_base, tgt_path)
                      src_full_path = vcspath.join(src_base, src_path)
                      self.binary_content = False
                      mime_type = self._get_mime_type(tgt_full_path)
                      if mime_type and not mime_type.startswith(b'text'):
                          self.binary_content = True
                          buf.write(b"=" * 67 + b'\n')
                          buf.write(b"Cannot display: file marked as a binary type.\n")
                          buf.write(b"svn:mime-type = %s\n" % mime_type)
                      buf.write(b"Index: %b\n" % tgt_path_bytes)
                      buf.write(b"=" * 67 + b'\n')
                      buf.write(b"diff --git a/%b b/%b\n" % (tgt_path_bytes, tgt_path_bytes))
                      if change == 'add':
                          # TODO: johbo: SVN is missing a zero here compared to git
                          buf.write(b"new file mode 10644\n")
                          # TODO(marcink): intro to binary detection of svn patches
                          # if self.binary_content:
                          #     buf.write(b'GIT binary patch\n')
                          buf.write(b"--- /dev/null\t(revision 0)\n")
                          src_lines = []
                      else:
                          if change == 'delete':
                              buf.write(b"deleted file mode 10644\n")
                          # TODO(marcink): intro to binary detection of svn patches
                          # if self.binary_content:
                          #     buf.write('GIT binary patch\n')
                          buf.write(b"--- a/%b\t(revision %d)\n" % (src_path_bytes, self.src_rev))
                          src_lines = self._svn_readlines(self.src_root, src_full_path)
                      if change == 'delete':
                          buf.write(b"+++ /dev/null\t(revision %d)\n" % self.tgt_rev)
                          tgt_lines = []
                      else:
                          buf.write(b"+++ b/%b\t(revision %d)\n" % (tgt_path_bytes, self.tgt_rev))
                          tgt_lines = self._svn_readlines(self.tgt_root, tgt_full_path)
                      # we made our diff header, time to generate the diff content into our buffer
                      if not self.binary_content:
                          udiff = svn_diff.unified_diff(
                              src_lines, tgt_lines, context=self.context,
                              ignore_blank_lines=self.ignore_whitespace,
                              ignore_case=False,
                              ignore_space_changes=self.ignore_whitespace)
                          buf.writelines(udiff)
                  def _get_mime_type(self, path) -> bytes:
                      try:
                          mime_type = svn.fs.node_prop(
                              self.tgt_root, path, svn.core.SVN_PROP_MIME_TYPE)
                      except svn.core.SubversionException:
                          mime_type = svn.fs.node_prop(
                              self.src_root, path, svn.core.SVN_PROP_MIME_TYPE)
                      return mime_type
                  def _svn_readlines(self, fs_root, node_path):
                      if self.binary_content:
                          return []
                      node_kind = svn.fs.check_path(fs_root, node_path)
                      if node_kind not in (
                              svn.core.svn_node_file, svn.core.svn_node_symlink):
                          return []
                      content = svn.core.Stream(
                          svn.fs.file_contents(fs_root, node_path)).read()
                      return content.splitlines(True)
              class DiffChangeEditor(svn.delta.Editor):
                  """
                  Records changes between two given revisions
                  """
                  def __init__(self):
                      self.changes = []
                  def delete_entry(self, path, revision, parent_baton, pool=None):
                      self.changes.append((path, None, 'delete'))
                  def add_file(
                          self, path, parent_baton, copyfrom_path, copyfrom_revision,
                          file_pool=None):
                      self.changes.append((path, 'file', 'add'))
                  def open_file(self, path, parent_baton, base_revision, file_pool=None):
                      self.changes.append((path, 'file', 'change'))
              def authorization_callback_allow_all(root, path, pool):
                  return True
-             class TxnNodeProcessor(object):
+             class TxnNodeProcessor:
                  """
                  Utility to process the change of one node within a transaction root.
                  It encapsulates the knowledge of how to add, update or remove
                  a node for a given transaction root. The purpose is to support the method
                  `SvnRemote.commit`.
                  """
                  def __init__(self, node, txn_root):
                      assert_bytes(node['path'])
                      self.node = node
                      self.txn_root = txn_root
                  def update(self):
                      self._ensure_parent_dirs()
                      self._add_file_if_node_does_not_exist()
                      self._update_file_content()
                      self._update_file_properties()
                  def remove(self):
                      svn.fs.delete(self.txn_root, self.node['path'])
                      # TODO: Clean up directory if empty
                  def _ensure_parent_dirs(self):
                      curdir = vcspath.dirname(self.node['path'])
                      dirs_to_create = []
                      while not self._svn_path_exists(curdir):
                          dirs_to_create.append(curdir)
                          curdir = vcspath.dirname(curdir)
                      for curdir in reversed(dirs_to_create):
                          log.debug('Creating missing directory "%s"', curdir)
                          svn.fs.make_dir(self.txn_root, curdir)
                  def _svn_path_exists(self, path):
                      path_status = svn.fs.check_path(self.txn_root, path)
                      return path_status != svn.core.svn_node_none
                  def _add_file_if_node_does_not_exist(self):
                      kind = svn.fs.check_path(self.txn_root, self.node['path'])
                      if kind == svn.core.svn_node_none:
                          svn.fs.make_file(self.txn_root, self.node['path'])
                  def _update_file_content(self):
                      assert_bytes(self.node['content'])
                      handler, baton = svn.fs.apply_textdelta(
                          self.txn_root, self.node['path'], None, None)
                      svn.delta.svn_txdelta_send_string(self.node['content'], handler, baton)
                  def _update_file_properties(self):
                      properties = self.node.get('properties', {})
                      for key, value in properties.items():
                          svn.fs.change_node_prop(
                              self.txn_root, self.node['path'], safe_bytes(key), safe_bytes(value))
              def apr_time_t(timestamp):
                  """
                  Convert a Python timestamp into APR timestamp type apr_time_t
                  """
                  return int(timestamp * 1E6)
              def svn_opt_revision_value_t(num):
                  """
                  Put `num` into a `svn_opt_revision_value_t` structure.
                  """
                  value = svn.core.svn_opt_revision_value_t()
                  value.number = num
                  revision = svn.core.svn_opt_revision_t()
                  revision.kind = svn.core.svn_opt_revision_number
                  revision.value = value
                  return revision

vcsserver/remote_wsgi.py

0 +2 -2

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              from vcsserver import scm_app, wsgi_app_caller
-             class GitRemoteWsgi(object):
+             class GitRemoteWsgi:
                  def handle(self, environ, input_data, *args, **kwargs):
                      app = wsgi_app_caller.WSGIAppCaller(
                          scm_app.create_git_wsgi_app(*args, **kwargs))
                      return app.handle(environ, input_data)
-             class HgRemoteWsgi(object):
+             class HgRemoteWsgi:
                  def handle(self, environ, input_data, *args, **kwargs):
                      app = wsgi_app_caller.WSGIAppCaller(
                          scm_app.create_hg_wsgi_app(*args, **kwargs))
                      return app.handle(environ, input_data)

vcsserver/scm_app.py

0 +2 -2

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import os
              import logging
              import itertools
              import mercurial
              import mercurial.error
              import mercurial.wireprotoserver
              import mercurial.hgweb.common
              import mercurial.hgweb.hgweb_mod
              import webob.exc
              from vcsserver import pygrack, exceptions, settings, git_lfs
              from vcsserver.str_utils import ascii_bytes, safe_bytes
              log = logging.getLogger(__name__)
              # propagated from mercurial documentation
              HG_UI_SECTIONS = [
                  'alias', 'auth', 'decode/encode', 'defaults', 'diff', 'email', 'extensions',
                  'format', 'merge-patterns', 'merge-tools', 'hooks', 'http_proxy', 'smtp',
                  'patch', 'paths', 'profiling', 'server', 'trusted', 'ui', 'web',
              ]
              class HgWeb(mercurial.hgweb.hgweb_mod.hgweb):
                  """Extension of hgweb that simplifies some functions."""
                  def _get_view(self, repo):
                      """Views are not supported."""
                      return repo
                  def loadsubweb(self):
                      """The result is only used in the templater method which is not used."""
                      return None
                  def run(self):
                      """Unused function so raise an exception if accidentally called."""
                      raise NotImplementedError
                  def templater(self, req):
                      """Function used in an unreachable code path.
                      This code is unreachable because we guarantee that the HTTP request,
                      corresponds to a Mercurial command. See the is_hg method. So, we are
                      never going to get a user-visible url.
                      """
                      raise NotImplementedError
                  def archivelist(self, nodeid):
                      """Unused function so raise an exception if accidentally called."""
                      raise NotImplementedError
                  def __call__(self, environ, start_response):
                      """Run the WSGI application.
                      This may be called by multiple threads.
                      """
                      from mercurial.hgweb import request as requestmod
                      req = requestmod.parserequestfromenv(environ)
                      res = requestmod.wsgiresponse(req, start_response)
                      gen = self.run_wsgi(req, res)
                      first_chunk = None
                      try:
                          data = next(gen)
                          def first_chunk():
                              yield data
                      except StopIteration:
                          pass
                      if first_chunk:
                          return itertools.chain(first_chunk(), gen)
                      return gen
                  def _runwsgi(self, req, res, repo):
                      cmd = req.qsparams.get(b'cmd', '')
                      if not mercurial.wireprotoserver.iscmd(cmd):
                          # NOTE(marcink): for unsupported commands, we return bad request
                          # internally from HG
                          log.warning('cmd: `%s` is not supported by the mercurial wireprotocol v1', cmd)
                          from mercurial.hgweb.common import statusmessage
                          res.status = statusmessage(mercurial.hgweb.common.HTTP_BAD_REQUEST)
                          res.setbodybytes(b'')
                          return res.sendresponse()
                      return super()._runwsgi(req, res, repo)
              def make_hg_ui_from_config(repo_config):
                  baseui = mercurial.ui.ui()
                  # clean the baseui object
                  baseui._ocfg = mercurial.config.config()
                  baseui._ucfg = mercurial.config.config()
                  baseui._tcfg = mercurial.config.config()
                  for section, option, value in repo_config:
                      baseui.setconfig(
                          ascii_bytes(section, allow_bytes=True),
                          ascii_bytes(option, allow_bytes=True),
                          ascii_bytes(value, allow_bytes=True))
                  # make our hgweb quiet so it doesn't print output
                  baseui.setconfig(b'ui', b'quiet', b'true')
                  return baseui
              def update_hg_ui_from_hgrc(baseui, repo_path):
                  path = os.path.join(repo_path, '.hg', 'hgrc')
                  if not os.path.isfile(path):
                      log.debug('hgrc file is not present at %s, skipping...', path)
                      return
                  log.debug('reading hgrc from %s', path)
                  cfg = mercurial.config.config()
                  cfg.read(ascii_bytes(path))
                  for section in HG_UI_SECTIONS:
                      for k, v in cfg.items(section):
                          log.debug('settings ui from file: [%s] %s=%s', section, k, v)
                          baseui.setconfig(
                              ascii_bytes(section, allow_bytes=True),
                              ascii_bytes(k, allow_bytes=True),
                              ascii_bytes(v, allow_bytes=True))
              def create_hg_wsgi_app(repo_path, repo_name, config):
                  """
                  Prepares a WSGI application to handle Mercurial requests.
                  :param config: is a list of 3-item tuples representing a ConfigObject
                      (it is the serialized version of the config object).
                  """
                  log.debug("Creating Mercurial WSGI application")
                  baseui = make_hg_ui_from_config(config)
                  update_hg_ui_from_hgrc(baseui, repo_path)
                  try:
                      return HgWeb(safe_bytes(repo_path), name=safe_bytes(repo_name), baseui=baseui)
                  except mercurial.error.RequirementError as e:
                      raise exceptions.RequirementException(e)(e)
-             class GitHandler(object):
+             class GitHandler:
                  """
                  Handler for Git operations like push/pull etc
                  """
                  def __init__(self, repo_location, repo_name, git_path, update_server_info,
                               extras):
                      if not os.path.isdir(repo_location):
                          raise OSError(repo_location)
                      self.content_path = repo_location
                      self.repo_name = repo_name
                      self.repo_location = repo_location
                      self.extras = extras
                      self.git_path = git_path
                      self.update_server_info = update_server_info
                  def __call__(self, environ, start_response):
                      app = webob.exc.HTTPNotFound()
                      candidate_paths = (
                          self.content_path, os.path.join(self.content_path, '.git'))
                      for content_path in candidate_paths:
                          try:
                              app = pygrack.GitRepository(
                                  self.repo_name, content_path, self.git_path,
                                  self.update_server_info, self.extras)
                              break
                          except OSError:
                              continue
                      return app(environ, start_response)
              def create_git_wsgi_app(repo_path, repo_name, config):
                  """
                  Creates a WSGI application to handle Git requests.
                  :param config: is a dictionary holding the extras.
                  """
                  git_path = settings.GIT_EXECUTABLE
                  update_server_info = config.pop('git_update_server_info')
                  app = GitHandler(
                      repo_path, repo_name, git_path, update_server_info, config)
                  return app
-             class GitLFSHandler(object):
+             class GitLFSHandler:
                  """
                  Handler for Git LFS operations
                  """
                  def __init__(self, repo_location, repo_name, git_path, update_server_info,
                               extras):
                      if not os.path.isdir(repo_location):
                          raise OSError(repo_location)
                      self.content_path = repo_location
                      self.repo_name = repo_name
                      self.repo_location = repo_location
                      self.extras = extras
                      self.git_path = git_path
                      self.update_server_info = update_server_info
                  def get_app(self, git_lfs_enabled, git_lfs_store_path, git_lfs_http_scheme):
                      app = git_lfs.create_app(git_lfs_enabled, git_lfs_store_path, git_lfs_http_scheme)
                      return app
              def create_git_lfs_wsgi_app(repo_path, repo_name, config):
                  git_path = settings.GIT_EXECUTABLE
                  update_server_info = config.pop(b'git_update_server_info')
                  git_lfs_enabled = config.pop(b'git_lfs_enabled')
                  git_lfs_store_path = config.pop(b'git_lfs_store_path')
                  git_lfs_http_scheme = config.pop(b'git_lfs_http_scheme', 'http')
                  app = GitLFSHandler(
                      repo_path, repo_name, git_path, update_server_info, config)
                  return app.get_app(git_lfs_enabled, git_lfs_store_path, git_lfs_http_scheme)

vcsserver/server.py

0 +1 -1

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import gc
              import logging
              import os
              import time
              log = logging.getLogger(__name__)
-             class VcsServer(object):
+             class VcsServer:
                  """
                  Exposed remote interface of the vcsserver itself.
                  This object can be used to manage the server remotely. Right now the main
                  use case is to allow to shut down the server.
                  """
                  _shutdown = False
                  def shutdown(self):
                      self._shutdown = True
                  def ping(self):
                      """
                      Utility to probe a server connection.
                      """
                      log.debug("Received server ping.")
                  def echo(self, data):
                      """
                      Utility for performance testing.
                      Allows to pass in arbitrary data and will return this data.
                      """
                      log.debug("Received server echo.")
                      return data
                  def sleep(self, seconds):
                      """
                      Utility to simulate long running server interaction.
                      """
                      log.debug("Sleeping %s seconds", seconds)
                      time.sleep(seconds)
                  def get_pid(self):
                      """
                      Allows to discover the PID based on a proxy object.
                      """
                      return os.getpid()
                  def run_gc(self):
                      """
                      Allows to trigger the garbage collector.
                      Main intention is to support statistics gathering during test runs.
                      """
                      freed_objects = gc.collect()
                      return {
                          'freed_objects': freed_objects,
                          'garbage': len(gc.garbage),
                      }

vcsserver/subprocessio.py

0 +2 -2

              """
              Module provides a class allowing to wrap communication over subprocess.Popen
              input, output, error streams into a meaningfull, non-blocking, concurrent
              stream processor exposing the output data as an iterator fitting to be a
              return value passed by a WSGI applicaiton to a WSGI server per PEP 3333.
              Copyright (c) 2011  Daniel Dotsenko <dotsa[at]hotmail.com>
              This file is part of git_http_backend.py Project.
              git_http_backend.py Project is free software: you can redistribute it and/or
              modify it under the terms of the GNU Lesser General Public License as
              published by the Free Software Foundation, either version 2.1 of the License,
              or (at your option) any later version.
              git_http_backend.py Project is distributed in the hope that it will be useful,
              but WITHOUT ANY WARRANTY; without even the implied warranty of
              MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
              GNU Lesser General Public License for more details.
              You should have received a copy of the GNU Lesser General Public License
              along with git_http_backend.py Project.
              If not, see <http://www.gnu.org/licenses/>.
              """
              import os
              import collections
              import logging
              import subprocess
              import threading
              from vcsserver.str_utils import safe_str
              log = logging.getLogger(__name__)
              class StreamFeeder(threading.Thread):
                  """
                  Normal writing into pipe-like is blocking once the buffer is filled.
                  This thread allows a thread to seep data from a file-like into a pipe
                  without blocking the main thread.
                  We close inpipe once the end of the source stream is reached.
                  """
                  def __init__(self, source):
                      super().__init__()
                      self.daemon = True
                      filelike = False
                      self.bytes = b''
                      if type(source) in (str, bytes, bytearray):  # string-like
                          self.bytes = bytes(source)
                      else:  # can be either file pointer or file-like
                          if isinstance(source, int):  # file pointer it is
                              # converting file descriptor (int) stdin into file-like
                              source = os.fdopen(source, 'rb', 16384)
                          # let's see if source is file-like by now
                          filelike = hasattr(source, 'read')
                      if not filelike and not self.bytes:
                          raise TypeError("StreamFeeder's source object must be a readable "
                                          "file-like, a file descriptor, or a string-like.")
                      self.source = source
                      self.readiface, self.writeiface = os.pipe()
                  def run(self):
                      writer = self.writeiface
                      try:
                          if self.bytes:
                              os.write(writer, self.bytes)
                          else:
                              s = self.source
                              while 1:
                                  _bytes = s.read(4096)
                                  if not _bytes:
                                      break
                                  os.write(writer, _bytes)
                      finally:
                          os.close(writer)
                  @property
                  def output(self):
                      return self.readiface
              class InputStreamChunker(threading.Thread):
                  def __init__(self, source, target, buffer_size, chunk_size):
                      super().__init__()
                      self.daemon = True  # die die die.
                      self.source = source
                      self.target = target
                      self.chunk_count_max = int(buffer_size / chunk_size) + 1
                      self.chunk_size = chunk_size
                      self.data_added = threading.Event()
                      self.data_added.clear()
                      self.keep_reading = threading.Event()
                      self.keep_reading.set()
                      self.EOF = threading.Event()
                      self.EOF.clear()
                      self.go = threading.Event()
                      self.go.set()
                  def stop(self):
                      self.go.clear()
                      self.EOF.set()
                      try:
                          # this is not proper, but is done to force the reader thread let
                          # go of the input because, if successful, .close() will send EOF
                          # down the pipe.
                          self.source.close()
                      except Exception:
                          pass
                  def run(self):
                      s = self.source
                      t = self.target
                      cs = self.chunk_size
                      chunk_count_max = self.chunk_count_max
                      keep_reading = self.keep_reading
                      da = self.data_added
                      go = self.go
                      try:
                          b = s.read(cs)
                      except ValueError:
                          b = ''
                      timeout_input = 20
                      while b and go.is_set():
                          if len(t) > chunk_count_max:
                              keep_reading.clear()
                              keep_reading.wait(timeout_input)
                              if len(t) > chunk_count_max + timeout_input:
                                  log.error("Timed out while waiting for input from subprocess.")
                                  os._exit(-1)  # this will cause the worker to recycle itself
                          t.append(b)
                          da.set()
                          try:
                              b = s.read(cs)
                          except ValueError:  # probably "I/O operation on closed file"
                              b = ''
                      self.EOF.set()
                      da.set()  # for cases when done but there was no input.
-             class BufferedGenerator(object):
+             class BufferedGenerator:
                  """
                  Class behaves as a non-blocking, buffered pipe reader.
                  Reads chunks of data (through a thread)
                  from a blocking pipe, and attaches these to an array (Deque) of chunks.
                  Reading is halted in the thread when max chunks is internally buffered.
                  The .next() may operate in blocking or non-blocking fashion by yielding
                  '' if no data is ready
                  to be sent or by not returning until there is some data to send
                  When we get EOF from underlying source pipe we raise the marker to raise
                  StopIteration after the last chunk of data is yielded.
                  """
                  def __init__(self, name, source, buffer_size=65536, chunk_size=4096,
                               starting_values=None, bottomless=False):
                      starting_values = starting_values or []
                      self.name = name
                      self.buffer_size = buffer_size
                      self.chunk_size = chunk_size
                      if bottomless:
                          maxlen = int(buffer_size / chunk_size)
                      else:
                          maxlen = None
                      self.data_queue = collections.deque(starting_values, maxlen)
                      self.worker = InputStreamChunker(source, self.data_queue, buffer_size, chunk_size)
                      if starting_values:
                          self.worker.data_added.set()
                      self.worker.start()
                  ####################
                  # Generator's methods
                  ####################
                  def __str__(self):
                      return f'BufferedGenerator(name={self.name} chunk: {self.chunk_size} on buffer: {self.buffer_size})'
                  def __iter__(self):
                      return self
                  def __next__(self):
                      while not self.length and not self.worker.EOF.is_set():
                          self.worker.data_added.clear()
                          self.worker.data_added.wait(0.2)
                      if self.length:
                          self.worker.keep_reading.set()
                          return bytes(self.data_queue.popleft())
                      elif self.worker.EOF.is_set():
                          raise StopIteration
                  def throw(self, exc_type, value=None, traceback=None):
                      if not self.worker.EOF.is_set():
                          raise exc_type(value)
                  def start(self):
                      self.worker.start()
                  def stop(self):
                      self.worker.stop()
                  def close(self):
                      try:
                          self.worker.stop()
                          self.throw(GeneratorExit)
                      except (GeneratorExit, StopIteration):
                          pass
                  ####################
                  # Threaded reader's infrastructure.
                  ####################
                  @property
                  def input(self):
                      return self.worker.w
                  @property
                  def data_added_event(self):
                      return self.worker.data_added
                  @property
                  def data_added(self):
                      return self.worker.data_added.is_set()
                  @property
                  def reading_paused(self):
                      return not self.worker.keep_reading.is_set()
                  @property
                  def done_reading_event(self):
                      """
                      Done_reding does not mean that the iterator's buffer is empty.
                      Iterator might have done reading from underlying source, but the read
                      chunks might still be available for serving through .next() method.
                      :returns: An Event class instance.
                      """
                      return self.worker.EOF
                  @property
                  def done_reading(self):
                      """
                      Done_reading does not mean that the iterator's buffer is empty.
                      Iterator might have done reading from underlying source, but the read
                      chunks might still be available for serving through .next() method.
                      :returns: An Bool value.
                      """
                      return self.worker.EOF.is_set()
                  @property
                  def length(self):
                      """
                      returns int.
                      This is the length of the queue of chunks, not the length of
                      the combined contents in those chunks.
                      __len__() cannot be meaningfully implemented because this
                      reader is just flying through a bottomless pit content and
                      can only know the length of what it already saw.
                      If __len__() on WSGI server per PEP 3333 returns a value,
                      the response's length will be set to that. In order not to
                      confuse WSGI PEP3333 servers, we will not implement __len__
                      at all.
                      """
                      return len(self.data_queue)
                  def prepend(self, x):
                      self.data_queue.appendleft(x)
                  def append(self, x):
                      self.data_queue.append(x)
                  def extend(self, o):
                      self.data_queue.extend(o)
                  def __getitem__(self, i):
                      return self.data_queue[i]
-             class SubprocessIOChunker(object):
+             class SubprocessIOChunker:
                  """
                  Processor class wrapping handling of subprocess IO.
                  .. important::
                     Watch out for the method `__del__` on this class. If this object
                     is deleted, it will kill the subprocess, so avoid to
                     return the `output` attribute or usage of it like in the following
                     example::
                        # `args` expected to run a program that produces a lot of output
                        output = ''.join(SubprocessIOChunker(
                           args, shell=False, inputstream=inputstream, env=environ).output)
                        # `output` will not contain all the data, because the __del__ method
                        # has already killed the subprocess in this case before all output
                        # has been consumed.
                  In a way, this is a "communicate()" replacement with a twist.
                  - We are multithreaded. Writing in and reading out, err are all sep threads.
                  - We support concurrent (in and out) stream processing.
                  - The output is not a stream. It's a queue of read string (bytes, not str)
                    chunks. The object behaves as an iterable. You can "for chunk in obj:" us.
                  - We are non-blocking in more respects than communicate()
                    (reading from subprocess out pauses when internal buffer is full, but
                     does not block the parent calling code. On the flip side, reading from
                     slow-yielding subprocess may block the iteration until data shows up. This
                     does not block the parallel inpipe reading occurring parallel thread.)
                  The purpose of the object is to allow us to wrap subprocess interactions into
                  an iterable that can be passed to a WSGI server as the application's return
                  value. Because of stream-processing-ability, WSGI does not have to read ALL
                  of the subprocess's output and buffer it, before handing it to WSGI server for
                  HTTP response. Instead, the class initializer reads just a bit of the stream
                  to figure out if error occurred or likely to occur and if not, just hands the
                  further iteration over subprocess output to the server for completion of HTTP
                  response.
                  The real or perceived subprocess error is trapped and raised as one of
                  OSError family of exceptions
                  Example usage:
                  #    try:
                  #        answer = SubprocessIOChunker(
                  #            cmd,
                  #            input,
                  #            buffer_size = 65536,
                  #            chunk_size = 4096
                  #            )
                  #    except (OSError) as e:
                  #        print str(e)
                  #        raise e
                  #
                  #    return answer
                  """
                  # TODO: johbo: This is used to make sure that the open end of the PIPE
                  # is closed in the end. It would be way better to wrap this into an
                  # object, so that it is closed automatically once it is consumed or
                  # something similar.
                  _close_input_fd = None
                  _closed = False
                  _stdout = None
                  _stderr = None
                  def __init__(self, cmd, input_stream=None, buffer_size=65536,
                               chunk_size=4096, starting_values=None, fail_on_stderr=True,
                               fail_on_return_code=True, **kwargs):
                      """
                      Initializes SubprocessIOChunker
                      :param cmd: A Subprocess.Popen style "cmd". Can be string or array of strings
                      :param input_stream: (Default: None) A file-like, string, or file pointer.
                      :param buffer_size: (Default: 65536) A size of total buffer per stream in bytes.
                      :param chunk_size: (Default: 4096) A max size of a chunk. Actual chunk may be smaller.
                      :param starting_values: (Default: []) An array of strings to put in front of output que.
                      :param fail_on_stderr: (Default: True) Whether to raise an exception in
                                             case something is written to stderr.
                      :param fail_on_return_code: (Default: True) Whether to raise an
                                                  exception if the return code is not 0.
                      """
                      kwargs['shell'] = kwargs.get('shell', True)
                      starting_values = starting_values or []
                      if input_stream:
                          input_streamer = StreamFeeder(input_stream)
                          input_streamer.start()
                          input_stream = input_streamer.output
                          self._close_input_fd = input_stream
                      self._fail_on_stderr = fail_on_stderr
                      self._fail_on_return_code = fail_on_return_code
                      self.cmd = cmd
                      _p = subprocess.Popen(cmd, bufsize=-1, stdin=input_stream, stdout=subprocess.PIPE, stderr=subprocess.PIPE,
                                            **kwargs)
                      self.process = _p
                      bg_out = BufferedGenerator('stdout', _p.stdout, buffer_size, chunk_size, starting_values)
                      bg_err = BufferedGenerator('stderr', _p.stderr, 10240, 1, bottomless=True)
                      while not bg_out.done_reading and not bg_out.reading_paused and not bg_err.length:
                          # doing this until we reach either end of file, or end of buffer.
                          bg_out.data_added_event.wait(0.2)
                          bg_out.data_added_event.clear()
                      # at this point it's still ambiguous if we are done reading or just full buffer.
                      # Either way, if error (returned by ended process, or implied based on
                      # presence of stuff in stderr output) we error out.
                      # Else, we are happy.
                      return_code = _p.poll()
                      ret_code_ok = return_code in [None, 0]
                      ret_code_fail = return_code is not None and return_code != 0
                      if (
                          (ret_code_fail and fail_on_return_code) or
                          (ret_code_ok and fail_on_stderr and bg_err.length)
                      ):
                          try:
                              _p.terminate()
                          except Exception:
                              pass
                          bg_out.stop()
                          out = b''.join(bg_out)
                          self._stdout = out
                          bg_err.stop()
                          err = b''.join(bg_err)
                          self._stderr = err
                          # code from https://github.com/schacon/grack/pull/7
                          if err.strip() == b'fatal: The remote end hung up unexpectedly' and out.startswith(b'0034shallow '):
                              bg_out = iter([out])
                              _p = None
                          elif err and fail_on_stderr:
                              text_err = err.decode()
                              raise OSError(
                                  f"Subprocess exited due to an error:\n{text_err}")
                          if ret_code_fail and fail_on_return_code:
                              text_err = err.decode()
                              if not err:
                                  # maybe get empty stderr, try stdout instead
                                  # in many cases git reports the errors on stdout too
                                  text_err = out.decode()
                              raise OSError(
                                  f"Subprocess exited with non 0 ret code:{return_code}: stderr:{text_err}")
                      self.stdout = bg_out
                      self.stderr = bg_err
                      self.inputstream = input_stream
                  def __str__(self):
                      proc = getattr(self, 'process', 'NO_PROCESS')
                      return f'SubprocessIOChunker: {proc}'
                  def __iter__(self):
                      return self
                  def __next__(self):
                      # Note: mikhail: We need to be sure that we are checking the return
                      # code after the stdout stream is closed. Some processes, e.g. git
                      # are doing some magic in between closing stdout and terminating the
                      # process and, as a result,  we are not getting return code on "slow"
                      # systems.
                      result = None
                      stop_iteration = None
                      try:
                          result = next(self.stdout)
                      except StopIteration as e:
                          stop_iteration = e
                      if self.process:
                          return_code = self.process.poll()
                          ret_code_fail = return_code is not None and return_code != 0
                          if ret_code_fail and self._fail_on_return_code:
                              self.stop_streams()
                              err = self.get_stderr()
                              raise OSError(
                                  f"Subprocess exited (exit_code:{return_code}) due to an error during iteration:\n{err}")
                      if stop_iteration:
                          raise stop_iteration
                      return result
                  def throw(self, exc_type, value=None, traceback=None):
                      if self.stdout.length or not self.stdout.done_reading:
                          raise exc_type(value)
                  def close(self):
                      if self._closed:
                          return
                      try:
                          self.process.terminate()
                      except Exception:
                          pass
                      if self._close_input_fd:
                          os.close(self._close_input_fd)
                      try:
                          self.stdout.close()
                      except Exception:
                          pass
                      try:
                          self.stderr.close()
                      except Exception:
                          pass
                      try:
                          os.close(self.inputstream)
                      except Exception:
                          pass
                      self._closed = True
                  def stop_streams(self):
                      getattr(self.stdout, 'stop', lambda: None)()
                      getattr(self.stderr, 'stop', lambda: None)()
                  def get_stdout(self):
                      if self._stdout:
                          return self._stdout
                      else:
                          return b''.join(self.stdout)
                  def get_stderr(self):
                      if self._stderr:
                          return self._stderr
                      else:
                          return b''.join(self.stderr)
              def run_command(arguments, env=None):
                  """
                  Run the specified command and return the stdout.
                  :param arguments: sequence of program arguments (including the program name)
                  :type arguments: list[str]
                  """
                  cmd = arguments
                  log.debug('Running subprocessio command %s', cmd)
                  proc = None
                  try:
                      _opts = {'shell': False, 'fail_on_stderr': False}
                      if env:
                          _opts.update({'env': env})
                      proc = SubprocessIOChunker(cmd, **_opts)
                      return b''.join(proc), b''.join(proc.stderr)
                  except OSError as err:
                      cmd = ' '.join(map(safe_str, cmd)) # human friendly CMD
                      tb_err = ("Couldn't run subprocessio command (%s).\n"
                                "Original error was:%s\n" % (cmd, err))
                      log.exception(tb_err)
                      raise Exception(tb_err)
                  finally:
                      if proc:
                          proc.close()

vcsserver/tests/fixture.py

0 +1 -1

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import os
              import shutil
              import tempfile
              import configparser
-             class ContextINI(object):
+             class ContextINI:
                  """
                  Allows to create a new test.ini file as a copy of existing one with edited
                  data. If existing file is not present, it creates a new one. Example usage::
                      with TestINI('test.ini', [{'section': {'key': 'val'}}]) as new_test_ini_path:
                          print 'vcsserver --config=%s' % new_test_ini
                  """
                  def __init__(self, ini_file_path, ini_params, new_file_prefix=None,
                               destroy=True):
                      self.ini_file_path = ini_file_path
                      self.ini_params = ini_params
                      self.new_path = None
                      self.new_path_prefix = new_file_prefix or 'test'
                      self.destroy = destroy
                  def __enter__(self):
                      _, pref = tempfile.mkstemp()
                      loc = tempfile.gettempdir()
                      self.new_path = os.path.join(loc, '{}_{}_{}'.format(
                          pref, self.new_path_prefix, self.ini_file_path))
                      # copy ini file and modify according to the params, if we re-use a file
                      if os.path.isfile(self.ini_file_path):
                          shutil.copy(self.ini_file_path, self.new_path)
                      else:
                          # create new dump file for configObj to write to.
                          with open(self.new_path, 'wb'):
                              pass
                      parser = configparser.ConfigParser()
                      parser.read(self.ini_file_path)
                      for data in self.ini_params:
                          section, ini_params = list(data.items())[0]
                          key, val = list(ini_params.items())[0]
                          if section not in parser:
                              parser[section] = {}
                          parser[section][key] = val
                      with open(self.ini_file_path, 'w') as f:
                          parser.write(f)
                      return self.new_path
                  def __exit__(self, exc_type, exc_val, exc_tb):
                      if self.destroy:
                          os.remove(self.new_path)
              def no_newline_id_generator(test_name):
                  """
                  Generates a test name without spaces or newlines characters. Used for
                  nicer output of progress of test
                  """
                  org_name = test_name
                  test_name = str(test_name)\
                      .replace('\n', '_N') \
                      .replace('\r', '_N') \
                      .replace('\t', '_T') \
                      .replace(' ', '_S')
                  return test_name or 'test-with-empty-name'

vcsserver/tests/test_git.py

0 +4 -4

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import inspect
              import pytest
              import dulwich.errors
              from mock import Mock, patch
              from vcsserver.remote import git_remote
              SAMPLE_REFS = {
                  'HEAD': 'fd627b9e0dd80b47be81af07c4a98518244ed2f7',
                  'refs/tags/v0.1.9': '341d28f0eec5ddf0b6b77871e13c2bbd6bec685c',
                  'refs/tags/v0.1.8': '74ebce002c088b8a5ecf40073db09375515ecd68',
                  'refs/tags/v0.1.1': 'e6ea6d16e2f26250124a1f4b4fe37a912f9d86a0',
                  'refs/tags/v0.1.3': '5a3a8fb005554692b16e21dee62bf02667d8dc3e',
              }
              @pytest.fixture
              def git_remote_fix():
                  """
                  A GitRemote instance with a mock factory.
                  """
                  factory = Mock()
                  remote = git_remote.GitRemote(factory)
                  return remote
              def test_discover_git_version(git_remote_fix):
                  version = git_remote_fix.discover_git_version()
                  assert version
-             class TestGitFetch(object):
+             class TestGitFetch:
                  def setup_method(self):
                      self.mock_repo = Mock()
                      factory = Mock()
                      factory.repo = Mock(return_value=self.mock_repo)
                      self.remote_git = git_remote.GitRemote(factory)
                  def test_fetches_all_when_no_commit_ids_specified(self):
                      def side_effect(determine_wants, *args, **kwargs):
                          determine_wants(SAMPLE_REFS)
                      with patch('dulwich.client.LocalGitClient.fetch') as mock_fetch:
                          mock_fetch.side_effect = side_effect
                          self.remote_git.pull(wire={}, url='/tmp/', apply_refs=False)
                          determine_wants = self.mock_repo.object_store.determine_wants_all
                          determine_wants.assert_called_once_with(SAMPLE_REFS)
                  def test_fetches_specified_commits(self):
                      selected_refs = {
                          'refs/tags/v0.1.8': b'74ebce002c088b8a5ecf40073db09375515ecd68',
                          'refs/tags/v0.1.3': b'5a3a8fb005554692b16e21dee62bf02667d8dc3e',
                      }
                      def side_effect(determine_wants, *args, **kwargs):
                          result = determine_wants(SAMPLE_REFS)
                          assert sorted(result) == sorted(selected_refs.values())
                          return result
                      with patch('dulwich.client.LocalGitClient.fetch') as mock_fetch:
                          mock_fetch.side_effect = side_effect
                          self.remote_git.pull(
                              wire={}, url='/tmp/', apply_refs=False,
                              refs=list(selected_refs.keys()))
                          determine_wants = self.mock_repo.object_store.determine_wants_all
                          assert determine_wants.call_count == 0
                  def test_get_remote_refs(self):
                      factory = Mock()
                      remote_git = git_remote.GitRemote(factory)
                      url = 'https://example.com/test/test.git'
                      sample_refs = {
                          'refs/tags/v0.1.8': '74ebce002c088b8a5ecf40073db09375515ecd68',
                          'refs/tags/v0.1.3': '5a3a8fb005554692b16e21dee62bf02667d8dc3e',
                      }
                      with patch('vcsserver.remote.git_remote.Repo', create=False) as mock_repo:
                          mock_repo().get_refs.return_value = sample_refs
                          remote_refs = remote_git.get_remote_refs(wire={}, url=url)
                          mock_repo().get_refs.assert_called_once_with()
                          assert remote_refs == sample_refs
-             class TestReraiseSafeExceptions(object):
+             class TestReraiseSafeExceptions:
                  def test_method_decorated_with_reraise_safe_exceptions(self):
                      factory = Mock()
                      git_remote_instance = git_remote.GitRemote(factory)
                      def fake_function():
                          return None
                      decorator = git_remote.reraise_safe_exceptions(fake_function)
                      methods = inspect.getmembers(git_remote_instance, predicate=inspect.ismethod)
                      for method_name, method in methods:
                          if not method_name.startswith('_') and method_name not in ['vcsserver_invalidate_cache']:
                              assert method.__func__.__code__ == decorator.__code__
                  @pytest.mark.parametrize('side_effect, expected_type', [
                      (dulwich.errors.ChecksumMismatch('0000000', 'deadbeef'), 'lookup'),
                      (dulwich.errors.NotCommitError('deadbeef'), 'lookup'),
                      (dulwich.errors.MissingCommitError('deadbeef'), 'lookup'),
                      (dulwich.errors.ObjectMissing('deadbeef'), 'lookup'),
                      (dulwich.errors.HangupException(), 'error'),
                      (dulwich.errors.UnexpectedCommandError('test-cmd'), 'error'),
                  ])
                  def test_safe_exceptions_reraised(self, side_effect, expected_type):
                      @git_remote.reraise_safe_exceptions
                      def fake_method():
                          raise side_effect
                      with pytest.raises(Exception) as exc_info:
                          fake_method()
                      assert type(exc_info.value) == Exception
                      assert exc_info.value._vcs_kind == expected_type
-             class TestDulwichRepoWrapper(object):
+             class TestDulwichRepoWrapper:
                  def test_calls_close_on_delete(self):
                      isdir_patcher = patch('dulwich.repo.os.path.isdir', return_value=True)
                      with patch.object(git_remote.Repo, 'close') as close_mock:
                          with isdir_patcher:
                              repo = git_remote.Repo('/tmp/abcde')
                              assert repo is not None
                              repo.__del__()
                              # can't use del repo as in python3 this isn't always calling .__del__()
                          close_mock.assert_called_once_with()
-             class TestGitFactory(object):
+             class TestGitFactory:
                  def test_create_repo_returns_dulwich_wrapper(self):
                      with patch('vcsserver.lib.rc_cache.region_meta.dogpile_cache_regions') as mock:
                          mock.side_effect = {'repo_objects': ''}
                          factory = git_remote.GitFactory()
                          wire = {
                              'path': '/tmp/abcde'
                          }
                          isdir_patcher = patch('dulwich.repo.os.path.isdir', return_value=True)
                          with isdir_patcher:
                              result = factory._create_repo(wire, True)
                          assert isinstance(result, git_remote.Repo)

vcsserver/tests/test_hg.py

0 +2 -2

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import inspect
              import sys
              import traceback
              import pytest
              from mercurial.error import LookupError
              from mock import Mock, patch
              from vcsserver import exceptions, hgcompat
              from vcsserver.remote import hg_remote
-             class TestDiff(object):
+             class TestDiff:
                  def test_raising_safe_exception_when_lookup_failed(self):
                      factory = Mock()
                      hg_remote_instance = hg_remote.HgRemote(factory)
                      with patch('mercurial.patch.diff') as diff_mock:
                          diff_mock.side_effect = LookupError(b'deadbeef', b'index', b'message')
                          with pytest.raises(Exception) as exc_info:
                              hg_remote_instance.diff(
                                  wire={}, commit_id_1='deadbeef', commit_id_2='deadbee1',
                                  file_filter=None, opt_git=True, opt_ignorews=True,
                                  context=3)
                          assert type(exc_info.value) == Exception
                          assert exc_info.value._vcs_kind == 'lookup'
-             class TestReraiseSafeExceptions(object):
+             class TestReraiseSafeExceptions:
                  original_traceback = None
                  def test_method_decorated_with_reraise_safe_exceptions(self):
                      factory = Mock()
                      hg_remote_instance = hg_remote.HgRemote(factory)
                      methods = inspect.getmembers(hg_remote_instance, predicate=inspect.ismethod)
                      decorator = hg_remote.reraise_safe_exceptions(None)
                      for method_name, method in methods:
                          if not method_name.startswith('_') and method_name not in ['vcsserver_invalidate_cache']:
                              assert method.__func__.__code__ == decorator.__code__
                  @pytest.mark.parametrize('side_effect, expected_type', [
                      (hgcompat.Abort(b'failed-abort'), 'abort'),
                      (hgcompat.InterventionRequired(b'intervention-required'), 'abort'),
                      (hgcompat.RepoLookupError(), 'lookup'),
                      (hgcompat.LookupError(b'deadbeef', b'index', b'message'), 'lookup'),
                      (hgcompat.RepoError(), 'error'),
                      (hgcompat.RequirementError(), 'requirement'),
                  ])
                  def test_safe_exceptions_reraised(self, side_effect, expected_type):
                      @hg_remote.reraise_safe_exceptions
                      def fake_method():
                          raise side_effect
                      with pytest.raises(Exception) as exc_info:
                          fake_method()
                      assert type(exc_info.value) == Exception
                      assert exc_info.value._vcs_kind == expected_type
                  def test_keeps_original_traceback(self):
                      @hg_remote.reraise_safe_exceptions
                      def fake_method():
                          try:
                              raise hgcompat.Abort(b'test-abort')
                          except:
                              self.original_traceback = traceback.format_tb(sys.exc_info()[2])
                              raise
                      new_traceback = None
                      try:
                          fake_method()
                      except Exception:
                          new_traceback = traceback.format_tb(sys.exc_info()[2])
                      new_traceback_tail = new_traceback[-len(self.original_traceback):]
                      assert new_traceback_tail == self.original_traceback
                  def test_maps_unknown_exceptions_to_unhandled(self):
                      @hg_remote.reraise_safe_exceptions
                      def stub_method():
                          raise ValueError('stub')
                      with pytest.raises(Exception) as exc_info:
                          stub_method()
                      assert exc_info.value._vcs_kind == 'unhandled'
                  def test_does_not_map_known_exceptions(self):
                      @hg_remote.reraise_safe_exceptions
                      def stub_method():
                          raise exceptions.LookupException()('stub')
                      with pytest.raises(Exception) as exc_info:
                          stub_method()
                      assert exc_info.value._vcs_kind == 'lookup'

vcsserver/tests/test_hooks.py

0 +4 -4

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import threading
              import msgpack
              from http.server import BaseHTTPRequestHandler
              from socketserver import TCPServer
              import mercurial.ui
              import mock
              import pytest
              from vcsserver.hooks import HooksHttpClient
              from vcsserver.lib.rc_json import json
              from vcsserver import hooks
              def get_hg_ui(extras=None):
                  """Create a Config object with a valid RC_SCM_DATA entry."""
                  extras = extras or {}
                  required_extras = {
                      'username': '',
                      'repository': '',
                      'locked_by': '',
                      'scm': '',
                      'make_lock': '',
                      'action': '',
                      'ip': '',
                      'hooks_uri': 'fake_hooks_uri',
                  }
                  required_extras.update(extras)
                  hg_ui = mercurial.ui.ui()
                  hg_ui.setconfig(b'rhodecode', b'RC_SCM_DATA', json.dumps(required_extras))
                  return hg_ui
              def test_git_pre_receive_is_disabled():
                  extras = {'hooks': ['pull']}
                  response = hooks.git_pre_receive(None, None,
                                                   {'RC_SCM_DATA': json.dumps(extras)})
                  assert response == 0
              def test_git_post_receive_is_disabled():
                  extras = {'hooks': ['pull']}
                  response = hooks.git_post_receive(None, '',
                                                    {'RC_SCM_DATA': json.dumps(extras)})
                  assert response == 0
              def test_git_post_receive_calls_repo_size():
                  extras = {'hooks': ['push', 'repo_size']}
                  with mock.patch.object(hooks, '_call_hook') as call_hook_mock:
                      hooks.git_post_receive(
                          None, '', {'RC_SCM_DATA': json.dumps(extras)})
                  extras.update({'commit_ids': [], 'hook_type': 'post_receive',
                                 'new_refs': {'bookmarks': [], 'branches': [], 'tags': []}})
                  expected_calls = [
                      mock.call('repo_size', extras, mock.ANY),
                      mock.call('post_push', extras, mock.ANY),
                  ]
                  assert call_hook_mock.call_args_list == expected_calls
              def test_git_post_receive_does_not_call_disabled_repo_size():
                  extras = {'hooks': ['push']}
                  with mock.patch.object(hooks, '_call_hook') as call_hook_mock:
                      hooks.git_post_receive(
                          None, '', {'RC_SCM_DATA': json.dumps(extras)})
                  extras.update({'commit_ids': [], 'hook_type': 'post_receive',
                                 'new_refs': {'bookmarks': [], 'branches': [], 'tags': []}})
                  expected_calls = [
                      mock.call('post_push', extras, mock.ANY)
                  ]
                  assert call_hook_mock.call_args_list == expected_calls
              def test_repo_size_exception_does_not_affect_git_post_receive():
                  extras = {'hooks': ['push', 'repo_size']}
                  status = 0
                  def side_effect(name, *args, **kwargs):
                      if name == 'repo_size':
                          raise Exception('Fake exception')
                      else:
                          return status
                  with mock.patch.object(hooks, '_call_hook') as call_hook_mock:
                      call_hook_mock.side_effect = side_effect
                      result = hooks.git_post_receive(
                          None, '', {'RC_SCM_DATA': json.dumps(extras)})
                  assert result == status
              def test_git_pre_pull_is_disabled():
                  assert hooks.git_pre_pull({'hooks': ['push']}) == hooks.HookResponse(0, '')
              def test_git_post_pull_is_disabled():
                  assert (
                      hooks.git_post_pull({'hooks': ['push']}) == hooks.HookResponse(0, ''))
-             class TestGetHooksClient(object):
+             class TestGetHooksClient:
                  def test_returns_http_client_when_protocol_matches(self):
                      hooks_uri = 'localhost:8000'
                      result = hooks._get_hooks_client({
                          'hooks_uri': hooks_uri,
                          'hooks_protocol': 'http'
                      })
                      assert isinstance(result, hooks.HooksHttpClient)
                      assert result.hooks_uri == hooks_uri
                  def test_returns_dummy_client_when_hooks_uri_not_specified(self):
                      fake_module = mock.Mock()
                      import_patcher = mock.patch.object(
                          hooks.importlib, 'import_module', return_value=fake_module)
                      fake_module_name = 'fake.module'
                      with import_patcher as import_mock:
                          result = hooks._get_hooks_client(
                              {'hooks_module': fake_module_name})
                      import_mock.assert_called_once_with(fake_module_name)
                      assert isinstance(result, hooks.HooksDummyClient)
                      assert result._hooks_module == fake_module
-             class TestHooksHttpClient(object):
+             class TestHooksHttpClient:
                  def test_init_sets_hooks_uri(self):
                      uri = 'localhost:3000'
                      client = hooks.HooksHttpClient(uri)
                      assert client.hooks_uri == uri
                  def test_serialize_returns_serialized_string(self):
                      client = hooks.HooksHttpClient('localhost:3000')
                      hook_name = 'test'
                      extras = {
                          'first': 1,
                          'second': 'two'
                      }
                      hooks_proto, result = client._serialize(hook_name, extras)
                      expected_result = msgpack.packb({
                          'method': hook_name,
                          'extras': extras,
                      })
                      assert hooks_proto == {'rc-hooks-protocol': 'msgpack.v1', 'Connection': 'keep-alive'}
                      assert result == expected_result
                  def test_call_queries_http_server(self, http_mirror):
                      client = hooks.HooksHttpClient(http_mirror.uri)
                      hook_name = 'test'
                      extras = {
                          'first': 1,
                          'second': 'two'
                      }
                      result = client(hook_name, extras)
                      expected_result = msgpack.unpackb(msgpack.packb({
                          'method': hook_name,
                          'extras': extras
                      }), raw=False)
                      assert result == expected_result
-             class TestHooksDummyClient(object):
+             class TestHooksDummyClient:
                  def test_init_imports_hooks_module(self):
                      hooks_module_name = 'rhodecode.fake.module'
                      hooks_module = mock.MagicMock()
                      import_patcher = mock.patch.object(
                          hooks.importlib, 'import_module', return_value=hooks_module)
                      with import_patcher as import_mock:
                          client = hooks.HooksDummyClient(hooks_module_name)
                          import_mock.assert_called_once_with(hooks_module_name)
                      assert client._hooks_module == hooks_module
                  def test_call_returns_hook_result(self):
                      hooks_module_name = 'rhodecode.fake.module'
                      hooks_module = mock.MagicMock()
                      import_patcher = mock.patch.object(
                          hooks.importlib, 'import_module', return_value=hooks_module)
                      with import_patcher:
                          client = hooks.HooksDummyClient(hooks_module_name)
                      result = client('post_push', {})
                      hooks_module.Hooks.assert_called_once_with()
                      assert result == hooks_module.Hooks().__enter__().post_push()
              @pytest.fixture
              def http_mirror(request):
                  server = MirrorHttpServer()
                  request.addfinalizer(server.stop)
                  return server
              class MirrorHttpHandler(BaseHTTPRequestHandler):
                  def do_POST(self):
                      length = int(self.headers['Content-Length'])
                      body = self.rfile.read(length)
                      self.send_response(200)
                      self.end_headers()
                      self.wfile.write(body)
-             class MirrorHttpServer(object):
+             class MirrorHttpServer:
                  ip_address = '127.0.0.1'
                  port = 0
                  def __init__(self):
                      self._daemon = TCPServer((self.ip_address, 0), MirrorHttpHandler)
                      _, self.port = self._daemon.server_address
                      self._thread = threading.Thread(target=self._daemon.serve_forever)
                      self._thread.daemon = True
                      self._thread.start()
                  def stop(self):
                      self._daemon.shutdown()
                      self._thread.join()
                      self._daemon = None
                      self._thread = None
                  @property
                  def uri(self):
                      return '{}:{}'.format(self.ip_address, self.port)
              def test_hooks_http_client_init():
                  hooks_uri = 'http://localhost:8000'
                  client = HooksHttpClient(hooks_uri)
                  assert client.hooks_uri == hooks_uri
              def test_hooks_http_client_call():
                  hooks_uri = 'http://localhost:8000'
                  method = 'test_method'
                  extras = {'key': 'value'}
                  with \
                      mock.patch('http.client.HTTPConnection') as mock_connection,\
                      mock.patch('msgpack.load') as mock_load:
                      client = HooksHttpClient(hooks_uri)
                      mock_load.return_value = {'result': 'success'}
                      response = mock.MagicMock()
                      response.status = 200
                      mock_connection.request.side_effect = None
                      mock_connection.getresponse.return_value = response
                      result = client(method, extras)
                      mock_connection.assert_called_with(hooks_uri)
                      mock_connection.return_value.request.assert_called_once()
                      assert result == {'result': 'success'}
              def test_hooks_http_client_serialize():
                  method = 'test_method'
                  extras = {'key': 'value'}
                  headers, body = HooksHttpClient._serialize(method, extras)
                  assert headers == {'rc-hooks-protocol': HooksHttpClient.proto, 'Connection': 'keep-alive'}
                  assert msgpack.unpackb(body) == {'method': method, 'extras': extras}

vcsserver/tests/test_install_hooks.py

0 +2 -2

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import os
              import sys
              import stat
              import pytest
              import vcsserver
              import tempfile
              from vcsserver import hook_utils
              from vcsserver.tests.fixture import no_newline_id_generator
              from vcsserver.str_utils import safe_bytes, safe_str
              from vcsserver.utils import AttributeDict
-             class TestCheckRhodecodeHook(object):
+             class TestCheckRhodecodeHook:
                  def test_returns_false_when_hook_file_is_wrong_found(self, tmpdir):
                      hook = os.path.join(str(tmpdir), 'fake_hook_file.py')
                      with open(hook, 'wb') as f:
                          f.write(b'dummy test')
                          result = hook_utils.check_rhodecode_hook(hook)
                          assert result is False
                  def test_returns_true_when_no_hook_file_found(self, tmpdir):
                      hook = os.path.join(str(tmpdir), 'fake_hook_file_not_existing.py')
                      result = hook_utils.check_rhodecode_hook(hook)
                      assert result
                  @pytest.mark.parametrize("file_content, expected_result", [
                      ("RC_HOOK_VER = '3.3.3'\n", True),
                      ("RC_HOOK = '3.3.3'\n", False),
                  ], ids=no_newline_id_generator)
                  def test_signatures(self, file_content, expected_result, tmpdir):
                      hook = os.path.join(str(tmpdir), 'fake_hook_file_1.py')
                      with open(hook, 'wb') as f:
                          f.write(safe_bytes(file_content))
                      result = hook_utils.check_rhodecode_hook(hook)
                      assert result is expected_result
-             class BaseInstallHooks(object):
+             class BaseInstallHooks:
                  HOOK_FILES = ()
                  def _check_hook_file_mode(self, file_path):
                      assert os.path.exists(file_path), 'path %s missing' % file_path
                      stat_info = os.stat(file_path)
                      file_mode = stat.S_IMODE(stat_info.st_mode)
                      expected_mode = int('755', 8)
                      assert expected_mode == file_mode
                  def _check_hook_file_content(self, file_path, executable):
                      executable = executable or sys.executable
                      with open(file_path, 'rt') as hook_file:
                          content = hook_file.read()
                      expected_env = '#!{}'.format(executable)
                      expected_rc_version = "\nRC_HOOK_VER = '{}'\n".format(vcsserver.__version__)
                      assert content.strip().startswith(expected_env)
                      assert expected_rc_version in content
                  def _create_fake_hook(self, file_path, content):
                      with open(file_path, 'w') as hook_file:
                          hook_file.write(content)
                  def create_dummy_repo(self, repo_type):
                      tmpdir = tempfile.mkdtemp()
                      repo = AttributeDict()
                      if repo_type == 'git':
                          repo.path = os.path.join(tmpdir, 'test_git_hooks_installation_repo')
                          os.makedirs(repo.path)
                          os.makedirs(os.path.join(repo.path, 'hooks'))
                          repo.bare = True
                      elif repo_type == 'svn':
                          repo.path = os.path.join(tmpdir, 'test_svn_hooks_installation_repo')
                          os.makedirs(repo.path)
                          os.makedirs(os.path.join(repo.path, 'hooks'))
                      return repo
                  def check_hooks(self, repo_path, repo_bare=True):
                      for file_name in self.HOOK_FILES:
                          if repo_bare:
                              file_path = os.path.join(repo_path, 'hooks', file_name)
                          else:
                              file_path = os.path.join(repo_path, '.git', 'hooks', file_name)
                          self._check_hook_file_mode(file_path)
                          self._check_hook_file_content(file_path, sys.executable)
              class TestInstallGitHooks(BaseInstallHooks):
                  HOOK_FILES = ('pre-receive', 'post-receive')
                  def test_hooks_are_installed(self):
                      repo = self.create_dummy_repo('git')
                      result = hook_utils.install_git_hooks(repo.path, repo.bare)
                      assert result
                      self.check_hooks(repo.path, repo.bare)
                  def test_hooks_are_replaced(self):
                      repo = self.create_dummy_repo('git')
                      hooks_path = os.path.join(repo.path, 'hooks')
                      for file_path in [os.path.join(hooks_path, f) for f in self.HOOK_FILES]:
                          self._create_fake_hook(
                              file_path, content="RC_HOOK_VER = 'abcde'\n")
                      result = hook_utils.install_git_hooks(repo.path, repo.bare)
                      assert result
                      self.check_hooks(repo.path, repo.bare)
                  def test_non_rc_hooks_are_not_replaced(self):
                      repo = self.create_dummy_repo('git')
                      hooks_path = os.path.join(repo.path, 'hooks')
                      non_rc_content = 'echo "non rc hook"\n'
                      for file_path in [os.path.join(hooks_path, f) for f in self.HOOK_FILES]:
                          self._create_fake_hook(
                              file_path, content=non_rc_content)
                      result = hook_utils.install_git_hooks(repo.path, repo.bare)
                      assert result
                      for file_path in [os.path.join(hooks_path, f) for f in self.HOOK_FILES]:
                          with open(file_path, 'rt') as hook_file:
                              content = hook_file.read()
                          assert content == non_rc_content
                  def test_non_rc_hooks_are_replaced_with_force_flag(self):
                      repo = self.create_dummy_repo('git')
                      hooks_path = os.path.join(repo.path, 'hooks')
                      non_rc_content = 'echo "non rc hook"\n'
                      for file_path in [os.path.join(hooks_path, f) for f in self.HOOK_FILES]:
                          self._create_fake_hook(
                              file_path, content=non_rc_content)
                      result = hook_utils.install_git_hooks(
                          repo.path, repo.bare, force_create=True)
                      assert result
                      self.check_hooks(repo.path, repo.bare)
              class TestInstallSvnHooks(BaseInstallHooks):
                  HOOK_FILES = ('pre-commit', 'post-commit')
                  def test_hooks_are_installed(self):
                      repo = self.create_dummy_repo('svn')
                      result = hook_utils.install_svn_hooks(repo.path)
                      assert result
                      self.check_hooks(repo.path)
                  def test_hooks_are_replaced(self):
                      repo = self.create_dummy_repo('svn')
                      hooks_path = os.path.join(repo.path, 'hooks')
                      for file_path in [os.path.join(hooks_path, f) for f in self.HOOK_FILES]:
                          self._create_fake_hook(
                              file_path, content="RC_HOOK_VER = 'abcde'\n")
                      result = hook_utils.install_svn_hooks(repo.path)
                      assert result
                      self.check_hooks(repo.path)
                  def test_non_rc_hooks_are_not_replaced(self):
                      repo = self.create_dummy_repo('svn')
                      hooks_path = os.path.join(repo.path, 'hooks')
                      non_rc_content = 'echo "non rc hook"\n'
                      for file_path in [os.path.join(hooks_path, f) for f in self.HOOK_FILES]:
                          self._create_fake_hook(
                              file_path, content=non_rc_content)
                      result = hook_utils.install_svn_hooks(repo.path)
                      assert result
                      for file_path in [os.path.join(hooks_path, f) for f in self.HOOK_FILES]:
                          with open(file_path, 'rt') as hook_file:
                              content = hook_file.read()
                          assert content == non_rc_content
                  def test_non_rc_hooks_are_replaced_with_force_flag(self):
                      repo = self.create_dummy_repo('svn')
                      hooks_path = os.path.join(repo.path, 'hooks')
                      non_rc_content = 'echo "non rc hook"\n'
                      for file_path in [os.path.join(hooks_path, f) for f in self.HOOK_FILES]:
                          self._create_fake_hook(
                              file_path, content=non_rc_content)
                      result = hook_utils.install_svn_hooks(
                          repo.path, force_create=True)
                      assert result
                      self.check_hooks(repo.path, )

vcsserver/tests/test_pygrack.py

0 +1 -1

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import io
              import more_itertools
              import dulwich.protocol
              import mock
              import pytest
              import webob
              import webtest
              from vcsserver import hooks, pygrack
              from vcsserver.str_utils import ascii_bytes
              @pytest.fixture()
              def pygrack_instance(tmpdir):
                  """
                  Creates a pygrack app instance.
                  Right now, it does not much helpful regarding the passed directory.
                  It just contains the required folders to pass the signature test.
                  """
                  for dir_name in ('config', 'head', 'info', 'objects', 'refs'):
                      tmpdir.mkdir(dir_name)
                  return pygrack.GitRepository('repo_name', str(tmpdir), 'git', False, {})
              @pytest.fixture()
              def pygrack_app(pygrack_instance):
                  """
                  Creates a pygrack app wrapped in webtest.TestApp.
                  """
                  return webtest.TestApp(pygrack_instance)
              def test_invalid_service_info_refs_returns_403(pygrack_app):
                  response = pygrack_app.get('/info/refs?service=git-upload-packs',
                                             expect_errors=True)
                  assert response.status_int == 403
              def test_invalid_endpoint_returns_403(pygrack_app):
                  response = pygrack_app.post('/git-upload-packs', expect_errors=True)
                  assert response.status_int == 403
              @pytest.mark.parametrize('sideband', [
                  'side-band-64k',
                  'side-band',
                  'side-band no-progress',
              ])
              def test_pre_pull_hook_fails_with_sideband(pygrack_app, sideband):
                  request = ''.join([
                      '0054want 74730d410fcb6603ace96f1dc55ea6196122532d ',
-                     'multi_ack %s ofs-delta\n' % sideband,
+                     f'multi_ack {sideband} ofs-delta\n',
                      '0000',
                      '0009done\n',
                  ])
                  with mock.patch('vcsserver.hooks.git_pre_pull', return_value=hooks.HookResponse(1, 'foo')):
                      response = pygrack_app.post(
                          '/git-upload-pack', params=request,
                          content_type='application/x-git-upload-pack')
                  data = io.BytesIO(response.body)
                  proto = dulwich.protocol.Protocol(data.read, None)
                  packets = list(proto.read_pkt_seq())
                  expected_packets = [
                      b'NAK\n', b'\x02foo', b'\x02Pre pull hook failed: aborting\n',
                      b'\x01' + pygrack.GitRepository.EMPTY_PACK,
                  ]
                  assert packets == expected_packets
              def test_pre_pull_hook_fails_no_sideband(pygrack_app):
                  request = ''.join([
                      '0054want 74730d410fcb6603ace96f1dc55ea6196122532d ' +
                      'multi_ack ofs-delta\n'
                      '0000',
                      '0009done\n',
                  ])
                  with mock.patch('vcsserver.hooks.git_pre_pull',
                                  return_value=hooks.HookResponse(1, 'foo')):
                      response = pygrack_app.post(
                          '/git-upload-pack', params=request,
                          content_type='application/x-git-upload-pack')
                  assert response.body == pygrack.GitRepository.EMPTY_PACK
              def test_pull_has_hook_messages(pygrack_app):
                  request = ''.join([
                      '0054want 74730d410fcb6603ace96f1dc55ea6196122532d ' +
                      'multi_ack side-band-64k ofs-delta\n'
                      '0000',
                      '0009done\n',
                  ])
                  pre_pull = 'pre_pull_output'
                  post_pull = 'post_pull_output'
                  with mock.patch('vcsserver.hooks.git_pre_pull',
                                  return_value=hooks.HookResponse(0, pre_pull)):
                      with mock.patch('vcsserver.hooks.git_post_pull',
                                      return_value=hooks.HookResponse(1, post_pull)):
                          with mock.patch('vcsserver.subprocessio.SubprocessIOChunker',
                                          return_value=more_itertools.always_iterable([b'0008NAK\n0009subp\n0000'])):
                              response = pygrack_app.post(
                                  '/git-upload-pack', params=request,
                                  content_type='application/x-git-upload-pack')
                  data = io.BytesIO(response.body)
                  proto = dulwich.protocol.Protocol(data.read, None)
                  packets = list(proto.read_pkt_seq())
                  assert packets == [b'NAK\n',
                                     # pre-pull only outputs if IT FAILS as in != 0 ret code
                                     #b'\x02pre_pull_output',
                                     b'subp\n',
                                     b'\x02post_pull_output']
              def test_get_want_capabilities(pygrack_instance):
                  data = io.BytesIO(
                      b'0054want 74730d410fcb6603ace96f1dc55ea6196122532d ' +
                      b'multi_ack side-band-64k ofs-delta\n00000009done\n')
                  request = webob.Request({
                      'wsgi.input': data,
                      'REQUEST_METHOD': 'POST',
                      'webob.is_body_seekable': True
                  })
                  capabilities = pygrack_instance._get_want_capabilities(request)
                  assert capabilities == frozenset(
                      (b'ofs-delta', b'multi_ack', b'side-band-64k'))
                  assert data.tell() == 0
              @pytest.mark.parametrize('data,capabilities,expected', [
                  ('foo', [], []),
                  ('', [pygrack.CAPABILITY_SIDE_BAND_64K], []),
                  ('', [pygrack.CAPABILITY_SIDE_BAND], []),
                  ('foo', [pygrack.CAPABILITY_SIDE_BAND_64K], [b'0008\x02foo']),
                  ('foo', [pygrack.CAPABILITY_SIDE_BAND], [b'0008\x02foo']),
                  ('f'*1000, [pygrack.CAPABILITY_SIDE_BAND_64K], [b'03ed\x02' + b'f' * 1000]),
                  ('f'*1000, [pygrack.CAPABILITY_SIDE_BAND], [b'03e8\x02' + b'f' * 995, b'000a\x02fffff']),
                  ('f'*65520, [pygrack.CAPABILITY_SIDE_BAND_64K], [b'fff0\x02' + b'f' * 65515, b'000a\x02fffff']),
                  ('f'*65520, [pygrack.CAPABILITY_SIDE_BAND], [b'03e8\x02' + b'f' * 995] * 65 + [b'0352\x02' + b'f' * 845]),
              ], ids=[
                  'foo-empty',
                  'empty-64k', 'empty',
                  'foo-64k', 'foo',
                  'f-1000-64k', 'f-1000',
                  'f-65520-64k', 'f-65520'])
              def test_get_messages(pygrack_instance, data, capabilities, expected):
                  messages = pygrack_instance._get_messages(data, capabilities)
                  assert messages == expected
              @pytest.mark.parametrize('response,capabilities,pre_pull_messages,post_pull_messages', [
                  # Unexpected response
                  ([b'unexpected_response[no_initial_header]'], [pygrack.CAPABILITY_SIDE_BAND_64K], 'foo', 'bar'),
                  # No sideband
                  ([b'no-sideband'], [], 'foo', 'bar'),
                  # No messages
                  ([b'no-messages'], [pygrack.CAPABILITY_SIDE_BAND_64K], '', ''),
              ])
              def test_inject_messages_to_response_nothing_to_do(
                      pygrack_instance, response, capabilities, pre_pull_messages, post_pull_messages):
                  new_response = pygrack_instance._build_post_pull_response(
                      more_itertools.always_iterable(response), capabilities, pre_pull_messages, post_pull_messages)
                  assert list(new_response) == response
              @pytest.mark.parametrize('capabilities', [
                  [pygrack.CAPABILITY_SIDE_BAND],
                  [pygrack.CAPABILITY_SIDE_BAND_64K],
              ])
              def test_inject_messages_to_response_single_element(pygrack_instance, capabilities):
                  response = [b'0008NAK\n0009subp\n0000']
                  new_response = pygrack_instance._build_post_pull_response(
                      more_itertools.always_iterable(response), capabilities, 'foo', 'bar')
                  expected_response = b''.join([
                      b'0008NAK\n',
                      b'0008\x02foo',
                      b'0009subp\n',
                      b'0008\x02bar',
                      b'0000'])
                  assert b''.join(new_response) == expected_response
              @pytest.mark.parametrize('capabilities', [
                  [pygrack.CAPABILITY_SIDE_BAND],
                  [pygrack.CAPABILITY_SIDE_BAND_64K],
              ])
              def test_inject_messages_to_response_multi_element(pygrack_instance, capabilities):
                  response = more_itertools.always_iterable([
                      b'0008NAK\n000asubp1\n', b'000asubp2\n', b'000asubp3\n', b'000asubp4\n0000'
                  ])
                  new_response = pygrack_instance._build_post_pull_response(response, capabilities, 'foo', 'bar')
                  expected_response = b''.join([
                      b'0008NAK\n',
                      b'0008\x02foo',
                      b'000asubp1\n', b'000asubp2\n', b'000asubp3\n', b'000asubp4\n',
                      b'0008\x02bar',
                      b'0000'
                  ])
                  assert b''.join(new_response) == expected_response
              def test_build_failed_pre_pull_response_no_sideband(pygrack_instance):
                  response = pygrack_instance._build_failed_pre_pull_response([], 'foo')
                  assert response == [pygrack.GitRepository.EMPTY_PACK]
              @pytest.mark.parametrize('capabilities', [
                  [pygrack.CAPABILITY_SIDE_BAND],
                  [pygrack.CAPABILITY_SIDE_BAND_64K],
                  [pygrack.CAPABILITY_SIDE_BAND_64K, b'no-progress'],
              ])
              def test_build_failed_pre_pull_response(pygrack_instance, capabilities):
                  response = pygrack_instance._build_failed_pre_pull_response(capabilities, 'foo')
                  expected_response = [
                      b'0008NAK\n', b'0008\x02foo', b'0024\x02Pre pull hook failed: aborting\n',
                      b'%04x\x01%s' % (len(pygrack.GitRepository.EMPTY_PACK) + 5, pygrack.GitRepository.EMPTY_PACK),
                      pygrack.GitRepository.FLUSH_PACKET,
                  ]
                  assert response == expected_response
              def test_inject_messages_to_response_generator(pygrack_instance):
                  def response_generator():
                      response = [
                          # protocol start
                          b'0008NAK\n',
                      ]
                      response += [ascii_bytes(f'000asubp{x}\n') for x in range(1000)]
                      response += [
                          # protocol end
                          pygrack.GitRepository.FLUSH_PACKET
                      ]
                      for elem in response:
                          yield elem
                  new_response = pygrack_instance._build_post_pull_response(
                      response_generator(), [pygrack.CAPABILITY_SIDE_BAND_64K, b'no-progress'], 'PRE_PULL_MSG\n', 'POST_PULL_MSG\n')
                  assert iter(new_response)
                  expected_response = b''.join([
                      # start
                      b'0008NAK\n0012\x02PRE_PULL_MSG\n',
                  ] + [
                      # ... rest
                      ascii_bytes(f'000asubp{x}\n') for x in range(1000)
                  ] + [
                      # final message,
                      b'0013\x02POST_PULL_MSG\n0000',
                  ])
                  assert b''.join(new_response) == expected_response

vcsserver/tests/test_subprocessio.py

0 +1 -1

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import io
              import os
              import sys
              import pytest
              from vcsserver import subprocessio
              from vcsserver.str_utils import ascii_bytes
-             class FileLikeObj(object):  # pragma: no cover
+             class FileLikeObj:  # pragma: no cover
                  def __init__(self, data: bytes, size):
                      chunks = size // len(data)
                      self.stream = self._get_stream(data, chunks)
                  def _get_stream(self, data, chunks):
                      for x in range(chunks):
                          yield data
                  def read(self, n):
                      buffer_stream = b''
                      for chunk in self.stream:
                          buffer_stream += chunk
                          if len(buffer_stream) >= n:
                              break
                      # self.stream = self.bytes[n:]
                      return buffer_stream
              @pytest.fixture(scope='module')
              def environ():
                  """Delete coverage variables, as they make the tests fail."""
                  env = dict(os.environ)
                  for key in list(env.keys()):
                      if key.startswith('COV_CORE_'):
                          del env[key]
                  return env
              def _get_python_args(script):
                  return [sys.executable, '-c', 'import sys; import time; import shutil; ' + script]
              def test_raise_exception_on_non_zero_return_code(environ):
                  call_args = _get_python_args('raise ValueError("fail")')
                  with pytest.raises(OSError):
                      b''.join(subprocessio.SubprocessIOChunker(call_args, shell=False, env=environ))
              def test_does_not_fail_on_non_zero_return_code(environ):
                  call_args = _get_python_args('sys.stdout.write("hello"); sys.exit(1)')
                  proc = subprocessio.SubprocessIOChunker(call_args, shell=False, fail_on_return_code=False, env=environ)
                  output = b''.join(proc)
                  assert output == b'hello'
              def test_raise_exception_on_stderr(environ):
                  call_args = _get_python_args('sys.stderr.write("WRITE_TO_STDERR"); time.sleep(1);')
                  with pytest.raises(OSError) as excinfo:
                      b''.join(subprocessio.SubprocessIOChunker(call_args, shell=False, env=environ))
                  assert 'exited due to an error:\nWRITE_TO_STDERR' in str(excinfo.value)
              def test_does_not_fail_on_stderr(environ):
                  call_args = _get_python_args('sys.stderr.write("WRITE_TO_STDERR"); sys.stderr.flush; time.sleep(2);')
                  proc = subprocessio.SubprocessIOChunker(call_args, shell=False, fail_on_stderr=False, env=environ)
                  output = b''.join(proc)
                  assert output == b''
              @pytest.mark.parametrize('size', [
 ,
 ** 5
              ])
              def test_output_with_no_input(size, environ):
                  call_args = _get_python_args(f'sys.stdout.write("X" * {size});')
                  proc = subprocessio.SubprocessIOChunker(call_args, shell=False, env=environ)
                  output = b''.join(proc)
                  assert output == ascii_bytes("X" * size)
              @pytest.mark.parametrize('size', [
 ,
 ** 5
              ])
              def test_output_with_no_input_does_not_fail(size, environ):
                  call_args = _get_python_args(f'sys.stdout.write("X" * {size}); sys.exit(1)')
                  proc = subprocessio.SubprocessIOChunker(call_args, shell=False, fail_on_return_code=False, env=environ)
                  output = b''.join(proc)
                  assert output == ascii_bytes("X" * size)
              @pytest.mark.parametrize('size', [
 ,
 ** 5
              ])
              def test_output_with_input(size, environ):
                  data_len = size
                  inputstream = FileLikeObj(b'X', size)
                  # This acts like the cat command.
                  call_args = _get_python_args('shutil.copyfileobj(sys.stdin, sys.stdout)')
                  # note: in this tests we explicitly don't assign chunker to a variable and let it stream directly
                  output = b''.join(
                      subprocessio.SubprocessIOChunker(call_args, shell=False, input_stream=inputstream, env=environ)
                  )
                  assert len(output) == data_len
              @pytest.mark.parametrize('size', [
 ,
 ** 5
              ])
              def test_output_with_input_skipping_iterator(size, environ):
                  data_len = size
                  inputstream = FileLikeObj(b'X', size)
                  # This acts like the cat command.
                  call_args = _get_python_args('shutil.copyfileobj(sys.stdin, sys.stdout)')
                  # Note: assigning the chunker makes sure that it is not deleted too early
                  proc = subprocessio.SubprocessIOChunker(call_args, shell=False, input_stream=inputstream, env=environ)
                  output = b''.join(proc.stdout)
                  assert len(output) == data_len

vcsserver/tests/test_svn.py

0 +1 -1

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import io
              import mock
              import pytest
              import sys
              from vcsserver.str_utils import ascii_bytes
-             class MockPopen(object):
+             class MockPopen:
                  def __init__(self, stderr):
                      self.stdout = io.BytesIO(b'')
                      self.stderr = io.BytesIO(stderr)
                      self.returncode = 1
                  def wait(self):
                      pass
              INVALID_CERTIFICATE_STDERR = '\n'.join([
                  'svnrdump: E230001: Unable to connect to a repository at URL url',
                  'svnrdump: E230001: Server SSL certificate verification failed: issuer is not trusted',
              ])
              @pytest.mark.parametrize('stderr,expected_reason', [
                  (INVALID_CERTIFICATE_STDERR, 'INVALID_CERTIFICATE'),
                  ('svnrdump: E123456', 'UNKNOWN:svnrdump: E123456'),
              ], ids=['invalid-cert-stderr', 'svnrdump-err-123456'])
              @pytest.mark.xfail(sys.platform == "cygwin",
                                 reason="SVN not packaged for Cygwin")
              def test_import_remote_repository_certificate_error(stderr, expected_reason):
                  from vcsserver.remote import svn_remote
                  factory = mock.Mock()
                  factory.repo = mock.Mock(return_value=mock.Mock())
                  remote = svn_remote.SvnRemote(factory)
                  remote.is_path_valid_repository = lambda wire, path: True
                  with mock.patch('subprocess.Popen',
                                  return_value=MockPopen(ascii_bytes(stderr))):
                      with pytest.raises(Exception) as excinfo:
                          remote.import_remote_repository({'path': 'path'}, 'url')
                  expected_error_args = 'Failed to dump the remote repository from url. Reason:{}'.format(expected_reason)
                  assert excinfo.value.args[0] == expected_error_args
              def test_svn_libraries_can_be_imported():
                  import svn.client  # noqa
                  assert svn.client is not None
              @pytest.mark.parametrize('example_url, parts', [
                  ('http://server.com', ('', '', 'http://server.com')),
                  ('http://user@server.com', ('user', '', 'http://user@server.com')),
                  ('http://user:pass@server.com', ('user', 'pass', 'http://user:pass@server.com')),
                  ('<script>', ('', '', '<script>')),
                  ('http://', ('', '', 'http://')),
              ])
              def test_username_password_extraction_from_url(example_url, parts):
                  from vcsserver.remote import svn_remote
                  factory = mock.Mock()
                  factory.repo = mock.Mock(return_value=mock.Mock())
                  remote = svn_remote.SvnRemote(factory)
                  remote.is_path_valid_repository = lambda wire, path: True
                  assert remote.get_url_and_credentials(example_url) == parts
              @pytest.mark.parametrize('call_url', [
                  b'https://svn.code.sf.net/p/svnbook/source/trunk/',
                  b'https://marcink@svn.code.sf.net/p/svnbook/source/trunk/',
                  b'https://marcink:qweqwe@svn.code.sf.net/p/svnbook/source/trunk/',
              ])
              def test_check_url(call_url):
                  from vcsserver.remote import svn_remote
                  factory = mock.Mock()
                  factory.repo = mock.Mock(return_value=mock.Mock())
                  remote = svn_remote.SvnRemote(factory)
                  remote.is_path_valid_repository = lambda wire, path: True
                  assert remote.check_url(call_url, {'dummy': 'config'})

vcsserver/tweens/request_wrapper.py

0 +1 -1

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              import base64
              import logging
              import time
              import msgpack
              import vcsserver
              from vcsserver.str_utils import safe_str
              log = logging.getLogger(__name__)
              def get_access_path(environ):
                  path = environ.get('PATH_INFO')
                  return path
              def get_user_agent(environ):
                  return environ.get('HTTP_USER_AGENT')
              def get_call_context(request) -> dict:
                  cc = {}
                  registry = request.registry
                  if hasattr(registry, 'vcs_call_context'):
                      cc.update({
                          'X-RC-Method': registry.vcs_call_context.get('method'),
                          'X-RC-Repo-Name': registry.vcs_call_context.get('repo_name')
                      })
                  return cc
              def get_headers_call_context(environ, strict=True):
                  if 'HTTP_X_RC_VCS_STREAM_CALL_CONTEXT' in environ:
                      packed_cc = base64.b64decode(environ['HTTP_X_RC_VCS_STREAM_CALL_CONTEXT'])
                      return msgpack.unpackb(packed_cc)
                  elif strict:
                      raise ValueError('Expected header HTTP_X_RC_VCS_STREAM_CALL_CONTEXT not found')
-             class RequestWrapperTween(object):
+             class RequestWrapperTween:
                  def __init__(self, handler, registry):
                      self.handler = handler
                      self.registry = registry
                      # one-time configuration code goes here
                  def __call__(self, request):
                      start = time.time()
                      log.debug('Starting request time measurement')
                      response = None
                      try:
                          response = self.handler(request)
                      finally:
                          ua = get_user_agent(request.environ)
                          call_context = get_call_context(request)
                          vcs_method = call_context.get('X-RC-Method', '_NO_VCS_METHOD')
                          repo_name = call_context.get('X-RC-Repo-Name', '')
                          count = request.request_count()
                          _ver_ = vcsserver.__version__
                          _path = safe_str(get_access_path(request.environ))
                          ip = '127.0.0.1'
                          match_route = request.matched_route.name if request.matched_route else "NOT_FOUND"
                          resp_code = getattr(response, 'status_code', 'UNDEFINED')
                          _view_path = f"{repo_name}@{_path}/{vcs_method}"
                          total = time.time() - start
                          log.info(
                              'Req[%4s] IP: %s %s Request to %s time: %.4fs [%s], VCSServer %s',
                              count, ip, request.environ.get('REQUEST_METHOD'),
                              _view_path, total, ua, _ver_,
                              extra={"time": total, "ver": _ver_, "code": resp_code,
                                     "path": _path, "view_name": match_route, "user_agent": ua,
                                     "vcs_method": vcs_method, "repo_name": repo_name}
                          )
                          statsd = request.registry.statsd
                          if statsd:
                              match_route = request.matched_route.name if request.matched_route else _path
                              elapsed_time_ms = round(1000.0 * total)  # use ms only
                              statsd.timing(
                                  "vcsserver_req_timing.histogram", elapsed_time_ms,
                                  tags=[
                                      f"view_name:{match_route}",
                                      f"code:{resp_code}"
                                  ],
                                  use_decimals=False
                              )
                              statsd.incr(
                                  "vcsserver_req_total", tags=[
                                      f"view_name:{match_route}",
                                      f"code:{resp_code}"
                                  ])
                      return response
              def includeme(config):
                  config.add_tween(
                      'vcsserver.tweens.request_wrapper.RequestWrapperTween',
                  )

vcsserver/vcs_base.py

0 +1 -1

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              from vcsserver.lib import rc_cache
-             class RemoteBase(object):
+             class RemoteBase:
                  EMPTY_COMMIT = '0' * 40
                  def _region(self, wire):
                      cache_repo_id = wire.get('cache_repo_id', '')
                      cache_namespace_uid = f'cache_repo.{rc_cache.CACHE_OBJ_CACHE_VER}.{cache_repo_id}'
                      return rc_cache.get_or_create_region('repo_object', cache_namespace_uid)
                  def _cache_on(self, wire):
                      context = wire.get('context', '')
                      context_uid = f'{context}'
                      repo_id = wire.get('repo_id', '')
                      cache = wire.get('cache', True)
                      cache_on = context and cache
                      return cache_on, context_uid, repo_id
                  def vcsserver_invalidate_cache(self, wire, delete):
                      cache_repo_id = wire.get('cache_repo_id', '')
                      cache_namespace_uid = f'cache_repo.{rc_cache.CACHE_OBJ_CACHE_VER}.{cache_repo_id}'
                      if delete:
                          rc_cache.clear_cache_namespace(
                              'repo_object', cache_namespace_uid, method=rc_cache.CLEAR_DELETE)
                      repo_id = wire.get('repo_id', '')
                      return {'invalidated': {'repo_id': repo_id, 'delete': delete}}

vcsserver/wsgi_app_caller.py

0 +2 -2

              # RhodeCode VCSServer provides access to different vcs backends via network.
              # Copyright (C) 2014-2023 RhodeCode GmbH
              #
              # This program is free software; you can redistribute it and/or modify
              # it under the terms of the GNU General Public License as published by
              # the Free Software Foundation; either version 3 of the License, or
              # (at your option) any later version.
              #
              # This program is distributed in the hope that it will be useful,
              # but WITHOUT ANY WARRANTY; without even the implied warranty of
              # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
              # GNU General Public License for more details.
              #
              # You should have received a copy of the GNU General Public License
              # along with this program; if not, write to the Free Software Foundation,
              # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301  USA
              """Extract the responses of a WSGI app."""
              __all__ = ('WSGIAppCaller',)
              import io
              import logging
              import os
              from vcsserver.str_utils import ascii_bytes
              log = logging.getLogger(__name__)
              DEV_NULL = open(os.devnull)
              def _complete_environ(environ, input_data: bytes):
                  """Update the missing wsgi.* variables of a WSGI environment.
                  :param environ: WSGI environment to update
                  :type environ: dict
                  :param input_data: data to be read by the app
                  :type input_data: bytes
                  """
                  environ.update({
                      'wsgi.version': (1, 0),
                      'wsgi.url_scheme': 'http',
                      'wsgi.multithread': True,
                      'wsgi.multiprocess': True,
                      'wsgi.run_once': False,
                      'wsgi.input': io.BytesIO(input_data),
                      'wsgi.errors': DEV_NULL,
                  })
              # pylint: disable=too-few-public-methods
-             class _StartResponse(object):
+             class _StartResponse:
                  """Save the arguments of a start_response call."""
                  __slots__ = ['status', 'headers', 'content']
                  def __init__(self):
                      self.status = None
                      self.headers = None
                      self.content = []
                  def __call__(self, status, headers, exc_info=None):
                      # TODO(skreft): do something meaningful with the exc_info
                      exc_info = None  # avoid dangling circular reference
                      self.status = status
                      self.headers = headers
                      return self.write
                  def write(self, content):
                      """Write method returning when calling this object.
                      All the data written is then available in content.
                      """
                      self.content.append(content)
-             class WSGIAppCaller(object):
+             class WSGIAppCaller:
                  """Calls a WSGI app."""
                  def __init__(self, app):
                      """
                      :param app: WSGI app to call
                      """
                      self.app = app
                  def handle(self, environ, input_data):
                      """Process a request with the WSGI app.
                      The returned data of the app is fully consumed into a list.
                      :param environ: WSGI environment to update
                      :type environ: dict
                      :param input_data: data to be read by the app
                      :type input_data: str/bytes
                      :returns: a tuple with the contents, status and headers
                      :rtype: (list<str>, str, list<(str, str)>)
                      """
                      _complete_environ(environ, ascii_bytes(input_data, allow_bytes=True))
                      start_response = _StartResponse()
                      log.debug("Calling wrapped WSGI application")
                      responses = self.app(environ, start_response)
                      responses_list = list(responses)
                      existing_responses = start_response.content
                      if existing_responses:
                          log.debug("Adding returned response to response written via write()")
                          existing_responses.extend(responses_list)
                          responses_list = existing_responses
                      if hasattr(responses, 'close'):
                          log.debug("Closing iterator from WSGI application")
                          responses.close()
                      log.debug("Handling of WSGI request done, returning response")
                      return responses_list, start_response.status, start_response.headers

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages