upstream/mercurial-mirror Commit - r43385:4aa72cdf

py3: delete b'' prefix from safehasattr arguments...

Martin von Zweigbergk -

r43385:4aa72cdf default

parent child

hgext/absorb.py

0 +1 -1

              # absorb.py
              #
              # Copyright 2016 Facebook, Inc.
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              """apply working directory changes to changesets (EXPERIMENTAL)
              The absorb extension provides a command to use annotate information to
              amend modified chunks into the corresponding non-public changesets.
              ::
                  [absorb]
                  # only check 50 recent non-public changesets at most
                  max-stack-size = 50
                  # whether to add noise to new commits to avoid obsolescence cycle
                  add-noise = 1
                  # make `amend --correlated` a shortcut to the main command
                  amend-flag = correlated
                  [color]
                  absorb.description = yellow
                  absorb.node = blue bold
                  absorb.path = bold
              """
              # TODO:
              #  * Rename config items to [commands] namespace
              #  * Converge getdraftstack() with other code in core
              #  * move many attributes on fixupstate to be private
              from __future__ import absolute_import
              import collections
              from mercurial.i18n import _
              from mercurial import (
                  cmdutil,
                  commands,
                  context,
                  crecord,
                  error,
                  linelog,
                  mdiff,
                  node,
                  obsolete,
                  patch,
                  phases,
                  pycompat,
                  registrar,
                  scmutil,
                  util,
              )
              from mercurial.utils import stringutil
              # Note for extension authors: ONLY specify testedwith = 'ships-with-hg-core' for
              # extensions which SHIP WITH MERCURIAL. Non-mainline extensions should
              # be specifying the version(s) of Mercurial they are tested with, or
              # leave the attribute unspecified.
              testedwith = b'ships-with-hg-core'
              cmdtable = {}
              command = registrar.command(cmdtable)
              configtable = {}
              configitem = registrar.configitem(configtable)
              configitem(b'absorb', b'add-noise', default=True)
              configitem(b'absorb', b'amend-flag', default=None)
              configitem(b'absorb', b'max-stack-size', default=50)
              colortable = {
                  b'absorb.description': b'yellow',
                  b'absorb.node': b'blue bold',
                  b'absorb.path': b'bold',
              }
              defaultdict = collections.defaultdict
              class nullui(object):
                  """blank ui object doing nothing"""
                  debugflag = False
                  verbose = False
                  quiet = True
                  def __getitem__(name):
                      def nullfunc(*args, **kwds):
                          return
                      return nullfunc
              class emptyfilecontext(object):
                  """minimal filecontext representing an empty file"""
                  def data(self):
                      return b''
                  def node(self):
                      return node.nullid
              def uniq(lst):
                  """list -> list. remove duplicated items without changing the order"""
                  seen = set()
                  result = []
                  for x in lst:
                      if x not in seen:
                          seen.add(x)
                          result.append(x)
                  return result
              def getdraftstack(headctx, limit=None):
                  """(ctx, int?) -> [ctx]. get a linear stack of non-public changesets.
                  changesets are sorted in topo order, oldest first.
                  return at most limit items, if limit is a positive number.
                  merges are considered as non-draft as well. i.e. every commit
                  returned has and only has 1 parent.
                  """
                  ctx = headctx
                  result = []
                  while ctx.phase() != phases.public:
                      if limit and len(result) >= limit:
                          break
                      parents = ctx.parents()
                      if len(parents) != 1:
                          break
                      result.append(ctx)
                      ctx = parents[0]
                  result.reverse()
                  return result
              def getfilestack(stack, path, seenfctxs=None):
                  """([ctx], str, set) -> [fctx], {ctx: fctx}
                  stack is a list of contexts, from old to new. usually they are what
                  "getdraftstack" returns.
                  follows renames, but not copies.
                  seenfctxs is a set of filecontexts that will be considered "immutable".
                  they are usually what this function returned in earlier calls, useful
                  to avoid issues that a file was "moved" to multiple places and was then
                  modified differently, like: "a" was copied to "b", "a" was also copied to
                  "c" and then "a" was deleted, then both "b" and "c" were "moved" from "a"
                  and we enforce only one of them to be able to affect "a"'s content.
                  return an empty list and an empty dict, if the specified path does not
                  exist in stack[-1] (the top of the stack).
                  otherwise, return a list of de-duplicated filecontexts, and the map to
                  convert ctx in the stack to fctx, for possible mutable fctxs. the first item
                  of the list would be outside the stack and should be considered immutable.
                  the remaining items are within the stack.
                  for example, given the following changelog and corresponding filelog
                  revisions:
                    changelog: 3----4----5----6----7
                    filelog:   x    0----1----1----2 (x: no such file yet)
                  - if stack = [5, 6, 7], returns ([0, 1, 2], {5: 1, 6: 1, 7: 2})
                  - if stack = [3, 4, 5], returns ([e, 0, 1], {4: 0, 5: 1}), where "e" is a
                    dummy empty filecontext.
                  - if stack = [2], returns ([], {})
                  - if stack = [7], returns ([1, 2], {7: 2})
                  - if stack = [6, 7], returns ([1, 2], {6: 1, 7: 2}), although {6: 1} can be
                    removed, since 1 is immutable.
                  """
                  if seenfctxs is None:
                      seenfctxs = set()
                  assert stack
                  if path not in stack[-1]:
                      return [], {}
                  fctxs = []
                  fctxmap = {}
                  pctx = stack[0].p1()  # the public (immutable) ctx we stop at
                  for ctx in reversed(stack):
                      if path not in ctx:  # the file is added in the next commit
                          pctx = ctx
                          break
                      fctx = ctx[path]
                      fctxs.append(fctx)
                      if fctx in seenfctxs:  # treat fctx as the immutable one
                          pctx = None  # do not add another immutable fctx
                          break
                      fctxmap[ctx] = fctx  # only for mutable fctxs
                      copy = fctx.copysource()
                      if copy:
                          path = copy  # follow rename
                          if path in ctx:  # but do not follow copy
                              pctx = ctx.p1()
                              break
                  if pctx is not None:  # need an extra immutable fctx
                      if path in pctx:
                          fctxs.append(pctx[path])
                      else:
                          fctxs.append(emptyfilecontext())
                  fctxs.reverse()
                  # note: we rely on a property of hg: filerev is not reused for linear
                  # history. i.e. it's impossible to have:
                  #   changelog:  4----5----6 (linear, no merges)
                  #   filelog:    1----2----1
                  #                         ^ reuse filerev (impossible)
                  # because parents are part of the hash. if that's not true, we need to
                  # remove uniq and find a different way to identify fctxs.
                  return uniq(fctxs), fctxmap
              class overlaystore(patch.filestore):
                  """read-only, hybrid store based on a dict and ctx.
                  memworkingcopy: {path: content}, overrides file contents.
                  """
                  def __init__(self, basectx, memworkingcopy):
                      self.basectx = basectx
                      self.memworkingcopy = memworkingcopy
                  def getfile(self, path):
                      """comply with mercurial.patch.filestore.getfile"""
                      if path not in self.basectx:
                          return None, None, None
                      fctx = self.basectx[path]
                      if path in self.memworkingcopy:
                          content = self.memworkingcopy[path]
                      else:
                          content = fctx.data()
                      mode = (fctx.islink(), fctx.isexec())
                      copy = fctx.copysource()
                      return content, mode, copy
              def overlaycontext(memworkingcopy, ctx, parents=None, extra=None):
                  """({path: content}, ctx, (p1node, p2node)?, {}?) -> memctx
                  memworkingcopy overrides file contents.
                  """
                  # parents must contain 2 items: (node1, node2)
                  if parents is None:
                      parents = ctx.repo().changelog.parents(ctx.node())
                  if extra is None:
                      extra = ctx.extra()
                  date = ctx.date()
                  desc = ctx.description()
                  user = ctx.user()
                  files = set(ctx.files()).union(memworkingcopy)
                  store = overlaystore(ctx, memworkingcopy)
                  return context.memctx(
                      repo=ctx.repo(),
                      parents=parents,
                      text=desc,
                      files=files,
                      filectxfn=store,
                      user=user,
                      date=date,
                      branch=None,
                      extra=extra,
                  )
              class filefixupstate(object):
                  """state needed to apply fixups to a single file
                  internally, it keeps file contents of several revisions and a linelog.
                  the linelog uses odd revision numbers for original contents (fctxs passed
                  to __init__), and even revision numbers for fixups, like:
                      linelog rev 1: self.fctxs[0] (from an immutable "public" changeset)
                      linelog rev 2: fixups made to self.fctxs[0]
                      linelog rev 3: self.fctxs[1] (a child of fctxs[0])
                      linelog rev 4: fixups made to self.fctxs[1]
                      ...
                  a typical use is like:
 . call diffwith, to calculate self.fixups
 . (optionally), present self.fixups to the user, or change it
 . call apply, to apply changes
 . read results from "finalcontents", or call getfinalcontent
                  """
                  def __init__(self, fctxs, path, ui=None, opts=None):
                      """([fctx], ui or None) -> None
                      fctxs should be linear, and sorted by topo order - oldest first.
                      fctxs[0] will be considered as "immutable" and will not be changed.
                      """
                      self.fctxs = fctxs
                      self.path = path
                      self.ui = ui or nullui()
                      self.opts = opts or {}
                      # following fields are built from fctxs. they exist for perf reason
                      self.contents = [f.data() for f in fctxs]
                      self.contentlines = pycompat.maplist(mdiff.splitnewlines, self.contents)
                      self.linelog = self._buildlinelog()
                      if self.ui.debugflag:
                          assert self._checkoutlinelog() == self.contents
                      # following fields will be filled later
                      self.chunkstats = [0, 0]  # [adopted, total : int]
                      self.targetlines = []  # [str]
                      self.fixups = []  # [(linelog rev, a1, a2, b1, b2)]
                      self.finalcontents = []  # [str]
                      self.ctxaffected = set()
                  def diffwith(self, targetfctx, fm=None):
                      """calculate fixups needed by examining the differences between
                      self.fctxs[-1] and targetfctx, chunk by chunk.
                      targetfctx is the target state we move towards. we may or may not be
                      able to get there because not all modified chunks can be amended into
                      a non-public fctx unambiguously.
                      call this only once, before apply().
                      update self.fixups, self.chunkstats, and self.targetlines.
                      """
                      a = self.contents[-1]
                      alines = self.contentlines[-1]
                      b = targetfctx.data()
                      blines = mdiff.splitnewlines(b)
                      self.targetlines = blines
                      self.linelog.annotate(self.linelog.maxrev)
                      annotated = self.linelog.annotateresult  # [(linelog rev, linenum)]
                      assert len(annotated) == len(alines)
                      # add a dummy end line to make insertion at the end easier
                      if annotated:
                          dummyendline = (annotated[-1][0], annotated[-1][1] + 1)
                          annotated.append(dummyendline)
                      # analyse diff blocks
                      for chunk in self._alldiffchunks(a, b, alines, blines):
                          newfixups = self._analysediffchunk(chunk, annotated)
                          self.chunkstats[0] += bool(newfixups)  # 1 or 0
                          self.chunkstats[1] += 1
                          self.fixups += newfixups
                          if fm is not None:
                              self._showchanges(fm, alines, blines, chunk, newfixups)
                  def apply(self):
                      """apply self.fixups. update self.linelog, self.finalcontents.
                      call this only once, before getfinalcontent(), after diffwith().
                      """
                      # the following is unnecessary, as it's done by "diffwith":
                      #   self.linelog.annotate(self.linelog.maxrev)
                      for rev, a1, a2, b1, b2 in reversed(self.fixups):
                          blines = self.targetlines[b1:b2]
                          if self.ui.debugflag:
                              idx = (max(rev - 1, 0)) // 2
                              self.ui.write(
                                  _(b'%s: chunk %d:%d -> %d lines\n')
                                  % (node.short(self.fctxs[idx].node()), a1, a2, len(blines))
                              )
                          self.linelog.replacelines(rev, a1, a2, b1, b2)
                      if self.opts.get(b'edit_lines', False):
                          self.finalcontents = self._checkoutlinelogwithedits()
                      else:
                          self.finalcontents = self._checkoutlinelog()
                  def getfinalcontent(self, fctx):
                      """(fctx) -> str. get modified file content for a given filecontext"""
                      idx = self.fctxs.index(fctx)
                      return self.finalcontents[idx]
                  def _analysediffchunk(self, chunk, annotated):
                      """analyse a different chunk and return new fixups found
                      return [] if no lines from the chunk can be safely applied.
                      the chunk (or lines) cannot be safely applied, if, for example:
                        - the modified (deleted) lines belong to a public changeset
                          (self.fctxs[0])
                        - the chunk is a pure insertion and the adjacent lines (at most 2
                          lines) belong to different non-public changesets, or do not belong
                          to any non-public changesets.
                        - the chunk is modifying lines from different changesets.
                          in this case, if the number of lines deleted equals to the number
                          of lines added, assume it's a simple 1:1 map (could be wrong).
                          otherwise, give up.
                        - the chunk is modifying lines from a single non-public changeset,
                          but other revisions touch the area as well. i.e. the lines are
                          not continuous as seen from the linelog.
                      """
                      a1, a2, b1, b2 = chunk
                      # find involved indexes from annotate result
                      involved = annotated[a1:a2]
                      if not involved and annotated:  # a1 == a2 and a is not empty
                          # pure insertion, check nearby lines. ignore lines belong
                          # to the public (first) changeset (i.e. annotated[i][0] == 1)
                          nearbylinenums = {a2, max(0, a1 - 1)}
                          involved = [
                              annotated[i] for i in nearbylinenums if annotated[i][0] != 1
                          ]
                      involvedrevs = list(set(r for r, l in involved))
                      newfixups = []
                      if len(involvedrevs) == 1 and self._iscontinuous(a1, a2 - 1, True):
                          # chunk belongs to a single revision
                          rev = involvedrevs[0]
                          if rev > 1:
                              fixuprev = rev + 1
                              newfixups.append((fixuprev, a1, a2, b1, b2))
                      elif a2 - a1 == b2 - b1 or b1 == b2:
                          # 1:1 line mapping, or chunk was deleted
                          for i in pycompat.xrange(a1, a2):
                              rev, linenum = annotated[i]
                              if rev > 1:
                                  if b1 == b2:  # deletion, simply remove that single line
                                      nb1 = nb2 = 0
                                  else:  # 1:1 line mapping, change the corresponding rev
                                      nb1 = b1 + i - a1
                                      nb2 = nb1 + 1
                                  fixuprev = rev + 1
                                  newfixups.append((fixuprev, i, i + 1, nb1, nb2))
                      return self._optimizefixups(newfixups)
                  @staticmethod
                  def _alldiffchunks(a, b, alines, blines):
                      """like mdiff.allblocks, but only care about differences"""
                      blocks = mdiff.allblocks(a, b, lines1=alines, lines2=blines)
                      for chunk, btype in blocks:
                          if btype != b'!':
                              continue
                          yield chunk
                  def _buildlinelog(self):
                      """calculate the initial linelog based on self.content{,line}s.
                      this is similar to running a partial "annotate".
                      """
                      llog = linelog.linelog()
                      a, alines = b'', []
                      for i in pycompat.xrange(len(self.contents)):
                          b, blines = self.contents[i], self.contentlines[i]
                          llrev = i * 2 + 1
                          chunks = self._alldiffchunks(a, b, alines, blines)
                          for a1, a2, b1, b2 in reversed(list(chunks)):
                              llog.replacelines(llrev, a1, a2, b1, b2)
                          a, alines = b, blines
                      return llog
                  def _checkoutlinelog(self):
                      """() -> [str]. check out file contents from linelog"""
                      contents = []
                      for i in pycompat.xrange(len(self.contents)):
                          rev = (i + 1) * 2
                          self.linelog.annotate(rev)
                          content = b''.join(map(self._getline, self.linelog.annotateresult))
                          contents.append(content)
                      return contents
                  def _checkoutlinelogwithedits(self):
                      """() -> [str]. prompt all lines for edit"""
                      alllines = self.linelog.getalllines()
                      # header
                      editortext = (
                          _(
                              b'HG: editing %s\nHG: "y" means the line to the right '
                              b'exists in the changeset to the top\nHG:\n'
                          )
                          % self.fctxs[-1].path()
                      )
                      # [(idx, fctx)]. hide the dummy emptyfilecontext
                      visiblefctxs = [
                          (i, f)
                          for i, f in enumerate(self.fctxs)
                          if not isinstance(f, emptyfilecontext)
                      ]
                      for i, (j, f) in enumerate(visiblefctxs):
                          editortext += _(b'HG: %s/%s %s %s\n') % (
                              b'|' * i,
                              b'-' * (len(visiblefctxs) - i + 1),
                              node.short(f.node()),
                              f.description().split(b'\n', 1)[0],
                          )
                      editortext += _(b'HG: %s\n') % (b'|' * len(visiblefctxs))
                      # figure out the lifetime of a line, this is relatively inefficient,
                      # but probably fine
                      lineset = defaultdict(lambda: set())  # {(llrev, linenum): {llrev}}
                      for i, f in visiblefctxs:
                          self.linelog.annotate((i + 1) * 2)
                          for l in self.linelog.annotateresult:
                              lineset[l].add(i)
                      # append lines
                      for l in alllines:
                          editortext += b'    %s : %s' % (
                              b''.join(
                                  [
                                      (b'y' if i in lineset[l] else b' ')
                                      for i, _f in visiblefctxs
                                  ]
                              ),
                              self._getline(l),
                          )
                      # run editor
                      editedtext = self.ui.edit(editortext, b'', action=b'absorb')
                      if not editedtext:
                          raise error.Abort(_(b'empty editor text'))
                      # parse edited result
                      contents = [b'' for i in self.fctxs]
                      leftpadpos = 4
                      colonpos = leftpadpos + len(visiblefctxs) + 1
                      for l in mdiff.splitnewlines(editedtext):
                          if l.startswith(b'HG:'):
                              continue
                          if l[colonpos - 1 : colonpos + 2] != b' : ':
                              raise error.Abort(_(b'malformed line: %s') % l)
                          linecontent = l[colonpos + 2 :]
                          for i, ch in enumerate(
                              pycompat.bytestr(l[leftpadpos : colonpos - 1])
                          ):
                              if ch == b'y':
                                  contents[visiblefctxs[i][0]] += linecontent
                      # chunkstats is hard to calculate if anything changes, therefore
                      # set them to just a simple value (1, 1).
                      if editedtext != editortext:
                          self.chunkstats = [1, 1]
                      return contents
                  def _getline(self, lineinfo):
                      """((rev, linenum)) -> str. convert rev+line number to line content"""
                      rev, linenum = lineinfo
                      if rev & 1:  # odd: original line taken from fctxs
                          return self.contentlines[rev // 2][linenum]
                      else:  # even: fixup line from targetfctx
                          return self.targetlines[linenum]
                  def _iscontinuous(self, a1, a2, closedinterval=False):
                      """(a1, a2 : int) -> bool
                      check if these lines are continuous. i.e. no other insertions or
                      deletions (from other revisions) among these lines.
                      closedinterval decides whether a2 should be included or not. i.e. is
                      it [a1, a2), or [a1, a2] ?
                      """
                      if a1 >= a2:
                          return True
                      llog = self.linelog
                      offset1 = llog.getoffset(a1)
                      offset2 = llog.getoffset(a2) + int(closedinterval)
                      linesinbetween = llog.getalllines(offset1, offset2)
                      return len(linesinbetween) == a2 - a1 + int(closedinterval)
                  def _optimizefixups(self, fixups):
                      """[(rev, a1, a2, b1, b2)] -> [(rev, a1, a2, b1, b2)].
                      merge adjacent fixups to make them less fragmented.
                      """
                      result = []
                      pcurrentchunk = [[-1, -1, -1, -1, -1]]
                      def pushchunk():
                          if pcurrentchunk[0][0] != -1:
                              result.append(tuple(pcurrentchunk[0]))
                      for i, chunk in enumerate(fixups):
                          rev, a1, a2, b1, b2 = chunk
                          lastrev = pcurrentchunk[0][0]
                          lasta2 = pcurrentchunk[0][2]
                          lastb2 = pcurrentchunk[0][4]
                          if (
                              a1 == lasta2
                              and b1 == lastb2
                              and rev == lastrev
                              and self._iscontinuous(max(a1 - 1, 0), a1)
                          ):
                              # merge into currentchunk
                              pcurrentchunk[0][2] = a2
                              pcurrentchunk[0][4] = b2
                          else:
                              pushchunk()
                              pcurrentchunk[0] = list(chunk)
                      pushchunk()
                      return result
                  def _showchanges(self, fm, alines, blines, chunk, fixups):
                      def trim(line):
                          if line.endswith(b'\n'):
                              line = line[:-1]
                          return line
                      # this is not optimized for perf but _showchanges only gets executed
                      # with an extra command-line flag.
                      a1, a2, b1, b2 = chunk
                      aidxs, bidxs = [0] * (a2 - a1), [0] * (b2 - b1)
                      for idx, fa1, fa2, fb1, fb2 in fixups:
                          for i in pycompat.xrange(fa1, fa2):
                              aidxs[i - a1] = (max(idx, 1) - 1) // 2
                          for i in pycompat.xrange(fb1, fb2):
                              bidxs[i - b1] = (max(idx, 1) - 1) // 2
                      fm.startitem()
                      fm.write(
                          b'hunk',
                          b'        %s\n',
                          b'@@ -%d,%d +%d,%d @@' % (a1, a2 - a1, b1, b2 - b1),
                          label=b'diff.hunk',
                      )
                      fm.data(path=self.path, linetype=b'hunk')
                      def writeline(idx, diffchar, line, linetype, linelabel):
                          fm.startitem()
                          node = b''
                          if idx:
                              ctx = self.fctxs[idx]
                              fm.context(fctx=ctx)
                              node = ctx.hex()
                              self.ctxaffected.add(ctx.changectx())
                          fm.write(b'node', b'%-7.7s ', node, label=b'absorb.node')
                          fm.write(
                              b'diffchar ' + linetype,
                              b'%s%s\n',
                              diffchar,
                              line,
                              label=linelabel,
                          )
                          fm.data(path=self.path, linetype=linetype)
                      for i in pycompat.xrange(a1, a2):
                          writeline(
                              aidxs[i - a1],
                              b'-',
                              trim(alines[i]),
                              b'deleted',
                              b'diff.deleted',
                          )
                      for i in pycompat.xrange(b1, b2):
                          writeline(
                              bidxs[i - b1],
                              b'+',
                              trim(blines[i]),
                              b'inserted',
                              b'diff.inserted',
                          )
              class fixupstate(object):
                  """state needed to run absorb
                  internally, it keeps paths and filefixupstates.
                  a typical use is like filefixupstates:
 . call diffwith, to calculate fixups
 . (optionally), present fixups to the user, or edit fixups
 . call apply, to apply changes to memory
 . call commit, to commit changes to hg database
                  """
                  def __init__(self, stack, ui=None, opts=None):
                      """([ctx], ui or None) -> None
                      stack: should be linear, and sorted by topo order - oldest first.
                      all commits in stack are considered mutable.
                      """
                      assert stack
                      self.ui = ui or nullui()
                      self.opts = opts or {}
                      self.stack = stack
                      self.repo = stack[-1].repo().unfiltered()
                      # following fields will be filled later
                      self.paths = []  # [str]
                      self.status = None  # ctx.status output
                      self.fctxmap = {}  # {path: {ctx: fctx}}
                      self.fixupmap = {}  # {path: filefixupstate}
                      self.replacemap = {}  # {oldnode: newnode or None}
                      self.finalnode = None  # head after all fixups
                      self.ctxaffected = set()  # ctx that will be absorbed into
                  def diffwith(self, targetctx, match=None, fm=None):
                      """diff and prepare fixups. update self.fixupmap, self.paths"""
                      # only care about modified files
                      self.status = self.stack[-1].status(targetctx, match)
                      self.paths = []
                      # but if --edit-lines is used, the user may want to edit files
                      # even if they are not modified
                      editopt = self.opts.get(b'edit_lines')
                      if not self.status.modified and editopt and match:
                          interestingpaths = match.files()
                      else:
                          interestingpaths = self.status.modified
                      # prepare the filefixupstate
                      seenfctxs = set()
                      # sorting is necessary to eliminate ambiguity for the "double move"
                      # case: "hg cp A B; hg cp A C; hg rm A", then only "B" can affect "A".
                      for path in sorted(interestingpaths):
                          self.ui.debug(b'calculating fixups for %s\n' % path)
                          targetfctx = targetctx[path]
                          fctxs, ctx2fctx = getfilestack(self.stack, path, seenfctxs)
                          # ignore symbolic links or binary, or unchanged files
                          if any(
                              f.islink() or stringutil.binary(f.data())
                              for f in [targetfctx] + fctxs
                              if not isinstance(f, emptyfilecontext)
                          ):
                              continue
                          if targetfctx.data() == fctxs[-1].data() and not editopt:
                              continue
                          seenfctxs.update(fctxs[1:])
                          self.fctxmap[path] = ctx2fctx
                          fstate = filefixupstate(fctxs, path, ui=self.ui, opts=self.opts)
                          if fm is not None:
                              fm.startitem()
                              fm.plain(b'showing changes for ')
                              fm.write(b'path', b'%s\n', path, label=b'absorb.path')
                              fm.data(linetype=b'path')
                          fstate.diffwith(targetfctx, fm)
                          self.fixupmap[path] = fstate
                          self.paths.append(path)
                          self.ctxaffected.update(fstate.ctxaffected)
                  def apply(self):
                      """apply fixups to individual filefixupstates"""
                      for path, state in pycompat.iteritems(self.fixupmap):
                          if self.ui.debugflag:
                              self.ui.write(_(b'applying fixups to %s\n') % path)
                          state.apply()
                  @property
                  def chunkstats(self):
                      """-> {path: chunkstats}. collect chunkstats from filefixupstates"""
                      return dict(
                          (path, state.chunkstats)
                          for path, state in pycompat.iteritems(self.fixupmap)
                      )
                  def commit(self):
                      """commit changes. update self.finalnode, self.replacemap"""
                      with self.repo.transaction(b'absorb') as tr:
                          self._commitstack()
                          self._movebookmarks(tr)
                          if self.repo[b'.'].node() in self.replacemap:
                              self._moveworkingdirectoryparent()
                          self._cleanupoldcommits()
                      return self.finalnode
                  def printchunkstats(self):
                      """print things like '1 of 2 chunk(s) applied'"""
                      ui = self.ui
                      chunkstats = self.chunkstats
                      if ui.verbose:
                          # chunkstats for each file
                          for path, stat in pycompat.iteritems(chunkstats):
                              if stat[0]:
                                  ui.write(
                                      _(b'%s: %d of %d chunk(s) applied\n')
                                      % (path, stat[0], stat[1])
                                  )
                      elif not ui.quiet:
                          # a summary for all files
                          stats = chunkstats.values()
                          applied, total = (sum(s[i] for s in stats) for i in (0, 1))
                          ui.write(_(b'%d of %d chunk(s) applied\n') % (applied, total))
                  def _commitstack(self):
                      """make new commits. update self.finalnode, self.replacemap.
                      it is splitted from "commit" to avoid too much indentation.
                      """
                      # last node (20-char) committed by us
                      lastcommitted = None
                      # p1 which overrides the parent of the next commit, "None" means use
                      # the original parent unchanged
                      nextp1 = None
                      for ctx in self.stack:
                          memworkingcopy = self._getnewfilecontents(ctx)
                          if not memworkingcopy and not lastcommitted:
                              # nothing changed, nothing commited
                              nextp1 = ctx
                              continue
                          if self._willbecomenoop(memworkingcopy, ctx, nextp1):
                              # changeset is no longer necessary
                              self.replacemap[ctx.node()] = None
                              msg = _(b'became empty and was dropped')
                          else:
                              # changeset needs re-commit
                              nodestr = self._commitsingle(memworkingcopy, ctx, p1=nextp1)
                              lastcommitted = self.repo[nodestr]
                              nextp1 = lastcommitted
                              self.replacemap[ctx.node()] = lastcommitted.node()
                              if memworkingcopy:
                                  msg = _(b'%d file(s) changed, became %s') % (
                                      len(memworkingcopy),
                                      self._ctx2str(lastcommitted),
                                  )
                              else:
                                  msg = _(b'became %s') % self._ctx2str(lastcommitted)
                          if self.ui.verbose and msg:
                              self.ui.write(_(b'%s: %s\n') % (self._ctx2str(ctx), msg))
                      self.finalnode = lastcommitted and lastcommitted.node()
                  def _ctx2str(self, ctx):
                      if self.ui.debugflag:
                          return b'%d:%s' % (ctx.rev(), ctx.hex())
                      else:
                          return b'%d:%s' % (ctx.rev(), node.short(ctx.node()))
                  def _getnewfilecontents(self, ctx):
                      """(ctx) -> {path: str}
                      fetch file contents from filefixupstates.
                      return the working copy overrides - files different from ctx.
                      """
                      result = {}
                      for path in self.paths:
                          ctx2fctx = self.fctxmap[path]  # {ctx: fctx}
                          if ctx not in ctx2fctx:
                              continue
                          fctx = ctx2fctx[ctx]
                          content = fctx.data()
                          newcontent = self.fixupmap[path].getfinalcontent(fctx)
                          if content != newcontent:
                              result[fctx.path()] = newcontent
                      return result
                  def _movebookmarks(self, tr):
                      repo = self.repo
                      needupdate = [
                          (name, self.replacemap[hsh])
                          for name, hsh in pycompat.iteritems(repo._bookmarks)
                          if hsh in self.replacemap
                      ]
                      changes = []
                      for name, hsh in needupdate:
                          if hsh:
                              changes.append((name, hsh))
                              if self.ui.verbose:
                                  self.ui.write(
                                      _(b'moving bookmark %s to %s\n') % (name, node.hex(hsh))
                                  )
                          else:
                              changes.append((name, None))
                              if self.ui.verbose:
                                  self.ui.write(_(b'deleting bookmark %s\n') % name)
                      repo._bookmarks.applychanges(repo, tr, changes)
                  def _moveworkingdirectoryparent(self):
                      if not self.finalnode:
                          # Find the latest not-{obsoleted,stripped} parent.
                          revs = self.repo.revs(b'max(::. - %ln)', self.replacemap.keys())
                          ctx = self.repo[revs.first()]
                          self.finalnode = ctx.node()
                      else:
                          ctx = self.repo[self.finalnode]
                      dirstate = self.repo.dirstate
                      # dirstate.rebuild invalidates fsmonitorstate, causing "hg status" to
                      # be slow. in absorb's case, no need to invalidate fsmonitorstate.
                      noop = lambda: 0
                      restore = noop
-                     if util.safehasattr(dirstate, b'_fsmonitorstate'):
+                     if util.safehasattr(dirstate, '_fsmonitorstate'):
                          bak = dirstate._fsmonitorstate.invalidate
                          def restore():
                              dirstate._fsmonitorstate.invalidate = bak
                          dirstate._fsmonitorstate.invalidate = noop
                      try:
                          with dirstate.parentchange():
                              dirstate.rebuild(ctx.node(), ctx.manifest(), self.paths)
                      finally:
                          restore()
                  @staticmethod
                  def _willbecomenoop(memworkingcopy, ctx, pctx=None):
                      """({path: content}, ctx, ctx) -> bool. test if a commit will be noop
                      if it will become an empty commit (does not change anything, after the
                      memworkingcopy overrides), return True. otherwise return False.
                      """
                      if not pctx:
                          parents = ctx.parents()
                          if len(parents) != 1:
                              return False
                          pctx = parents[0]
                      # ctx changes more files (not a subset of memworkingcopy)
                      if not set(ctx.files()).issubset(set(memworkingcopy)):
                          return False
                      for path, content in pycompat.iteritems(memworkingcopy):
                          if path not in pctx or path not in ctx:
                              return False
                          fctx = ctx[path]
                          pfctx = pctx[path]
                          if pfctx.flags() != fctx.flags():
                              return False
                          if pfctx.data() != content:
                              return False
                      return True
                  def _commitsingle(self, memworkingcopy, ctx, p1=None):
                      """(ctx, {path: content}, node) -> node. make a single commit
                      the commit is a clone from ctx, with a (optionally) different p1, and
                      different file contents replaced by memworkingcopy.
                      """
                      parents = p1 and (p1, node.nullid)
                      extra = ctx.extra()
                      if self._useobsolete and self.ui.configbool(b'absorb', b'add-noise'):
                          extra[b'absorb_source'] = ctx.hex()
                      mctx = overlaycontext(memworkingcopy, ctx, parents, extra=extra)
                      return mctx.commit()
                  @util.propertycache
                  def _useobsolete(self):
                      """() -> bool"""
                      return obsolete.isenabled(self.repo, obsolete.createmarkersopt)
                  def _cleanupoldcommits(self):
                      replacements = {
                          k: ([v] if v is not None else [])
                          for k, v in pycompat.iteritems(self.replacemap)
                      }
                      if replacements:
                          scmutil.cleanupnodes(
                              self.repo, replacements, operation=b'absorb', fixphase=True
                          )
              def _parsechunk(hunk):
                  """(crecord.uihunk or patch.recordhunk) -> (path, (a1, a2, [bline]))"""
                  if type(hunk) not in (crecord.uihunk, patch.recordhunk):
                      return None, None
                  path = hunk.header.filename()
                  a1 = hunk.fromline + len(hunk.before) - 1
                  # remove before and after context
                  hunk.before = hunk.after = []
                  buf = util.stringio()
                  hunk.write(buf)
                  patchlines = mdiff.splitnewlines(buf.getvalue())
                  # hunk.prettystr() will update hunk.removed
                  a2 = a1 + hunk.removed
                  blines = [l[1:] for l in patchlines[1:] if not l.startswith(b'-')]
                  return path, (a1, a2, blines)
              def overlaydiffcontext(ctx, chunks):
                  """(ctx, [crecord.uihunk]) -> memctx
                  return a memctx with some [1] patches (chunks) applied to ctx.
                  [1]: modifications are handled. renames, mode changes, etc. are ignored.
                  """
                  # sadly the applying-patch logic is hardly reusable, and messy:
                  # 1. the core logic "_applydiff" is too heavy - it writes .rej files, it
                  #    needs a file stream of a patch and will re-parse it, while we have
                  #    structured hunk objects at hand.
                  # 2. a lot of different implementations about "chunk" (patch.hunk,
                  #    patch.recordhunk, crecord.uihunk)
                  # as we only care about applying changes to modified files, no mode
                  # change, no binary diff, and no renames, it's probably okay to
                  # re-invent the logic using much simpler code here.
                  memworkingcopy = {}  # {path: content}
                  patchmap = defaultdict(lambda: [])  # {path: [(a1, a2, [bline])]}
                  for path, info in map(_parsechunk, chunks):
                      if not path or not info:
                          continue
                      patchmap[path].append(info)
                  for path, patches in pycompat.iteritems(patchmap):
                      if path not in ctx or not patches:
                          continue
                      patches.sort(reverse=True)
                      lines = mdiff.splitnewlines(ctx[path].data())
                      for a1, a2, blines in patches:
                          lines[a1:a2] = blines
                      memworkingcopy[path] = b''.join(lines)
                  return overlaycontext(memworkingcopy, ctx)
              def absorb(ui, repo, stack=None, targetctx=None, pats=None, opts=None):
                  """pick fixup chunks from targetctx, apply them to stack.
                  if targetctx is None, the working copy context will be used.
                  if stack is None, the current draft stack will be used.
                  return fixupstate.
                  """
                  if stack is None:
                      limit = ui.configint(b'absorb', b'max-stack-size')
                      headctx = repo[b'.']
                      if len(headctx.parents()) > 1:
                          raise error.Abort(_(b'cannot absorb into a merge'))
                      stack = getdraftstack(headctx, limit)
                      if limit and len(stack) >= limit:
                          ui.warn(
                              _(
                                  b'absorb: only the recent %d changesets will '
                                  b'be analysed\n'
                              )
                              % limit
                          )
                  if not stack:
                      raise error.Abort(_(b'no mutable changeset to change'))
                  if targetctx is None:  # default to working copy
                      targetctx = repo[None]
                  if pats is None:
                      pats = ()
                  if opts is None:
                      opts = {}
                  state = fixupstate(stack, ui=ui, opts=opts)
                  matcher = scmutil.match(targetctx, pats, opts)
                  if opts.get(b'interactive'):
                      diff = patch.diff(repo, stack[-1].node(), targetctx.node(), matcher)
                      origchunks = patch.parsepatch(diff)
                      chunks = cmdutil.recordfilter(ui, origchunks, matcher)[0]
                      targetctx = overlaydiffcontext(stack[-1], chunks)
                  fm = None
                  if opts.get(b'print_changes') or not opts.get(b'apply_changes'):
                      fm = ui.formatter(b'absorb', opts)
                  state.diffwith(targetctx, matcher, fm)
                  if fm is not None:
                      fm.startitem()
                      fm.write(
                          b"count", b"\n%d changesets affected\n", len(state.ctxaffected)
                      )
                      fm.data(linetype=b'summary')
                      for ctx in reversed(stack):
                          if ctx not in state.ctxaffected:
                              continue
                          fm.startitem()
                          fm.context(ctx=ctx)
                          fm.data(linetype=b'changeset')
                          fm.write(b'node', b'%-7.7s ', ctx.hex(), label=b'absorb.node')
                          descfirstline = ctx.description().splitlines()[0]
                          fm.write(
                              b'descfirstline',
                              b'%s\n',
                              descfirstline,
                              label=b'absorb.description',
                          )
                      fm.end()
                  if not opts.get(b'dry_run'):
                      if (
                          not opts.get(b'apply_changes')
                          and state.ctxaffected
                          and ui.promptchoice(
                              b"apply changes (yn)? $$ &Yes $$ &No", default=1
                          )
                      ):
                          raise error.Abort(_(b'absorb cancelled\n'))
                      state.apply()
                      if state.commit():
                          state.printchunkstats()
                      elif not ui.quiet:
                          ui.write(_(b'nothing applied\n'))
                  return state
              @command(
                  b'absorb',
                  [
                      (
                          b'a',
                          b'apply-changes',
                          None,
                          _(b'apply changes without prompting for confirmation'),
                      ),
                      (
                          b'p',
                          b'print-changes',
                          None,
                          _(b'always print which changesets are modified by which changes'),
                      ),
                      (
                          b'i',
                          b'interactive',
                          None,
                          _(b'interactively select which chunks to apply (EXPERIMENTAL)'),
                      ),
                      (
                          b'e',
                          b'edit-lines',
                          None,
                          _(
                              b'edit what lines belong to which changesets before commit '
                              b'(EXPERIMENTAL)'
                          ),
                      ),
                  ]
                  + commands.dryrunopts
                  + commands.templateopts
                  + commands.walkopts,
                  _(b'hg absorb [OPTION] [FILE]...'),
                  helpcategory=command.CATEGORY_COMMITTING,
                  helpbasic=True,
              )
              def absorbcmd(ui, repo, *pats, **opts):
                  """incorporate corrections into the stack of draft changesets
                  absorb analyzes each change in your working directory and attempts to
                  amend the changed lines into the changesets in your stack that first
                  introduced those lines.
                  If absorb cannot find an unambiguous changeset to amend for a change,
                  that change will be left in the working directory, untouched. They can be
                  observed by :hg:`status` or :hg:`diff` afterwards. In other words,
                  absorb does not write to the working directory.
                  Changesets outside the revset `::. and not public() and not merge()` will
                  not be changed.
                  Changesets that become empty after applying the changes will be deleted.
                  By default, absorb will show what it plans to do and prompt for
                  confirmation.  If you are confident that the changes will be absorbed
                  to the correct place, run :hg:`absorb -a` to apply the changes
                  immediately.
                  Returns 0 on success, 1 if all chunks were ignored and nothing amended.
                  """
                  opts = pycompat.byteskwargs(opts)
                  with repo.wlock(), repo.lock():
                      if not opts[b'dry_run']:
                          cmdutil.checkunfinished(repo)
                      state = absorb(ui, repo, pats=pats, opts=opts)
                      if sum(s[0] for s in state.chunkstats.values()) == 0:
                          return 1

hgext/bugzilla.py

0 +2 -2

              # bugzilla.py - bugzilla integration for mercurial
              #
              # Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com>
              # Copyright 2011-4 Jim Hague <jim.hague@acm.org>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              '''hooks for integrating with the Bugzilla bug tracker
              This hook extension adds comments on bugs in Bugzilla when changesets
              that refer to bugs by Bugzilla ID are seen. The comment is formatted using
              the Mercurial template mechanism.
              The bug references can optionally include an update for Bugzilla of the
              hours spent working on the bug. Bugs can also be marked fixed.
              Four basic modes of access to Bugzilla are provided:
 . Access via the Bugzilla REST-API. Requires bugzilla 5.0 or later.
 . Access via the Bugzilla XMLRPC interface. Requires Bugzilla 3.4 or later.
 . Check data via the Bugzilla XMLRPC interface and submit bug change
                 via email to Bugzilla email interface. Requires Bugzilla 3.4 or later.
 . Writing directly to the Bugzilla database. Only Bugzilla installations
                 using MySQL are supported. Requires Python MySQLdb.
              Writing directly to the database is susceptible to schema changes, and
              relies on a Bugzilla contrib script to send out bug change
              notification emails. This script runs as the user running Mercurial,
              must be run on the host with the Bugzilla install, and requires
              permission to read Bugzilla configuration details and the necessary
              MySQL user and password to have full access rights to the Bugzilla
              database. For these reasons this access mode is now considered
              deprecated, and will not be updated for new Bugzilla versions going
              forward. Only adding comments is supported in this access mode.
              Access via XMLRPC needs a Bugzilla username and password to be specified
              in the configuration. Comments are added under that username. Since the
              configuration must be readable by all Mercurial users, it is recommended
              that the rights of that user are restricted in Bugzilla to the minimum
              necessary to add comments. Marking bugs fixed requires Bugzilla 4.0 and later.
              Access via XMLRPC/email uses XMLRPC to query Bugzilla, but sends
              email to the Bugzilla email interface to submit comments to bugs.
              The From: address in the email is set to the email address of the Mercurial
              user, so the comment appears to come from the Mercurial user. In the event
              that the Mercurial user email is not recognized by Bugzilla as a Bugzilla
              user, the email associated with the Bugzilla username used to log into
              Bugzilla is used instead as the source of the comment. Marking bugs fixed
              works on all supported Bugzilla versions.
              Access via the REST-API needs either a Bugzilla username and password
              or an apikey specified in the configuration. Comments are made under
              the given username or the user associated with the apikey in Bugzilla.
              Configuration items common to all access modes:
              bugzilla.version
                The access type to use. Values recognized are:
                :``restapi``:      Bugzilla REST-API, Bugzilla 5.0 and later.
                :``xmlrpc``:       Bugzilla XMLRPC interface.
                :``xmlrpc+email``: Bugzilla XMLRPC and email interfaces.
                :``3.0``:          MySQL access, Bugzilla 3.0 and later.
                :``2.18``:         MySQL access, Bugzilla 2.18 and up to but not
                                   including 3.0.
                :``2.16``:         MySQL access, Bugzilla 2.16 and up to but not
                                   including 2.18.
              bugzilla.regexp
                Regular expression to match bug IDs for update in changeset commit message.
                It must contain one "()" named group ``<ids>`` containing the bug
                IDs separated by non-digit characters. It may also contain
                a named group ``<hours>`` with a floating-point number giving the
                hours worked on the bug. If no named groups are present, the first
                "()" group is assumed to contain the bug IDs, and work time is not
                updated. The default expression matches ``Bug 1234``, ``Bug no. 1234``,
                ``Bug number 1234``, ``Bugs 1234,5678``, ``Bug 1234 and 5678`` and
                variations thereof, followed by an hours number prefixed by ``h`` or
                ``hours``, e.g. ``hours 1.5``. Matching is case insensitive.
              bugzilla.fixregexp
                Regular expression to match bug IDs for marking fixed in changeset
                commit message. This must contain a "()" named group ``<ids>` containing
                the bug IDs separated by non-digit characters. It may also contain
                a named group ``<hours>`` with a floating-point number giving the
                hours worked on the bug. If no named groups are present, the first
                "()" group is assumed to contain the bug IDs, and work time is not
                updated. The default expression matches ``Fixes 1234``, ``Fixes bug 1234``,
                ``Fixes bugs 1234,5678``, ``Fixes 1234 and 5678`` and
                variations thereof, followed by an hours number prefixed by ``h`` or
                ``hours``, e.g. ``hours 1.5``. Matching is case insensitive.
              bugzilla.fixstatus
                The status to set a bug to when marking fixed. Default ``RESOLVED``.
              bugzilla.fixresolution
                The resolution to set a bug to when marking fixed. Default ``FIXED``.
              bugzilla.style
                The style file to use when formatting comments.
              bugzilla.template
                Template to use when formatting comments. Overrides style if
                specified. In addition to the usual Mercurial keywords, the
                extension specifies:
                :``{bug}``:     The Bugzilla bug ID.
                :``{root}``:    The full pathname of the Mercurial repository.
                :``{webroot}``: Stripped pathname of the Mercurial repository.
                :``{hgweb}``:   Base URL for browsing Mercurial repositories.
                Default ``changeset {node|short} in repo {root} refers to bug
                {bug}.\\ndetails:\\n\\t{desc|tabindent}``
              bugzilla.strip
                The number of path separator characters to strip from the front of
                the Mercurial repository path (``{root}`` in templates) to produce
                ``{webroot}``. For example, a repository with ``{root}``
                ``/var/local/my-project`` with a strip of 2 gives a value for
                ``{webroot}`` of ``my-project``. Default 0.
              web.baseurl
                Base URL for browsing Mercurial repositories. Referenced from
                templates as ``{hgweb}``.
              Configuration items common to XMLRPC+email and MySQL access modes:
              bugzilla.usermap
                Path of file containing Mercurial committer email to Bugzilla user email
                mappings. If specified, the file should contain one mapping per
                line::
                  committer = Bugzilla user
                See also the ``[usermap]`` section.
              The ``[usermap]`` section is used to specify mappings of Mercurial
              committer email to Bugzilla user email. See also ``bugzilla.usermap``.
              Contains entries of the form ``committer = Bugzilla user``.
              XMLRPC and REST-API access mode configuration:
              bugzilla.bzurl
                The base URL for the Bugzilla installation.
                Default ``http://localhost/bugzilla``.
              bugzilla.user
                The username to use to log into Bugzilla via XMLRPC. Default
                ``bugs``.
              bugzilla.password
                The password for Bugzilla login.
              REST-API access mode uses the options listed above as well as:
              bugzilla.apikey
                An apikey generated on the Bugzilla instance for api access.
                Using an apikey removes the need to store the user and password
                options.
              XMLRPC+email access mode uses the XMLRPC access mode configuration items,
              and also:
              bugzilla.bzemail
                The Bugzilla email address.
              In addition, the Mercurial email settings must be configured. See the
              documentation in hgrc(5), sections ``[email]`` and ``[smtp]``.
              MySQL access mode configuration:
              bugzilla.host
                Hostname of the MySQL server holding the Bugzilla database.
                Default ``localhost``.
              bugzilla.db
                Name of the Bugzilla database in MySQL. Default ``bugs``.
              bugzilla.user
                Username to use to access MySQL server. Default ``bugs``.
              bugzilla.password
                Password to use to access MySQL server.
              bugzilla.timeout
                Database connection timeout (seconds). Default 5.
              bugzilla.bzuser
                Fallback Bugzilla user name to record comments with, if changeset
                committer cannot be found as a Bugzilla user.
              bugzilla.bzdir
                 Bugzilla install directory. Used by default notify. Default
                 ``/var/www/html/bugzilla``.
              bugzilla.notify
                The command to run to get Bugzilla to send bug change notification
                emails. Substitutes from a map with 3 keys, ``bzdir``, ``id`` (bug
                id) and ``user`` (committer bugzilla email). Default depends on
                version; from 2.18 it is "cd %(bzdir)s && perl -T
                contrib/sendbugmail.pl %(id)s %(user)s".
              Activating the extension::
                  [extensions]
                  bugzilla =
                  [hooks]
                  # run bugzilla hook on every change pulled or pushed in here
                  incoming.bugzilla = python:hgext.bugzilla.hook
              Example configurations:
              XMLRPC example configuration. This uses the Bugzilla at
              ``http://my-project.org/bugzilla``, logging in as user
              ``bugmail@my-project.org`` with password ``plugh``. It is used with a
              collection of Mercurial repositories in ``/var/local/hg/repos/``,
              with a web interface at ``http://my-project.org/hg``. ::
                  [bugzilla]
                  bzurl=http://my-project.org/bugzilla
                  user=bugmail@my-project.org
                  password=plugh
                  version=xmlrpc
                  template=Changeset {node|short} in {root|basename}.
                           {hgweb}/{webroot}/rev/{node|short}\\n
                           {desc}\\n
                  strip=5
                  [web]
                  baseurl=http://my-project.org/hg
              XMLRPC+email example configuration. This uses the Bugzilla at
              ``http://my-project.org/bugzilla``, logging in as user
              ``bugmail@my-project.org`` with password ``plugh``. It is used with a
              collection of Mercurial repositories in ``/var/local/hg/repos/``,
              with a web interface at ``http://my-project.org/hg``. Bug comments
              are sent to the Bugzilla email address
              ``bugzilla@my-project.org``. ::
                  [bugzilla]
                  bzurl=http://my-project.org/bugzilla
                  user=bugmail@my-project.org
                  password=plugh
                  version=xmlrpc+email
                  bzemail=bugzilla@my-project.org
                  template=Changeset {node|short} in {root|basename}.
                           {hgweb}/{webroot}/rev/{node|short}\\n
                           {desc}\\n
                  strip=5
                  [web]
                  baseurl=http://my-project.org/hg
                  [usermap]
                  user@emaildomain.com=user.name@bugzilladomain.com
              MySQL example configuration. This has a local Bugzilla 3.2 installation
              in ``/opt/bugzilla-3.2``. The MySQL database is on ``localhost``,
              the Bugzilla database name is ``bugs`` and MySQL is
              accessed with MySQL username ``bugs`` password ``XYZZY``. It is used
              with a collection of Mercurial repositories in ``/var/local/hg/repos/``,
              with a web interface at ``http://my-project.org/hg``. ::
                  [bugzilla]
                  host=localhost
                  password=XYZZY
                  version=3.0
                  bzuser=unknown@domain.com
                  bzdir=/opt/bugzilla-3.2
                  template=Changeset {node|short} in {root|basename}.
                           {hgweb}/{webroot}/rev/{node|short}\\n
                           {desc}\\n
                  strip=5
                  [web]
                  baseurl=http://my-project.org/hg
                  [usermap]
                  user@emaildomain.com=user.name@bugzilladomain.com
              All the above add a comment to the Bugzilla bug record of the form::
                  Changeset 3b16791d6642 in repository-name.
                  http://my-project.org/hg/repository-name/rev/3b16791d6642
                  Changeset commit comment. Bug 1234.
              '''
              from __future__ import absolute_import
              import json
              import re
              import time
              from mercurial.i18n import _
              from mercurial.node import short
              from mercurial import (
                  error,
                  logcmdutil,
                  mail,
                  pycompat,
                  registrar,
                  url,
                  util,
              )
              from mercurial.utils import (
                  procutil,
                  stringutil,
              )
              xmlrpclib = util.xmlrpclib
              # Note for extension authors: ONLY specify testedwith = 'ships-with-hg-core' for
              # extensions which SHIP WITH MERCURIAL. Non-mainline extensions should
              # be specifying the version(s) of Mercurial they are tested with, or
              # leave the attribute unspecified.
              testedwith = b'ships-with-hg-core'
              configtable = {}
              configitem = registrar.configitem(configtable)
              configitem(
                  b'bugzilla', b'apikey', default=b'',
              )
              configitem(
                  b'bugzilla', b'bzdir', default=b'/var/www/html/bugzilla',
              )
              configitem(
                  b'bugzilla', b'bzemail', default=None,
              )
              configitem(
                  b'bugzilla', b'bzurl', default=b'http://localhost/bugzilla/',
              )
              configitem(
                  b'bugzilla', b'bzuser', default=None,
              )
              configitem(
                  b'bugzilla', b'db', default=b'bugs',
              )
              configitem(
                  b'bugzilla',
                  b'fixregexp',
                  default=(
                      br'fix(?:es)?\s*(?:bugs?\s*)?,?\s*'
                      br'(?:nos?\.?|num(?:ber)?s?)?\s*'
                      br'(?P<ids>(?:#?\d+\s*(?:,?\s*(?:and)?)?\s*)+)'
                      br'\.?\s*(?:h(?:ours?)?\s*(?P<hours>\d*(?:\.\d+)?))?'
                  ),
              )
              configitem(
                  b'bugzilla', b'fixresolution', default=b'FIXED',
              )
              configitem(
                  b'bugzilla', b'fixstatus', default=b'RESOLVED',
              )
              configitem(
                  b'bugzilla', b'host', default=b'localhost',
              )
              configitem(
                  b'bugzilla', b'notify', default=configitem.dynamicdefault,
              )
              configitem(
                  b'bugzilla', b'password', default=None,
              )
              configitem(
                  b'bugzilla',
                  b'regexp',
                  default=(
                      br'bugs?\s*,?\s*(?:#|nos?\.?|num(?:ber)?s?)?\s*'
                      br'(?P<ids>(?:\d+\s*(?:,?\s*(?:and)?)?\s*)+)'
                      br'\.?\s*(?:h(?:ours?)?\s*(?P<hours>\d*(?:\.\d+)?))?'
                  ),
              )
              configitem(
                  b'bugzilla', b'strip', default=0,
              )
              configitem(
                  b'bugzilla', b'style', default=None,
              )
              configitem(
                  b'bugzilla', b'template', default=None,
              )
              configitem(
                  b'bugzilla', b'timeout', default=5,
              )
              configitem(
                  b'bugzilla', b'user', default=b'bugs',
              )
              configitem(
                  b'bugzilla', b'usermap', default=None,
              )
              configitem(
                  b'bugzilla', b'version', default=None,
              )
              class bzaccess(object):
                  '''Base class for access to Bugzilla.'''
                  def __init__(self, ui):
                      self.ui = ui
                      usermap = self.ui.config(b'bugzilla', b'usermap')
                      if usermap:
                          self.ui.readconfig(usermap, sections=[b'usermap'])
                  def map_committer(self, user):
                      '''map name of committer to Bugzilla user name.'''
                      for committer, bzuser in self.ui.configitems(b'usermap'):
                          if committer.lower() == user.lower():
                              return bzuser
                      return user
                  # Methods to be implemented by access classes.
                  #
                  # 'bugs' is a dict keyed on bug id, where values are a dict holding
                  # updates to bug state. Recognized dict keys are:
                  #
                  # 'hours': Value, float containing work hours to be updated.
                  # 'fix':   If key present, bug is to be marked fixed. Value ignored.
                  def filter_real_bug_ids(self, bugs):
                      '''remove bug IDs that do not exist in Bugzilla from bugs.'''
                  def filter_cset_known_bug_ids(self, node, bugs):
                      '''remove bug IDs where node occurs in comment text from bugs.'''
                  def updatebug(self, bugid, newstate, text, committer):
                      '''update the specified bug. Add comment text and set new states.
                      If possible add the comment as being from the committer of
                      the changeset. Otherwise use the default Bugzilla user.
                      '''
                  def notify(self, bugs, committer):
                      '''Force sending of Bugzilla notification emails.
                      Only required if the access method does not trigger notification
                      emails automatically.
                      '''
              # Bugzilla via direct access to MySQL database.
              class bzmysql(bzaccess):
                  '''Support for direct MySQL access to Bugzilla.
                  The earliest Bugzilla version this is tested with is version 2.16.
                  If your Bugzilla is version 3.4 or above, you are strongly
                  recommended to use the XMLRPC access method instead.
                  '''
                  @staticmethod
                  def sql_buglist(ids):
                      '''return SQL-friendly list of bug ids'''
                      return b'(' + b','.join(map(str, ids)) + b')'
                  _MySQLdb = None
                  def __init__(self, ui):
                      try:
                          import MySQLdb as mysql
                          bzmysql._MySQLdb = mysql
                      except ImportError as err:
                          raise error.Abort(
                              _(b'python mysql support not available: %s') % err
                          )
                      bzaccess.__init__(self, ui)
                      host = self.ui.config(b'bugzilla', b'host')
                      user = self.ui.config(b'bugzilla', b'user')
                      passwd = self.ui.config(b'bugzilla', b'password')
                      db = self.ui.config(b'bugzilla', b'db')
                      timeout = int(self.ui.config(b'bugzilla', b'timeout'))
                      self.ui.note(
                          _(b'connecting to %s:%s as %s, password %s\n')
                          % (host, db, user, b'*' * len(passwd))
                      )
                      self.conn = bzmysql._MySQLdb.connect(
                          host=host, user=user, passwd=passwd, db=db, connect_timeout=timeout
                      )
                      self.cursor = self.conn.cursor()
                      self.longdesc_id = self.get_longdesc_id()
                      self.user_ids = {}
                      self.default_notify = b"cd %(bzdir)s && ./processmail %(id)s %(user)s"
                  def run(self, *args, **kwargs):
                      '''run a query.'''
                      self.ui.note(_(b'query: %s %s\n') % (args, kwargs))
                      try:
                          self.cursor.execute(*args, **kwargs)
                      except bzmysql._MySQLdb.MySQLError:
                          self.ui.note(_(b'failed query: %s %s\n') % (args, kwargs))
                          raise
                  def get_longdesc_id(self):
                      '''get identity of longdesc field'''
                      self.run(b'select fieldid from fielddefs where name = "longdesc"')
                      ids = self.cursor.fetchall()
                      if len(ids) != 1:
                          raise error.Abort(_(b'unknown database schema'))
                      return ids[0][0]
                  def filter_real_bug_ids(self, bugs):
                      '''filter not-existing bugs from set.'''
                      self.run(
                          b'select bug_id from bugs where bug_id in %s'
                          % bzmysql.sql_buglist(bugs.keys())
                      )
                      existing = [id for (id,) in self.cursor.fetchall()]
                      for id in bugs.keys():
                          if id not in existing:
                              self.ui.status(_(b'bug %d does not exist\n') % id)
                              del bugs[id]
                  def filter_cset_known_bug_ids(self, node, bugs):
                      '''filter bug ids that already refer to this changeset from set.'''
                      self.run(
                          '''select bug_id from longdescs where
                                  bug_id in %s and thetext like "%%%s%%"'''
                          % (bzmysql.sql_buglist(bugs.keys()), short(node))
                      )
                      for (id,) in self.cursor.fetchall():
                          self.ui.status(
                              _(b'bug %d already knows about changeset %s\n')
                              % (id, short(node))
                          )
                          del bugs[id]
                  def notify(self, bugs, committer):
                      '''tell bugzilla to send mail.'''
                      self.ui.status(_(b'telling bugzilla to send mail:\n'))
                      (user, userid) = self.get_bugzilla_user(committer)
                      for id in bugs.keys():
                          self.ui.status(_(b'  bug %s\n') % id)
                          cmdfmt = self.ui.config(b'bugzilla', b'notify', self.default_notify)
                          bzdir = self.ui.config(b'bugzilla', b'bzdir')
                          try:
                              # Backwards-compatible with old notify string, which
                              # took one string. This will throw with a new format
                              # string.
                              cmd = cmdfmt % id
                          except TypeError:
                              cmd = cmdfmt % {b'bzdir': bzdir, b'id': id, b'user': user}
                          self.ui.note(_(b'running notify command %s\n') % cmd)
                          fp = procutil.popen(b'(%s) 2>&1' % cmd, b'rb')
                          out = util.fromnativeeol(fp.read())
                          ret = fp.close()
                          if ret:
                              self.ui.warn(out)
                              raise error.Abort(
                                  _(b'bugzilla notify command %s') % procutil.explainexit(ret)
                              )
                      self.ui.status(_(b'done\n'))
                  def get_user_id(self, user):
                      '''look up numeric bugzilla user id.'''
                      try:
                          return self.user_ids[user]
                      except KeyError:
                          try:
                              userid = int(user)
                          except ValueError:
                              self.ui.note(_(b'looking up user %s\n') % user)
                              self.run(
                                  '''select userid from profiles
                                          where login_name like %s''',
                                  user,
                              )
                              all = self.cursor.fetchall()
                              if len(all) != 1:
                                  raise KeyError(user)
                              userid = int(all[0][0])
                          self.user_ids[user] = userid
                          return userid
                  def get_bugzilla_user(self, committer):
                      '''See if committer is a registered bugzilla user. Return
                      bugzilla username and userid if so. If not, return default
                      bugzilla username and userid.'''
                      user = self.map_committer(committer)
                      try:
                          userid = self.get_user_id(user)
                      except KeyError:
                          try:
                              defaultuser = self.ui.config(b'bugzilla', b'bzuser')
                              if not defaultuser:
                                  raise error.Abort(
                                      _(b'cannot find bugzilla user id for %s') % user
                                  )
                              userid = self.get_user_id(defaultuser)
                              user = defaultuser
                          except KeyError:
                              raise error.Abort(
                                  _(b'cannot find bugzilla user id for %s or %s')
                                  % (user, defaultuser)
                              )
                      return (user, userid)
                  def updatebug(self, bugid, newstate, text, committer):
                      '''update bug state with comment text.
                      Try adding comment as committer of changeset, otherwise as
                      default bugzilla user.'''
                      if len(newstate) > 0:
                          self.ui.warn(_(b"Bugzilla/MySQL cannot update bug state\n"))
                      (user, userid) = self.get_bugzilla_user(committer)
                      now = time.strftime(r'%Y-%m-%d %H:%M:%S')
                      self.run(
                          '''insert into longdescs
                                  (bug_id, who, bug_when, thetext)
                                  values (%s, %s, %s, %s)''',
                          (bugid, userid, now, text),
                      )
                      self.run(
                          '''insert into bugs_activity (bug_id, who, bug_when, fieldid)
                                  values (%s, %s, %s, %s)''',
                          (bugid, userid, now, self.longdesc_id),
                      )
                      self.conn.commit()
              class bzmysql_2_18(bzmysql):
                  '''support for bugzilla 2.18 series.'''
                  def __init__(self, ui):
                      bzmysql.__init__(self, ui)
                      self.default_notify = (
                          b"cd %(bzdir)s && perl -T contrib/sendbugmail.pl %(id)s %(user)s"
                      )
              class bzmysql_3_0(bzmysql_2_18):
                  '''support for bugzilla 3.0 series.'''
                  def __init__(self, ui):
                      bzmysql_2_18.__init__(self, ui)
                  def get_longdesc_id(self):
                      '''get identity of longdesc field'''
                      self.run(b'select id from fielddefs where name = "longdesc"')
                      ids = self.cursor.fetchall()
                      if len(ids) != 1:
                          raise error.Abort(_(b'unknown database schema'))
                      return ids[0][0]
              # Bugzilla via XMLRPC interface.
              class cookietransportrequest(object):
                  """A Transport request method that retains cookies over its lifetime.
                  The regular xmlrpclib transports ignore cookies. Which causes
                  a bit of a problem when you need a cookie-based login, as with
                  the Bugzilla XMLRPC interface prior to 4.4.3.
                  So this is a helper for defining a Transport which looks for
                  cookies being set in responses and saves them to add to all future
                  requests.
                  """
                  # Inspiration drawn from
                  # http://blog.godson.in/2010/09/how-to-make-python-xmlrpclib-client.html
                  # http://www.itkovian.net/base/transport-class-for-pythons-xml-rpc-lib/
                  cookies = []
                  def send_cookies(self, connection):
                      if self.cookies:
                          for cookie in self.cookies:
                              connection.putheader(b"Cookie", cookie)
                  def request(self, host, handler, request_body, verbose=0):
                      self.verbose = verbose
                      self.accept_gzip_encoding = False
                      # issue XML-RPC request
                      h = self.make_connection(host)
                      if verbose:
                          h.set_debuglevel(1)
                      self.send_request(h, handler, request_body)
                      self.send_host(h, host)
                      self.send_cookies(h)
                      self.send_user_agent(h)
                      self.send_content(h, request_body)
                      # Deal with differences between Python 2.6 and 2.7.
                      # In the former h is a HTTP(S). In the latter it's a
                      # HTTP(S)Connection. Luckily, the 2.6 implementation of
                      # HTTP(S) has an underlying HTTP(S)Connection, so extract
                      # that and use it.
                      try:
                          response = h.getresponse()
                      except AttributeError:
                          response = h._conn.getresponse()
                      # Add any cookie definitions to our list.
                      for header in response.msg.getallmatchingheaders(b"Set-Cookie"):
                          val = header.split(b": ", 1)[1]
                          cookie = val.split(b";", 1)[0]
                          self.cookies.append(cookie)
                      if response.status != 200:
                          raise xmlrpclib.ProtocolError(
                              host + handler,
                              response.status,
                              response.reason,
                              response.msg.headers,
                          )
                      payload = response.read()
                      parser, unmarshaller = self.getparser()
                      parser.feed(payload)
                      parser.close()
                      return unmarshaller.close()
              # The explicit calls to the underlying xmlrpclib __init__() methods are
              # necessary. The xmlrpclib.Transport classes are old-style classes, and
              # it turns out their __init__() doesn't get called when doing multiple
              # inheritance with a new-style class.
              class cookietransport(cookietransportrequest, xmlrpclib.Transport):
                  def __init__(self, use_datetime=0):
-                     if util.safehasattr(xmlrpclib.Transport, b"__init__"):
+                     if util.safehasattr(xmlrpclib.Transport, "__init__"):
                          xmlrpclib.Transport.__init__(self, use_datetime)
              class cookiesafetransport(cookietransportrequest, xmlrpclib.SafeTransport):
                  def __init__(self, use_datetime=0):
-                     if util.safehasattr(xmlrpclib.Transport, b"__init__"):
+                     if util.safehasattr(xmlrpclib.Transport, "__init__"):
                          xmlrpclib.SafeTransport.__init__(self, use_datetime)
              class bzxmlrpc(bzaccess):
                  """Support for access to Bugzilla via the Bugzilla XMLRPC API.
                  Requires a minimum Bugzilla version 3.4.
                  """
                  def __init__(self, ui):
                      bzaccess.__init__(self, ui)
                      bzweb = self.ui.config(b'bugzilla', b'bzurl')
                      bzweb = bzweb.rstrip(b"/") + b"/xmlrpc.cgi"
                      user = self.ui.config(b'bugzilla', b'user')
                      passwd = self.ui.config(b'bugzilla', b'password')
                      self.fixstatus = self.ui.config(b'bugzilla', b'fixstatus')
                      self.fixresolution = self.ui.config(b'bugzilla', b'fixresolution')
                      self.bzproxy = xmlrpclib.ServerProxy(bzweb, self.transport(bzweb))
                      ver = self.bzproxy.Bugzilla.version()[b'version'].split(b'.')
                      self.bzvermajor = int(ver[0])
                      self.bzverminor = int(ver[1])
                      login = self.bzproxy.User.login(
                          {b'login': user, b'password': passwd, b'restrict_login': True}
                      )
                      self.bztoken = login.get(b'token', b'')
                  def transport(self, uri):
                      if util.urlreq.urlparse(uri, b"http")[0] == b"https":
                          return cookiesafetransport()
                      else:
                          return cookietransport()
                  def get_bug_comments(self, id):
                      """Return a string with all comment text for a bug."""
                      c = self.bzproxy.Bug.comments(
                          {b'ids': [id], b'include_fields': [b'text'], b'token': self.bztoken}
                      )
                      return b''.join(
                          [t[b'text'] for t in c[b'bugs'][b'%d' % id][b'comments']]
                      )
                  def filter_real_bug_ids(self, bugs):
                      probe = self.bzproxy.Bug.get(
                          {
                              b'ids': sorted(bugs.keys()),
                              b'include_fields': [],
                              b'permissive': True,
                              b'token': self.bztoken,
                          }
                      )
                      for badbug in probe[b'faults']:
                          id = badbug[b'id']
                          self.ui.status(_(b'bug %d does not exist\n') % id)
                          del bugs[id]
                  def filter_cset_known_bug_ids(self, node, bugs):
                      for id in sorted(bugs.keys()):
                          if self.get_bug_comments(id).find(short(node)) != -1:
                              self.ui.status(
                                  _(b'bug %d already knows about changeset %s\n')
                                  % (id, short(node))
                              )
                              del bugs[id]
                  def updatebug(self, bugid, newstate, text, committer):
                      args = {}
                      if b'hours' in newstate:
                          args[b'work_time'] = newstate[b'hours']
                      if self.bzvermajor >= 4:
                          args[b'ids'] = [bugid]
                          args[b'comment'] = {b'body': text}
                          if b'fix' in newstate:
                              args[b'status'] = self.fixstatus
                              args[b'resolution'] = self.fixresolution
                          args[b'token'] = self.bztoken
                          self.bzproxy.Bug.update(args)
                      else:
                          if b'fix' in newstate:
                              self.ui.warn(
                                  _(
                                      b"Bugzilla/XMLRPC needs Bugzilla 4.0 or later "
                                      b"to mark bugs fixed\n"
                                  )
                              )
                          args[b'id'] = bugid
                          args[b'comment'] = text
                          self.bzproxy.Bug.add_comment(args)
              class bzxmlrpcemail(bzxmlrpc):
                  """Read data from Bugzilla via XMLRPC, send updates via email.
                  Advantages of sending updates via email:
 . Comments can be added as any user, not just logged in user.
 . Bug statuses or other fields not accessible via XMLRPC can
                       potentially be updated.
                  There is no XMLRPC function to change bug status before Bugzilla
 .0, so bugs cannot be marked fixed via XMLRPC before Bugzilla 4.0.
                  But bugs can be marked fixed via email from 3.4 onwards.
                  """
                  # The email interface changes subtly between 3.4 and 3.6. In 3.4,
                  # in-email fields are specified as '@<fieldname> = <value>'. In
                  # 3.6 this becomes '@<fieldname> <value>'. And fieldname @bug_id
                  # in 3.4 becomes @id in 3.6. 3.6 and 4.0 both maintain backwards
                  # compatibility, but rather than rely on this use the new format for
                  # 4.0 onwards.
                  def __init__(self, ui):
                      bzxmlrpc.__init__(self, ui)
                      self.bzemail = self.ui.config(b'bugzilla', b'bzemail')
                      if not self.bzemail:
                          raise error.Abort(_(b"configuration 'bzemail' missing"))
                      mail.validateconfig(self.ui)
                  def makecommandline(self, fieldname, value):
                      if self.bzvermajor >= 4:
                          return b"@%s %s" % (fieldname, pycompat.bytestr(value))
                      else:
                          if fieldname == b"id":
                              fieldname = b"bug_id"
                          return b"@%s = %s" % (fieldname, pycompat.bytestr(value))
                  def send_bug_modify_email(self, bugid, commands, comment, committer):
                      '''send modification message to Bugzilla bug via email.
                      The message format is documented in the Bugzilla email_in.pl
                      specification. commands is a list of command lines, comment is the
                      comment text.
                      To stop users from crafting commit comments with
                      Bugzilla commands, specify the bug ID via the message body, rather
                      than the subject line, and leave a blank line after it.
                      '''
                      user = self.map_committer(committer)
                      matches = self.bzproxy.User.get(
                          {b'match': [user], b'token': self.bztoken}
                      )
                      if not matches[b'users']:
                          user = self.ui.config(b'bugzilla', b'user')
                          matches = self.bzproxy.User.get(
                              {b'match': [user], b'token': self.bztoken}
                          )
                          if not matches[b'users']:
                              raise error.Abort(
                                  _(b"default bugzilla user %s email not found") % user
                              )
                      user = matches[b'users'][0][b'email']
                      commands.append(self.makecommandline(b"id", bugid))
                      text = b"\n".join(commands) + b"\n\n" + comment
                      _charsets = mail._charsets(self.ui)
                      user = mail.addressencode(self.ui, user, _charsets)
                      bzemail = mail.addressencode(self.ui, self.bzemail, _charsets)
                      msg = mail.mimeencode(self.ui, text, _charsets)
                      msg[b'From'] = user
                      msg[b'To'] = bzemail
                      msg[b'Subject'] = mail.headencode(
                          self.ui, b"Bug modification", _charsets
                      )
                      sendmail = mail.connect(self.ui)
                      sendmail(user, bzemail, msg.as_string())
                  def updatebug(self, bugid, newstate, text, committer):
                      cmds = []
                      if b'hours' in newstate:
                          cmds.append(self.makecommandline(b"work_time", newstate[b'hours']))
                      if b'fix' in newstate:
                          cmds.append(self.makecommandline(b"bug_status", self.fixstatus))
                          cmds.append(self.makecommandline(b"resolution", self.fixresolution))
                      self.send_bug_modify_email(bugid, cmds, text, committer)
              class NotFound(LookupError):
                  pass
              class bzrestapi(bzaccess):
                  """Read and write bugzilla data using the REST API available since
                  Bugzilla 5.0.
                  """
                  def __init__(self, ui):
                      bzaccess.__init__(self, ui)
                      bz = self.ui.config(b'bugzilla', b'bzurl')
                      self.bzroot = b'/'.join([bz, b'rest'])
                      self.apikey = self.ui.config(b'bugzilla', b'apikey')
                      self.user = self.ui.config(b'bugzilla', b'user')
                      self.passwd = self.ui.config(b'bugzilla', b'password')
                      self.fixstatus = self.ui.config(b'bugzilla', b'fixstatus')
                      self.fixresolution = self.ui.config(b'bugzilla', b'fixresolution')
                  def apiurl(self, targets, include_fields=None):
                      url = b'/'.join([self.bzroot] + [pycompat.bytestr(t) for t in targets])
                      qv = {}
                      if self.apikey:
                          qv[b'api_key'] = self.apikey
                      elif self.user and self.passwd:
                          qv[b'login'] = self.user
                          qv[b'password'] = self.passwd
                      if include_fields:
                          qv[b'include_fields'] = include_fields
                      if qv:
                          url = b'%s?%s' % (url, util.urlreq.urlencode(qv))
                      return url
                  def _fetch(self, burl):
                      try:
                          resp = url.open(self.ui, burl)
                          return json.loads(resp.read())
                      except util.urlerr.httperror as inst:
                          if inst.code == 401:
                              raise error.Abort(_(b'authorization failed'))
                          if inst.code == 404:
                              raise NotFound()
                          else:
                              raise
                  def _submit(self, burl, data, method=b'POST'):
                      data = json.dumps(data)
                      if method == b'PUT':
                          class putrequest(util.urlreq.request):
                              def get_method(self):
                                  return b'PUT'
                          request_type = putrequest
                      else:
                          request_type = util.urlreq.request
                      req = request_type(burl, data, {b'Content-Type': b'application/json'})
                      try:
                          resp = url.opener(self.ui).open(req)
                          return json.loads(resp.read())
                      except util.urlerr.httperror as inst:
                          if inst.code == 401:
                              raise error.Abort(_(b'authorization failed'))
                          if inst.code == 404:
                              raise NotFound()
                          else:
                              raise
                  def filter_real_bug_ids(self, bugs):
                      '''remove bug IDs that do not exist in Bugzilla from bugs.'''
                      badbugs = set()
                      for bugid in bugs:
                          burl = self.apiurl((b'bug', bugid), include_fields=b'status')
                          try:
                              self._fetch(burl)
                          except NotFound:
                              badbugs.add(bugid)
                      for bugid in badbugs:
                          del bugs[bugid]
                  def filter_cset_known_bug_ids(self, node, bugs):
                      '''remove bug IDs where node occurs in comment text from bugs.'''
                      sn = short(node)
                      for bugid in bugs.keys():
                          burl = self.apiurl(
                              (b'bug', bugid, b'comment'), include_fields=b'text'
                          )
                          result = self._fetch(burl)
                          comments = result[b'bugs'][pycompat.bytestr(bugid)][b'comments']
                          if any(sn in c[b'text'] for c in comments):
                              self.ui.status(
                                  _(b'bug %d already knows about changeset %s\n')
                                  % (bugid, sn)
                              )
                              del bugs[bugid]
                  def updatebug(self, bugid, newstate, text, committer):
                      '''update the specified bug. Add comment text and set new states.
                      If possible add the comment as being from the committer of
                      the changeset. Otherwise use the default Bugzilla user.
                      '''
                      bugmod = {}
                      if b'hours' in newstate:
                          bugmod[b'work_time'] = newstate[b'hours']
                      if b'fix' in newstate:
                          bugmod[b'status'] = self.fixstatus
                          bugmod[b'resolution'] = self.fixresolution
                      if bugmod:
                          # if we have to change the bugs state do it here
                          bugmod[b'comment'] = {
                              b'comment': text,
                              b'is_private': False,
                              b'is_markdown': False,
                          }
                          burl = self.apiurl((b'bug', bugid))
                          self._submit(burl, bugmod, method=b'PUT')
                          self.ui.debug(b'updated bug %s\n' % bugid)
                      else:
                          burl = self.apiurl((b'bug', bugid, b'comment'))
                          self._submit(
                              burl,
                              {
                                  b'comment': text,
                                  b'is_private': False,
                                  b'is_markdown': False,
                              },
                          )
                          self.ui.debug(b'added comment to bug %s\n' % bugid)
                  def notify(self, bugs, committer):
                      '''Force sending of Bugzilla notification emails.
                      Only required if the access method does not trigger notification
                      emails automatically.
                      '''
                      pass
              class bugzilla(object):
                  # supported versions of bugzilla. different versions have
                  # different schemas.
                  _versions = {
                      b'2.16': bzmysql,
                      b'2.18': bzmysql_2_18,
                      b'3.0': bzmysql_3_0,
                      b'xmlrpc': bzxmlrpc,
                      b'xmlrpc+email': bzxmlrpcemail,
                      b'restapi': bzrestapi,
                  }
                  def __init__(self, ui, repo):
                      self.ui = ui
                      self.repo = repo
                      bzversion = self.ui.config(b'bugzilla', b'version')
                      try:
                          bzclass = bugzilla._versions[bzversion]
                      except KeyError:
                          raise error.Abort(
                              _(b'bugzilla version %s not supported') % bzversion
                          )
                      self.bzdriver = bzclass(self.ui)
                      self.bug_re = re.compile(
                          self.ui.config(b'bugzilla', b'regexp'), re.IGNORECASE
                      )
                      self.fix_re = re.compile(
                          self.ui.config(b'bugzilla', b'fixregexp'), re.IGNORECASE
                      )
                      self.split_re = re.compile(br'\D+')
                  def find_bugs(self, ctx):
                      '''return bugs dictionary created from commit comment.
                      Extract bug info from changeset comments. Filter out any that are
                      not known to Bugzilla, and any that already have a reference to
                      the given changeset in their comments.
                      '''
                      start = 0
                      hours = 0.0
                      bugs = {}
                      bugmatch = self.bug_re.search(ctx.description(), start)
                      fixmatch = self.fix_re.search(ctx.description(), start)
                      while True:
                          bugattribs = {}
                          if not bugmatch and not fixmatch:
                              break
                          if not bugmatch:
                              m = fixmatch
                          elif not fixmatch:
                              m = bugmatch
                          else:
                              if bugmatch.start() < fixmatch.start():
                                  m = bugmatch
                              else:
                                  m = fixmatch
                          start = m.end()
                          if m is bugmatch:
                              bugmatch = self.bug_re.search(ctx.description(), start)
                              if b'fix' in bugattribs:
                                  del bugattribs[b'fix']
                          else:
                              fixmatch = self.fix_re.search(ctx.description(), start)
                              bugattribs[b'fix'] = None
                          try:
                              ids = m.group(b'ids')
                          except IndexError:
                              ids = m.group(1)
                          try:
                              hours = float(m.group(b'hours'))
                              bugattribs[b'hours'] = hours
                          except IndexError:
                              pass
                          except TypeError:
                              pass
                          except ValueError:
                              self.ui.status(_(b"%s: invalid hours\n") % m.group(b'hours'))
                          for id in self.split_re.split(ids):
                              if not id:
                                  continue
                              bugs[int(id)] = bugattribs
                      if bugs:
                          self.bzdriver.filter_real_bug_ids(bugs)
                      if bugs:
                          self.bzdriver.filter_cset_known_bug_ids(ctx.node(), bugs)
                      return bugs
                  def update(self, bugid, newstate, ctx):
                      '''update bugzilla bug with reference to changeset.'''
                      def webroot(root):
                          '''strip leading prefix of repo root and turn into
                          url-safe path.'''
                          count = int(self.ui.config(b'bugzilla', b'strip'))
                          root = util.pconvert(root)
                          while count > 0:
                              c = root.find(b'/')
                              if c == -1:
                                  break
                              root = root[c + 1 :]
                              count -= 1
                          return root
                      mapfile = None
                      tmpl = self.ui.config(b'bugzilla', b'template')
                      if not tmpl:
                          mapfile = self.ui.config(b'bugzilla', b'style')
                      if not mapfile and not tmpl:
                          tmpl = _(
                              b'changeset {node|short} in repo {root} refers '
                              b'to bug {bug}.\ndetails:\n\t{desc|tabindent}'
                          )
                      spec = logcmdutil.templatespec(tmpl, mapfile)
                      t = logcmdutil.changesettemplater(self.ui, self.repo, spec)
                      self.ui.pushbuffer()
                      t.show(
                          ctx,
                          changes=ctx.changeset(),
                          bug=pycompat.bytestr(bugid),
                          hgweb=self.ui.config(b'web', b'baseurl'),
                          root=self.repo.root,
                          webroot=webroot(self.repo.root),
                      )
                      data = self.ui.popbuffer()
                      self.bzdriver.updatebug(
                          bugid, newstate, data, stringutil.email(ctx.user())
                      )
                  def notify(self, bugs, committer):
                      '''ensure Bugzilla users are notified of bug change.'''
                      self.bzdriver.notify(bugs, committer)
              def hook(ui, repo, hooktype, node=None, **kwargs):
                  '''add comment to bugzilla for each changeset that refers to a
                  bugzilla bug id. only add a comment once per bug, so same change
                  seen multiple times does not fill bug with duplicate data.'''
                  if node is None:
                      raise error.Abort(
                          _(b'hook type %s does not pass a changeset id') % hooktype
                      )
                  try:
                      bz = bugzilla(ui, repo)
                      ctx = repo[node]
                      bugs = bz.find_bugs(ctx)
                      if bugs:
                          for bug in bugs:
                              bz.update(bug, bugs[bug], ctx)
                          bz.notify(bugs, stringutil.email(ctx.user()))
                  except Exception as e:
                      raise error.Abort(_(b'Bugzilla error: %s') % e)

hgext/commitextras.py

0 +1 -1

              # commitextras.py
              #
              # Copyright 2013 Facebook, Inc.
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              '''adds a new flag extras to commit (ADVANCED)'''
              from __future__ import absolute_import
              import re
              from mercurial.i18n import _
              from mercurial import (
                  commands,
                  error,
                  extensions,
                  registrar,
                  util,
              )
              cmdtable = {}
              command = registrar.command(cmdtable)
              testedwith = b'ships-with-hg-core'
              usedinternally = {
                  b'amend_source',
                  b'branch',
                  b'close',
                  b'histedit_source',
                  b'topic',
                  b'rebase_source',
                  b'intermediate-source',
                  b'__touch-noise__',
                  b'source',
                  b'transplant_source',
              }
              def extsetup(ui):
                  entry = extensions.wrapcommand(commands.table, b'commit', _commit)
                  options = entry[1]
                  options.append(
                      (
                          b'',
                          b'extra',
                          [],
                          _(b'set a changeset\'s extra values'),
                          _(b"KEY=VALUE"),
                      )
                  )
              def _commit(orig, ui, repo, *pats, **opts):
-                 if util.safehasattr(repo, b'unfiltered'):
+                 if util.safehasattr(repo, 'unfiltered'):
                      repo = repo.unfiltered()
                  class repoextra(repo.__class__):
                      def commit(self, *innerpats, **inneropts):
                          extras = opts.get(r'extra')
                          for raw in extras:
                              if b'=' not in raw:
                                  msg = _(
                                      b"unable to parse '%s', should follow "
                                      b"KEY=VALUE format"
                                  )
                                  raise error.Abort(msg % raw)
                              k, v = raw.split(b'=', 1)
                              if not k:
                                  msg = _(b"unable to parse '%s', keys can't be empty")
                                  raise error.Abort(msg % raw)
                              if re.search(br'[^\w-]', k):
                                  msg = _(
                                      b"keys can only contain ascii letters, digits,"
                                      b" '_' and '-'"
                                  )
                                  raise error.Abort(msg)
                              if k in usedinternally:
                                  msg = _(
                                      b"key '%s' is used internally, can't be set "
                                      b"manually"
                                  )
                                  raise error.Abort(msg % k)
                              inneropts[r'extra'][k] = v
                          return super(repoextra, self).commit(*innerpats, **inneropts)
                  repo.__class__ = repoextra
                  return orig(ui, repo, *pats, **opts)

hgext/fastannotate/commands.py

0 +3 -3

              # Copyright 2016-present Facebook. All Rights Reserved.
              #
              # commands: fastannotate commands
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import os
              from mercurial.i18n import _
              from mercurial import (
                  commands,
                  encoding,
                  error,
                  extensions,
                  patch,
                  pycompat,
                  registrar,
                  scmutil,
                  util,
              )
              from . import (
                  context as facontext,
                  error as faerror,
                  formatter as faformatter,
              )
              cmdtable = {}
              command = registrar.command(cmdtable)
              def _matchpaths(repo, rev, pats, opts, aopts=facontext.defaultopts):
                  """generate paths matching given patterns"""
                  perfhack = repo.ui.configbool(b'fastannotate', b'perfhack')
                  # disable perfhack if:
                  # a) any walkopt is used
                  # b) if we treat pats as plain file names, some of them do not have
                  #    corresponding linelog files
                  if perfhack:
                      # cwd related to reporoot
                      reporoot = os.path.dirname(repo.path)
                      reldir = os.path.relpath(encoding.getcwd(), reporoot)
                      if reldir == b'.':
                          reldir = b''
                      if any(opts.get(o[1]) for o in commands.walkopts):  # a)
                          perfhack = False
                      else:  # b)
                          relpats = [
                              os.path.relpath(p, reporoot) if os.path.isabs(p) else p
                              for p in pats
                          ]
                          # disable perfhack on '..' since it allows escaping from the repo
                          if any(
                              (
                                  b'..' in f
                                  or not os.path.isfile(
                                      facontext.pathhelper(repo, f, aopts).linelogpath
                                  )
                              )
                              for f in relpats
                          ):
                              perfhack = False
                  # perfhack: emit paths directory without checking with manifest
                  # this can be incorrect if the rev dos not have file.
                  if perfhack:
                      for p in relpats:
                          yield os.path.join(reldir, p)
                  else:
                      def bad(x, y):
                          raise error.Abort(b"%s: %s" % (x, y))
                      ctx = scmutil.revsingle(repo, rev)
                      m = scmutil.match(ctx, pats, opts, badfn=bad)
                      for p in ctx.walk(m):
                          yield p
              fastannotatecommandargs = {
                  r'options': [
                      (b'r', b'rev', b'.', _(b'annotate the specified revision'), _(b'REV')),
                      (b'u', b'user', None, _(b'list the author (long with -v)')),
                      (b'f', b'file', None, _(b'list the filename')),
                      (b'd', b'date', None, _(b'list the date (short with -q)')),
                      (b'n', b'number', None, _(b'list the revision number (default)')),
                      (b'c', b'changeset', None, _(b'list the changeset')),
                      (
                          b'l',
                          b'line-number',
                          None,
                          _(b'show line number at the first ' b'appearance'),
                      ),
                      (
                          b'e',
                          b'deleted',
                          None,
                          _(b'show deleted lines (slow) (EXPERIMENTAL)'),
                      ),
                      (
                          b'',
                          b'no-content',
                          None,
                          _(b'do not show file content (EXPERIMENTAL)'),
                      ),
                      (b'', b'no-follow', None, _(b"don't follow copies and renames")),
                      (
                          b'',
                          b'linear',
                          None,
                          _(
                              b'enforce linear history, ignore second parent '
                              b'of merges (EXPERIMENTAL)'
                          ),
                      ),
                      (
                          b'',
                          b'long-hash',
                          None,
                          _(b'show long changeset hash (EXPERIMENTAL)'),
                      ),
                      (
                          b'',
                          b'rebuild',
                          None,
                          _(b'rebuild cache even if it exists ' b'(EXPERIMENTAL)'),
                      ),
                  ]
                  + commands.diffwsopts
                  + commands.walkopts
                  + commands.formatteropts,
                  r'synopsis': _(b'[-r REV] [-f] [-a] [-u] [-d] [-n] [-c] [-l] FILE...'),
                  r'inferrepo': True,
              }
              def fastannotate(ui, repo, *pats, **opts):
                  """show changeset information by line for each file
                  List changes in files, showing the revision id responsible for each line.
                  This command is useful for discovering when a change was made and by whom.
                  By default this command prints revision numbers. If you include --file,
                  --user, or --date, the revision number is suppressed unless you also
                  include --number. The default format can also be customized by setting
                  fastannotate.defaultformat.
                  Returns 0 on success.
                  .. container:: verbose
                      This command uses an implementation different from the vanilla annotate
                      command, which may produce slightly different (while still reasonable)
                      outputs for some cases.
                      Unlike the vanilla anootate, fastannotate follows rename regardless of
                      the existence of --file.
                      For the best performance when running on a full repo, use -c, -l,
                      avoid -u, -d, -n. Use --linear and --no-content to make it even faster.
                      For the best performance when running on a shallow (remotefilelog)
                      repo, avoid --linear, --no-follow, or any diff options. As the server
                      won't be able to populate annotate cache when non-default options
                      affecting results are used.
                  """
                  if not pats:
                      raise error.Abort(_(b'at least one filename or pattern is required'))
                  # performance hack: filtered repo can be slow. unfilter by default.
                  if ui.configbool(b'fastannotate', b'unfilteredrepo'):
                      repo = repo.unfiltered()
                  opts = pycompat.byteskwargs(opts)
                  rev = opts.get(b'rev', b'.')
                  rebuild = opts.get(b'rebuild', False)
                  diffopts = patch.difffeatureopts(
                      ui, opts, section=b'annotate', whitespace=True
                  )
                  aopts = facontext.annotateopts(
                      diffopts=diffopts,
                      followmerge=not opts.get(b'linear', False),
                      followrename=not opts.get(b'no_follow', False),
                  )
                  if not any(
                      opts.get(s)
                      for s in [b'user', b'date', b'file', b'number', b'changeset']
                  ):
                      # default 'number' for compatibility. but fastannotate is more
                      # efficient with "changeset", "line-number" and "no-content".
                      for name in ui.configlist(
                          b'fastannotate', b'defaultformat', [b'number']
                      ):
                          opts[name] = True
                  ui.pager(b'fastannotate')
                  template = opts.get(b'template')
                  if template == b'json':
                      formatter = faformatter.jsonformatter(ui, repo, opts)
                  else:
                      formatter = faformatter.defaultformatter(ui, repo, opts)
                  showdeleted = opts.get(b'deleted', False)
                  showlines = not bool(opts.get(b'no_content'))
                  showpath = opts.get(b'file', False)
                  # find the head of the main (master) branch
                  master = ui.config(b'fastannotate', b'mainbranch') or rev
                  # paths will be used for prefetching and the real annotating
                  paths = list(_matchpaths(repo, rev, pats, opts, aopts))
                  # for client, prefetch from the server
-                 if util.safehasattr(repo, b'prefetchfastannotate'):
+                 if util.safehasattr(repo, 'prefetchfastannotate'):
                      repo.prefetchfastannotate(paths)
                  for path in paths:
                      result = lines = existinglines = None
                      while True:
                          try:
                              with facontext.annotatecontext(repo, path, aopts, rebuild) as a:
                                  result = a.annotate(
                                      rev,
                                      master=master,
                                      showpath=showpath,
                                      showlines=(showlines and not showdeleted),
                                  )
                                  if showdeleted:
                                      existinglines = set((l[0], l[1]) for l in result)
                                      result = a.annotatealllines(
                                          rev, showpath=showpath, showlines=showlines
                                      )
                              break
                          except (faerror.CannotReuseError, faerror.CorruptedFileError):
                              # happens if master moves backwards, or the file was deleted
                              # and readded, or renamed to an existing name, or corrupted.
                              if rebuild:  # give up since we have tried rebuild already
                                  raise
                              else:  # try a second time rebuilding the cache (slow)
                                  rebuild = True
                                  continue
                      if showlines:
                          result, lines = result
                      formatter.write(result, lines, existinglines=existinglines)
                  formatter.end()
              _newopts = set()
              _knownopts = {
                  opt[1].replace(b'-', b'_')
                  for opt in (fastannotatecommandargs[r'options'] + commands.globalopts)
              }
              def _annotatewrapper(orig, ui, repo, *pats, **opts):
                  """used by wrapdefault"""
                  # we need this hack until the obsstore has 0.0 seconds perf impact
                  if ui.configbool(b'fastannotate', b'unfilteredrepo'):
                      repo = repo.unfiltered()
                  # treat the file as text (skip the isbinary check)
                  if ui.configbool(b'fastannotate', b'forcetext'):
                      opts[r'text'] = True
                  # check if we need to do prefetch (client-side)
                  rev = opts.get(r'rev')
-                 if util.safehasattr(repo, b'prefetchfastannotate') and rev is not None:
+                 if util.safehasattr(repo, 'prefetchfastannotate') and rev is not None:
                      paths = list(_matchpaths(repo, rev, pats, pycompat.byteskwargs(opts)))
                      repo.prefetchfastannotate(paths)
                  return orig(ui, repo, *pats, **opts)
              def registercommand():
                  """register the fastannotate command"""
                  name = b'fastannotate|fastblame|fa'
                  command(name, helpbasic=True, **fastannotatecommandargs)(fastannotate)
              def wrapdefault():
                  """wrap the default annotate command, to be aware of the protocol"""
                  extensions.wrapcommand(commands.table, b'annotate', _annotatewrapper)
              @command(
                  b'debugbuildannotatecache',
                  [(b'r', b'rev', b'', _(b'build up to the specific revision'), _(b'REV'))]
                  + commands.walkopts,
                  _(b'[-r REV] FILE...'),
              )
              def debugbuildannotatecache(ui, repo, *pats, **opts):
                  """incrementally build fastannotate cache up to REV for specified files
                  If REV is not specified, use the config 'fastannotate.mainbranch'.
                  If fastannotate.client is True, download the annotate cache from the
                  server. Otherwise, build the annotate cache locally.
                  The annotate cache will be built using the default diff and follow
                  options and lives in '.hg/fastannotate/default'.
                  """
                  opts = pycompat.byteskwargs(opts)
                  rev = opts.get(b'REV') or ui.config(b'fastannotate', b'mainbranch')
                  if not rev:
                      raise error.Abort(
                          _(b'you need to provide a revision'),
                          hint=_(b'set fastannotate.mainbranch or use --rev'),
                      )
                  if ui.configbool(b'fastannotate', b'unfilteredrepo'):
                      repo = repo.unfiltered()
                  ctx = scmutil.revsingle(repo, rev)
                  m = scmutil.match(ctx, pats, opts)
                  paths = list(ctx.walk(m))
-                 if util.safehasattr(repo, b'prefetchfastannotate'):
+                 if util.safehasattr(repo, 'prefetchfastannotate'):
                      # client
                      if opts.get(b'REV'):
                          raise error.Abort(_(b'--rev cannot be used for client'))
                      repo.prefetchfastannotate(paths)
                  else:
                      # server, or full repo
                      progress = ui.makeprogress(_(b'building'), total=len(paths))
                      for i, path in enumerate(paths):
                          progress.update(i)
                          with facontext.annotatecontext(repo, path) as actx:
                              try:
                                  if actx.isuptodate(rev):
                                      continue
                                  actx.annotate(rev, rev)
                              except (faerror.CannotReuseError, faerror.CorruptedFileError):
                                  # the cache is broken (could happen with renaming so the
                                  # file history gets invalidated). rebuild and try again.
                                  ui.debug(
                                      b'fastannotate: %s: rebuilding broken cache\n' % path
                                  )
                                  actx.rebuild()
                                  try:
                                      actx.annotate(rev, rev)
                                  except Exception as ex:
                                      # possibly a bug, but should not stop us from building
                                      # cache for other files.
                                      ui.warn(
                                          _(
                                              b'fastannotate: %s: failed to '
                                              b'build cache: %r\n'
                                          )
                                          % (path, ex)
                                      )
                      progress.complete()

hgext/fsmonitor/watchmanclient.py

0 +1 -1

              # watchmanclient.py - Watchman client for the fsmonitor extension
              #
              # Copyright 2013-2016 Facebook, Inc.
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import getpass
              from mercurial import util
              from . import pywatchman
              class Unavailable(Exception):
                  def __init__(self, msg, warn=True, invalidate=False):
                      self.msg = msg
                      self.warn = warn
                      if self.msg == b'timed out waiting for response':
                          self.warn = False
                      self.invalidate = invalidate
                  def __str__(self):
                      if self.warn:
                          return b'warning: Watchman unavailable: %s' % self.msg
                      else:
                          return b'Watchman unavailable: %s' % self.msg
              class WatchmanNoRoot(Unavailable):
                  def __init__(self, root, msg):
                      self.root = root
                      super(WatchmanNoRoot, self).__init__(msg)
              class client(object):
                  def __init__(self, ui, root, timeout=1.0):
                      err = None
                      if not self._user:
                          err = b"couldn't get user"
                          warn = True
                      if self._user in ui.configlist(b'fsmonitor', b'blacklistusers'):
                          err = b'user %s in blacklist' % self._user
                          warn = False
                      if err:
                          raise Unavailable(err, warn)
                      self._timeout = timeout
                      self._watchmanclient = None
                      self._root = root
                      self._ui = ui
                      self._firsttime = True
                  def settimeout(self, timeout):
                      self._timeout = timeout
                      if self._watchmanclient is not None:
                          self._watchmanclient.setTimeout(timeout)
                  def getcurrentclock(self):
                      result = self.command(b'clock')
-                     if not util.safehasattr(result, b'clock'):
+                     if not util.safehasattr(result, 'clock'):
                          raise Unavailable(
                              b'clock result is missing clock value', invalidate=True
                          )
                      return result.clock
                  def clearconnection(self):
                      self._watchmanclient = None
                  def available(self):
                      return self._watchmanclient is not None or self._firsttime
                  @util.propertycache
                  def _user(self):
                      try:
                          return getpass.getuser()
                      except KeyError:
                          # couldn't figure out our user
                          return None
                  def _command(self, *args):
                      watchmanargs = (args[0], self._root) + args[1:]
                      try:
                          if self._watchmanclient is None:
                              self._firsttime = False
                              watchman_exe = self._ui.configpath(
                                  b'fsmonitor', b'watchman_exe'
                              )
                              self._watchmanclient = pywatchman.client(
                                  timeout=self._timeout,
                                  useImmutableBser=True,
                                  watchman_exe=watchman_exe,
                              )
                          return self._watchmanclient.query(*watchmanargs)
                      except pywatchman.CommandError as ex:
                          if b'unable to resolve root' in ex.msg:
                              raise WatchmanNoRoot(self._root, ex.msg)
                          raise Unavailable(ex.msg)
                      except pywatchman.WatchmanError as ex:
                          raise Unavailable(str(ex))
                  def command(self, *args):
                      try:
                          try:
                              return self._command(*args)
                          except WatchmanNoRoot:
                              # this 'watch' command can also raise a WatchmanNoRoot if
                              # watchman refuses to accept this root
                              self._command(b'watch')
                              return self._command(*args)
                      except Unavailable:
                          # this is in an outer scope to catch Unavailable form any of the
                          # above _command calls
                          self._watchmanclient = None
                          raise

hgext/journal.py

0 +4 -4

              # journal.py
              #
              # Copyright 2014-2016 Facebook, Inc.
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              """track previous positions of bookmarks (EXPERIMENTAL)
              This extension adds a new command: `hg journal`, which shows you where
              bookmarks were previously located.
              """
              from __future__ import absolute_import
              import collections
              import errno
              import os
              import weakref
              from mercurial.i18n import _
              from mercurial import (
                  bookmarks,
                  cmdutil,
                  dispatch,
                  encoding,
                  error,
                  extensions,
                  hg,
                  localrepo,
                  lock,
                  logcmdutil,
                  node,
                  pycompat,
                  registrar,
                  util,
              )
              from mercurial.utils import (
                  dateutil,
                  procutil,
                  stringutil,
              )
              cmdtable = {}
              command = registrar.command(cmdtable)
              # Note for extension authors: ONLY specify testedwith = 'ships-with-hg-core' for
              # extensions which SHIP WITH MERCURIAL. Non-mainline extensions should
              # be specifying the version(s) of Mercurial they are tested with, or
              # leave the attribute unspecified.
              testedwith = b'ships-with-hg-core'
              # storage format version; increment when the format changes
              storageversion = 0
              # namespaces
              bookmarktype = b'bookmark'
              wdirparenttype = b'wdirparent'
              # In a shared repository, what shared feature name is used
              # to indicate this namespace is shared with the source?
              sharednamespaces = {
                  bookmarktype: hg.sharedbookmarks,
              }
              # Journal recording, register hooks and storage object
              def extsetup(ui):
                  extensions.wrapfunction(dispatch, b'runcommand', runcommand)
                  extensions.wrapfunction(bookmarks.bmstore, b'_write', recordbookmarks)
                  extensions.wrapfilecache(
                      localrepo.localrepository, b'dirstate', wrapdirstate
                  )
                  extensions.wrapfunction(hg, b'postshare', wrappostshare)
                  extensions.wrapfunction(hg, b'copystore', unsharejournal)
              def reposetup(ui, repo):
                  if repo.local():
                      repo.journal = journalstorage(repo)
                      repo._wlockfreeprefix.add(b'namejournal')
                      dirstate, cached = localrepo.isfilecached(repo, b'dirstate')
                      if cached:
                          # already instantiated dirstate isn't yet marked as
                          # "journal"-ing, even though repo.dirstate() was already
                          # wrapped by own wrapdirstate()
                          _setupdirstate(repo, dirstate)
              def runcommand(orig, lui, repo, cmd, fullargs, *args):
                  """Track the command line options for recording in the journal"""
                  journalstorage.recordcommand(*fullargs)
                  return orig(lui, repo, cmd, fullargs, *args)
              def _setupdirstate(repo, dirstate):
                  dirstate.journalstorage = repo.journal
                  dirstate.addparentchangecallback(b'journal', recorddirstateparents)
              # hooks to record dirstate changes
              def wrapdirstate(orig, repo):
                  """Make journal storage available to the dirstate object"""
                  dirstate = orig(repo)
-                 if util.safehasattr(repo, b'journal'):
+                 if util.safehasattr(repo, 'journal'):
                      _setupdirstate(repo, dirstate)
                  return dirstate
              def recorddirstateparents(dirstate, old, new):
                  """Records all dirstate parent changes in the journal."""
                  old = list(old)
                  new = list(new)
-                 if util.safehasattr(dirstate, b'journalstorage'):
+                 if util.safehasattr(dirstate, 'journalstorage'):
                      # only record two hashes if there was a merge
                      oldhashes = old[:1] if old[1] == node.nullid else old
                      newhashes = new[:1] if new[1] == node.nullid else new
                      dirstate.journalstorage.record(
                          wdirparenttype, b'.', oldhashes, newhashes
                      )
              # hooks to record bookmark changes (both local and remote)
              def recordbookmarks(orig, store, fp):
                  """Records all bookmark changes in the journal."""
                  repo = store._repo
-                 if util.safehasattr(repo, b'journal'):
+                 if util.safehasattr(repo, 'journal'):
                      oldmarks = bookmarks.bmstore(repo)
                      for mark, value in pycompat.iteritems(store):
                          oldvalue = oldmarks.get(mark, node.nullid)
                          if value != oldvalue:
                              repo.journal.record(bookmarktype, mark, oldvalue, value)
                  return orig(store, fp)
              # shared repository support
              def _readsharedfeatures(repo):
                  """A set of shared features for this repository"""
                  try:
                      return set(repo.vfs.read(b'shared').splitlines())
                  except IOError as inst:
                      if inst.errno != errno.ENOENT:
                          raise
                      return set()
              def _mergeentriesiter(*iterables, **kwargs):
                  """Given a set of sorted iterables, yield the next entry in merged order
                  Note that by default entries go from most recent to oldest.
                  """
                  order = kwargs.pop(r'order', max)
                  iterables = [iter(it) for it in iterables]
                  # this tracks still active iterables; iterables are deleted as they are
                  # exhausted, which is why this is a dictionary and why each entry also
                  # stores the key. Entries are mutable so we can store the next value each
                  # time.
                  iterable_map = {}
                  for key, it in enumerate(iterables):
                      try:
                          iterable_map[key] = [next(it), key, it]
                      except StopIteration:
                          # empty entry, can be ignored
                          pass
                  while iterable_map:
                      value, key, it = order(pycompat.itervalues(iterable_map))
                      yield value
                      try:
                          iterable_map[key][0] = next(it)
                      except StopIteration:
                          # this iterable is empty, remove it from consideration
                          del iterable_map[key]
              def wrappostshare(orig, sourcerepo, destrepo, **kwargs):
                  """Mark this shared working copy as sharing journal information"""
                  with destrepo.wlock():
                      orig(sourcerepo, destrepo, **kwargs)
                      with destrepo.vfs(b'shared', b'a') as fp:
                          fp.write(b'journal\n')
              def unsharejournal(orig, ui, repo, repopath):
                  """Copy shared journal entries into this repo when unsharing"""
                  if (
                      repo.path == repopath
                      and repo.shared()
-                     and util.safehasattr(repo, b'journal')
+                     and util.safehasattr(repo, 'journal')
                  ):
                      sharedrepo = hg.sharedreposource(repo)
                      sharedfeatures = _readsharedfeatures(repo)
                      if sharedrepo and sharedfeatures > {b'journal'}:
                          # there is a shared repository and there are shared journal entries
                          # to copy. move shared date over from source to destination but
                          # move the local file first
                          if repo.vfs.exists(b'namejournal'):
                              journalpath = repo.vfs.join(b'namejournal')
                              util.rename(journalpath, journalpath + b'.bak')
                          storage = repo.journal
                          local = storage._open(
                              repo.vfs, filename=b'namejournal.bak', _newestfirst=False
                          )
                          shared = (
                              e
                              for e in storage._open(sharedrepo.vfs, _newestfirst=False)
                              if sharednamespaces.get(e.namespace) in sharedfeatures
                          )
                          for entry in _mergeentriesiter(local, shared, order=min):
                              storage._write(repo.vfs, entry)
                  return orig(ui, repo, repopath)
              class journalentry(
                  collections.namedtuple(
                      r'journalentry',
                      r'timestamp user command namespace name oldhashes newhashes',
                  )
              ):
                  """Individual journal entry
                  * timestamp: a mercurial (time, timezone) tuple
                  * user: the username that ran the command
                  * namespace: the entry namespace, an opaque string
                  * name: the name of the changed item, opaque string with meaning in the
                    namespace
                  * command: the hg command that triggered this record
                  * oldhashes: a tuple of one or more binary hashes for the old location
                  * newhashes: a tuple of one or more binary hashes for the new location
                  Handles serialisation from and to the storage format. Fields are
                  separated by newlines, hashes are written out in hex separated by commas,
                  timestamp and timezone are separated by a space.
                  """
                  @classmethod
                  def fromstorage(cls, line):
                      (
                          time,
                          user,
                          command,
                          namespace,
                          name,
                          oldhashes,
                          newhashes,
                      ) = line.split(b'\n')
                      timestamp, tz = time.split()
                      timestamp, tz = float(timestamp), int(tz)
                      oldhashes = tuple(node.bin(hash) for hash in oldhashes.split(b','))
                      newhashes = tuple(node.bin(hash) for hash in newhashes.split(b','))
                      return cls(
                          (timestamp, tz),
                          user,
                          command,
                          namespace,
                          name,
                          oldhashes,
                          newhashes,
                      )
                  def __bytes__(self):
                      """bytes representation for storage"""
                      time = b' '.join(map(pycompat.bytestr, self.timestamp))
                      oldhashes = b','.join([node.hex(hash) for hash in self.oldhashes])
                      newhashes = b','.join([node.hex(hash) for hash in self.newhashes])
                      return b'\n'.join(
                          (
                              time,
                              self.user,
                              self.command,
                              self.namespace,
                              self.name,
                              oldhashes,
                              newhashes,
                          )
                      )
                  __str__ = encoding.strmethod(__bytes__)
              class journalstorage(object):
                  """Storage for journal entries
                  Entries are divided over two files; one with entries that pertain to the
                  local working copy *only*, and one with entries that are shared across
                  multiple working copies when shared using the share extension.
                  Entries are stored with NUL bytes as separators. See the journalentry
                  class for the per-entry structure.
                  The file format starts with an integer version, delimited by a NUL.
                  This storage uses a dedicated lock; this makes it easier to avoid issues
                  with adding entries that added when the regular wlock is unlocked (e.g.
                  the dirstate).
                  """
                  _currentcommand = ()
                  _lockref = None
                  def __init__(self, repo):
                      self.user = procutil.getuser()
                      self.ui = repo.ui
                      self.vfs = repo.vfs
                      # is this working copy using a shared storage?
                      self.sharedfeatures = self.sharedvfs = None
                      if repo.shared():
                          features = _readsharedfeatures(repo)
                          sharedrepo = hg.sharedreposource(repo)
                          if sharedrepo is not None and b'journal' in features:
                              self.sharedvfs = sharedrepo.vfs
                              self.sharedfeatures = features
                  # track the current command for recording in journal entries
                  @property
                  def command(self):
                      commandstr = b' '.join(
                          map(procutil.shellquote, journalstorage._currentcommand)
                      )
                      if b'\n' in commandstr:
                          # truncate multi-line commands
                          commandstr = commandstr.partition(b'\n')[0] + b' ...'
                      return commandstr
                  @classmethod
                  def recordcommand(cls, *fullargs):
                      """Set the current hg arguments, stored with recorded entries"""
                      # Set the current command on the class because we may have started
                      # with a non-local repo (cloning for example).
                      cls._currentcommand = fullargs
                  def _currentlock(self, lockref):
                      """Returns the lock if it's held, or None if it's not.
                      (This is copied from the localrepo class)
                      """
                      if lockref is None:
                          return None
                      l = lockref()
                      if l is None or not l.held:
                          return None
                      return l
                  def jlock(self, vfs):
                      """Create a lock for the journal file"""
                      if self._currentlock(self._lockref) is not None:
                          raise error.Abort(_(b'journal lock does not support nesting'))
                      desc = _(b'journal of %s') % vfs.base
                      try:
                          l = lock.lock(vfs, b'namejournal.lock', 0, desc=desc)
                      except error.LockHeld as inst:
                          self.ui.warn(
                              _(b"waiting for lock on %s held by %r\n") % (desc, inst.locker)
                          )
                          # default to 600 seconds timeout
                          l = lock.lock(
                              vfs,
                              b'namejournal.lock',
                              self.ui.configint(b"ui", b"timeout"),
                              desc=desc,
                          )
                          self.ui.warn(_(b"got lock after %s seconds\n") % l.delay)
                      self._lockref = weakref.ref(l)
                      return l
                  def record(self, namespace, name, oldhashes, newhashes):
                      """Record a new journal entry
                      * namespace: an opaque string; this can be used to filter on the type
                        of recorded entries.
                      * name: the name defining this entry; for bookmarks, this is the
                        bookmark name. Can be filtered on when retrieving entries.
                      * oldhashes and newhashes: each a single binary hash, or a list of
                        binary hashes. These represent the old and new position of the named
                        item.
                      """
                      if not isinstance(oldhashes, list):
                          oldhashes = [oldhashes]
                      if not isinstance(newhashes, list):
                          newhashes = [newhashes]
                      entry = journalentry(
                          dateutil.makedate(),
                          self.user,
                          self.command,
                          namespace,
                          name,
                          oldhashes,
                          newhashes,
                      )
                      vfs = self.vfs
                      if self.sharedvfs is not None:
                          # write to the shared repository if this feature is being
                          # shared between working copies.
                          if sharednamespaces.get(namespace) in self.sharedfeatures:
                              vfs = self.sharedvfs
                      self._write(vfs, entry)
                  def _write(self, vfs, entry):
                      with self.jlock(vfs):
                          # open file in amend mode to ensure it is created if missing
                          with vfs(b'namejournal', mode=b'a+b') as f:
                              f.seek(0, os.SEEK_SET)
                              # Read just enough bytes to get a version number (up to 2
                              # digits plus separator)
                              version = f.read(3).partition(b'\0')[0]
                              if version and version != b"%d" % storageversion:
                                  # different version of the storage. Exit early (and not
                                  # write anything) if this is not a version we can handle or
                                  # the file is corrupt. In future, perhaps rotate the file
                                  # instead?
                                  self.ui.warn(
                                      _(b"unsupported journal file version '%s'\n") % version
                                  )
                                  return
                              if not version:
                                  # empty file, write version first
                                  f.write((b"%d" % storageversion) + b'\0')
                              f.seek(0, os.SEEK_END)
                              f.write(bytes(entry) + b'\0')
                  def filtered(self, namespace=None, name=None):
                      """Yield all journal entries with the given namespace or name
                      Both the namespace and the name are optional; if neither is given all
                      entries in the journal are produced.
                      Matching supports regular expressions by using the `re:` prefix
                      (use `literal:` to match names or namespaces that start with `re:`)
                      """
                      if namespace is not None:
                          namespace = stringutil.stringmatcher(namespace)[-1]
                      if name is not None:
                          name = stringutil.stringmatcher(name)[-1]
                      for entry in self:
                          if namespace is not None and not namespace(entry.namespace):
                              continue
                          if name is not None and not name(entry.name):
                              continue
                          yield entry
                  def __iter__(self):
                      """Iterate over the storage
                      Yields journalentry instances for each contained journal record.
                      """
                      local = self._open(self.vfs)
                      if self.sharedvfs is None:
                          return local
                      # iterate over both local and shared entries, but only those
                      # shared entries that are among the currently shared features
                      shared = (
                          e
                          for e in self._open(self.sharedvfs)
                          if sharednamespaces.get(e.namespace) in self.sharedfeatures
                      )
                      return _mergeentriesiter(local, shared)
                  def _open(self, vfs, filename=b'namejournal', _newestfirst=True):
                      if not vfs.exists(filename):
                          return
                      with vfs(filename) as f:
                          raw = f.read()
                      lines = raw.split(b'\0')
                      version = lines and lines[0]
                      if version != b"%d" % storageversion:
                          version = version or _(b'not available')
                          raise error.Abort(_(b"unknown journal file version '%s'") % version)
                      # Skip the first line, it's a version number. Normally we iterate over
                      # these in reverse order to list newest first; only when copying across
                      # a shared storage do we forgo reversing.
                      lines = lines[1:]
                      if _newestfirst:
                          lines = reversed(lines)
                      for line in lines:
                          if not line:
                              continue
                          yield journalentry.fromstorage(line)
              # journal reading
              # log options that don't make sense for journal
              _ignoreopts = (b'no-merges', b'graph')
              @command(
                  b'journal',
                  [
                      (b'', b'all', None, b'show history for all names'),
                      (b'c', b'commits', None, b'show commit metadata'),
                  ]
                  + [opt for opt in cmdutil.logopts if opt[1] not in _ignoreopts],
                  b'[OPTION]... [BOOKMARKNAME]',
                  helpcategory=command.CATEGORY_CHANGE_ORGANIZATION,
              )
              def journal(ui, repo, *args, **opts):
                  """show the previous position of bookmarks and the working copy
                  The journal is used to see the previous commits that bookmarks and the
                  working copy pointed to. By default the previous locations for the working
                  copy.  Passing a bookmark name will show all the previous positions of
                  that bookmark. Use the --all switch to show previous locations for all
                  bookmarks and the working copy; each line will then include the bookmark
                  name, or '.' for the working copy, as well.
                  If `name` starts with `re:`, the remainder of the name is treated as
                  a regular expression. To match a name that actually starts with `re:`,
                  use the prefix `literal:`.
                  By default hg journal only shows the commit hash and the command that was
                  running at that time. -v/--verbose will show the prior hash, the user, and
                  the time at which it happened.
                  Use -c/--commits to output log information on each commit hash; at this
                  point you can use the usual `--patch`, `--git`, `--stat` and `--template`
                  switches to alter the log output for these.
                  `hg journal -T json` can be used to produce machine readable output.
                  """
                  opts = pycompat.byteskwargs(opts)
                  name = b'.'
                  if opts.get(b'all'):
                      if args:
                          raise error.Abort(
                              _(b"You can't combine --all and filtering on a name")
                          )
                      name = None
                  if args:
                      name = args[0]
                  fm = ui.formatter(b'journal', opts)
                  def formatnodes(nodes):
                      return fm.formatlist(map(fm.hexfunc, nodes), name=b'node', sep=b',')
                  if opts.get(b"template") != b"json":
                      if name is None:
                          displayname = _(b'the working copy and bookmarks')
                      else:
                          displayname = b"'%s'" % name
                      ui.status(_(b"previous locations of %s:\n") % displayname)
                  limit = logcmdutil.getlimit(opts)
                  entry = None
                  ui.pager(b'journal')
                  for count, entry in enumerate(repo.journal.filtered(name=name)):
                      if count == limit:
                          break
                      fm.startitem()
                      fm.condwrite(
                          ui.verbose, b'oldnodes', b'%s -> ', formatnodes(entry.oldhashes)
                      )
                      fm.write(b'newnodes', b'%s', formatnodes(entry.newhashes))
                      fm.condwrite(ui.verbose, b'user', b' %-8s', entry.user)
                      fm.condwrite(
                          opts.get(b'all') or name.startswith(b're:'),
                          b'name',
                          b'  %-8s',
                          entry.name,
                      )
                      fm.condwrite(
                          ui.verbose,
                          b'date',
                          b' %s',
                          fm.formatdate(entry.timestamp, b'%Y-%m-%d %H:%M %1%2'),
                      )
                      fm.write(b'command', b'  %s\n', entry.command)
                      if opts.get(b"commits"):
                          if fm.isplain():
                              displayer = logcmdutil.changesetdisplayer(ui, repo, opts)
                          else:
                              displayer = logcmdutil.changesetformatter(
                                  ui, repo, fm.nested(b'changesets'), diffopts=opts
                              )
                          for hash in entry.newhashes:
                              try:
                                  ctx = repo[hash]
                                  displayer.show(ctx)
                              except error.RepoLookupError as e:
                                  fm.plain(b"%s\n\n" % pycompat.bytestr(e))
                          displayer.close()
                  fm.end()
                  if entry is None:
                      ui.status(_(b"no recorded locations\n"))

hgext/lfs/wireprotolfsserver.py

0 +1 -1

              # wireprotolfsserver.py - lfs protocol server side implementation
              #
              # Copyright 2018 Matt Harbison <matt_harbison@yahoo.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import datetime
              import errno
              import json
              import traceback
              from mercurial.hgweb import common as hgwebcommon
              from mercurial import (
                  exthelper,
                  pycompat,
                  util,
                  wireprotoserver,
              )
              from . import blobstore
              HTTP_OK = hgwebcommon.HTTP_OK
              HTTP_CREATED = hgwebcommon.HTTP_CREATED
              HTTP_BAD_REQUEST = hgwebcommon.HTTP_BAD_REQUEST
              HTTP_NOT_FOUND = hgwebcommon.HTTP_NOT_FOUND
              HTTP_METHOD_NOT_ALLOWED = hgwebcommon.HTTP_METHOD_NOT_ALLOWED
              HTTP_NOT_ACCEPTABLE = hgwebcommon.HTTP_NOT_ACCEPTABLE
              HTTP_UNSUPPORTED_MEDIA_TYPE = hgwebcommon.HTTP_UNSUPPORTED_MEDIA_TYPE
              eh = exthelper.exthelper()
              @eh.wrapfunction(wireprotoserver, b'handlewsgirequest')
              def handlewsgirequest(orig, rctx, req, res, checkperm):
                  """Wrap wireprotoserver.handlewsgirequest() to possibly process an LFS
                  request if it is left unprocessed by the wrapped method.
                  """
                  if orig(rctx, req, res, checkperm):
                      return True
                  if not rctx.repo.ui.configbool(b'experimental', b'lfs.serve'):
                      return False
-                 if not util.safehasattr(rctx.repo.svfs, b'lfslocalblobstore'):
+                 if not util.safehasattr(rctx.repo.svfs, 'lfslocalblobstore'):
                      return False
                  if not req.dispatchpath:
                      return False
                  try:
                      if req.dispatchpath == b'.git/info/lfs/objects/batch':
                          checkperm(rctx, req, b'pull')
                          return _processbatchrequest(rctx.repo, req, res)
                      # TODO: reserve and use a path in the proposed http wireprotocol /api/
                      #       namespace?
                      elif req.dispatchpath.startswith(b'.hg/lfs/objects'):
                          return _processbasictransfer(
                              rctx.repo, req, res, lambda perm: checkperm(rctx, req, perm)
                          )
                      return False
                  except hgwebcommon.ErrorResponse as e:
                      # XXX: copied from the handler surrounding wireprotoserver._callhttp()
                      #      in the wrapped function.  Should this be moved back to hgweb to
                      #      be a common handler?
                      for k, v in e.headers:
                          res.headers[k] = v
                      res.status = hgwebcommon.statusmessage(e.code, pycompat.bytestr(e))
                      res.setbodybytes(b'0\n%s\n' % pycompat.bytestr(e))
                      return True
              def _sethttperror(res, code, message=None):
                  res.status = hgwebcommon.statusmessage(code, message=message)
                  res.headers[b'Content-Type'] = b'text/plain; charset=utf-8'
                  res.setbodybytes(b'')
              def _logexception(req):
                  """Write information about the current exception to wsgi.errors."""
                  tb = pycompat.sysbytes(traceback.format_exc())
                  errorlog = req.rawenv[b'wsgi.errors']
                  uri = b''
                  if req.apppath:
                      uri += req.apppath
                  uri += b'/' + req.dispatchpath
                  errorlog.write(
                      b"Exception happened while processing request '%s':\n%s" % (uri, tb)
                  )
              def _processbatchrequest(repo, req, res):
                  """Handle a request for the Batch API, which is the gateway to granting file
                  access.
                  https://github.com/git-lfs/git-lfs/blob/master/docs/api/batch.md
                  """
                  # Mercurial client request:
                  #
                  #   HOST: localhost:$HGPORT
                  #   ACCEPT: application/vnd.git-lfs+json
                  #   ACCEPT-ENCODING: identity
                  #   USER-AGENT: git-lfs/2.3.4 (Mercurial 4.5.2+1114-f48b9754f04c+20180316)
                  #   Content-Length: 125
                  #   Content-Type: application/vnd.git-lfs+json
                  #
                  #   {
                  #     "objects": [
                  #       {
                  #         "oid": "31cf...8e5b"
                  #         "size": 12
                  #       }
                  #     ]
                  #     "operation": "upload"
                  #  }
                  if req.method != b'POST':
                      _sethttperror(res, HTTP_METHOD_NOT_ALLOWED)
                      return True
                  if req.headers[b'Content-Type'] != b'application/vnd.git-lfs+json':
                      _sethttperror(res, HTTP_UNSUPPORTED_MEDIA_TYPE)
                      return True
                  if req.headers[b'Accept'] != b'application/vnd.git-lfs+json':
                      _sethttperror(res, HTTP_NOT_ACCEPTABLE)
                      return True
                  # XXX: specify an encoding?
                  lfsreq = json.loads(req.bodyfh.read())
                  # If no transfer handlers are explicitly requested, 'basic' is assumed.
                  if r'basic' not in lfsreq.get(r'transfers', [r'basic']):
                      _sethttperror(
                          res,
                          HTTP_BAD_REQUEST,
                          b'Only the basic LFS transfer handler is supported',
                      )
                      return True
                  operation = lfsreq.get(r'operation')
                  operation = pycompat.bytestr(operation)
                  if operation not in (b'upload', b'download'):
                      _sethttperror(
                          res,
                          HTTP_BAD_REQUEST,
                          b'Unsupported LFS transfer operation: %s' % operation,
                      )
                      return True
                  localstore = repo.svfs.lfslocalblobstore
                  objects = [
                      p
                      for p in _batchresponseobjects(
                          req, lfsreq.get(r'objects', []), operation, localstore
                      )
                  ]
                  rsp = {
                      r'transfer': r'basic',
                      r'objects': objects,
                  }
                  res.status = hgwebcommon.statusmessage(HTTP_OK)
                  res.headers[b'Content-Type'] = b'application/vnd.git-lfs+json'
                  res.setbodybytes(pycompat.bytestr(json.dumps(rsp)))
                  return True
              def _batchresponseobjects(req, objects, action, store):
                  """Yield one dictionary of attributes for the Batch API response for each
                  object in the list.
                  req: The parsedrequest for the Batch API request
                  objects: The list of objects in the Batch API object request list
                  action: 'upload' or 'download'
                  store: The local blob store for servicing requests"""
                  # Successful lfs-test-server response to solict an upload:
                  # {
                  #    u'objects': [{
                  #       u'size': 12,
                  #       u'oid': u'31cf...8e5b',
                  #       u'actions': {
                  #           u'upload': {
                  #               u'href': u'http://localhost:$HGPORT/objects/31cf...8e5b',
                  #               u'expires_at': u'0001-01-01T00:00:00Z',
                  #               u'header': {
                  #                   u'Accept': u'application/vnd.git-lfs'
                  #               }
                  #           }
                  #       }
                  #    }]
                  # }
                  # TODO: Sort out the expires_at/expires_in/authenticated keys.
                  for obj in objects:
                      # Convert unicode to ASCII to create a filesystem path
                      soid = obj.get(r'oid')
                      oid = soid.encode(r'ascii')
                      rsp = {
                          r'oid': soid,
                          r'size': obj.get(r'size'),  # XXX: should this check the local size?
                          # r'authenticated': True,
                      }
                      exists = True
                      verifies = False
                      # Verify an existing file on the upload request, so that the client is
                      # solicited to re-upload if it corrupt locally.  Download requests are
                      # also verified, so the error can be flagged in the Batch API response.
                      # (Maybe we can use this to short circuit the download for `hg verify`,
                      # IFF the client can assert that the remote end is an hg server.)
                      # Otherwise, it's potentially overkill on download, since it is also
                      # verified as the file is streamed to the caller.
                      try:
                          verifies = store.verify(oid)
                          if verifies and action == b'upload':
                              # The client will skip this upload, but make sure it remains
                              # available locally.
                              store.linkfromusercache(oid)
                      except IOError as inst:
                          if inst.errno != errno.ENOENT:
                              _logexception(req)
                              rsp[r'error'] = {
                                  r'code': 500,
                                  r'message': inst.strerror or r'Internal Server Server',
                              }
                              yield rsp
                              continue
                          exists = False
                      # Items are always listed for downloads.  They are dropped for uploads
                      # IFF they already exist locally.
                      if action == b'download':
                          if not exists:
                              rsp[r'error'] = {
                                  r'code': 404,
                                  r'message': r"The object does not exist",
                              }
                              yield rsp
                              continue
                          elif not verifies:
                              rsp[r'error'] = {
                                  r'code': 422,  # XXX: is this the right code?
                                  r'message': r"The object is corrupt",
                              }
                              yield rsp
                              continue
                      elif verifies:
                          yield rsp  # Skip 'actions': already uploaded
                          continue
                      expiresat = datetime.datetime.now() + datetime.timedelta(minutes=10)
                      def _buildheader():
                          # The spec doesn't mention the Accept header here, but avoid
                          # a gratuitous deviation from lfs-test-server in the test
                          # output.
                          hdr = {r'Accept': r'application/vnd.git-lfs'}
                          auth = req.headers.get(b'Authorization', b'')
                          if auth.startswith(b'Basic '):
                              hdr[r'Authorization'] = pycompat.strurl(auth)
                          return hdr
                      rsp[r'actions'] = {
                          r'%s'
                          % pycompat.strurl(action): {
                              r'href': pycompat.strurl(
                                  b'%s%s/.hg/lfs/objects/%s' % (req.baseurl, req.apppath, oid)
                              ),
                              # datetime.isoformat() doesn't include the 'Z' suffix
                              r"expires_at": expiresat.strftime(r'%Y-%m-%dT%H:%M:%SZ'),
                              r'header': _buildheader(),
                          }
                      }
                      yield rsp
              def _processbasictransfer(repo, req, res, checkperm):
                  """Handle a single file upload (PUT) or download (GET) action for the Basic
                  Transfer Adapter.
                  After determining if the request is for an upload or download, the access
                  must be checked by calling ``checkperm()`` with either 'pull' or 'upload'
                  before accessing the files.
                  https://github.com/git-lfs/git-lfs/blob/master/docs/api/basic-transfers.md
                  """
                  method = req.method
                  oid = req.dispatchparts[-1]
                  localstore = repo.svfs.lfslocalblobstore
                  if len(req.dispatchparts) != 4:
                      _sethttperror(res, HTTP_NOT_FOUND)
                      return True
                  if method == b'PUT':
                      checkperm(b'upload')
                      # TODO: verify Content-Type?
                      existed = localstore.has(oid)
                      # TODO: how to handle timeouts?  The body proxy handles limiting to
                      #       Content-Length, but what happens if a client sends less than it
                      #       says it will?
                      statusmessage = hgwebcommon.statusmessage
                      try:
                          localstore.download(oid, req.bodyfh)
                          res.status = statusmessage(HTTP_OK if existed else HTTP_CREATED)
                      except blobstore.LfsCorruptionError:
                          _logexception(req)
                          # XXX: Is this the right code?
                          res.status = statusmessage(422, b'corrupt blob')
                      # There's no payload here, but this is the header that lfs-test-server
                      # sends back.  This eliminates some gratuitous test output conditionals.
                      res.headers[b'Content-Type'] = b'text/plain; charset=utf-8'
                      res.setbodybytes(b'')
                      return True
                  elif method == b'GET':
                      checkperm(b'pull')
                      res.status = hgwebcommon.statusmessage(HTTP_OK)
                      res.headers[b'Content-Type'] = b'application/octet-stream'
                      try:
                          # TODO: figure out how to send back the file in chunks, instead of
                          #       reading the whole thing.  (Also figure out how to send back
                          #       an error status if an IOError occurs after a partial write
                          #       in that case.  Here, everything is read before starting.)
                          res.setbodybytes(localstore.read(oid))
                      except blobstore.LfsCorruptionError:
                          _logexception(req)
                          # XXX: Is this the right code?
                          res.status = hgwebcommon.statusmessage(422, b'corrupt blob')
                          res.setbodybytes(b'')
                      return True
                  else:
                      _sethttperror(
                          res,
                          HTTP_METHOD_NOT_ALLOWED,
                          message=b'Unsupported LFS transfer method: %s' % method,
                      )
                      return True

hgext/narrow/narrowbundle2.py

0 +3 -3

              # narrowbundle2.py - bundle2 extensions for narrow repository support
              #
              # Copyright 2017 Google, Inc.
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import errno
              import struct
              from mercurial.i18n import _
              from mercurial.node import (
                  bin,
                  nullid,
              )
              from mercurial import (
                  bundle2,
                  changegroup,
                  error,
                  exchange,
                  localrepo,
                  narrowspec,
                  repair,
                  util,
                  wireprototypes,
              )
              from mercurial.interfaces import repository
              from mercurial.utils import stringutil
              _NARROWACL_SECTION = b'narrowacl'
              _CHANGESPECPART = b'narrow:changespec'
              _RESSPECS = b'narrow:responsespec'
              _SPECPART = b'narrow:spec'
              _SPECPART_INCLUDE = b'include'
              _SPECPART_EXCLUDE = b'exclude'
              _KILLNODESIGNAL = b'KILL'
              _DONESIGNAL = b'DONE'
              _ELIDEDCSHEADER = b'>20s20s20sl'  # cset id, p1, p2, len(text)
              _ELIDEDMFHEADER = b'>20s20s20s20sl'  # manifest id, p1, p2, link id, len(text)
              _CSHEADERSIZE = struct.calcsize(_ELIDEDCSHEADER)
              _MFHEADERSIZE = struct.calcsize(_ELIDEDMFHEADER)
              # Serve a changegroup for a client with a narrow clone.
              def getbundlechangegrouppart_narrow(
                  bundler,
                  repo,
                  source,
                  bundlecaps=None,
                  b2caps=None,
                  heads=None,
                  common=None,
                  **kwargs
              ):
                  assert repo.ui.configbool(b'experimental', b'narrowservebrokenellipses')
                  cgversions = b2caps.get(b'changegroup')
                  cgversions = [
                      v
                      for v in cgversions
                      if v in changegroup.supportedoutgoingversions(repo)
                  ]
                  if not cgversions:
                      raise ValueError(_(b'no common changegroup version'))
                  version = max(cgversions)
                  oldinclude = sorted(filter(bool, kwargs.get(r'oldincludepats', [])))
                  oldexclude = sorted(filter(bool, kwargs.get(r'oldexcludepats', [])))
                  newinclude = sorted(filter(bool, kwargs.get(r'includepats', [])))
                  newexclude = sorted(filter(bool, kwargs.get(r'excludepats', [])))
                  known = {bin(n) for n in kwargs.get(r'known', [])}
                  generateellipsesbundle2(
                      bundler,
                      repo,
                      oldinclude,
                      oldexclude,
                      newinclude,
                      newexclude,
                      version,
                      common,
                      heads,
                      known,
                      kwargs.get(r'depth', None),
                  )
              def generateellipsesbundle2(
                  bundler,
                  repo,
                  oldinclude,
                  oldexclude,
                  newinclude,
                  newexclude,
                  version,
                  common,
                  heads,
                  known,
                  depth,
              ):
                  newmatch = narrowspec.match(
                      repo.root, include=newinclude, exclude=newexclude
                  )
                  if depth is not None:
                      depth = int(depth)
                      if depth < 1:
                          raise error.Abort(_(b'depth must be positive, got %d') % depth)
                  heads = set(heads or repo.heads())
                  common = set(common or [nullid])
                  if known and (oldinclude != newinclude or oldexclude != newexclude):
                      # Steps:
                      # 1. Send kill for "$known & ::common"
                      #
                      # 2. Send changegroup for ::common
                      #
                      # 3. Proceed.
                      #
                      # In the future, we can send kills for only the specific
                      # nodes we know should go away or change shape, and then
                      # send a data stream that tells the client something like this:
                      #
                      # a) apply this changegroup
                      # b) apply nodes XXX, YYY, ZZZ that you already have
                      # c) goto a
                      #
                      # until they've built up the full new state.
                      # Convert to revnums and intersect with "common". The client should
                      # have made it a subset of "common" already, but let's be safe.
                      known = set(repo.revs(b"%ln & ::%ln", known, common))
                      # TODO: we could send only roots() of this set, and the
                      # list of nodes in common, and the client could work out
                      # what to strip, instead of us explicitly sending every
                      # single node.
                      deadrevs = known
                      def genkills():
                          for r in deadrevs:
                              yield _KILLNODESIGNAL
                              yield repo.changelog.node(r)
                          yield _DONESIGNAL
                      bundler.newpart(_CHANGESPECPART, data=genkills())
                      newvisit, newfull, newellipsis = exchange._computeellipsis(
                          repo, set(), common, known, newmatch
                      )
                      if newvisit:
                          packer = changegroup.getbundler(
                              version,
                              repo,
                              matcher=newmatch,
                              ellipses=True,
                              shallow=depth is not None,
                              ellipsisroots=newellipsis,
                              fullnodes=newfull,
                          )
                          cgdata = packer.generate(common, newvisit, False, b'narrow_widen')
                          part = bundler.newpart(b'changegroup', data=cgdata)
                          part.addparam(b'version', version)
                          if b'treemanifest' in repo.requirements:
                              part.addparam(b'treemanifest', b'1')
                  visitnodes, relevant_nodes, ellipsisroots = exchange._computeellipsis(
                      repo, common, heads, set(), newmatch, depth=depth
                  )
                  repo.ui.debug(b'Found %d relevant revs\n' % len(relevant_nodes))
                  if visitnodes:
                      packer = changegroup.getbundler(
                          version,
                          repo,
                          matcher=newmatch,
                          ellipses=True,
                          shallow=depth is not None,
                          ellipsisroots=ellipsisroots,
                          fullnodes=relevant_nodes,
                      )
                      cgdata = packer.generate(common, visitnodes, False, b'narrow_widen')
                      part = bundler.newpart(b'changegroup', data=cgdata)
                      part.addparam(b'version', version)
                      if b'treemanifest' in repo.requirements:
                          part.addparam(b'treemanifest', b'1')
              @bundle2.parthandler(_SPECPART, (_SPECPART_INCLUDE, _SPECPART_EXCLUDE))
              def _handlechangespec_2(op, inpart):
                  # XXX: This bundle2 handling is buggy and should be removed after hg5.2 is
                  # released. New servers will send a mandatory bundle2 part named
                  # 'Narrowspec' and will send specs as data instead of params.
                  # Refer to issue5952 and 6019
                  includepats = set(inpart.params.get(_SPECPART_INCLUDE, b'').splitlines())
                  excludepats = set(inpart.params.get(_SPECPART_EXCLUDE, b'').splitlines())
                  narrowspec.validatepatterns(includepats)
                  narrowspec.validatepatterns(excludepats)
                  if not repository.NARROW_REQUIREMENT in op.repo.requirements:
                      op.repo.requirements.add(repository.NARROW_REQUIREMENT)
                      op.repo._writerequirements()
                  op.repo.setnarrowpats(includepats, excludepats)
                  narrowspec.copytoworkingcopy(op.repo)
              @bundle2.parthandler(_RESSPECS)
              def _handlenarrowspecs(op, inpart):
                  data = inpart.read()
                  inc, exc = data.split(b'\0')
                  includepats = set(inc.splitlines())
                  excludepats = set(exc.splitlines())
                  narrowspec.validatepatterns(includepats)
                  narrowspec.validatepatterns(excludepats)
                  if repository.NARROW_REQUIREMENT not in op.repo.requirements:
                      op.repo.requirements.add(repository.NARROW_REQUIREMENT)
                      op.repo._writerequirements()
                  op.repo.setnarrowpats(includepats, excludepats)
                  narrowspec.copytoworkingcopy(op.repo)
              @bundle2.parthandler(_CHANGESPECPART)
              def _handlechangespec(op, inpart):
                  repo = op.repo
                  cl = repo.changelog
                  # changesets which need to be stripped entirely. either they're no longer
                  # needed in the new narrow spec, or the server is sending a replacement
                  # in the changegroup part.
                  clkills = set()
                  # A changespec part contains all the updates to ellipsis nodes
                  # that will happen as a result of widening or narrowing a
                  # repo. All the changes that this block encounters are ellipsis
                  # nodes or flags to kill an existing ellipsis.
                  chunksignal = changegroup.readexactly(inpart, 4)
                  while chunksignal != _DONESIGNAL:
                      if chunksignal == _KILLNODESIGNAL:
                          # a node used to be an ellipsis but isn't anymore
                          ck = changegroup.readexactly(inpart, 20)
                          if cl.hasnode(ck):
                              clkills.add(ck)
                      else:
                          raise error.Abort(
                              _(b'unexpected changespec node chunk type: %s') % chunksignal
                          )
                      chunksignal = changegroup.readexactly(inpart, 4)
                  if clkills:
                      # preserve bookmarks that repair.strip() would otherwise strip
                      op._bookmarksbackup = repo._bookmarks
                      class dummybmstore(dict):
                          def applychanges(self, repo, tr, changes):
                              pass
                      localrepo.localrepository._bookmarks.set(repo, dummybmstore())
                      chgrpfile = repair.strip(
                          op.ui, repo, list(clkills), backup=True, topic=b'widen'
                      )
                      if chgrpfile:
                          op._widen_uninterr = repo.ui.uninterruptible()
                          op._widen_uninterr.__enter__()
                          # presence of _widen_bundle attribute activates widen handler later
                          op._widen_bundle = chgrpfile
                  # Set the new narrowspec if we're widening. The setnewnarrowpats() method
                  # will currently always be there when using the core+narrowhg server, but
                  # other servers may include a changespec part even when not widening (e.g.
                  # because we're deepening a shallow repo).
-                 if util.safehasattr(repo, b'setnewnarrowpats'):
+                 if util.safehasattr(repo, 'setnewnarrowpats'):
                      repo.setnewnarrowpats()
              def handlechangegroup_widen(op, inpart):
                  """Changegroup exchange handler which restores temporarily-stripped nodes"""
                  # We saved a bundle with stripped node data we must now restore.
                  # This approach is based on mercurial/repair.py@6ee26a53c111.
                  repo = op.repo
                  ui = op.ui
                  chgrpfile = op._widen_bundle
                  del op._widen_bundle
                  vfs = repo.vfs
                  ui.note(_(b"adding branch\n"))
                  f = vfs.open(chgrpfile, b"rb")
                  try:
                      gen = exchange.readbundle(ui, f, chgrpfile, vfs)
                      # silence internal shuffling chatter
                      override = {(b'ui', b'quiet'): True}
                      if ui.verbose:
                          override = {}
                      with ui.configoverride(override):
                          if isinstance(gen, bundle2.unbundle20):
                              with repo.transaction(b'strip') as tr:
                                  bundle2.processbundle(repo, gen, lambda: tr)
                          else:
                              gen.apply(
                                  repo, b'strip', b'bundle:' + vfs.join(chgrpfile), True
                              )
                  finally:
                      f.close()
                  # remove undo files
                  for undovfs, undofile in repo.undofiles():
                      try:
                          undovfs.unlink(undofile)
                      except OSError as e:
                          if e.errno != errno.ENOENT:
                              ui.warn(
                                  _(b'error removing %s: %s\n')
                                  % (undovfs.join(undofile), stringutil.forcebytestr(e))
                              )
                  # Remove partial backup only if there were no exceptions
                  op._widen_uninterr.__exit__(None, None, None)
                  vfs.unlink(chgrpfile)
              def setup():
                  """Enable narrow repo support in bundle2-related extension points."""
                  getbundleargs = wireprototypes.GETBUNDLE_ARGUMENTS
                  getbundleargs[b'narrow'] = b'boolean'
                  getbundleargs[b'depth'] = b'plain'
                  getbundleargs[b'oldincludepats'] = b'csv'
                  getbundleargs[b'oldexcludepats'] = b'csv'
                  getbundleargs[b'known'] = b'csv'
                  # Extend changegroup serving to handle requests from narrow clients.
                  origcgfn = exchange.getbundle2partsmapping[b'changegroup']
                  def wrappedcgfn(*args, **kwargs):
                      repo = args[1]
                      if repo.ui.has_section(_NARROWACL_SECTION):
                          kwargs = exchange.applynarrowacl(repo, kwargs)
                      if kwargs.get(r'narrow', False) and repo.ui.configbool(
                          b'experimental', b'narrowservebrokenellipses'
                      ):
                          getbundlechangegrouppart_narrow(*args, **kwargs)
                      else:
                          origcgfn(*args, **kwargs)
                  exchange.getbundle2partsmapping[b'changegroup'] = wrappedcgfn
                  # Extend changegroup receiver so client can fixup after widen requests.
                  origcghandler = bundle2.parthandlermapping[b'changegroup']
                  def wrappedcghandler(op, inpart):
                      origcghandler(op, inpart)
-                     if util.safehasattr(op, b'_widen_bundle'):
+                     if util.safehasattr(op, '_widen_bundle'):
                          handlechangegroup_widen(op, inpart)
-                     if util.safehasattr(op, b'_bookmarksbackup'):
+                     if util.safehasattr(op, '_bookmarksbackup'):
                          localrepo.localrepository._bookmarks.set(
                              op.repo, op._bookmarksbackup
                          )
                          del op._bookmarksbackup
                  wrappedcghandler.params = origcghandler.params
                  bundle2.parthandlermapping[b'changegroup'] = wrappedcghandler

hgext/remotefilelog/connectionpool.py

0 +3 -3

              # connectionpool.py - class for pooling peer connections for reuse
              #
              # Copyright 2017 Facebook, Inc.
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              from mercurial import (
                  extensions,
                  hg,
                  pycompat,
                  sshpeer,
                  util,
              )
              _sshv1peer = sshpeer.sshv1peer
              class connectionpool(object):
                  def __init__(self, repo):
                      self._repo = repo
                      self._pool = dict()
                  def get(self, path):
                      pathpool = self._pool.get(path)
                      if pathpool is None:
                          pathpool = list()
                          self._pool[path] = pathpool
                      conn = None
                      if len(pathpool) > 0:
                          try:
                              conn = pathpool.pop()
                              peer = conn.peer
                              # If the connection has died, drop it
                              if isinstance(peer, _sshv1peer):
                                  if peer._subprocess.poll() is not None:
                                      conn = None
                          except IndexError:
                              pass
                      if conn is None:
                          def _cleanup(orig):
                              # close pipee first so peer.cleanup reading it won't deadlock,
                              # if there are other processes with pipeo open (i.e. us).
                              peer = orig.im_self
-                             if util.safehasattr(peer, b'pipee'):
+                             if util.safehasattr(peer, 'pipee'):
                                  peer.pipee.close()
                              return orig()
                          peer = hg.peer(self._repo.ui, {}, path)
-                         if util.safehasattr(peer, b'cleanup'):
+                         if util.safehasattr(peer, 'cleanup'):
                              extensions.wrapfunction(peer, b'cleanup', _cleanup)
                          conn = connection(pathpool, peer)
                      return conn
                  def close(self):
                      for pathpool in pycompat.itervalues(self._pool):
                          for conn in pathpool:
                              conn.close()
                          del pathpool[:]
              class connection(object):
                  def __init__(self, pool, peer):
                      self._pool = pool
                      self.peer = peer
                  def __enter__(self):
                      return self
                  def __exit__(self, type, value, traceback):
                      # Only add the connection back to the pool if there was no exception,
                      # since an exception could mean the connection is not in a reusable
                      # state.
                      if type is None:
                          self._pool.append(self)
                      else:
                          self.close()
                  def close(self):
-                     if util.safehasattr(self.peer, b'cleanup'):
+                     if util.safehasattr(self.peer, 'cleanup'):
                          self.peer.cleanup()

hgext/remotefilelog/fileserverclient.py

0 +2 -2

              # fileserverclient.py - client for communicating with the cache process
              #
              # Copyright 2013 Facebook, Inc.
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import hashlib
              import io
              import os
              import threading
              import time
              import zlib
              from mercurial.i18n import _
              from mercurial.node import bin, hex, nullid
              from mercurial import (
                  error,
                  node,
                  pycompat,
                  revlog,
                  sshpeer,
                  util,
                  wireprotov1peer,
              )
              from mercurial.utils import procutil
              from . import (
                  constants,
                  contentstore,
                  metadatastore,
              )
              _sshv1peer = sshpeer.sshv1peer
              # Statistics for debugging
              fetchcost = 0
              fetches = 0
              fetched = 0
              fetchmisses = 0
              _lfsmod = None
              def getcachekey(reponame, file, id):
                  pathhash = node.hex(hashlib.sha1(file).digest())
                  return os.path.join(reponame, pathhash[:2], pathhash[2:], id)
              def getlocalkey(file, id):
                  pathhash = node.hex(hashlib.sha1(file).digest())
                  return os.path.join(pathhash, id)
              def peersetup(ui, peer):
                  class remotefilepeer(peer.__class__):
                      @wireprotov1peer.batchable
                      def x_rfl_getfile(self, file, node):
                          if not self.capable(b'x_rfl_getfile'):
                              raise error.Abort(
                                  b'configured remotefile server does not support getfile'
                              )
                          f = wireprotov1peer.future()
                          yield {b'file': file, b'node': node}, f
                          code, data = f.value.split(b'\0', 1)
                          if int(code):
                              raise error.LookupError(file, node, data)
                          yield data
                      @wireprotov1peer.batchable
                      def x_rfl_getflogheads(self, path):
                          if not self.capable(b'x_rfl_getflogheads'):
                              raise error.Abort(
                                  b'configured remotefile server does not '
                                  b'support getflogheads'
                              )
                          f = wireprotov1peer.future()
                          yield {b'path': path}, f
                          heads = f.value.split(b'\n') if f.value else []
                          yield heads
                      def _updatecallstreamopts(self, command, opts):
                          if command != b'getbundle':
                              return
                          if (
                              constants.NETWORK_CAP_LEGACY_SSH_GETFILES
                              not in self.capabilities()
                          ):
                              return
-                         if not util.safehasattr(self, b'_localrepo'):
+                         if not util.safehasattr(self, '_localrepo'):
                              return
                          if (
                              constants.SHALLOWREPO_REQUIREMENT
                              not in self._localrepo.requirements
                          ):
                              return
                          bundlecaps = opts.get(b'bundlecaps')
                          if bundlecaps:
                              bundlecaps = [bundlecaps]
                          else:
                              bundlecaps = []
                          # shallow, includepattern, and excludepattern are a hacky way of
                          # carrying over data from the local repo to this getbundle
                          # command. We need to do it this way because bundle1 getbundle
                          # doesn't provide any other place we can hook in to manipulate
                          # getbundle args before it goes across the wire. Once we get rid
                          # of bundle1, we can use bundle2's _pullbundle2extraprepare to
                          # do this more cleanly.
                          bundlecaps.append(constants.BUNDLE2_CAPABLITY)
                          if self._localrepo.includepattern:
                              patterns = b'\0'.join(self._localrepo.includepattern)
                              includecap = b"includepattern=" + patterns
                              bundlecaps.append(includecap)
                          if self._localrepo.excludepattern:
                              patterns = b'\0'.join(self._localrepo.excludepattern)
                              excludecap = b"excludepattern=" + patterns
                              bundlecaps.append(excludecap)
                          opts[b'bundlecaps'] = b','.join(bundlecaps)
                      def _sendrequest(self, command, args, **opts):
                          self._updatecallstreamopts(command, args)
                          return super(remotefilepeer, self)._sendrequest(
                              command, args, **opts
                          )
                      def _callstream(self, command, **opts):
                          supertype = super(remotefilepeer, self)
-                         if not util.safehasattr(supertype, b'_sendrequest'):
+                         if not util.safehasattr(supertype, '_sendrequest'):
                              self._updatecallstreamopts(command, pycompat.byteskwargs(opts))
                          return super(remotefilepeer, self)._callstream(command, **opts)
                  peer.__class__ = remotefilepeer
              class cacheconnection(object):
                  """The connection for communicating with the remote cache. Performs
                  gets and sets by communicating with an external process that has the
                  cache-specific implementation.
                  """
                  def __init__(self):
                      self.pipeo = self.pipei = self.pipee = None
                      self.subprocess = None
                      self.connected = False
                  def connect(self, cachecommand):
                      if self.pipeo:
                          raise error.Abort(_(b"cache connection already open"))
                      self.pipei, self.pipeo, self.pipee, self.subprocess = procutil.popen4(
                          cachecommand
                      )
                      self.connected = True
                  def close(self):
                      def tryclose(pipe):
                          try:
                              pipe.close()
                          except Exception:
                              pass
                      if self.connected:
                          try:
                              self.pipei.write(b"exit\n")
                          except Exception:
                              pass
                          tryclose(self.pipei)
                          self.pipei = None
                          tryclose(self.pipeo)
                          self.pipeo = None
                          tryclose(self.pipee)
                          self.pipee = None
                          try:
                              # Wait for process to terminate, making sure to avoid deadlock.
                              # See https://docs.python.org/2/library/subprocess.html for
                              # warnings about wait() and deadlocking.
                              self.subprocess.communicate()
                          except Exception:
                              pass
                          self.subprocess = None
                      self.connected = False
                  def request(self, request, flush=True):
                      if self.connected:
                          try:
                              self.pipei.write(request)
                              if flush:
                                  self.pipei.flush()
                          except IOError:
                              self.close()
                  def receiveline(self):
                      if not self.connected:
                          return None
                      try:
                          result = self.pipeo.readline()[:-1]
                          if not result:
                              self.close()
                      except IOError:
                          self.close()
                      return result
              def _getfilesbatch(
                  remote, receivemissing, progresstick, missed, idmap, batchsize
              ):
                  # Over http(s), iterbatch is a streamy method and we can start
                  # looking at results early. This means we send one (potentially
                  # large) request, but then we show nice progress as we process
                  # file results, rather than showing chunks of $batchsize in
                  # progress.
                  #
                  # Over ssh, iterbatch isn't streamy because batch() wasn't
                  # explicitly designed as a streaming method. In the future we
                  # should probably introduce a streambatch() method upstream and
                  # use that for this.
                  with remote.commandexecutor() as e:
                      futures = []
                      for m in missed:
                          futures.append(
                              e.callcommand(
                                  b'x_rfl_getfile', {b'file': idmap[m], b'node': m[-40:]}
                              )
                          )
                      for i, m in enumerate(missed):
                          r = futures[i].result()
                          futures[i] = None  # release memory
                          file_ = idmap[m]
                          node = m[-40:]
                          receivemissing(io.BytesIO(b'%d\n%s' % (len(r), r)), file_, node)
                          progresstick()
              def _getfiles_optimistic(
                  remote, receivemissing, progresstick, missed, idmap, step
              ):
                  remote._callstream(b"x_rfl_getfiles")
                  i = 0
                  pipeo = remote._pipeo
                  pipei = remote._pipei
                  while i < len(missed):
                      # issue a batch of requests
                      start = i
                      end = min(len(missed), start + step)
                      i = end
                      for missingid in missed[start:end]:
                          # issue new request
                          versionid = missingid[-40:]
                          file = idmap[missingid]
                          sshrequest = b"%s%s\n" % (versionid, file)
                          pipeo.write(sshrequest)
                      pipeo.flush()
                      # receive batch results
                      for missingid in missed[start:end]:
                          versionid = missingid[-40:]
                          file = idmap[missingid]
                          receivemissing(pipei, file, versionid)
                          progresstick()
                  # End the command
                  pipeo.write(b'\n')
                  pipeo.flush()
              def _getfiles_threaded(
                  remote, receivemissing, progresstick, missed, idmap, step
              ):
                  remote._callstream(b"getfiles")
                  pipeo = remote._pipeo
                  pipei = remote._pipei
                  def writer():
                      for missingid in missed:
                          versionid = missingid[-40:]
                          file = idmap[missingid]
                          sshrequest = b"%s%s\n" % (versionid, file)
                          pipeo.write(sshrequest)
                      pipeo.flush()
                  writerthread = threading.Thread(target=writer)
                  writerthread.daemon = True
                  writerthread.start()
                  for missingid in missed:
                      versionid = missingid[-40:]
                      file = idmap[missingid]
                      receivemissing(pipei, file, versionid)
                      progresstick()
                  writerthread.join()
                  # End the command
                  pipeo.write(b'\n')
                  pipeo.flush()
              class fileserverclient(object):
                  """A client for requesting files from the remote file server.
                  """
                  def __init__(self, repo):
                      ui = repo.ui
                      self.repo = repo
                      self.ui = ui
                      self.cacheprocess = ui.config(b"remotefilelog", b"cacheprocess")
                      if self.cacheprocess:
                          self.cacheprocess = util.expandpath(self.cacheprocess)
                      # This option causes remotefilelog to pass the full file path to the
                      # cacheprocess instead of a hashed key.
                      self.cacheprocesspasspath = ui.configbool(
                          b"remotefilelog", b"cacheprocess.includepath"
                      )
                      self.debugoutput = ui.configbool(b"remotefilelog", b"debug")
                      self.remotecache = cacheconnection()
                  def setstore(self, datastore, historystore, writedata, writehistory):
                      self.datastore = datastore
                      self.historystore = historystore
                      self.writedata = writedata
                      self.writehistory = writehistory
                  def _connect(self):
                      return self.repo.connectionpool.get(self.repo.fallbackpath)
                  def request(self, fileids):
                      """Takes a list of filename/node pairs and fetches them from the
                      server. Files are stored in the local cache.
                      A list of nodes that the server couldn't find is returned.
                      If the connection fails, an exception is raised.
                      """
                      if not self.remotecache.connected:
                          self.connect()
                      cache = self.remotecache
                      writedata = self.writedata
                      repo = self.repo
                      total = len(fileids)
                      request = b"get\n%d\n" % total
                      idmap = {}
                      reponame = repo.name
                      for file, id in fileids:
                          fullid = getcachekey(reponame, file, id)
                          if self.cacheprocesspasspath:
                              request += file + b'\0'
                          request += fullid + b"\n"
                          idmap[fullid] = file
                      cache.request(request)
                      progress = self.ui.makeprogress(_(b'downloading'), total=total)
                      progress.update(0)
                      missed = []
                      while True:
                          missingid = cache.receiveline()
                          if not missingid:
                              missedset = set(missed)
                              for missingid in idmap:
                                  if not missingid in missedset:
                                      missed.append(missingid)
                              self.ui.warn(
                                  _(
                                      b"warning: cache connection closed early - "
                                      + b"falling back to server\n"
                                  )
                              )
                              break
                          if missingid == b"0":
                              break
                          if missingid.startswith(b"_hits_"):
                              # receive progress reports
                              parts = missingid.split(b"_")
                              progress.increment(int(parts[2]))
                              continue
                          missed.append(missingid)
                      global fetchmisses
                      fetchmisses += len(missed)
                      fromcache = total - len(missed)
                      progress.update(fromcache, total=total)
                      self.ui.log(
                          b"remotefilelog",
                          b"remote cache hit rate is %r of %r\n",
                          fromcache,
                          total,
                          hit=fromcache,
                          total=total,
                      )
                      oldumask = os.umask(0o002)
                      try:
                          # receive cache misses from master
                          if missed:
                              # When verbose is true, sshpeer prints 'running ssh...'
                              # to stdout, which can interfere with some command
                              # outputs
                              verbose = self.ui.verbose
                              self.ui.verbose = False
                              try:
                                  with self._connect() as conn:
                                      remote = conn.peer
                                      if remote.capable(
                                          constants.NETWORK_CAP_LEGACY_SSH_GETFILES
                                      ):
                                          if not isinstance(remote, _sshv1peer):
                                              raise error.Abort(
                                                  b'remotefilelog requires ssh ' b'servers'
                                              )
                                          step = self.ui.configint(
                                              b'remotefilelog', b'getfilesstep'
                                          )
                                          getfilestype = self.ui.config(
                                              b'remotefilelog', b'getfilestype'
                                          )
                                          if getfilestype == b'threaded':
                                              _getfiles = _getfiles_threaded
                                          else:
                                              _getfiles = _getfiles_optimistic
                                          _getfiles(
                                              remote,
                                              self.receivemissing,
                                              progress.increment,
                                              missed,
                                              idmap,
                                              step,
                                          )
                                      elif remote.capable(b"x_rfl_getfile"):
                                          if remote.capable(b'batch'):
                                              batchdefault = 100
                                          else:
                                              batchdefault = 10
                                          batchsize = self.ui.configint(
                                              b'remotefilelog', b'batchsize', batchdefault
                                          )
                                          self.ui.debug(
                                              b'requesting %d files from '
                                              b'remotefilelog server...\n' % len(missed)
                                          )
                                          _getfilesbatch(
                                              remote,
                                              self.receivemissing,
                                              progress.increment,
                                              missed,
                                              idmap,
                                              batchsize,
                                          )
                                      else:
                                          raise error.Abort(
                                              b"configured remotefilelog server"
                                              b" does not support remotefilelog"
                                          )
                                  self.ui.log(
                                      b"remotefilefetchlog",
                                      b"Success\n",
                                      fetched_files=progress.pos - fromcache,
                                      total_to_fetch=total - fromcache,
                                  )
                              except Exception:
                                  self.ui.log(
                                      b"remotefilefetchlog",
                                      b"Fail\n",
                                      fetched_files=progress.pos - fromcache,
                                      total_to_fetch=total - fromcache,
                                  )
                                  raise
                              finally:
                                  self.ui.verbose = verbose
                              # send to memcache
                              request = b"set\n%d\n%s\n" % (len(missed), b"\n".join(missed))
                              cache.request(request)
                          progress.complete()
                          # mark ourselves as a user of this cache
                          writedata.markrepo(self.repo.path)
                      finally:
                          os.umask(oldumask)
                  def receivemissing(self, pipe, filename, node):
                      line = pipe.readline()[:-1]
                      if not line:
                          raise error.ResponseError(
                              _(b"error downloading file contents:"),
                              _(b"connection closed early"),
                          )
                      size = int(line)
                      data = pipe.read(size)
                      if len(data) != size:
                          raise error.ResponseError(
                              _(b"error downloading file contents:"),
                              _(b"only received %s of %s bytes") % (len(data), size),
                          )
                      self.writedata.addremotefilelognode(
                          filename, bin(node), zlib.decompress(data)
                      )
                  def connect(self):
                      if self.cacheprocess:
                          cmd = b"%s %s" % (self.cacheprocess, self.writedata._path)
                          self.remotecache.connect(cmd)
                      else:
                          # If no cache process is specified, we fake one that always
                          # returns cache misses.  This enables tests to run easily
                          # and may eventually allow us to be a drop in replacement
                          # for the largefiles extension.
                          class simplecache(object):
                              def __init__(self):
                                  self.missingids = []
                                  self.connected = True
                              def close(self):
                                  pass
                              def request(self, value, flush=True):
                                  lines = value.split(b"\n")
                                  if lines[0] != b"get":
                                      return
                                  self.missingids = lines[2:-1]
                                  self.missingids.append(b'0')
                              def receiveline(self):
                                  if len(self.missingids) > 0:
                                      return self.missingids.pop(0)
                                  return None
                          self.remotecache = simplecache()
                  def close(self):
                      if fetches:
                          msg = (
                              b"%d files fetched over %d fetches - "
                              + b"(%d misses, %0.2f%% hit ratio) over %0.2fs\n"
                          ) % (
                              fetched,
                              fetches,
                              fetchmisses,
                              float(fetched - fetchmisses) / float(fetched) * 100.0,
                              fetchcost,
                          )
                          if self.debugoutput:
                              self.ui.warn(msg)
                          self.ui.log(
                              b"remotefilelog.prefetch",
                              msg.replace(b"%", b"%%"),
                              remotefilelogfetched=fetched,
                              remotefilelogfetches=fetches,
                              remotefilelogfetchmisses=fetchmisses,
                              remotefilelogfetchtime=fetchcost * 1000,
                          )
                      if self.remotecache.connected:
                          self.remotecache.close()
                  def prefetch(
                      self, fileids, force=False, fetchdata=True, fetchhistory=False
                  ):
                      """downloads the given file versions to the cache
                      """
                      repo = self.repo
                      idstocheck = []
                      for file, id in fileids:
                          # hack
                          # - we don't use .hgtags
                          # - workingctx produces ids with length 42,
                          #   which we skip since they aren't in any cache
                          if (
                              file == b'.hgtags'
                              or len(id) == 42
                              or not repo.shallowmatch(file)
                          ):
                              continue
                          idstocheck.append((file, bin(id)))
                      datastore = self.datastore
                      historystore = self.historystore
                      if force:
                          datastore = contentstore.unioncontentstore(*repo.shareddatastores)
                          historystore = metadatastore.unionmetadatastore(
                              *repo.sharedhistorystores
                          )
                      missingids = set()
                      if fetchdata:
                          missingids.update(datastore.getmissing(idstocheck))
                      if fetchhistory:
                          missingids.update(historystore.getmissing(idstocheck))
                      # partition missing nodes into nullid and not-nullid so we can
                      # warn about this filtering potentially shadowing bugs.
                      nullids = len([None for unused, id in missingids if id == nullid])
                      if nullids:
                          missingids = [(f, id) for f, id in missingids if id != nullid]
                          repo.ui.develwarn(
                              (
                                  b'remotefilelog not fetching %d null revs'
                                  b' - this is likely hiding bugs' % nullids
                              ),
                              config=b'remotefilelog-ext',
                          )
                      if missingids:
                          global fetches, fetched, fetchcost
                          fetches += 1
                          # We want to be able to detect excess individual file downloads, so
                          # let's log that information for debugging.
                          if fetches >= 15 and fetches < 18:
                              if fetches == 15:
                                  fetchwarning = self.ui.config(
                                      b'remotefilelog', b'fetchwarning'
                                  )
                                  if fetchwarning:
                                      self.ui.warn(fetchwarning + b'\n')
                              self.logstacktrace()
                          missingids = [(file, hex(id)) for file, id in sorted(missingids)]
                          fetched += len(missingids)
                          start = time.time()
                          missingids = self.request(missingids)
                          if missingids:
                              raise error.Abort(
                                  _(b"unable to download %d files") % len(missingids)
                              )
                          fetchcost += time.time() - start
                          self._lfsprefetch(fileids)
                  def _lfsprefetch(self, fileids):
                      if not _lfsmod or not util.safehasattr(
                          self.repo.svfs, b'lfslocalblobstore'
                      ):
                          return
                      if not _lfsmod.wrapper.candownload(self.repo):
                          return
                      pointers = []
                      store = self.repo.svfs.lfslocalblobstore
                      for file, id in fileids:
                          node = bin(id)
                          rlog = self.repo.file(file)
                          if rlog.flags(node) & revlog.REVIDX_EXTSTORED:
                              text = rlog.rawdata(node)
                              p = _lfsmod.pointer.deserialize(text)
                              oid = p.oid()
                              if not store.has(oid):
                                  pointers.append(p)
                      if len(pointers) > 0:
                          self.repo.svfs.lfsremoteblobstore.readbatch(pointers, store)
                          assert all(store.has(p.oid()) for p in pointers)
                  def logstacktrace(self):
                      import traceback
                      self.ui.log(
                          b'remotefilelog',
                          b'excess remotefilelog fetching:\n%s\n',
                          b''.join(traceback.format_stack()),
                      )

hgext/remotefilelog/repack.py

0 +5 -5

              from __future__ import absolute_import
              import os
              import time
              from mercurial.i18n import _
              from mercurial.node import (
                  nullid,
                  short,
              )
              from mercurial import (
                  encoding,
                  error,
                  lock as lockmod,
                  mdiff,
                  policy,
                  pycompat,
                  scmutil,
                  util,
                  vfs,
              )
              from mercurial.utils import procutil
              from . import (
                  constants,
                  contentstore,
                  datapack,
                  historypack,
                  metadatastore,
                  shallowutil,
              )
              osutil = policy.importmod(r'osutil')
              class RepackAlreadyRunning(error.Abort):
                  pass
              def backgroundrepack(
                  repo, incremental=True, packsonly=False, ensurestart=False
              ):
                  cmd = [procutil.hgexecutable(), b'-R', repo.origroot, b'repack']
                  msg = _(b"(running background repack)\n")
                  if incremental:
                      cmd.append(b'--incremental')
                      msg = _(b"(running background incremental repack)\n")
                  if packsonly:
                      cmd.append(b'--packsonly')
                  repo.ui.warn(msg)
                  # We know this command will find a binary, so don't block on it starting.
                  procutil.runbgcommand(cmd, encoding.environ, ensurestart=ensurestart)
              def fullrepack(repo, options=None):
                  """If ``packsonly`` is True, stores creating only loose objects are skipped.
                  """
-                 if util.safehasattr(repo, b'shareddatastores'):
+                 if util.safehasattr(repo, 'shareddatastores'):
                      datasource = contentstore.unioncontentstore(*repo.shareddatastores)
                      historysource = metadatastore.unionmetadatastore(
                          *repo.sharedhistorystores, allowincomplete=True
                      )
                      packpath = shallowutil.getcachepackpath(
                          repo, constants.FILEPACK_CATEGORY
                      )
                      _runrepack(
                          repo,
                          datasource,
                          historysource,
                          packpath,
                          constants.FILEPACK_CATEGORY,
                          options=options,
                      )
-                 if util.safehasattr(repo.manifestlog, b'datastore'):
+                 if util.safehasattr(repo.manifestlog, 'datastore'):
                      localdata, shareddata = _getmanifeststores(repo)
                      lpackpath, ldstores, lhstores = localdata
                      spackpath, sdstores, shstores = shareddata
                      # Repack the shared manifest store
                      datasource = contentstore.unioncontentstore(*sdstores)
                      historysource = metadatastore.unionmetadatastore(
                          *shstores, allowincomplete=True
                      )
                      _runrepack(
                          repo,
                          datasource,
                          historysource,
                          spackpath,
                          constants.TREEPACK_CATEGORY,
                          options=options,
                      )
                      # Repack the local manifest store
                      datasource = contentstore.unioncontentstore(
                          *ldstores, allowincomplete=True
                      )
                      historysource = metadatastore.unionmetadatastore(
                          *lhstores, allowincomplete=True
                      )
                      _runrepack(
                          repo,
                          datasource,
                          historysource,
                          lpackpath,
                          constants.TREEPACK_CATEGORY,
                          options=options,
                      )
              def incrementalrepack(repo, options=None):
                  """This repacks the repo by looking at the distribution of pack files in the
                  repo and performing the most minimal repack to keep the repo in good shape.
                  """
-                 if util.safehasattr(repo, b'shareddatastores'):
+                 if util.safehasattr(repo, 'shareddatastores'):
                      packpath = shallowutil.getcachepackpath(
                          repo, constants.FILEPACK_CATEGORY
                      )
                      _incrementalrepack(
                          repo,
                          repo.shareddatastores,
                          repo.sharedhistorystores,
                          packpath,
                          constants.FILEPACK_CATEGORY,
                          options=options,
                      )
-                 if util.safehasattr(repo.manifestlog, b'datastore'):
+                 if util.safehasattr(repo.manifestlog, 'datastore'):
                      localdata, shareddata = _getmanifeststores(repo)
                      lpackpath, ldstores, lhstores = localdata
                      spackpath, sdstores, shstores = shareddata
                      # Repack the shared manifest store
                      _incrementalrepack(
                          repo,
                          sdstores,
                          shstores,
                          spackpath,
                          constants.TREEPACK_CATEGORY,
                          options=options,
                      )
                      # Repack the local manifest store
                      _incrementalrepack(
                          repo,
                          ldstores,
                          lhstores,
                          lpackpath,
                          constants.TREEPACK_CATEGORY,
                          allowincompletedata=True,
                          options=options,
                      )
              def _getmanifeststores(repo):
                  shareddatastores = repo.manifestlog.shareddatastores
                  localdatastores = repo.manifestlog.localdatastores
                  sharedhistorystores = repo.manifestlog.sharedhistorystores
                  localhistorystores = repo.manifestlog.localhistorystores
                  sharedpackpath = shallowutil.getcachepackpath(
                      repo, constants.TREEPACK_CATEGORY
                  )
                  localpackpath = shallowutil.getlocalpackpath(
                      repo.svfs.vfs.base, constants.TREEPACK_CATEGORY
                  )
                  return (
                      (localpackpath, localdatastores, localhistorystores),
                      (sharedpackpath, shareddatastores, sharedhistorystores),
                  )
              def _topacks(packpath, files, constructor):
                  paths = list(os.path.join(packpath, p) for p in files)
                  packs = list(constructor(p) for p in paths)
                  return packs
              def _deletebigpacks(repo, folder, files):
                  """Deletes packfiles that are bigger than ``packs.maxpacksize``.
                  Returns ``files` with the removed files omitted."""
                  maxsize = repo.ui.configbytes(b"packs", b"maxpacksize")
                  if maxsize <= 0:
                      return files
                  # This only considers datapacks today, but we could broaden it to include
                  # historypacks.
                  VALIDEXTS = [b".datapack", b".dataidx"]
                  # Either an oversize index or datapack will trigger cleanup of the whole
                  # pack:
                  oversized = {
                      os.path.splitext(path)[0]
                      for path, ftype, stat in files
                      if (stat.st_size > maxsize and (os.path.splitext(path)[1] in VALIDEXTS))
                  }
                  for rootfname in oversized:
                      rootpath = os.path.join(folder, rootfname)
                      for ext in VALIDEXTS:
                          path = rootpath + ext
                          repo.ui.debug(
                              b'removing oversize packfile %s (%s)\n'
                              % (path, util.bytecount(os.stat(path).st_size))
                          )
                          os.unlink(path)
                  return [row for row in files if os.path.basename(row[0]) not in oversized]
              def _incrementalrepack(
                  repo,
                  datastore,
                  historystore,
                  packpath,
                  category,
                  allowincompletedata=False,
                  options=None,
              ):
                  shallowutil.mkstickygroupdir(repo.ui, packpath)
                  files = osutil.listdir(packpath, stat=True)
                  files = _deletebigpacks(repo, packpath, files)
                  datapacks = _topacks(
                      packpath, _computeincrementaldatapack(repo.ui, files), datapack.datapack
                  )
                  datapacks.extend(
                      s for s in datastore if not isinstance(s, datapack.datapackstore)
                  )
                  historypacks = _topacks(
                      packpath,
                      _computeincrementalhistorypack(repo.ui, files),
                      historypack.historypack,
                  )
                  historypacks.extend(
                      s
                      for s in historystore
                      if not isinstance(s, historypack.historypackstore)
                  )
                  # ``allhistory{files,packs}`` contains all known history packs, even ones we
                  # don't plan to repack. They are used during the datapack repack to ensure
                  # good ordering of nodes.
                  allhistoryfiles = _allpackfileswithsuffix(
                      files, historypack.PACKSUFFIX, historypack.INDEXSUFFIX
                  )
                  allhistorypacks = _topacks(
                      packpath,
                      (f for f, mode, stat in allhistoryfiles),
                      historypack.historypack,
                  )
                  allhistorypacks.extend(
                      s
                      for s in historystore
                      if not isinstance(s, historypack.historypackstore)
                  )
                  _runrepack(
                      repo,
                      contentstore.unioncontentstore(
                          *datapacks, allowincomplete=allowincompletedata
                      ),
                      metadatastore.unionmetadatastore(*historypacks, allowincomplete=True),
                      packpath,
                      category,
                      fullhistory=metadatastore.unionmetadatastore(
                          *allhistorypacks, allowincomplete=True
                      ),
                      options=options,
                  )
              def _computeincrementaldatapack(ui, files):
                  opts = {
                      b'gencountlimit': ui.configint(b'remotefilelog', b'data.gencountlimit'),
                      b'generations': ui.configlist(b'remotefilelog', b'data.generations'),
                      b'maxrepackpacks': ui.configint(
                          b'remotefilelog', b'data.maxrepackpacks'
                      ),
                      b'repackmaxpacksize': ui.configbytes(
                          b'remotefilelog', b'data.repackmaxpacksize'
                      ),
                      b'repacksizelimit': ui.configbytes(
                          b'remotefilelog', b'data.repacksizelimit'
                      ),
                  }
                  packfiles = _allpackfileswithsuffix(
                      files, datapack.PACKSUFFIX, datapack.INDEXSUFFIX
                  )
                  return _computeincrementalpack(packfiles, opts)
              def _computeincrementalhistorypack(ui, files):
                  opts = {
                      b'gencountlimit': ui.configint(
                          b'remotefilelog', b'history.gencountlimit'
                      ),
                      b'generations': ui.configlist(
                          b'remotefilelog', b'history.generations', [b'100MB']
                      ),
                      b'maxrepackpacks': ui.configint(
                          b'remotefilelog', b'history.maxrepackpacks'
                      ),
                      b'repackmaxpacksize': ui.configbytes(
                          b'remotefilelog', b'history.repackmaxpacksize', b'400MB'
                      ),
                      b'repacksizelimit': ui.configbytes(
                          b'remotefilelog', b'history.repacksizelimit'
                      ),
                  }
                  packfiles = _allpackfileswithsuffix(
                      files, historypack.PACKSUFFIX, historypack.INDEXSUFFIX
                  )
                  return _computeincrementalpack(packfiles, opts)
              def _allpackfileswithsuffix(files, packsuffix, indexsuffix):
                  result = []
                  fileset = set(fn for fn, mode, stat in files)
                  for filename, mode, stat in files:
                      if not filename.endswith(packsuffix):
                          continue
                      prefix = filename[: -len(packsuffix)]
                      # Don't process a pack if it doesn't have an index.
                      if (prefix + indexsuffix) not in fileset:
                          continue
                      result.append((prefix, mode, stat))
                  return result
              def _computeincrementalpack(files, opts):
                  """Given a set of pack files along with the configuration options, this
                  function computes the list of files that should be packed as part of an
                  incremental repack.
                  It tries to strike a balance between keeping incremental repacks cheap (i.e.
                  packing small things when possible, and rolling the packs up to the big ones
                  over time).
                  """
                  limits = list(
                      sorted((util.sizetoint(s) for s in opts[b'generations']), reverse=True)
                  )
                  limits.append(0)
                  # Group the packs by generation (i.e. by size)
                  generations = []
                  for i in pycompat.xrange(len(limits)):
                      generations.append([])
                  sizes = {}
                  for prefix, mode, stat in files:
                      size = stat.st_size
                      if size > opts[b'repackmaxpacksize']:
                          continue
                      sizes[prefix] = size
                      for i, limit in enumerate(limits):
                          if size > limit:
                              generations[i].append(prefix)
                              break
                  # Steps for picking what packs to repack:
                  # 1. Pick the largest generation with > gencountlimit pack files.
                  # 2. Take the smallest three packs.
                  # 3. While total-size-of-packs < repacksizelimit: add another pack
                  # Find the largest generation with more than gencountlimit packs
                  genpacks = []
                  for i, limit in enumerate(limits):
                      if len(generations[i]) > opts[b'gencountlimit']:
                          # Sort to be smallest last, for easy popping later
                          genpacks.extend(
                              sorted(generations[i], reverse=True, key=lambda x: sizes[x])
                          )
                          break
                  # Take as many packs from the generation as we can
                  chosenpacks = genpacks[-3:]
                  genpacks = genpacks[:-3]
                  repacksize = sum(sizes[n] for n in chosenpacks)
                  while (
                      repacksize < opts[b'repacksizelimit']
                      and genpacks
                      and len(chosenpacks) < opts[b'maxrepackpacks']
                  ):
                      chosenpacks.append(genpacks.pop())
                      repacksize += sizes[chosenpacks[-1]]
                  return chosenpacks
              def _runrepack(
                  repo, data, history, packpath, category, fullhistory=None, options=None
              ):
                  shallowutil.mkstickygroupdir(repo.ui, packpath)
                  def isold(repo, filename, node):
                      """Check if the file node is older than a limit.
                      Unless a limit is specified in the config the default limit is taken.
                      """
                      filectx = repo.filectx(filename, fileid=node)
                      filetime = repo[filectx.linkrev()].date()
                      ttl = repo.ui.configint(b'remotefilelog', b'nodettl')
                      limit = time.time() - ttl
                      return filetime[0] < limit
                  garbagecollect = repo.ui.configbool(b'remotefilelog', b'gcrepack')
                  if not fullhistory:
                      fullhistory = history
                  packer = repacker(
                      repo,
                      data,
                      history,
                      fullhistory,
                      category,
                      gc=garbagecollect,
                      isold=isold,
                      options=options,
                  )
                  with datapack.mutabledatapack(repo.ui, packpath) as dpack:
                      with historypack.mutablehistorypack(repo.ui, packpath) as hpack:
                          try:
                              packer.run(dpack, hpack)
                          except error.LockHeld:
                              raise RepackAlreadyRunning(
                                  _(
                                      b"skipping repack - another repack "
                                      b"is already running"
                                  )
                              )
              def keepset(repo, keyfn, lastkeepkeys=None):
                  """Computes a keepset which is not garbage collected.
                  'keyfn' is a function that maps filename, node to a unique key.
                  'lastkeepkeys' is an optional argument and if provided the keepset
                  function updates lastkeepkeys with more keys and returns the result.
                  """
                  if not lastkeepkeys:
                      keepkeys = set()
                  else:
                      keepkeys = lastkeepkeys
                  # We want to keep:
                  # 1. Working copy parent
                  # 2. Draft commits
                  # 3. Parents of draft commits
                  # 4. Pullprefetch and bgprefetchrevs revsets if specified
                  revs = [b'.', b'draft()', b'parents(draft())']
                  prefetchrevs = repo.ui.config(b'remotefilelog', b'pullprefetch', None)
                  if prefetchrevs:
                      revs.append(b'(%s)' % prefetchrevs)
                  prefetchrevs = repo.ui.config(b'remotefilelog', b'bgprefetchrevs', None)
                  if prefetchrevs:
                      revs.append(b'(%s)' % prefetchrevs)
                  revs = b'+'.join(revs)
                  revs = [b'sort((%s), "topo")' % revs]
                  keep = scmutil.revrange(repo, revs)
                  processed = set()
                  lastmanifest = None
                  # process the commits in toposorted order starting from the oldest
                  for r in reversed(keep._list):
                      if repo[r].p1().rev() in processed:
                          # if the direct parent has already been processed
                          # then we only need to process the delta
                          m = repo[r].manifestctx().readdelta()
                      else:
                          # otherwise take the manifest and diff it
                          # with the previous manifest if one exists
                          if lastmanifest:
                              m = repo[r].manifest().diff(lastmanifest)
                          else:
                              m = repo[r].manifest()
                      lastmanifest = repo[r].manifest()
                      processed.add(r)
                      # populate keepkeys with keys from the current manifest
                      if type(m) is dict:
                          # m is a result of diff of two manifests and is a dictionary that
                          # maps filename to ((newnode, newflag), (oldnode, oldflag)) tuple
                          for filename, diff in pycompat.iteritems(m):
                              if diff[0][0] is not None:
                                  keepkeys.add(keyfn(filename, diff[0][0]))
                      else:
                          # m is a manifest object
                          for filename, filenode in pycompat.iteritems(m):
                              keepkeys.add(keyfn(filename, filenode))
                  return keepkeys
              class repacker(object):
                  """Class for orchestrating the repack of data and history information into a
                  new format.
                  """
                  def __init__(
                      self,
                      repo,
                      data,
                      history,
                      fullhistory,
                      category,
                      gc=False,
                      isold=None,
                      options=None,
                  ):
                      self.repo = repo
                      self.data = data
                      self.history = history
                      self.fullhistory = fullhistory
                      self.unit = constants.getunits(category)
                      self.garbagecollect = gc
                      self.options = options
                      if self.garbagecollect:
                          if not isold:
                              raise ValueError(b"Function 'isold' is not properly specified")
                          # use (filename, node) tuple as a keepset key
                          self.keepkeys = keepset(repo, lambda f, n: (f, n))
                          self.isold = isold
                  def run(self, targetdata, targethistory):
                      ledger = repackledger()
                      with lockmod.lock(
                          repacklockvfs(self.repo), b"repacklock", desc=None, timeout=0
                      ):
                          self.repo.hook(b'prerepack')
                          # Populate ledger from source
                          self.data.markledger(ledger, options=self.options)
                          self.history.markledger(ledger, options=self.options)
                          # Run repack
                          self.repackdata(ledger, targetdata)
                          self.repackhistory(ledger, targethistory)
                          # Call cleanup on each source
                          for source in ledger.sources:
                              source.cleanup(ledger)
                  def _chainorphans(self, ui, filename, nodes, orphans, deltabases):
                      """Reorderes ``orphans`` into a single chain inside ``nodes`` and
                      ``deltabases``.
                      We often have orphan entries (nodes without a base that aren't
                      referenced by other nodes -- i.e., part of a chain) due to gaps in
                      history. Rather than store them as individual fulltexts, we prefer to
                      insert them as one chain sorted by size.
                      """
                      if not orphans:
                          return nodes
                      def getsize(node, default=0):
                          meta = self.data.getmeta(filename, node)
                          if constants.METAKEYSIZE in meta:
                              return meta[constants.METAKEYSIZE]
                          else:
                              return default
                      # Sort orphans by size; biggest first is preferred, since it's more
                      # likely to be the newest version assuming files grow over time.
                      # (Sort by node first to ensure the sort is stable.)
                      orphans = sorted(orphans)
                      orphans = list(sorted(orphans, key=getsize, reverse=True))
                      if ui.debugflag:
                          ui.debug(
                              b"%s: orphan chain: %s\n"
                              % (filename, b", ".join([short(s) for s in orphans]))
                          )
                      # Create one contiguous chain and reassign deltabases.
                      for i, node in enumerate(orphans):
                          if i == 0:
                              deltabases[node] = (nullid, 0)
                          else:
                              parent = orphans[i - 1]
                              deltabases[node] = (parent, deltabases[parent][1] + 1)
                      nodes = [n for n in nodes if n not in orphans]
                      nodes += orphans
                      return nodes
                  def repackdata(self, ledger, target):
                      ui = self.repo.ui
                      maxchainlen = ui.configint(b'packs', b'maxchainlen', 1000)
                      byfile = {}
                      for entry in pycompat.itervalues(ledger.entries):
                          if entry.datasource:
                              byfile.setdefault(entry.filename, {})[entry.node] = entry
                      count = 0
                      repackprogress = ui.makeprogress(
                          _(b"repacking data"), unit=self.unit, total=len(byfile)
                      )
                      for filename, entries in sorted(pycompat.iteritems(byfile)):
                          repackprogress.update(count)
                          ancestors = {}
                          nodes = list(node for node in entries)
                          nohistory = []
                          buildprogress = ui.makeprogress(
                              _(b"building history"), unit=b'nodes', total=len(nodes)
                          )
                          for i, node in enumerate(nodes):
                              if node in ancestors:
                                  continue
                              buildprogress.update(i)
                              try:
                                  ancestors.update(
                                      self.fullhistory.getancestors(
                                          filename, node, known=ancestors
                                      )
                                  )
                              except KeyError:
                                  # Since we're packing data entries, we may not have the
                                  # corresponding history entries for them. It's not a big
                                  # deal, but the entries won't be delta'd perfectly.
                                  nohistory.append(node)
                          buildprogress.complete()
                          # Order the nodes children first, so we can produce reverse deltas
                          orderednodes = list(reversed(self._toposort(ancestors)))
                          if len(nohistory) > 0:
                              ui.debug(
                                  b'repackdata: %d nodes without history\n' % len(nohistory)
                              )
                          orderednodes.extend(sorted(nohistory))
                          # Filter orderednodes to just the nodes we want to serialize (it
                          # currently also has the edge nodes' ancestors).
                          orderednodes = list(
                              filter(lambda node: node in nodes, orderednodes)
                          )
                          # Garbage collect old nodes:
                          if self.garbagecollect:
                              neworderednodes = []
                              for node in orderednodes:
                                  # If the node is old and is not in the keepset, we skip it,
                                  # and mark as garbage collected
                                  if (filename, node) not in self.keepkeys and self.isold(
                                      self.repo, filename, node
                                  ):
                                      entries[node].gced = True
                                      continue
                                  neworderednodes.append(node)
                              orderednodes = neworderednodes
                          # Compute delta bases for nodes:
                          deltabases = {}
                          nobase = set()
                          referenced = set()
                          nodes = set(nodes)
                          processprogress = ui.makeprogress(
                              _(b"processing nodes"), unit=b'nodes', total=len(orderednodes)
                          )
                          for i, node in enumerate(orderednodes):
                              processprogress.update(i)
                              # Find delta base
                              # TODO: allow delta'ing against most recent descendant instead
                              # of immediate child
                              deltatuple = deltabases.get(node, None)
                              if deltatuple is None:
                                  deltabase, chainlen = nullid, 0
                                  deltabases[node] = (nullid, 0)
                                  nobase.add(node)
                              else:
                                  deltabase, chainlen = deltatuple
                                  referenced.add(deltabase)
                              # Use available ancestor information to inform our delta choices
                              ancestorinfo = ancestors.get(node)
                              if ancestorinfo:
                                  p1, p2, linknode, copyfrom = ancestorinfo
                                  # The presence of copyfrom means we're at a point where the
                                  # file was copied from elsewhere. So don't attempt to do any
                                  # deltas with the other file.
                                  if copyfrom:
                                      p1 = nullid
                                  if chainlen < maxchainlen:
                                      # Record this child as the delta base for its parents.
                                      # This may be non optimal, since the parents may have
                                      # many children, and this will only choose the last one.
                                      # TODO: record all children and try all deltas to find
                                      # best
                                      if p1 != nullid:
                                          deltabases[p1] = (node, chainlen + 1)
                                      if p2 != nullid:
                                          deltabases[p2] = (node, chainlen + 1)
                          # experimental config: repack.chainorphansbysize
                          if ui.configbool(b'repack', b'chainorphansbysize'):
                              orphans = nobase - referenced
                              orderednodes = self._chainorphans(
                                  ui, filename, orderednodes, orphans, deltabases
                              )
                          # Compute deltas and write to the pack
                          for i, node in enumerate(orderednodes):
                              deltabase, chainlen = deltabases[node]
                              # Compute delta
                              # TODO: Optimize the deltachain fetching. Since we're
                              # iterating over the different version of the file, we may
                              # be fetching the same deltachain over and over again.
                              if deltabase != nullid:
                                  deltaentry = self.data.getdelta(filename, node)
                                  delta, deltabasename, origdeltabase, meta = deltaentry
                                  size = meta.get(constants.METAKEYSIZE)
                                  if (
                                      deltabasename != filename
                                      or origdeltabase != deltabase
                                      or size is None
                                  ):
                                      deltabasetext = self.data.get(filename, deltabase)
                                      original = self.data.get(filename, node)
                                      size = len(original)
                                      delta = mdiff.textdiff(deltabasetext, original)
                              else:
                                  delta = self.data.get(filename, node)
                                  size = len(delta)
                                  meta = self.data.getmeta(filename, node)
                              # TODO: don't use the delta if it's larger than the fulltext
                              if constants.METAKEYSIZE not in meta:
                                  meta[constants.METAKEYSIZE] = size
                              target.add(filename, node, deltabase, delta, meta)
                              entries[node].datarepacked = True
                          processprogress.complete()
                          count += 1
                      repackprogress.complete()
                      target.close(ledger=ledger)
                  def repackhistory(self, ledger, target):
                      ui = self.repo.ui
                      byfile = {}
                      for entry in pycompat.itervalues(ledger.entries):
                          if entry.historysource:
                              byfile.setdefault(entry.filename, {})[entry.node] = entry
                      progress = ui.makeprogress(
                          _(b"repacking history"), unit=self.unit, total=len(byfile)
                      )
                      for filename, entries in sorted(pycompat.iteritems(byfile)):
                          ancestors = {}
                          nodes = list(node for node in entries)
                          for node in nodes:
                              if node in ancestors:
                                  continue
                              ancestors.update(
                                  self.history.getancestors(filename, node, known=ancestors)
                              )
                          # Order the nodes children first
                          orderednodes = reversed(self._toposort(ancestors))
                          # Write to the pack
                          dontprocess = set()
                          for node in orderednodes:
                              p1, p2, linknode, copyfrom = ancestors[node]
                              # If the node is marked dontprocess, but it's also in the
                              # explicit entries set, that means the node exists both in this
                              # file and in another file that was copied to this file.
                              # Usually this happens if the file was copied to another file,
                              # then the copy was deleted, then reintroduced without copy
                              # metadata. The original add and the new add have the same hash
                              # since the content is identical and the parents are null.
                              if node in dontprocess and node not in entries:
                                  # If copyfrom == filename, it means the copy history
                                  # went to come other file, then came back to this one, so we
                                  # should continue processing it.
                                  if p1 != nullid and copyfrom != filename:
                                      dontprocess.add(p1)
                                  if p2 != nullid:
                                      dontprocess.add(p2)
                                  continue
                              if copyfrom:
                                  dontprocess.add(p1)
                              target.add(filename, node, p1, p2, linknode, copyfrom)
                              if node in entries:
                                  entries[node].historyrepacked = True
                          progress.increment()
                      progress.complete()
                      target.close(ledger=ledger)
                  def _toposort(self, ancestors):
                      def parentfunc(node):
                          p1, p2, linknode, copyfrom = ancestors[node]
                          parents = []
                          if p1 != nullid:
                              parents.append(p1)
                          if p2 != nullid:
                              parents.append(p2)
                          return parents
                      sortednodes = shallowutil.sortnodes(ancestors.keys(), parentfunc)
                      return sortednodes
              class repackledger(object):
                  """Storage for all the bookkeeping that happens during a repack. It contains
                  the list of revisions being repacked, what happened to each revision, and
                  which source store contained which revision originally (for later cleanup).
                  """
                  def __init__(self):
                      self.entries = {}
                      self.sources = {}
                      self.created = set()
                  def markdataentry(self, source, filename, node):
                      """Mark the given filename+node revision as having a data rev in the
                      given source.
                      """
                      entry = self._getorcreateentry(filename, node)
                      entry.datasource = True
                      entries = self.sources.get(source)
                      if not entries:
                          entries = set()
                          self.sources[source] = entries
                      entries.add(entry)
                  def markhistoryentry(self, source, filename, node):
                      """Mark the given filename+node revision as having a history rev in the
                      given source.
                      """
                      entry = self._getorcreateentry(filename, node)
                      entry.historysource = True
                      entries = self.sources.get(source)
                      if not entries:
                          entries = set()
                          self.sources[source] = entries
                      entries.add(entry)
                  def _getorcreateentry(self, filename, node):
                      key = (filename, node)
                      value = self.entries.get(key)
                      if not value:
                          value = repackentry(filename, node)
                          self.entries[key] = value
                      return value
                  def addcreated(self, value):
                      self.created.add(value)
              class repackentry(object):
                  """Simple class representing a single revision entry in the repackledger.
                  """
                  __slots__ = (
                      r'filename',
                      r'node',
                      r'datasource',
                      r'historysource',
                      r'datarepacked',
                      r'historyrepacked',
                      r'gced',
                  )
                  def __init__(self, filename, node):
                      self.filename = filename
                      self.node = node
                      # If the revision has a data entry in the source
                      self.datasource = False
                      # If the revision has a history entry in the source
                      self.historysource = False
                      # If the revision's data entry was repacked into the repack target
                      self.datarepacked = False
                      # If the revision's history entry was repacked into the repack target
                      self.historyrepacked = False
                      # If garbage collected
                      self.gced = False
              def repacklockvfs(repo):
-                 if util.safehasattr(repo, b'name'):
+                 if util.safehasattr(repo, 'name'):
                      # Lock in the shared cache so repacks across multiple copies of the same
                      # repo are coordinated.
                      sharedcachepath = shallowutil.getcachepackpath(
                          repo, constants.FILEPACK_CATEGORY
                      )
                      return vfs.vfs(sharedcachepath)
                  else:
                      return repo.svfs

hgext/remotefilelog/shallowrepo.py

0 +1 -1

              # shallowrepo.py - shallow repository that uses remote filelogs
              #
              # Copyright 2013 Facebook, Inc.
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import os
              from mercurial.i18n import _
              from mercurial.node import hex, nullid, nullrev
              from mercurial import (
                  encoding,
                  error,
                  localrepo,
                  match,
                  pycompat,
                  scmutil,
                  sparse,
                  util,
              )
              from mercurial.utils import procutil
              from . import (
                  connectionpool,
                  constants,
                  contentstore,
                  datapack,
                  fileserverclient,
                  historypack,
                  metadatastore,
                  remotefilectx,
                  remotefilelog,
                  shallowutil,
              )
              # These make*stores functions are global so that other extensions can replace
              # them.
              def makelocalstores(repo):
                  """In-repo stores, like .hg/store/data; can not be discarded."""
                  localpath = os.path.join(repo.svfs.vfs.base, b'data')
                  if not os.path.exists(localpath):
                      os.makedirs(localpath)
                  # Instantiate local data stores
                  localcontent = contentstore.remotefilelogcontentstore(
                      repo, localpath, repo.name, shared=False
                  )
                  localmetadata = metadatastore.remotefilelogmetadatastore(
                      repo, localpath, repo.name, shared=False
                  )
                  return localcontent, localmetadata
              def makecachestores(repo):
                  """Typically machine-wide, cache of remote data; can be discarded."""
                  # Instantiate shared cache stores
                  cachepath = shallowutil.getcachepath(repo.ui)
                  cachecontent = contentstore.remotefilelogcontentstore(
                      repo, cachepath, repo.name, shared=True
                  )
                  cachemetadata = metadatastore.remotefilelogmetadatastore(
                      repo, cachepath, repo.name, shared=True
                  )
                  repo.sharedstore = cachecontent
                  repo.shareddatastores.append(cachecontent)
                  repo.sharedhistorystores.append(cachemetadata)
                  return cachecontent, cachemetadata
              def makeremotestores(repo, cachecontent, cachemetadata):
                  """These stores fetch data from a remote server."""
                  # Instantiate remote stores
                  repo.fileservice = fileserverclient.fileserverclient(repo)
                  remotecontent = contentstore.remotecontentstore(
                      repo.ui, repo.fileservice, cachecontent
                  )
                  remotemetadata = metadatastore.remotemetadatastore(
                      repo.ui, repo.fileservice, cachemetadata
                  )
                  return remotecontent, remotemetadata
              def makepackstores(repo):
                  """Packs are more efficient (to read from) cache stores."""
                  # Instantiate pack stores
                  packpath = shallowutil.getcachepackpath(repo, constants.FILEPACK_CATEGORY)
                  packcontentstore = datapack.datapackstore(repo.ui, packpath)
                  packmetadatastore = historypack.historypackstore(repo.ui, packpath)
                  repo.shareddatastores.append(packcontentstore)
                  repo.sharedhistorystores.append(packmetadatastore)
                  shallowutil.reportpackmetrics(
                      repo.ui, b'filestore', packcontentstore, packmetadatastore
                  )
                  return packcontentstore, packmetadatastore
              def makeunionstores(repo):
                  """Union stores iterate the other stores and return the first result."""
                  repo.shareddatastores = []
                  repo.sharedhistorystores = []
                  packcontentstore, packmetadatastore = makepackstores(repo)
                  cachecontent, cachemetadata = makecachestores(repo)
                  localcontent, localmetadata = makelocalstores(repo)
                  remotecontent, remotemetadata = makeremotestores(
                      repo, cachecontent, cachemetadata
                  )
                  # Instantiate union stores
                  repo.contentstore = contentstore.unioncontentstore(
                      packcontentstore,
                      cachecontent,
                      localcontent,
                      remotecontent,
                      writestore=localcontent,
                  )
                  repo.metadatastore = metadatastore.unionmetadatastore(
                      packmetadatastore,
                      cachemetadata,
                      localmetadata,
                      remotemetadata,
                      writestore=localmetadata,
                  )
                  fileservicedatawrite = cachecontent
                  fileservicehistorywrite = cachemetadata
                  repo.fileservice.setstore(
                      repo.contentstore,
                      repo.metadatastore,
                      fileservicedatawrite,
                      fileservicehistorywrite,
                  )
                  shallowutil.reportpackmetrics(
                      repo.ui, b'filestore', packcontentstore, packmetadatastore
                  )
              def wraprepo(repo):
                  class shallowrepository(repo.__class__):
                      @util.propertycache
                      def name(self):
                          return self.ui.config(b'remotefilelog', b'reponame')
                      @util.propertycache
                      def fallbackpath(self):
                          path = repo.ui.config(
                              b"remotefilelog",
                              b"fallbackpath",
                              repo.ui.config(b'paths', b'default'),
                          )
                          if not path:
                              raise error.Abort(
                                  b"no remotefilelog server "
                                  b"configured - is your .hg/hgrc trusted?"
                              )
                          return path
                      def maybesparsematch(self, *revs, **kwargs):
                          '''
                          A wrapper that allows the remotefilelog to invoke sparsematch() if
                          this is a sparse repository, or returns None if this is not a
                          sparse repository.
                          '''
                          if revs:
                              ret = sparse.matcher(repo, revs=revs)
                          else:
                              ret = sparse.matcher(repo)
                          if ret.always():
                              return None
                          return ret
                      def file(self, f):
                          if f[0] == b'/':
                              f = f[1:]
                          if self.shallowmatch(f):
                              return remotefilelog.remotefilelog(self.svfs, f, self)
                          else:
                              return super(shallowrepository, self).file(f)
                      def filectx(self, path, *args, **kwargs):
                          if self.shallowmatch(path):
                              return remotefilectx.remotefilectx(self, path, *args, **kwargs)
                          else:
                              return super(shallowrepository, self).filectx(
                                  path, *args, **kwargs
                              )
                      @localrepo.unfilteredmethod
                      def commitctx(self, ctx, error=False, origctx=None):
                          """Add a new revision to current repository.
                          Revision information is passed via the context argument.
                          """
                          # some contexts already have manifest nodes, they don't need any
                          # prefetching (for example if we're just editing a commit message
                          # we can reuse manifest
                          if not ctx.manifestnode():
                              # prefetch files that will likely be compared
                              m1 = ctx.p1().manifest()
                              files = []
                              for f in ctx.modified() + ctx.added():
                                  fparent1 = m1.get(f, nullid)
                                  if fparent1 != nullid:
                                      files.append((f, hex(fparent1)))
                              self.fileservice.prefetch(files)
                          return super(shallowrepository, self).commitctx(
                              ctx, error=error, origctx=origctx
                          )
                      def backgroundprefetch(
                          self,
                          revs,
                          base=None,
                          repack=False,
                          pats=None,
                          opts=None,
                          ensurestart=False,
                      ):
                          """Runs prefetch in background with optional repack
                          """
                          cmd = [procutil.hgexecutable(), b'-R', repo.origroot, b'prefetch']
                          if repack:
                              cmd.append(b'--repack')
                          if revs:
                              cmd += [b'-r', revs]
                          # We know this command will find a binary, so don't block
                          # on it starting.
                          procutil.runbgcommand(
                              cmd, encoding.environ, ensurestart=ensurestart
                          )
                      def prefetch(self, revs, base=None, pats=None, opts=None):
                          """Prefetches all the necessary file revisions for the given revs
                          Optionally runs repack in background
                          """
                          with repo._lock(
                              repo.svfs,
                              b'prefetchlock',
                              True,
                              None,
                              None,
                              _(b'prefetching in %s') % repo.origroot,
                          ):
                              self._prefetch(revs, base, pats, opts)
                      def _prefetch(self, revs, base=None, pats=None, opts=None):
                          fallbackpath = self.fallbackpath
                          if fallbackpath:
                              # If we know a rev is on the server, we should fetch the server
                              # version of those files, since our local file versions might
                              # become obsolete if the local commits are stripped.
                              localrevs = repo.revs(b'outgoing(%s)', fallbackpath)
                              if base is not None and base != nullrev:
                                  serverbase = list(
                                      repo.revs(
                                          b'first(reverse(::%s) - %ld)', base, localrevs
                                      )
                                  )
                                  if serverbase:
                                      base = serverbase[0]
                          else:
                              localrevs = repo
                          mfl = repo.manifestlog
                          mfrevlog = mfl.getstorage(b'')
                          if base is not None:
                              mfdict = mfl[repo[base].manifestnode()].read()
                              skip = set(pycompat.iteritems(mfdict))
                          else:
                              skip = set()
                          # Copy the skip set to start large and avoid constant resizing,
                          # and since it's likely to be very similar to the prefetch set.
                          files = skip.copy()
                          serverfiles = skip.copy()
                          visited = set()
                          visited.add(nullrev)
                          revcount = len(revs)
                          progress = self.ui.makeprogress(_(b'prefetching'), total=revcount)
                          progress.update(0)
                          for rev in sorted(revs):
                              ctx = repo[rev]
                              if pats:
                                  m = scmutil.match(ctx, pats, opts)
                              sparsematch = repo.maybesparsematch(rev)
                              mfnode = ctx.manifestnode()
                              mfrev = mfrevlog.rev(mfnode)
                              # Decompressing manifests is expensive.
                              # When possible, only read the deltas.
                              p1, p2 = mfrevlog.parentrevs(mfrev)
                              if p1 in visited and p2 in visited:
                                  mfdict = mfl[mfnode].readfast()
                              else:
                                  mfdict = mfl[mfnode].read()
                              diff = pycompat.iteritems(mfdict)
                              if pats:
                                  diff = (pf for pf in diff if m(pf[0]))
                              if sparsematch:
                                  diff = (pf for pf in diff if sparsematch(pf[0]))
                              if rev not in localrevs:
                                  serverfiles.update(diff)
                              else:
                                  files.update(diff)
                              visited.add(mfrev)
                              progress.increment()
                          files.difference_update(skip)
                          serverfiles.difference_update(skip)
                          progress.complete()
                          # Fetch files known to be on the server
                          if serverfiles:
                              results = [(path, hex(fnode)) for (path, fnode) in serverfiles]
                              repo.fileservice.prefetch(results, force=True)
                          # Fetch files that may or may not be on the server
                          if files:
                              results = [(path, hex(fnode)) for (path, fnode) in files]
                              repo.fileservice.prefetch(results)
                      def close(self):
                          super(shallowrepository, self).close()
                          self.connectionpool.close()
                  repo.__class__ = shallowrepository
                  repo.shallowmatch = match.always()
                  makeunionstores(repo)
                  repo.includepattern = repo.ui.configlist(
                      b"remotefilelog", b"includepattern", None
                  )
                  repo.excludepattern = repo.ui.configlist(
                      b"remotefilelog", b"excludepattern", None
                  )
-                 if not util.safehasattr(repo, b'connectionpool'):
+                 if not util.safehasattr(repo, 'connectionpool'):
                      repo.connectionpool = connectionpool.connectionpool(repo)
                  if repo.includepattern or repo.excludepattern:
                      repo.shallowmatch = match.match(
                          repo.root, b'', None, repo.includepattern, repo.excludepattern
                      )

mercurial/bundle2.py

0 +5 -5

              # bundle2.py - generic container format to transmit arbitrary data.
              #
              # Copyright 2013 Facebook, Inc.
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              """Handling of the new bundle2 format
              The goal of bundle2 is to act as an atomically packet to transmit a set of
              payloads in an application agnostic way. It consist in a sequence of "parts"
              that will be handed to and processed by the application layer.
              General format architecture
              ===========================
              The format is architectured as follow
               - magic string
               - stream level parameters
               - payload parts (any number)
               - end of stream marker.
              the Binary format
              ============================
              All numbers are unsigned and big-endian.
              stream level parameters
              ------------------------
              Binary format is as follow
              :params size: int32
                The total number of Bytes used by the parameters
              :params value: arbitrary number of Bytes
                A blob of `params size` containing the serialized version of all stream level
                parameters.
                The blob contains a space separated list of parameters. Parameters with value
                are stored in the form `<name>=<value>`. Both name and value are urlquoted.
                Empty name are obviously forbidden.
                Name MUST start with a letter. If this first letter is lower case, the
                parameter is advisory and can be safely ignored. However when the first
                letter is capital, the parameter is mandatory and the bundling process MUST
                stop if he is not able to proceed it.
                Stream parameters use a simple textual format for two main reasons:
                - Stream level parameters should remain simple and we want to discourage any
                  crazy usage.
                - Textual data allow easy human inspection of a bundle2 header in case of
                  troubles.
                Any Applicative level options MUST go into a bundle2 part instead.
              Payload part
              ------------------------
              Binary format is as follow
              :header size: int32
                The total number of Bytes used by the part header. When the header is empty
                (size = 0) this is interpreted as the end of stream marker.
              :header:
                  The header defines how to interpret the part. It contains two piece of
                  data: the part type, and the part parameters.
                  The part type is used to route an application level handler, that can
                  interpret payload.
                  Part parameters are passed to the application level handler.  They are
                  meant to convey information that will help the application level object to
                  interpret the part payload.
                  The binary format of the header is has follow
                  :typesize: (one byte)
                  :parttype: alphanumerical part name (restricted to [a-zA-Z0-9_:-]*)
                  :partid: A 32bits integer (unique in the bundle) that can be used to refer
                           to this part.
                  :parameters:
                      Part's parameter may have arbitrary content, the binary structure is::
                          <mandatory-count><advisory-count><param-sizes><param-data>
                      :mandatory-count: 1 byte, number of mandatory parameters
                      :advisory-count:  1 byte, number of advisory parameters
                      :param-sizes:
                          N couple of bytes, where N is the total number of parameters. Each
                          couple contains (<size-of-key>, <size-of-value) for one parameter.
                      :param-data:
                          A blob of bytes from which each parameter key and value can be
                          retrieved using the list of size couples stored in the previous
                          field.
                          Mandatory parameters comes first, then the advisory ones.
                          Each parameter's key MUST be unique within the part.
              :payload:
                  payload is a series of `<chunksize><chunkdata>`.
                  `chunksize` is an int32, `chunkdata` are plain bytes (as much as
                  `chunksize` says)` The payload part is concluded by a zero size chunk.
                  The current implementation always produces either zero or one chunk.
                  This is an implementation limitation that will ultimately be lifted.
                  `chunksize` can be negative to trigger special case processing. No such
                  processing is in place yet.
              Bundle processing
              ============================
              Each part is processed in order using a "part handler". Handler are registered
              for a certain part type.
              The matching of a part to its handler is case insensitive. The case of the
              part type is used to know if a part is mandatory or advisory. If the Part type
              contains any uppercase char it is considered mandatory. When no handler is
              known for a Mandatory part, the process is aborted and an exception is raised.
              If the part is advisory and no handler is known, the part is ignored. When the
              process is aborted, the full bundle is still read from the stream to keep the
              channel usable. But none of the part read from an abort are processed. In the
              future, dropping the stream may become an option for channel we do not care to
              preserve.
              """
              from __future__ import absolute_import, division
              import collections
              import errno
              import os
              import re
              import string
              import struct
              import sys
              from .i18n import _
              from . import (
                  bookmarks,
                  changegroup,
                  encoding,
                  error,
                  node as nodemod,
                  obsolete,
                  phases,
                  pushkey,
                  pycompat,
                  streamclone,
                  tags,
                  url,
                  util,
              )
              from .utils import stringutil
              urlerr = util.urlerr
              urlreq = util.urlreq
              _pack = struct.pack
              _unpack = struct.unpack
              _fstreamparamsize = b'>i'
              _fpartheadersize = b'>i'
              _fparttypesize = b'>B'
              _fpartid = b'>I'
              _fpayloadsize = b'>i'
              _fpartparamcount = b'>BB'
              preferedchunksize = 32768
              _parttypeforbidden = re.compile(b'[^a-zA-Z0-9_:-]')
              def outdebug(ui, message):
                  """debug regarding output stream (bundling)"""
                  if ui.configbool(b'devel', b'bundle2.debug'):
                      ui.debug(b'bundle2-output: %s\n' % message)
              def indebug(ui, message):
                  """debug on input stream (unbundling)"""
                  if ui.configbool(b'devel', b'bundle2.debug'):
                      ui.debug(b'bundle2-input: %s\n' % message)
              def validateparttype(parttype):
                  """raise ValueError if a parttype contains invalid character"""
                  if _parttypeforbidden.search(parttype):
                      raise ValueError(parttype)
              def _makefpartparamsizes(nbparams):
                  """return a struct format to read part parameter sizes
                  The number parameters is variable so we need to build that format
                  dynamically.
                  """
                  return b'>' + (b'BB' * nbparams)
              parthandlermapping = {}
              def parthandler(parttype, params=()):
                  """decorator that register a function as a bundle2 part handler
                  eg::
                      @parthandler('myparttype', ('mandatory', 'param', 'handled'))
                      def myparttypehandler(...):
                          '''process a part of type "my part".'''
                          ...
                  """
                  validateparttype(parttype)
                  def _decorator(func):
                      lparttype = parttype.lower()  # enforce lower case matching.
                      assert lparttype not in parthandlermapping
                      parthandlermapping[lparttype] = func
                      func.params = frozenset(params)
                      return func
                  return _decorator
              class unbundlerecords(object):
                  """keep record of what happens during and unbundle
                  New records are added using `records.add('cat', obj)`. Where 'cat' is a
                  category of record and obj is an arbitrary object.
                  `records['cat']` will return all entries of this category 'cat'.
                  Iterating on the object itself will yield `('category', obj)` tuples
                  for all entries.
                  All iterations happens in chronological order.
                  """
                  def __init__(self):
                      self._categories = {}
                      self._sequences = []
                      self._replies = {}
                  def add(self, category, entry, inreplyto=None):
                      """add a new record of a given category.
                      The entry can then be retrieved in the list returned by
                      self['category']."""
                      self._categories.setdefault(category, []).append(entry)
                      self._sequences.append((category, entry))
                      if inreplyto is not None:
                          self.getreplies(inreplyto).add(category, entry)
                  def getreplies(self, partid):
                      """get the records that are replies to a specific part"""
                      return self._replies.setdefault(partid, unbundlerecords())
                  def __getitem__(self, cat):
                      return tuple(self._categories.get(cat, ()))
                  def __iter__(self):
                      return iter(self._sequences)
                  def __len__(self):
                      return len(self._sequences)
                  def __nonzero__(self):
                      return bool(self._sequences)
                  __bool__ = __nonzero__
              class bundleoperation(object):
                  """an object that represents a single bundling process
                  Its purpose is to carry unbundle-related objects and states.
                  A new object should be created at the beginning of each bundle processing.
                  The object is to be returned by the processing function.
                  The object has very little content now it will ultimately contain:
                  * an access to the repo the bundle is applied to,
                  * a ui object,
                  * a way to retrieve a transaction to add changes to the repo,
                  * a way to record the result of processing each part,
                  * a way to construct a bundle response when applicable.
                  """
                  def __init__(self, repo, transactiongetter, captureoutput=True, source=b''):
                      self.repo = repo
                      self.ui = repo.ui
                      self.records = unbundlerecords()
                      self.reply = None
                      self.captureoutput = captureoutput
                      self.hookargs = {}
                      self._gettransaction = transactiongetter
                      # carries value that can modify part behavior
                      self.modes = {}
                      self.source = source
                  def gettransaction(self):
                      transaction = self._gettransaction()
                      if self.hookargs:
                          # the ones added to the transaction supercede those added
                          # to the operation.
                          self.hookargs.update(transaction.hookargs)
                          transaction.hookargs = self.hookargs
                      # mark the hookargs as flushed.  further attempts to add to
                      # hookargs will result in an abort.
                      self.hookargs = None
                      return transaction
                  def addhookargs(self, hookargs):
                      if self.hookargs is None:
                          raise error.ProgrammingError(
                              b'attempted to add hookargs to '
                              b'operation after transaction started'
                          )
                      self.hookargs.update(hookargs)
              class TransactionUnavailable(RuntimeError):
                  pass
              def _notransaction():
                  """default method to get a transaction while processing a bundle
                  Raise an exception to highlight the fact that no transaction was expected
                  to be created"""
                  raise TransactionUnavailable()
              def applybundle(repo, unbundler, tr, source, url=None, **kwargs):
                  # transform me into unbundler.apply() as soon as the freeze is lifted
                  if isinstance(unbundler, unbundle20):
                      tr.hookargs[b'bundle2'] = b'1'
                      if source is not None and b'source' not in tr.hookargs:
                          tr.hookargs[b'source'] = source
                      if url is not None and b'url' not in tr.hookargs:
                          tr.hookargs[b'url'] = url
                      return processbundle(repo, unbundler, lambda: tr, source=source)
                  else:
                      # the transactiongetter won't be used, but we might as well set it
                      op = bundleoperation(repo, lambda: tr, source=source)
                      _processchangegroup(op, unbundler, tr, source, url, **kwargs)
                      return op
              class partiterator(object):
                  def __init__(self, repo, op, unbundler):
                      self.repo = repo
                      self.op = op
                      self.unbundler = unbundler
                      self.iterator = None
                      self.count = 0
                      self.current = None
                  def __enter__(self):
                      def func():
                          itr = enumerate(self.unbundler.iterparts(), 1)
                          for count, p in itr:
                              self.count = count
                              self.current = p
                              yield p
                              p.consume()
                              self.current = None
                      self.iterator = func()
                      return self.iterator
                  def __exit__(self, type, exc, tb):
                      if not self.iterator:
                          return
                      # Only gracefully abort in a normal exception situation. User aborts
                      # like Ctrl+C throw a KeyboardInterrupt which is not a base Exception,
                      # and should not gracefully cleanup.
                      if isinstance(exc, Exception):
                          # Any exceptions seeking to the end of the bundle at this point are
                          # almost certainly related to the underlying stream being bad.
                          # And, chances are that the exception we're handling is related to
                          # getting in that bad state. So, we swallow the seeking error and
                          # re-raise the original error.
                          seekerror = False
                          try:
                              if self.current:
                                  # consume the part content to not corrupt the stream.
                                  self.current.consume()
                              for part in self.iterator:
                                  # consume the bundle content
                                  part.consume()
                          except Exception:
                              seekerror = True
                          # Small hack to let caller code distinguish exceptions from bundle2
                          # processing from processing the old format. This is mostly needed
                          # to handle different return codes to unbundle according to the type
                          # of bundle. We should probably clean up or drop this return code
                          # craziness in a future version.
                          exc.duringunbundle2 = True
                          salvaged = []
                          replycaps = None
                          if self.op.reply is not None:
                              salvaged = self.op.reply.salvageoutput()
                              replycaps = self.op.reply.capabilities
                          exc._replycaps = replycaps
                          exc._bundle2salvagedoutput = salvaged
                          # Re-raising from a variable loses the original stack. So only use
                          # that form if we need to.
                          if seekerror:
                              raise exc
                      self.repo.ui.debug(
                          b'bundle2-input-bundle: %i parts total\n' % self.count
                      )
              def processbundle(repo, unbundler, transactiongetter=None, op=None, source=b''):
                  """This function process a bundle, apply effect to/from a repo
                  It iterates over each part then searches for and uses the proper handling
                  code to process the part. Parts are processed in order.
                  Unknown Mandatory part will abort the process.
                  It is temporarily possible to provide a prebuilt bundleoperation to the
                  function. This is used to ensure output is properly propagated in case of
                  an error during the unbundling. This output capturing part will likely be
                  reworked and this ability will probably go away in the process.
                  """
                  if op is None:
                      if transactiongetter is None:
                          transactiongetter = _notransaction
                      op = bundleoperation(repo, transactiongetter, source=source)
                  # todo:
                  # - replace this is a init function soon.
                  # - exception catching
                  unbundler.params
                  if repo.ui.debugflag:
                      msg = [b'bundle2-input-bundle:']
                      if unbundler.params:
                          msg.append(b' %i params' % len(unbundler.params))
                      if op._gettransaction is None or op._gettransaction is _notransaction:
                          msg.append(b' no-transaction')
                      else:
                          msg.append(b' with-transaction')
                      msg.append(b'\n')
                      repo.ui.debug(b''.join(msg))
                  processparts(repo, op, unbundler)
                  return op
              def processparts(repo, op, unbundler):
                  with partiterator(repo, op, unbundler) as parts:
                      for part in parts:
                          _processpart(op, part)
              def _processchangegroup(op, cg, tr, source, url, **kwargs):
                  ret = cg.apply(op.repo, tr, source, url, **kwargs)
                  op.records.add(b'changegroup', {b'return': ret,})
                  return ret
              def _gethandler(op, part):
                  status = b'unknown'  # used by debug output
                  try:
                      handler = parthandlermapping.get(part.type)
                      if handler is None:
                          status = b'unsupported-type'
                          raise error.BundleUnknownFeatureError(parttype=part.type)
                      indebug(op.ui, b'found a handler for part %s' % part.type)
                      unknownparams = part.mandatorykeys - handler.params
                      if unknownparams:
                          unknownparams = list(unknownparams)
                          unknownparams.sort()
                          status = b'unsupported-params (%s)' % b', '.join(unknownparams)
                          raise error.BundleUnknownFeatureError(
                              parttype=part.type, params=unknownparams
                          )
                      status = b'supported'
                  except error.BundleUnknownFeatureError as exc:
                      if part.mandatory:  # mandatory parts
                          raise
                      indebug(op.ui, b'ignoring unsupported advisory part %s' % exc)
                      return  # skip to part processing
                  finally:
                      if op.ui.debugflag:
                          msg = [b'bundle2-input-part: "%s"' % part.type]
                          if not part.mandatory:
                              msg.append(b' (advisory)')
                          nbmp = len(part.mandatorykeys)
                          nbap = len(part.params) - nbmp
                          if nbmp or nbap:
                              msg.append(b' (params:')
                              if nbmp:
                                  msg.append(b' %i mandatory' % nbmp)
                              if nbap:
                                  msg.append(b' %i advisory' % nbmp)
                              msg.append(b')')
                          msg.append(b' %s\n' % status)
                          op.ui.debug(b''.join(msg))
                  return handler
              def _processpart(op, part):
                  """process a single part from a bundle
                  The part is guaranteed to have been fully consumed when the function exits
                  (even if an exception is raised)."""
                  handler = _gethandler(op, part)
                  if handler is None:
                      return
                  # handler is called outside the above try block so that we don't
                  # risk catching KeyErrors from anything other than the
                  # parthandlermapping lookup (any KeyError raised by handler()
                  # itself represents a defect of a different variety).
                  output = None
                  if op.captureoutput and op.reply is not None:
                      op.ui.pushbuffer(error=True, subproc=True)
                      output = b''
                  try:
                      handler(op, part)
                  finally:
                      if output is not None:
                          output = op.ui.popbuffer()
                      if output:
                          outpart = op.reply.newpart(b'output', data=output, mandatory=False)
                          outpart.addparam(
                              b'in-reply-to', pycompat.bytestr(part.id), mandatory=False
                          )
              def decodecaps(blob):
                  """decode a bundle2 caps bytes blob into a dictionary
                  The blob is a list of capabilities (one per line)
                  Capabilities may have values using a line of the form::
                      capability=value1,value2,value3
                  The values are always a list."""
                  caps = {}
                  for line in blob.splitlines():
                      if not line:
                          continue
                      if b'=' not in line:
                          key, vals = line, ()
                      else:
                          key, vals = line.split(b'=', 1)
                          vals = vals.split(b',')
                      key = urlreq.unquote(key)
                      vals = [urlreq.unquote(v) for v in vals]
                      caps[key] = vals
                  return caps
              def encodecaps(caps):
                  """encode a bundle2 caps dictionary into a bytes blob"""
                  chunks = []
                  for ca in sorted(caps):
                      vals = caps[ca]
                      ca = urlreq.quote(ca)
                      vals = [urlreq.quote(v) for v in vals]
                      if vals:
                          ca = b"%s=%s" % (ca, b','.join(vals))
                      chunks.append(ca)
                  return b'\n'.join(chunks)
              bundletypes = {
                  b"": (b"", b'UN'),  # only when using unbundle on ssh and old http servers
                  # since the unification ssh accepts a header but there
                  # is no capability signaling it.
                  b"HG20": (),  # special-cased below
                  b"HG10UN": (b"HG10UN", b'UN'),
                  b"HG10BZ": (b"HG10", b'BZ'),
                  b"HG10GZ": (b"HG10GZ", b'GZ'),
              }
              # hgweb uses this list to communicate its preferred type
              bundlepriority = [b'HG10GZ', b'HG10BZ', b'HG10UN']
              class bundle20(object):
                  """represent an outgoing bundle2 container
                  Use the `addparam` method to add stream level parameter. and `newpart` to
                  populate it. Then call `getchunks` to retrieve all the binary chunks of
                  data that compose the bundle2 container."""
                  _magicstring = b'HG20'
                  def __init__(self, ui, capabilities=()):
                      self.ui = ui
                      self._params = []
                      self._parts = []
                      self.capabilities = dict(capabilities)
                      self._compengine = util.compengines.forbundletype(b'UN')
                      self._compopts = None
                      # If compression is being handled by a consumer of the raw
                      # data (e.g. the wire protocol), unsetting this flag tells
                      # consumers that the bundle is best left uncompressed.
                      self.prefercompressed = True
                  def setcompression(self, alg, compopts=None):
                      """setup core part compression to <alg>"""
                      if alg in (None, b'UN'):
                          return
                      assert not any(n.lower() == b'compression' for n, v in self._params)
                      self.addparam(b'Compression', alg)
                      self._compengine = util.compengines.forbundletype(alg)
                      self._compopts = compopts
                  @property
                  def nbparts(self):
                      """total number of parts added to the bundler"""
                      return len(self._parts)
                  # methods used to defines the bundle2 content
                  def addparam(self, name, value=None):
                      """add a stream level parameter"""
                      if not name:
                          raise error.ProgrammingError(b'empty parameter name')
                      if name[0:1] not in pycompat.bytestr(string.ascii_letters):
                          raise error.ProgrammingError(
                              b'non letter first character: %s' % name
                          )
                      self._params.append((name, value))
                  def addpart(self, part):
                      """add a new part to the bundle2 container
                      Parts contains the actual applicative payload."""
                      assert part.id is None
                      part.id = len(self._parts)  # very cheap counter
                      self._parts.append(part)
                  def newpart(self, typeid, *args, **kwargs):
                      """create a new part and add it to the containers
                      As the part is directly added to the containers. For now, this means
                      that any failure to properly initialize the part after calling
                      ``newpart`` should result in a failure of the whole bundling process.
                      You can still fall back to manually create and add if you need better
                      control."""
                      part = bundlepart(typeid, *args, **kwargs)
                      self.addpart(part)
                      return part
                  # methods used to generate the bundle2 stream
                  def getchunks(self):
                      if self.ui.debugflag:
                          msg = [b'bundle2-output-bundle: "%s",' % self._magicstring]
                          if self._params:
                              msg.append(b' (%i params)' % len(self._params))
                          msg.append(b' %i parts total\n' % len(self._parts))
                          self.ui.debug(b''.join(msg))
                      outdebug(self.ui, b'start emission of %s stream' % self._magicstring)
                      yield self._magicstring
                      param = self._paramchunk()
                      outdebug(self.ui, b'bundle parameter: %s' % param)
                      yield _pack(_fstreamparamsize, len(param))
                      if param:
                          yield param
                      for chunk in self._compengine.compressstream(
                          self._getcorechunk(), self._compopts
                      ):
                          yield chunk
                  def _paramchunk(self):
                      """return a encoded version of all stream parameters"""
                      blocks = []
                      for par, value in self._params:
                          par = urlreq.quote(par)
                          if value is not None:
                              value = urlreq.quote(value)
                              par = b'%s=%s' % (par, value)
                          blocks.append(par)
                      return b' '.join(blocks)
                  def _getcorechunk(self):
                      """yield chunk for the core part of the bundle
                      (all but headers and parameters)"""
                      outdebug(self.ui, b'start of parts')
                      for part in self._parts:
                          outdebug(self.ui, b'bundle part: "%s"' % part.type)
                          for chunk in part.getchunks(ui=self.ui):
                              yield chunk
                      outdebug(self.ui, b'end of bundle')
                      yield _pack(_fpartheadersize, 0)
                  def salvageoutput(self):
                      """return a list with a copy of all output parts in the bundle
                      This is meant to be used during error handling to make sure we preserve
                      server output"""
                      salvaged = []
                      for part in self._parts:
                          if part.type.startswith(b'output'):
                              salvaged.append(part.copy())
                      return salvaged
              class unpackermixin(object):
                  """A mixin to extract bytes and struct data from a stream"""
                  def __init__(self, fp):
                      self._fp = fp
                  def _unpack(self, format):
                      """unpack this struct format from the stream
                      This method is meant for internal usage by the bundle2 protocol only.
                      They directly manipulate the low level stream including bundle2 level
                      instruction.
                      Do not use it to implement higher-level logic or methods."""
                      data = self._readexact(struct.calcsize(format))
                      return _unpack(format, data)
                  def _readexact(self, size):
                      """read exactly <size> bytes from the stream
                      This method is meant for internal usage by the bundle2 protocol only.
                      They directly manipulate the low level stream including bundle2 level
                      instruction.
                      Do not use it to implement higher-level logic or methods."""
                      return changegroup.readexactly(self._fp, size)
              def getunbundler(ui, fp, magicstring=None):
                  """return a valid unbundler object for a given magicstring"""
                  if magicstring is None:
                      magicstring = changegroup.readexactly(fp, 4)
                  magic, version = magicstring[0:2], magicstring[2:4]
                  if magic != b'HG':
                      ui.debug(
                          b"error: invalid magic: %r (version %r), should be 'HG'\n"
                          % (magic, version)
                      )
                      raise error.Abort(_(b'not a Mercurial bundle'))
                  unbundlerclass = formatmap.get(version)
                  if unbundlerclass is None:
                      raise error.Abort(_(b'unknown bundle version %s') % version)
                  unbundler = unbundlerclass(ui, fp)
                  indebug(ui, b'start processing of %s stream' % magicstring)
                  return unbundler
              class unbundle20(unpackermixin):
                  """interpret a bundle2 stream
                  This class is fed with a binary stream and yields parts through its
                  `iterparts` methods."""
                  _magicstring = b'HG20'
                  def __init__(self, ui, fp):
                      """If header is specified, we do not read it out of the stream."""
                      self.ui = ui
                      self._compengine = util.compengines.forbundletype(b'UN')
                      self._compressed = None
                      super(unbundle20, self).__init__(fp)
                  @util.propertycache
                  def params(self):
                      """dictionary of stream level parameters"""
                      indebug(self.ui, b'reading bundle2 stream parameters')
                      params = {}
                      paramssize = self._unpack(_fstreamparamsize)[0]
                      if paramssize < 0:
                          raise error.BundleValueError(
                              b'negative bundle param size: %i' % paramssize
                          )
                      if paramssize:
                          params = self._readexact(paramssize)
                          params = self._processallparams(params)
                      return params
                  def _processallparams(self, paramsblock):
                      """"""
                      params = util.sortdict()
                      for p in paramsblock.split(b' '):
                          p = p.split(b'=', 1)
                          p = [urlreq.unquote(i) for i in p]
                          if len(p) < 2:
                              p.append(None)
                          self._processparam(*p)
                          params[p[0]] = p[1]
                      return params
                  def _processparam(self, name, value):
                      """process a parameter, applying its effect if needed
                      Parameter starting with a lower case letter are advisory and will be
                      ignored when unknown.  Those starting with an upper case letter are
                      mandatory and will this function will raise a KeyError when unknown.
                      Note: no option are currently supported. Any input will be either
                            ignored or failing.
                      """
                      if not name:
                          raise ValueError(r'empty parameter name')
                      if name[0:1] not in pycompat.bytestr(string.ascii_letters):
                          raise ValueError(r'non letter first character: %s' % name)
                      try:
                          handler = b2streamparamsmap[name.lower()]
                      except KeyError:
                          if name[0:1].islower():
                              indebug(self.ui, b"ignoring unknown parameter %s" % name)
                          else:
                              raise error.BundleUnknownFeatureError(params=(name,))
                      else:
                          handler(self, name, value)
                  def _forwardchunks(self):
                      """utility to transfer a bundle2 as binary
                      This is made necessary by the fact the 'getbundle' command over 'ssh'
                      have no way to know then the reply end, relying on the bundle to be
                      interpreted to know its end. This is terrible and we are sorry, but we
                      needed to move forward to get general delta enabled.
                      """
                      yield self._magicstring
                      assert b'params' not in vars(self)
                      paramssize = self._unpack(_fstreamparamsize)[0]
                      if paramssize < 0:
                          raise error.BundleValueError(
                              b'negative bundle param size: %i' % paramssize
                          )
                      if paramssize:
                          params = self._readexact(paramssize)
                          self._processallparams(params)
                          # The payload itself is decompressed below, so drop
                          # the compression parameter passed down to compensate.
                          outparams = []
                          for p in params.split(b' '):
                              k, v = p.split(b'=', 1)
                              if k.lower() != b'compression':
                                  outparams.append(p)
                          outparams = b' '.join(outparams)
                          yield _pack(_fstreamparamsize, len(outparams))
                          yield outparams
                      else:
                          yield _pack(_fstreamparamsize, paramssize)
                      # From there, payload might need to be decompressed
                      self._fp = self._compengine.decompressorreader(self._fp)
                      emptycount = 0
                      while emptycount < 2:
                          # so we can brainlessly loop
                          assert _fpartheadersize == _fpayloadsize
                          size = self._unpack(_fpartheadersize)[0]
                          yield _pack(_fpartheadersize, size)
                          if size:
                              emptycount = 0
                          else:
                              emptycount += 1
                              continue
                          if size == flaginterrupt:
                              continue
                          elif size < 0:
                              raise error.BundleValueError(b'negative chunk size: %i')
                          yield self._readexact(size)
                  def iterparts(self, seekable=False):
                      """yield all parts contained in the stream"""
                      cls = seekableunbundlepart if seekable else unbundlepart
                      # make sure param have been loaded
                      self.params
                      # From there, payload need to be decompressed
                      self._fp = self._compengine.decompressorreader(self._fp)
                      indebug(self.ui, b'start extraction of bundle2 parts')
                      headerblock = self._readpartheader()
                      while headerblock is not None:
                          part = cls(self.ui, headerblock, self._fp)
                          yield part
                          # Ensure part is fully consumed so we can start reading the next
                          # part.
                          part.consume()
                          headerblock = self._readpartheader()
                      indebug(self.ui, b'end of bundle2 stream')
                  def _readpartheader(self):
                      """reads a part header size and return the bytes blob
                      returns None if empty"""
                      headersize = self._unpack(_fpartheadersize)[0]
                      if headersize < 0:
                          raise error.BundleValueError(
                              b'negative part header size: %i' % headersize
                          )
                      indebug(self.ui, b'part header size: %i' % headersize)
                      if headersize:
                          return self._readexact(headersize)
                      return None
                  def compressed(self):
                      self.params  # load params
                      return self._compressed
                  def close(self):
                      """close underlying file"""
-                     if util.safehasattr(self._fp, b'close'):
+                     if util.safehasattr(self._fp, 'close'):
                          return self._fp.close()
              formatmap = {b'20': unbundle20}
              b2streamparamsmap = {}
              def b2streamparamhandler(name):
                  """register a handler for a stream level parameter"""
                  def decorator(func):
                      assert name not in formatmap
                      b2streamparamsmap[name] = func
                      return func
                  return decorator
              @b2streamparamhandler(b'compression')
              def processcompression(unbundler, param, value):
                  """read compression parameter and install payload decompression"""
                  if value not in util.compengines.supportedbundletypes:
                      raise error.BundleUnknownFeatureError(params=(param,), values=(value,))
                  unbundler._compengine = util.compengines.forbundletype(value)
                  if value is not None:
                      unbundler._compressed = True
              class bundlepart(object):
                  """A bundle2 part contains application level payload
                  The part `type` is used to route the part to the application level
                  handler.
                  The part payload is contained in ``part.data``. It could be raw bytes or a
                  generator of byte chunks.
                  You can add parameters to the part using the ``addparam`` method.
                  Parameters can be either mandatory (default) or advisory. Remote side
                  should be able to safely ignore the advisory ones.
                  Both data and parameters cannot be modified after the generation has begun.
                  """
                  def __init__(
                      self,
                      parttype,
                      mandatoryparams=(),
                      advisoryparams=(),
                      data=b'',
                      mandatory=True,
                  ):
                      validateparttype(parttype)
                      self.id = None
                      self.type = parttype
                      self._data = data
                      self._mandatoryparams = list(mandatoryparams)
                      self._advisoryparams = list(advisoryparams)
                      # checking for duplicated entries
                      self._seenparams = set()
                      for pname, __ in self._mandatoryparams + self._advisoryparams:
                          if pname in self._seenparams:
                              raise error.ProgrammingError(b'duplicated params: %s' % pname)
                          self._seenparams.add(pname)
                      # status of the part's generation:
                      # - None: not started,
                      # - False: currently generated,
                      # - True: generation done.
                      self._generated = None
                      self.mandatory = mandatory
                  def __repr__(self):
                      cls = b"%s.%s" % (self.__class__.__module__, self.__class__.__name__)
                      return b'<%s object at %x; id: %s; type: %s; mandatory: %s>' % (
                          cls,
                          id(self),
                          self.id,
                          self.type,
                          self.mandatory,
                      )
                  def copy(self):
                      """return a copy of the part
                      The new part have the very same content but no partid assigned yet.
                      Parts with generated data cannot be copied."""
-                     assert not util.safehasattr(self.data, b'next')
+                     assert not util.safehasattr(self.data, 'next')
                      return self.__class__(
                          self.type,
                          self._mandatoryparams,
                          self._advisoryparams,
                          self._data,
                          self.mandatory,
                      )
                  # methods used to defines the part content
                  @property
                  def data(self):
                      return self._data
                  @data.setter
                  def data(self, data):
                      if self._generated is not None:
                          raise error.ReadOnlyPartError(b'part is being generated')
                      self._data = data
                  @property
                  def mandatoryparams(self):
                      # make it an immutable tuple to force people through ``addparam``
                      return tuple(self._mandatoryparams)
                  @property
                  def advisoryparams(self):
                      # make it an immutable tuple to force people through ``addparam``
                      return tuple(self._advisoryparams)
                  def addparam(self, name, value=b'', mandatory=True):
                      """add a parameter to the part
                      If 'mandatory' is set to True, the remote handler must claim support
                      for this parameter or the unbundling will be aborted.
                      The 'name' and 'value' cannot exceed 255 bytes each.
                      """
                      if self._generated is not None:
                          raise error.ReadOnlyPartError(b'part is being generated')
                      if name in self._seenparams:
                          raise ValueError(b'duplicated params: %s' % name)
                      self._seenparams.add(name)
                      params = self._advisoryparams
                      if mandatory:
                          params = self._mandatoryparams
                      params.append((name, value))
                  # methods used to generates the bundle2 stream
                  def getchunks(self, ui):
                      if self._generated is not None:
                          raise error.ProgrammingError(b'part can only be consumed once')
                      self._generated = False
                      if ui.debugflag:
                          msg = [b'bundle2-output-part: "%s"' % self.type]
                          if not self.mandatory:
                              msg.append(b' (advisory)')
                          nbmp = len(self.mandatoryparams)
                          nbap = len(self.advisoryparams)
                          if nbmp or nbap:
                              msg.append(b' (params:')
                              if nbmp:
                                  msg.append(b' %i mandatory' % nbmp)
                              if nbap:
                                  msg.append(b' %i advisory' % nbmp)
                              msg.append(b')')
                          if not self.data:
                              msg.append(b' empty payload')
-                         elif util.safehasattr(self.data, b'next') or util.safehasattr(
+                         elif util.safehasattr(self.data, 'next') or util.safehasattr(
                              self.data, b'__next__'
                          ):
                              msg.append(b' streamed payload')
                          else:
                              msg.append(b' %i bytes payload' % len(self.data))
                          msg.append(b'\n')
                          ui.debug(b''.join(msg))
                      #### header
                      if self.mandatory:
                          parttype = self.type.upper()
                      else:
                          parttype = self.type.lower()
                      outdebug(ui, b'part %s: "%s"' % (pycompat.bytestr(self.id), parttype))
                      ## parttype
                      header = [
                          _pack(_fparttypesize, len(parttype)),
                          parttype,
                          _pack(_fpartid, self.id),
                      ]
                      ## parameters
                      # count
                      manpar = self.mandatoryparams
                      advpar = self.advisoryparams
                      header.append(_pack(_fpartparamcount, len(manpar), len(advpar)))
                      # size
                      parsizes = []
                      for key, value in manpar:
                          parsizes.append(len(key))
                          parsizes.append(len(value))
                      for key, value in advpar:
                          parsizes.append(len(key))
                          parsizes.append(len(value))
                      paramsizes = _pack(_makefpartparamsizes(len(parsizes) // 2), *parsizes)
                      header.append(paramsizes)
                      # key, value
                      for key, value in manpar:
                          header.append(key)
                          header.append(value)
                      for key, value in advpar:
                          header.append(key)
                          header.append(value)
                      ## finalize header
                      try:
                          headerchunk = b''.join(header)
                      except TypeError:
                          raise TypeError(
                              r'Found a non-bytes trying to '
                              r'build bundle part header: %r' % header
                          )
                      outdebug(ui, b'header chunk size: %i' % len(headerchunk))
                      yield _pack(_fpartheadersize, len(headerchunk))
                      yield headerchunk
                      ## payload
                      try:
                          for chunk in self._payloadchunks():
                              outdebug(ui, b'payload chunk size: %i' % len(chunk))
                              yield _pack(_fpayloadsize, len(chunk))
                              yield chunk
                      except GeneratorExit:
                          # GeneratorExit means that nobody is listening for our
                          # results anyway, so just bail quickly rather than trying
                          # to produce an error part.
                          ui.debug(b'bundle2-generatorexit\n')
                          raise
                      except BaseException as exc:
                          bexc = stringutil.forcebytestr(exc)
                          # backup exception data for later
                          ui.debug(
                              b'bundle2-input-stream-interrupt: encoding exception %s' % bexc
                          )
                          tb = sys.exc_info()[2]
                          msg = b'unexpected error: %s' % bexc
                          interpart = bundlepart(
                              b'error:abort', [(b'message', msg)], mandatory=False
                          )
                          interpart.id = 0
                          yield _pack(_fpayloadsize, -1)
                          for chunk in interpart.getchunks(ui=ui):
                              yield chunk
                          outdebug(ui, b'closing payload chunk')
                          # abort current part payload
                          yield _pack(_fpayloadsize, 0)
                          pycompat.raisewithtb(exc, tb)
                      # end of payload
                      outdebug(ui, b'closing payload chunk')
                      yield _pack(_fpayloadsize, 0)
                      self._generated = True
                  def _payloadchunks(self):
                      """yield chunks of a the part payload
                      Exists to handle the different methods to provide data to a part."""
                      # we only support fixed size data now.
                      # This will be improved in the future.
-                     if util.safehasattr(self.data, b'next') or util.safehasattr(
+                     if util.safehasattr(self.data, 'next') or util.safehasattr(
                          self.data, b'__next__'
                      ):
                          buff = util.chunkbuffer(self.data)
                          chunk = buff.read(preferedchunksize)
                          while chunk:
                              yield chunk
                              chunk = buff.read(preferedchunksize)
                      elif len(self.data):
                          yield self.data
              flaginterrupt = -1
              class interrupthandler(unpackermixin):
                  """read one part and process it with restricted capability
                  This allows to transmit exception raised on the producer size during part
                  iteration while the consumer is reading a part.
                  Part processed in this manner only have access to a ui object,"""
                  def __init__(self, ui, fp):
                      super(interrupthandler, self).__init__(fp)
                      self.ui = ui
                  def _readpartheader(self):
                      """reads a part header size and return the bytes blob
                      returns None if empty"""
                      headersize = self._unpack(_fpartheadersize)[0]
                      if headersize < 0:
                          raise error.BundleValueError(
                              b'negative part header size: %i' % headersize
                          )
                      indebug(self.ui, b'part header size: %i\n' % headersize)
                      if headersize:
                          return self._readexact(headersize)
                      return None
                  def __call__(self):
                      self.ui.debug(
                          b'bundle2-input-stream-interrupt:' b' opening out of band context\n'
                      )
                      indebug(self.ui, b'bundle2 stream interruption, looking for a part.')
                      headerblock = self._readpartheader()
                      if headerblock is None:
                          indebug(self.ui, b'no part found during interruption.')
                          return
                      part = unbundlepart(self.ui, headerblock, self._fp)
                      op = interruptoperation(self.ui)
                      hardabort = False
                      try:
                          _processpart(op, part)
                      except (SystemExit, KeyboardInterrupt):
                          hardabort = True
                          raise
                      finally:
                          if not hardabort:
                              part.consume()
                      self.ui.debug(
                          b'bundle2-input-stream-interrupt:' b' closing out of band context\n'
                      )
              class interruptoperation(object):
                  """A limited operation to be use by part handler during interruption
                  It only have access to an ui object.
                  """
                  def __init__(self, ui):
                      self.ui = ui
                      self.reply = None
                      self.captureoutput = False
                  @property
                  def repo(self):
                      raise error.ProgrammingError(b'no repo access from stream interruption')
                  def gettransaction(self):
                      raise TransactionUnavailable(b'no repo access from stream interruption')
              def decodepayloadchunks(ui, fh):
                  """Reads bundle2 part payload data into chunks.
                  Part payload data consists of framed chunks. This function takes
                  a file handle and emits those chunks.
                  """
                  dolog = ui.configbool(b'devel', b'bundle2.debug')
                  debug = ui.debug
                  headerstruct = struct.Struct(_fpayloadsize)
                  headersize = headerstruct.size
                  unpack = headerstruct.unpack
                  readexactly = changegroup.readexactly
                  read = fh.read
                  chunksize = unpack(readexactly(fh, headersize))[0]
                  indebug(ui, b'payload chunk size: %i' % chunksize)
                  # changegroup.readexactly() is inlined below for performance.
                  while chunksize:
                      if chunksize >= 0:
                          s = read(chunksize)
                          if len(s) < chunksize:
                              raise error.Abort(
                                  _(
                                      b'stream ended unexpectedly '
                                      b' (got %d bytes, expected %d)'
                                  )
                                  % (len(s), chunksize)
                              )
                          yield s
                      elif chunksize == flaginterrupt:
                          # Interrupt "signal" detected. The regular stream is interrupted
                          # and a bundle2 part follows. Consume it.
                          interrupthandler(ui, fh)()
                      else:
                          raise error.BundleValueError(
                              b'negative payload chunk size: %s' % chunksize
                          )
                      s = read(headersize)
                      if len(s) < headersize:
                          raise error.Abort(
                              _(b'stream ended unexpectedly ' b' (got %d bytes, expected %d)')
                              % (len(s), chunksize)
                          )
                      chunksize = unpack(s)[0]
                      # indebug() inlined for performance.
                      if dolog:
                          debug(b'bundle2-input: payload chunk size: %i\n' % chunksize)
              class unbundlepart(unpackermixin):
                  """a bundle part read from a bundle"""
                  def __init__(self, ui, header, fp):
                      super(unbundlepart, self).__init__(fp)
-                     self._seekable = util.safehasattr(fp, b'seek') and util.safehasattr(
+                     self._seekable = util.safehasattr(fp, 'seek') and util.safehasattr(
                          fp, b'tell'
                      )
                      self.ui = ui
                      # unbundle state attr
                      self._headerdata = header
                      self._headeroffset = 0
                      self._initialized = False
                      self.consumed = False
                      # part data
                      self.id = None
                      self.type = None
                      self.mandatoryparams = None
                      self.advisoryparams = None
                      self.params = None
                      self.mandatorykeys = ()
                      self._readheader()
                      self._mandatory = None
                      self._pos = 0
                  def _fromheader(self, size):
                      """return the next <size> byte from the header"""
                      offset = self._headeroffset
                      data = self._headerdata[offset : (offset + size)]
                      self._headeroffset = offset + size
                      return data
                  def _unpackheader(self, format):
                      """read given format from header
                      This automatically compute the size of the format to read."""
                      data = self._fromheader(struct.calcsize(format))
                      return _unpack(format, data)
                  def _initparams(self, mandatoryparams, advisoryparams):
                      """internal function to setup all logic related parameters"""
                      # make it read only to prevent people touching it by mistake.
                      self.mandatoryparams = tuple(mandatoryparams)
                      self.advisoryparams = tuple(advisoryparams)
                      # user friendly UI
                      self.params = util.sortdict(self.mandatoryparams)
                      self.params.update(self.advisoryparams)
                      self.mandatorykeys = frozenset(p[0] for p in mandatoryparams)
                  def _readheader(self):
                      """read the header and setup the object"""
                      typesize = self._unpackheader(_fparttypesize)[0]
                      self.type = self._fromheader(typesize)
                      indebug(self.ui, b'part type: "%s"' % self.type)
                      self.id = self._unpackheader(_fpartid)[0]
                      indebug(self.ui, b'part id: "%s"' % pycompat.bytestr(self.id))
                      # extract mandatory bit from type
                      self.mandatory = self.type != self.type.lower()
                      self.type = self.type.lower()
                      ## reading parameters
                      # param count
                      mancount, advcount = self._unpackheader(_fpartparamcount)
                      indebug(self.ui, b'part parameters: %i' % (mancount + advcount))
                      # param size
                      fparamsizes = _makefpartparamsizes(mancount + advcount)
                      paramsizes = self._unpackheader(fparamsizes)
                      # make it a list of couple again
                      paramsizes = list(zip(paramsizes[::2], paramsizes[1::2]))
                      # split mandatory from advisory
                      mansizes = paramsizes[:mancount]
                      advsizes = paramsizes[mancount:]
                      # retrieve param value
                      manparams = []
                      for key, value in mansizes:
                          manparams.append((self._fromheader(key), self._fromheader(value)))
                      advparams = []
                      for key, value in advsizes:
                          advparams.append((self._fromheader(key), self._fromheader(value)))
                      self._initparams(manparams, advparams)
                      ## part payload
                      self._payloadstream = util.chunkbuffer(self._payloadchunks())
                      # we read the data, tell it
                      self._initialized = True
                  def _payloadchunks(self):
                      """Generator of decoded chunks in the payload."""
                      return decodepayloadchunks(self.ui, self._fp)
                  def consume(self):
                      """Read the part payload until completion.
                      By consuming the part data, the underlying stream read offset will
                      be advanced to the next part (or end of stream).
                      """
                      if self.consumed:
                          return
                      chunk = self.read(32768)
                      while chunk:
                          self._pos += len(chunk)
                          chunk = self.read(32768)
                  def read(self, size=None):
                      """read payload data"""
                      if not self._initialized:
                          self._readheader()
                      if size is None:
                          data = self._payloadstream.read()
                      else:
                          data = self._payloadstream.read(size)
                      self._pos += len(data)
                      if size is None or len(data) < size:
                          if not self.consumed and self._pos:
                              self.ui.debug(
                                  b'bundle2-input-part: total payload size %i\n' % self._pos
                              )
                          self.consumed = True
                      return data
              class seekableunbundlepart(unbundlepart):
                  """A bundle2 part in a bundle that is seekable.
                  Regular ``unbundlepart`` instances can only be read once. This class
                  extends ``unbundlepart`` to enable bi-directional seeking within the
                  part.
                  Bundle2 part data consists of framed chunks. Offsets when seeking
                  refer to the decoded data, not the offsets in the underlying bundle2
                  stream.
                  To facilitate quickly seeking within the decoded data, instances of this
                  class maintain a mapping between offsets in the underlying stream and
                  the decoded payload. This mapping will consume memory in proportion
                  to the number of chunks within the payload (which almost certainly
                  increases in proportion with the size of the part).
                  """
                  def __init__(self, ui, header, fp):
                      # (payload, file) offsets for chunk starts.
                      self._chunkindex = []
                      super(seekableunbundlepart, self).__init__(ui, header, fp)
                  def _payloadchunks(self, chunknum=0):
                      '''seek to specified chunk and start yielding data'''
                      if len(self._chunkindex) == 0:
                          assert chunknum == 0, b'Must start with chunk 0'
                          self._chunkindex.append((0, self._tellfp()))
                      else:
                          assert chunknum < len(self._chunkindex), (
                              b'Unknown chunk %d' % chunknum
                          )
                          self._seekfp(self._chunkindex[chunknum][1])
                      pos = self._chunkindex[chunknum][0]
                      for chunk in decodepayloadchunks(self.ui, self._fp):
                          chunknum += 1
                          pos += len(chunk)
                          if chunknum == len(self._chunkindex):
                              self._chunkindex.append((pos, self._tellfp()))
                          yield chunk
                  def _findchunk(self, pos):
                      '''for a given payload position, return a chunk number and offset'''
                      for chunk, (ppos, fpos) in enumerate(self._chunkindex):
                          if ppos == pos:
                              return chunk, 0
                          elif ppos > pos:
                              return chunk - 1, pos - self._chunkindex[chunk - 1][0]
                      raise ValueError(b'Unknown chunk')
                  def tell(self):
                      return self._pos
                  def seek(self, offset, whence=os.SEEK_SET):
                      if whence == os.SEEK_SET:
                          newpos = offset
                      elif whence == os.SEEK_CUR:
                          newpos = self._pos + offset
                      elif whence == os.SEEK_END:
                          if not self.consumed:
                              # Can't use self.consume() here because it advances self._pos.
                              chunk = self.read(32768)
                              while chunk:
                                  chunk = self.read(32768)
                          newpos = self._chunkindex[-1][0] - offset
                      else:
                          raise ValueError(b'Unknown whence value: %r' % (whence,))
                      if newpos > self._chunkindex[-1][0] and not self.consumed:
                          # Can't use self.consume() here because it advances self._pos.
                          chunk = self.read(32768)
                          while chunk:
                              chunk = self.read(32668)
                      if not 0 <= newpos <= self._chunkindex[-1][0]:
                          raise ValueError(b'Offset out of range')
                      if self._pos != newpos:
                          chunk, internaloffset = self._findchunk(newpos)
                          self._payloadstream = util.chunkbuffer(self._payloadchunks(chunk))
                          adjust = self.read(internaloffset)
                          if len(adjust) != internaloffset:
                              raise error.Abort(_(b'Seek failed\n'))
                          self._pos = newpos
                  def _seekfp(self, offset, whence=0):
                      """move the underlying file pointer
                      This method is meant for internal usage by the bundle2 protocol only.
                      They directly manipulate the low level stream including bundle2 level
                      instruction.
                      Do not use it to implement higher-level logic or methods."""
                      if self._seekable:
                          return self._fp.seek(offset, whence)
                      else:
                          raise NotImplementedError(_(b'File pointer is not seekable'))
                  def _tellfp(self):
                      """return the file offset, or None if file is not seekable
                      This method is meant for internal usage by the bundle2 protocol only.
                      They directly manipulate the low level stream including bundle2 level
                      instruction.
                      Do not use it to implement higher-level logic or methods."""
                      if self._seekable:
                          try:
                              return self._fp.tell()
                          except IOError as e:
                              if e.errno == errno.ESPIPE:
                                  self._seekable = False
                              else:
                                  raise
                      return None
              # These are only the static capabilities.
              # Check the 'getrepocaps' function for the rest.
              capabilities = {
                  b'HG20': (),
                  b'bookmarks': (),
                  b'error': (b'abort', b'unsupportedcontent', b'pushraced', b'pushkey'),
                  b'listkeys': (),
                  b'pushkey': (),
                  b'digests': tuple(sorted(util.DIGESTS.keys())),
                  b'remote-changegroup': (b'http', b'https'),
                  b'hgtagsfnodes': (),
                  b'rev-branch-cache': (),
                  b'phases': (b'heads',),
                  b'stream': (b'v2',),
              }
              def getrepocaps(repo, allowpushback=False, role=None):
                  """return the bundle2 capabilities for a given repo
                  Exists to allow extensions (like evolution) to mutate the capabilities.
                  The returned value is used for servers advertising their capabilities as
                  well as clients advertising their capabilities to servers as part of
                  bundle2 requests. The ``role`` argument specifies which is which.
                  """
                  if role not in (b'client', b'server'):
                      raise error.ProgrammingError(b'role argument must be client or server')
                  caps = capabilities.copy()
                  caps[b'changegroup'] = tuple(
                      sorted(changegroup.supportedincomingversions(repo))
                  )
                  if obsolete.isenabled(repo, obsolete.exchangeopt):
                      supportedformat = tuple(b'V%i' % v for v in obsolete.formats)
                      caps[b'obsmarkers'] = supportedformat
                  if allowpushback:
                      caps[b'pushback'] = ()
                  cpmode = repo.ui.config(b'server', b'concurrent-push-mode')
                  if cpmode == b'check-related':
                      caps[b'checkheads'] = (b'related',)
                  if b'phases' in repo.ui.configlist(b'devel', b'legacy.exchange'):
                      caps.pop(b'phases')
                  # Don't advertise stream clone support in server mode if not configured.
                  if role == b'server':
                      streamsupported = repo.ui.configbool(
                          b'server', b'uncompressed', untrusted=True
                      )
                      featuresupported = repo.ui.configbool(b'server', b'bundle2.stream')
                      if not streamsupported or not featuresupported:
                          caps.pop(b'stream')
                  # Else always advertise support on client, because payload support
                  # should always be advertised.
                  return caps
              def bundle2caps(remote):
                  """return the bundle capabilities of a peer as dict"""
                  raw = remote.capable(b'bundle2')
                  if not raw and raw != b'':
                      return {}
                  capsblob = urlreq.unquote(remote.capable(b'bundle2'))
                  return decodecaps(capsblob)
              def obsmarkersversion(caps):
                  """extract the list of supported obsmarkers versions from a bundle2caps dict
                  """
                  obscaps = caps.get(b'obsmarkers', ())
                  return [int(c[1:]) for c in obscaps if c.startswith(b'V')]
              def writenewbundle(
                  ui,
                  repo,
                  source,
                  filename,
                  bundletype,
                  outgoing,
                  opts,
                  vfs=None,
                  compression=None,
                  compopts=None,
              ):
                  if bundletype.startswith(b'HG10'):
                      cg = changegroup.makechangegroup(repo, outgoing, b'01', source)
                      return writebundle(
                          ui,
                          cg,
                          filename,
                          bundletype,
                          vfs=vfs,
                          compression=compression,
                          compopts=compopts,
                      )
                  elif not bundletype.startswith(b'HG20'):
                      raise error.ProgrammingError(b'unknown bundle type: %s' % bundletype)
                  caps = {}
                  if b'obsolescence' in opts:
                      caps[b'obsmarkers'] = (b'V1',)
                  bundle = bundle20(ui, caps)
                  bundle.setcompression(compression, compopts)
                  _addpartsfromopts(ui, repo, bundle, source, outgoing, opts)
                  chunkiter = bundle.getchunks()
                  return changegroup.writechunks(ui, chunkiter, filename, vfs=vfs)
              def _addpartsfromopts(ui, repo, bundler, source, outgoing, opts):
                  # We should eventually reconcile this logic with the one behind
                  # 'exchange.getbundle2partsgenerator'.
                  #
                  # The type of input from 'getbundle' and 'writenewbundle' are a bit
                  # different right now. So we keep them separated for now for the sake of
                  # simplicity.
                  # we might not always want a changegroup in such bundle, for example in
                  # stream bundles
                  if opts.get(b'changegroup', True):
                      cgversion = opts.get(b'cg.version')
                      if cgversion is None:
                          cgversion = changegroup.safeversion(repo)
                      cg = changegroup.makechangegroup(repo, outgoing, cgversion, source)
                      part = bundler.newpart(b'changegroup', data=cg.getchunks())
                      part.addparam(b'version', cg.version)
                      if b'clcount' in cg.extras:
                          part.addparam(
                              b'nbchanges', b'%d' % cg.extras[b'clcount'], mandatory=False
                          )
                      if opts.get(b'phases') and repo.revs(
                          b'%ln and secret()', outgoing.missingheads
                      ):
                          part.addparam(
                              b'targetphase', b'%d' % phases.secret, mandatory=False
                          )
                  if opts.get(b'streamv2', False):
                      addpartbundlestream2(bundler, repo, stream=True)
                  if opts.get(b'tagsfnodescache', True):
                      addparttagsfnodescache(repo, bundler, outgoing)
                  if opts.get(b'revbranchcache', True):
                      addpartrevbranchcache(repo, bundler, outgoing)
                  if opts.get(b'obsolescence', False):
                      obsmarkers = repo.obsstore.relevantmarkers(outgoing.missing)
                      buildobsmarkerspart(bundler, obsmarkers)
                  if opts.get(b'phases', False):
                      headsbyphase = phases.subsetphaseheads(repo, outgoing.missing)
                      phasedata = phases.binaryencode(headsbyphase)
                      bundler.newpart(b'phase-heads', data=phasedata)
              def addparttagsfnodescache(repo, bundler, outgoing):
                  # we include the tags fnode cache for the bundle changeset
                  # (as an optional parts)
                  cache = tags.hgtagsfnodescache(repo.unfiltered())
                  chunks = []
                  # .hgtags fnodes are only relevant for head changesets. While we could
                  # transfer values for all known nodes, there will likely be little to
                  # no benefit.
                  #
                  # We don't bother using a generator to produce output data because
                  # a) we only have 40 bytes per head and even esoteric numbers of heads
                  # consume little memory (1M heads is 40MB) b) we don't want to send the
                  # part if we don't have entries and knowing if we have entries requires
                  # cache lookups.
                  for node in outgoing.missingheads:
                      # Don't compute missing, as this may slow down serving.
                      fnode = cache.getfnode(node, computemissing=False)
                      if fnode is not None:
                          chunks.extend([node, fnode])
                  if chunks:
                      bundler.newpart(b'hgtagsfnodes', data=b''.join(chunks))
              def addpartrevbranchcache(repo, bundler, outgoing):
                  # we include the rev branch cache for the bundle changeset
                  # (as an optional parts)
                  cache = repo.revbranchcache()
                  cl = repo.unfiltered().changelog
                  branchesdata = collections.defaultdict(lambda: (set(), set()))
                  for node in outgoing.missing:
                      branch, close = cache.branchinfo(cl.rev(node))
                      branchesdata[branch][close].add(node)
                  def generate():
                      for branch, (nodes, closed) in sorted(branchesdata.items()):
                          utf8branch = encoding.fromlocal(branch)
                          yield rbcstruct.pack(len(utf8branch), len(nodes), len(closed))
                          yield utf8branch
                          for n in sorted(nodes):
                              yield n
                          for n in sorted(closed):
                              yield n
                  bundler.newpart(b'cache:rev-branch-cache', data=generate(), mandatory=False)
              def _formatrequirementsspec(requirements):
                  requirements = [req for req in requirements if req != b"shared"]
                  return urlreq.quote(b','.join(sorted(requirements)))
              def _formatrequirementsparams(requirements):
                  requirements = _formatrequirementsspec(requirements)
                  params = b"%s%s" % (urlreq.quote(b"requirements="), requirements)
                  return params
              def addpartbundlestream2(bundler, repo, **kwargs):
                  if not kwargs.get(r'stream', False):
                      return
                  if not streamclone.allowservergeneration(repo):
                      raise error.Abort(
                          _(
                              b'stream data requested but server does not allow '
                              b'this feature'
                          ),
                          hint=_(
                              b'well-behaved clients should not be '
                              b'requesting stream data from servers not '
                              b'advertising it; the client may be buggy'
                          ),
                      )
                  # Stream clones don't compress well. And compression undermines a
                  # goal of stream clones, which is to be fast. Communicate the desire
                  # to avoid compression to consumers of the bundle.
                  bundler.prefercompressed = False
                  # get the includes and excludes
                  includepats = kwargs.get(r'includepats')
                  excludepats = kwargs.get(r'excludepats')
                  narrowstream = repo.ui.configbool(
                      b'experimental', b'server.stream-narrow-clones'
                  )
                  if (includepats or excludepats) and not narrowstream:
                      raise error.Abort(_(b'server does not support narrow stream clones'))
                  includeobsmarkers = False
                  if repo.obsstore:
                      remoteversions = obsmarkersversion(bundler.capabilities)
                      if not remoteversions:
                          raise error.Abort(
                              _(
                                  b'server has obsolescence markers, but client '
                                  b'cannot receive them via stream clone'
                              )
                          )
                      elif repo.obsstore._version in remoteversions:
                          includeobsmarkers = True
                  filecount, bytecount, it = streamclone.generatev2(
                      repo, includepats, excludepats, includeobsmarkers
                  )
                  requirements = _formatrequirementsspec(repo.requirements)
                  part = bundler.newpart(b'stream2', data=it)
                  part.addparam(b'bytecount', b'%d' % bytecount, mandatory=True)
                  part.addparam(b'filecount', b'%d' % filecount, mandatory=True)
                  part.addparam(b'requirements', requirements, mandatory=True)
              def buildobsmarkerspart(bundler, markers):
                  """add an obsmarker part to the bundler with <markers>
                  No part is created if markers is empty.
                  Raises ValueError if the bundler doesn't support any known obsmarker format.
                  """
                  if not markers:
                      return None
                  remoteversions = obsmarkersversion(bundler.capabilities)
                  version = obsolete.commonversion(remoteversions)
                  if version is None:
                      raise ValueError(b'bundler does not support common obsmarker format')
                  stream = obsolete.encodemarkers(markers, True, version=version)
                  return bundler.newpart(b'obsmarkers', data=stream)
              def writebundle(
                  ui, cg, filename, bundletype, vfs=None, compression=None, compopts=None
              ):
                  """Write a bundle file and return its filename.
                  Existing files will not be overwritten.
                  If no filename is specified, a temporary file is created.
                  bz2 compression can be turned off.
                  The bundle file will be deleted in case of errors.
                  """
                  if bundletype == b"HG20":
                      bundle = bundle20(ui)
                      bundle.setcompression(compression, compopts)
                      part = bundle.newpart(b'changegroup', data=cg.getchunks())
                      part.addparam(b'version', cg.version)
                      if b'clcount' in cg.extras:
                          part.addparam(
                              b'nbchanges', b'%d' % cg.extras[b'clcount'], mandatory=False
                          )
                      chunkiter = bundle.getchunks()
                  else:
                      # compression argument is only for the bundle2 case
                      assert compression is None
                      if cg.version != b'01':
                          raise error.Abort(
                              _(b'old bundle types only supports v1 ' b'changegroups')
                          )
                      header, comp = bundletypes[bundletype]
                      if comp not in util.compengines.supportedbundletypes:
                          raise error.Abort(_(b'unknown stream compression type: %s') % comp)
                      compengine = util.compengines.forbundletype(comp)
                      def chunkiter():
                          yield header
                          for chunk in compengine.compressstream(cg.getchunks(), compopts):
                              yield chunk
                      chunkiter = chunkiter()
                  # parse the changegroup data, otherwise we will block
                  # in case of sshrepo because we don't know the end of the stream
                  return changegroup.writechunks(ui, chunkiter, filename, vfs=vfs)
              def combinechangegroupresults(op):
                  """logic to combine 0 or more addchangegroup results into one"""
                  results = [r.get(b'return', 0) for r in op.records[b'changegroup']]
                  changedheads = 0
                  result = 1
                  for ret in results:
                      # If any changegroup result is 0, return 0
                      if ret == 0:
                          result = 0
                          break
                      if ret < -1:
                          changedheads += ret + 1
                      elif ret > 1:
                          changedheads += ret - 1
                  if changedheads > 0:
                      result = 1 + changedheads
                  elif changedheads < 0:
                      result = -1 + changedheads
                  return result
              @parthandler(
                  b'changegroup', (b'version', b'nbchanges', b'treemanifest', b'targetphase')
              )
              def handlechangegroup(op, inpart):
                  """apply a changegroup part on the repo
                  This is a very early implementation that will massive rework before being
                  inflicted to any end-user.
                  """
                  from . import localrepo
                  tr = op.gettransaction()
                  unpackerversion = inpart.params.get(b'version', b'01')
                  # We should raise an appropriate exception here
                  cg = changegroup.getunbundler(unpackerversion, inpart, None)
                  # the source and url passed here are overwritten by the one contained in
                  # the transaction.hookargs argument. So 'bundle2' is a placeholder
                  nbchangesets = None
                  if b'nbchanges' in inpart.params:
                      nbchangesets = int(inpart.params.get(b'nbchanges'))
                  if (
                      b'treemanifest' in inpart.params
                      and b'treemanifest' not in op.repo.requirements
                  ):
                      if len(op.repo.changelog) != 0:
                          raise error.Abort(
                              _(
                                  b"bundle contains tree manifests, but local repo is "
                                  b"non-empty and does not use tree manifests"
                              )
                          )
                      op.repo.requirements.add(b'treemanifest')
                      op.repo.svfs.options = localrepo.resolvestorevfsoptions(
                          op.repo.ui, op.repo.requirements, op.repo.features
                      )
                      op.repo._writerequirements()
                  extrakwargs = {}
                  targetphase = inpart.params.get(b'targetphase')
                  if targetphase is not None:
                      extrakwargs[r'targetphase'] = int(targetphase)
                  ret = _processchangegroup(
                      op,
                      cg,
                      tr,
                      b'bundle2',
                      b'bundle2',
                      expectedtotal=nbchangesets,
                      **extrakwargs
                  )
                  if op.reply is not None:
                      # This is definitely not the final form of this
                      # return. But one need to start somewhere.
                      part = op.reply.newpart(b'reply:changegroup', mandatory=False)
                      part.addparam(
                          b'in-reply-to', pycompat.bytestr(inpart.id), mandatory=False
                      )
                      part.addparam(b'return', b'%i' % ret, mandatory=False)
                  assert not inpart.read()
              _remotechangegroupparams = tuple(
                  [b'url', b'size', b'digests']
                  + [b'digest:%s' % k for k in util.DIGESTS.keys()]
              )
              @parthandler(b'remote-changegroup', _remotechangegroupparams)
              def handleremotechangegroup(op, inpart):
                  """apply a bundle10 on the repo, given an url and validation information
                  All the information about the remote bundle to import are given as
                  parameters. The parameters include:
                    - url: the url to the bundle10.
                    - size: the bundle10 file size. It is used to validate what was
                      retrieved by the client matches the server knowledge about the bundle.
                    - digests: a space separated list of the digest types provided as
                      parameters.
                    - digest:<digest-type>: the hexadecimal representation of the digest with
                      that name. Like the size, it is used to validate what was retrieved by
                      the client matches what the server knows about the bundle.
                  When multiple digest types are given, all of them are checked.
                  """
                  try:
                      raw_url = inpart.params[b'url']
                  except KeyError:
                      raise error.Abort(_(b'remote-changegroup: missing "%s" param') % b'url')
                  parsed_url = util.url(raw_url)
                  if parsed_url.scheme not in capabilities[b'remote-changegroup']:
                      raise error.Abort(
                          _(b'remote-changegroup does not support %s urls')
                          % parsed_url.scheme
                      )
                  try:
                      size = int(inpart.params[b'size'])
                  except ValueError:
                      raise error.Abort(
                          _(b'remote-changegroup: invalid value for param "%s"') % b'size'
                      )
                  except KeyError:
                      raise error.Abort(
                          _(b'remote-changegroup: missing "%s" param') % b'size'
                      )
                  digests = {}
                  for typ in inpart.params.get(b'digests', b'').split():
                      param = b'digest:%s' % typ
                      try:
                          value = inpart.params[param]
                      except KeyError:
                          raise error.Abort(
                              _(b'remote-changegroup: missing "%s" param') % param
                          )
                      digests[typ] = value
                  real_part = util.digestchecker(url.open(op.ui, raw_url), size, digests)
                  tr = op.gettransaction()
                  from . import exchange
                  cg = exchange.readbundle(op.repo.ui, real_part, raw_url)
                  if not isinstance(cg, changegroup.cg1unpacker):
                      raise error.Abort(
                          _(b'%s: not a bundle version 1.0') % util.hidepassword(raw_url)
                      )
                  ret = _processchangegroup(op, cg, tr, b'bundle2', b'bundle2')
                  if op.reply is not None:
                      # This is definitely not the final form of this
                      # return. But one need to start somewhere.
                      part = op.reply.newpart(b'reply:changegroup')
                      part.addparam(
                          b'in-reply-to', pycompat.bytestr(inpart.id), mandatory=False
                      )
                      part.addparam(b'return', b'%i' % ret, mandatory=False)
                  try:
                      real_part.validate()
                  except error.Abort as e:
                      raise error.Abort(
                          _(b'bundle at %s is corrupted:\n%s')
                          % (util.hidepassword(raw_url), bytes(e))
                      )
                  assert not inpart.read()
              @parthandler(b'reply:changegroup', (b'return', b'in-reply-to'))
              def handlereplychangegroup(op, inpart):
                  ret = int(inpart.params[b'return'])
                  replyto = int(inpart.params[b'in-reply-to'])
                  op.records.add(b'changegroup', {b'return': ret}, replyto)
              @parthandler(b'check:bookmarks')
              def handlecheckbookmarks(op, inpart):
                  """check location of bookmarks
                  This part is to be used to detect push race regarding bookmark, it
                  contains binary encoded (bookmark, node) tuple. If the local state does
                  not marks the one in the part, a PushRaced exception is raised
                  """
                  bookdata = bookmarks.binarydecode(inpart)
                  msgstandard = (
                      b'remote repository changed while pushing - please try again '
                      b'(bookmark "%s" move from %s to %s)'
                  )
                  msgmissing = (
                      b'remote repository changed while pushing - please try again '
                      b'(bookmark "%s" is missing, expected %s)'
                  )
                  msgexist = (
                      b'remote repository changed while pushing - please try again '
                      b'(bookmark "%s" set on %s, expected missing)'
                  )
                  for book, node in bookdata:
                      currentnode = op.repo._bookmarks.get(book)
                      if currentnode != node:
                          if node is None:
                              finalmsg = msgexist % (book, nodemod.short(currentnode))
                          elif currentnode is None:
                              finalmsg = msgmissing % (book, nodemod.short(node))
                          else:
                              finalmsg = msgstandard % (
                                  book,
                                  nodemod.short(node),
                                  nodemod.short(currentnode),
                              )
                          raise error.PushRaced(finalmsg)
              @parthandler(b'check:heads')
              def handlecheckheads(op, inpart):
                  """check that head of the repo did not change
                  This is used to detect a push race when using unbundle.
                  This replaces the "heads" argument of unbundle."""
                  h = inpart.read(20)
                  heads = []
                  while len(h) == 20:
                      heads.append(h)
                      h = inpart.read(20)
                  assert not h
                  # Trigger a transaction so that we are guaranteed to have the lock now.
                  if op.ui.configbool(b'experimental', b'bundle2lazylocking'):
                      op.gettransaction()
                  if sorted(heads) != sorted(op.repo.heads()):
                      raise error.PushRaced(
                          b'remote repository changed while pushing - ' b'please try again'
                      )
              @parthandler(b'check:updated-heads')
              def handlecheckupdatedheads(op, inpart):
                  """check for race on the heads touched by a push
                  This is similar to 'check:heads' but focus on the heads actually updated
                  during the push. If other activities happen on unrelated heads, it is
                  ignored.
                  This allow server with high traffic to avoid push contention as long as
                  unrelated parts of the graph are involved."""
                  h = inpart.read(20)
                  heads = []
                  while len(h) == 20:
                      heads.append(h)
                      h = inpart.read(20)
                  assert not h
                  # trigger a transaction so that we are guaranteed to have the lock now.
                  if op.ui.configbool(b'experimental', b'bundle2lazylocking'):
                      op.gettransaction()
                  currentheads = set()
                  for ls in op.repo.branchmap().iterheads():
                      currentheads.update(ls)
                  for h in heads:
                      if h not in currentheads:
                          raise error.PushRaced(
                              b'remote repository changed while pushing - '
                              b'please try again'
                          )
              @parthandler(b'check:phases')
              def handlecheckphases(op, inpart):
                  """check that phase boundaries of the repository did not change
                  This is used to detect a push race.
                  """
                  phasetonodes = phases.binarydecode(inpart)
                  unfi = op.repo.unfiltered()
                  cl = unfi.changelog
                  phasecache = unfi._phasecache
                  msg = (
                      b'remote repository changed while pushing - please try again '
                      b'(%s is %s expected %s)'
                  )
                  for expectedphase, nodes in enumerate(phasetonodes):
                      for n in nodes:
                          actualphase = phasecache.phase(unfi, cl.rev(n))
                          if actualphase != expectedphase:
                              finalmsg = msg % (
                                  nodemod.short(n),
                                  phases.phasenames[actualphase],
                                  phases.phasenames[expectedphase],
                              )
                              raise error.PushRaced(finalmsg)
              @parthandler(b'output')
              def handleoutput(op, inpart):
                  """forward output captured on the server to the client"""
                  for line in inpart.read().splitlines():
                      op.ui.status(_(b'remote: %s\n') % line)
              @parthandler(b'replycaps')
              def handlereplycaps(op, inpart):
                  """Notify that a reply bundle should be created
                  The payload contains the capabilities information for the reply"""
                  caps = decodecaps(inpart.read())
                  if op.reply is None:
                      op.reply = bundle20(op.ui, caps)
              class AbortFromPart(error.Abort):
                  """Sub-class of Abort that denotes an error from a bundle2 part."""
              @parthandler(b'error:abort', (b'message', b'hint'))
              def handleerrorabort(op, inpart):
                  """Used to transmit abort error over the wire"""
                  raise AbortFromPart(
                      inpart.params[b'message'], hint=inpart.params.get(b'hint')
                  )
              @parthandler(
                  b'error:pushkey',
                  (b'namespace', b'key', b'new', b'old', b'ret', b'in-reply-to'),
              )
              def handleerrorpushkey(op, inpart):
                  """Used to transmit failure of a mandatory pushkey over the wire"""
                  kwargs = {}
                  for name in (b'namespace', b'key', b'new', b'old', b'ret'):
                      value = inpart.params.get(name)
                      if value is not None:
                          kwargs[name] = value
                  raise error.PushkeyFailed(
                      inpart.params[b'in-reply-to'], **pycompat.strkwargs(kwargs)
                  )
              @parthandler(b'error:unsupportedcontent', (b'parttype', b'params'))
              def handleerrorunsupportedcontent(op, inpart):
                  """Used to transmit unknown content error over the wire"""
                  kwargs = {}
                  parttype = inpart.params.get(b'parttype')
                  if parttype is not None:
                      kwargs[b'parttype'] = parttype
                  params = inpart.params.get(b'params')
                  if params is not None:
                      kwargs[b'params'] = params.split(b'\0')
                  raise error.BundleUnknownFeatureError(**pycompat.strkwargs(kwargs))
              @parthandler(b'error:pushraced', (b'message',))
              def handleerrorpushraced(op, inpart):
                  """Used to transmit push race error over the wire"""
                  raise error.ResponseError(_(b'push failed:'), inpart.params[b'message'])
              @parthandler(b'listkeys', (b'namespace',))
              def handlelistkeys(op, inpart):
                  """retrieve pushkey namespace content stored in a bundle2"""
                  namespace = inpart.params[b'namespace']
                  r = pushkey.decodekeys(inpart.read())
                  op.records.add(b'listkeys', (namespace, r))
              @parthandler(b'pushkey', (b'namespace', b'key', b'old', b'new'))
              def handlepushkey(op, inpart):
                  """process a pushkey request"""
                  dec = pushkey.decode
                  namespace = dec(inpart.params[b'namespace'])
                  key = dec(inpart.params[b'key'])
                  old = dec(inpart.params[b'old'])
                  new = dec(inpart.params[b'new'])
                  # Grab the transaction to ensure that we have the lock before performing the
                  # pushkey.
                  if op.ui.configbool(b'experimental', b'bundle2lazylocking'):
                      op.gettransaction()
                  ret = op.repo.pushkey(namespace, key, old, new)
                  record = {b'namespace': namespace, b'key': key, b'old': old, b'new': new}
                  op.records.add(b'pushkey', record)
                  if op.reply is not None:
                      rpart = op.reply.newpart(b'reply:pushkey')
                      rpart.addparam(
                          b'in-reply-to', pycompat.bytestr(inpart.id), mandatory=False
                      )
                      rpart.addparam(b'return', b'%i' % ret, mandatory=False)
                  if inpart.mandatory and not ret:
                      kwargs = {}
                      for key in (b'namespace', b'key', b'new', b'old', b'ret'):
                          if key in inpart.params:
                              kwargs[key] = inpart.params[key]
                      raise error.PushkeyFailed(
                          partid=b'%d' % inpart.id, **pycompat.strkwargs(kwargs)
                      )
              @parthandler(b'bookmarks')
              def handlebookmark(op, inpart):
                  """transmit bookmark information
                  The part contains binary encoded bookmark information.
                  The exact behavior of this part can be controlled by the 'bookmarks' mode
                  on the bundle operation.
                  When mode is 'apply' (the default) the bookmark information is applied as
                  is to the unbundling repository. Make sure a 'check:bookmarks' part is
                  issued earlier to check for push races in such update. This behavior is
                  suitable for pushing.
                  When mode is 'records', the information is recorded into the 'bookmarks'
                  records of the bundle operation. This behavior is suitable for pulling.
                  """
                  changes = bookmarks.binarydecode(inpart)
                  pushkeycompat = op.repo.ui.configbool(
                      b'server', b'bookmarks-pushkey-compat'
                  )
                  bookmarksmode = op.modes.get(b'bookmarks', b'apply')
                  if bookmarksmode == b'apply':
                      tr = op.gettransaction()
                      bookstore = op.repo._bookmarks
                      if pushkeycompat:
                          allhooks = []
                          for book, node in changes:
                              hookargs = tr.hookargs.copy()
                              hookargs[b'pushkeycompat'] = b'1'
                              hookargs[b'namespace'] = b'bookmarks'
                              hookargs[b'key'] = book
                              hookargs[b'old'] = nodemod.hex(bookstore.get(book, b''))
                              hookargs[b'new'] = nodemod.hex(
                                  node if node is not None else b''
                              )
                              allhooks.append(hookargs)
                          for hookargs in allhooks:
                              op.repo.hook(
                                  b'prepushkey', throw=True, **pycompat.strkwargs(hookargs)
                              )
                      bookstore.applychanges(op.repo, op.gettransaction(), changes)
                      if pushkeycompat:
                          def runhook():
                              for hookargs in allhooks:
                                  op.repo.hook(b'pushkey', **pycompat.strkwargs(hookargs))
                          op.repo._afterlock(runhook)
                  elif bookmarksmode == b'records':
                      for book, node in changes:
                          record = {b'bookmark': book, b'node': node}
                          op.records.add(b'bookmarks', record)
                  else:
                      raise error.ProgrammingError(
                          b'unkown bookmark mode: %s' % bookmarksmode
                      )
              @parthandler(b'phase-heads')
              def handlephases(op, inpart):
                  """apply phases from bundle part to repo"""
                  headsbyphase = phases.binarydecode(inpart)
                  phases.updatephases(op.repo.unfiltered(), op.gettransaction, headsbyphase)
              @parthandler(b'reply:pushkey', (b'return', b'in-reply-to'))
              def handlepushkeyreply(op, inpart):
                  """retrieve the result of a pushkey request"""
                  ret = int(inpart.params[b'return'])
                  partid = int(inpart.params[b'in-reply-to'])
                  op.records.add(b'pushkey', {b'return': ret}, partid)
              @parthandler(b'obsmarkers')
              def handleobsmarker(op, inpart):
                  """add a stream of obsmarkers to the repo"""
                  tr = op.gettransaction()
                  markerdata = inpart.read()
                  if op.ui.config(b'experimental', b'obsmarkers-exchange-debug'):
                      op.ui.writenoi18n(
                          b'obsmarker-exchange: %i bytes received\n' % len(markerdata)
                      )
                  # The mergemarkers call will crash if marker creation is not enabled.
                  # we want to avoid this if the part is advisory.
                  if not inpart.mandatory and op.repo.obsstore.readonly:
                      op.repo.ui.debug(
                          b'ignoring obsolescence markers, feature not enabled\n'
                      )
                      return
                  new = op.repo.obsstore.mergemarkers(tr, markerdata)
                  op.repo.invalidatevolatilesets()
                  op.records.add(b'obsmarkers', {b'new': new})
                  if op.reply is not None:
                      rpart = op.reply.newpart(b'reply:obsmarkers')
                      rpart.addparam(
                          b'in-reply-to', pycompat.bytestr(inpart.id), mandatory=False
                      )
                      rpart.addparam(b'new', b'%i' % new, mandatory=False)
              @parthandler(b'reply:obsmarkers', (b'new', b'in-reply-to'))
              def handleobsmarkerreply(op, inpart):
                  """retrieve the result of a pushkey request"""
                  ret = int(inpart.params[b'new'])
                  partid = int(inpart.params[b'in-reply-to'])
                  op.records.add(b'obsmarkers', {b'new': ret}, partid)
              @parthandler(b'hgtagsfnodes')
              def handlehgtagsfnodes(op, inpart):
                  """Applies .hgtags fnodes cache entries to the local repo.
                  Payload is pairs of 20 byte changeset nodes and filenodes.
                  """
                  # Grab the transaction so we ensure that we have the lock at this point.
                  if op.ui.configbool(b'experimental', b'bundle2lazylocking'):
                      op.gettransaction()
                  cache = tags.hgtagsfnodescache(op.repo.unfiltered())
                  count = 0
                  while True:
                      node = inpart.read(20)
                      fnode = inpart.read(20)
                      if len(node) < 20 or len(fnode) < 20:
                          op.ui.debug(b'ignoring incomplete received .hgtags fnodes data\n')
                          break
                      cache.setfnode(node, fnode)
                      count += 1
                  cache.write()
                  op.ui.debug(b'applied %i hgtags fnodes cache entries\n' % count)
              rbcstruct = struct.Struct(b'>III')
              @parthandler(b'cache:rev-branch-cache')
              def handlerbc(op, inpart):
                  """receive a rev-branch-cache payload and update the local cache
                  The payload is a series of data related to each branch
 ) branch name length
 ) number of open heads
 ) number of closed heads
 ) open heads nodes
 ) closed heads nodes
                  """
                  total = 0
                  rawheader = inpart.read(rbcstruct.size)
                  cache = op.repo.revbranchcache()
                  cl = op.repo.unfiltered().changelog
                  while rawheader:
                      header = rbcstruct.unpack(rawheader)
                      total += header[1] + header[2]
                      utf8branch = inpart.read(header[0])
                      branch = encoding.tolocal(utf8branch)
                      for x in pycompat.xrange(header[1]):
                          node = inpart.read(20)
                          rev = cl.rev(node)
                          cache.setdata(branch, rev, node, False)
                      for x in pycompat.xrange(header[2]):
                          node = inpart.read(20)
                          rev = cl.rev(node)
                          cache.setdata(branch, rev, node, True)
                      rawheader = inpart.read(rbcstruct.size)
                  cache.write()
              @parthandler(b'pushvars')
              def bundle2getvars(op, part):
                  '''unbundle a bundle2 containing shellvars on the server'''
                  # An option to disable unbundling on server-side for security reasons
                  if op.ui.configbool(b'push', b'pushvars.server'):
                      hookargs = {}
                      for key, value in part.advisoryparams:
                          key = key.upper()
                          # We want pushed variables to have USERVAR_ prepended so we know
                          # they came from the --pushvar flag.
                          key = b"USERVAR_" + key
                          hookargs[key] = value
                      op.addhookargs(hookargs)
              @parthandler(b'stream2', (b'requirements', b'filecount', b'bytecount'))
              def handlestreamv2bundle(op, part):
                  requirements = urlreq.unquote(part.params[b'requirements']).split(b',')
                  filecount = int(part.params[b'filecount'])
                  bytecount = int(part.params[b'bytecount'])
                  repo = op.repo
                  if len(repo):
                      msg = _(b'cannot apply stream clone to non empty repository')
                      raise error.Abort(msg)
                  repo.ui.debug(b'applying stream bundle\n')
                  streamclone.applybundlev2(repo, part, filecount, bytecount, requirements)
              def widen_bundle(
                  bundler, repo, oldmatcher, newmatcher, common, known, cgversion, ellipses
              ):
                  """generates bundle2 for widening a narrow clone
                  bundler is the bundle to which data should be added
                  repo is the localrepository instance
                  oldmatcher matches what the client already has
                  newmatcher matches what the client needs (including what it already has)
                  common is set of common heads between server and client
                  known is a set of revs known on the client side (used in ellipses)
                  cgversion is the changegroup version to send
                  ellipses is boolean value telling whether to send ellipses data or not
                  returns bundle2 of the data required for extending
                  """
                  commonnodes = set()
                  cl = repo.changelog
                  for r in repo.revs(b"::%ln", common):
                      commonnodes.add(cl.node(r))
                  if commonnodes:
                      # XXX: we should only send the filelogs (and treemanifest). user
                      # already has the changelog and manifest
                      packer = changegroup.getbundler(
                          cgversion,
                          repo,
                          oldmatcher=oldmatcher,
                          matcher=newmatcher,
                          fullnodes=commonnodes,
                      )
                      cgdata = packer.generate(
                          {nodemod.nullid},
                          list(commonnodes),
                          False,
                          b'narrow_widen',
                          changelog=False,
                      )
                      part = bundler.newpart(b'changegroup', data=cgdata)
                      part.addparam(b'version', cgversion)
                      if b'treemanifest' in repo.requirements:
                          part.addparam(b'treemanifest', b'1')
                  return bundler

mercurial/bundlerepo.py

0 +1 -1

              # bundlerepo.py - repository class for viewing uncompressed bundles
              #
              # Copyright 2006, 2007 Benoit Boissinot <bboissin@gmail.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              """Repository class for viewing uncompressed bundles.
              This provides a read-only repository interface to bundles as if they
              were part of the actual repository.
              """
              from __future__ import absolute_import
              import os
              import shutil
              from .i18n import _
              from .node import nullid, nullrev
              from . import (
                  bundle2,
                  changegroup,
                  changelog,
                  cmdutil,
                  discovery,
                  encoding,
                  error,
                  exchange,
                  filelog,
                  localrepo,
                  manifest,
                  mdiff,
                  node as nodemod,
                  pathutil,
                  phases,
                  pycompat,
                  revlog,
                  util,
                  vfs as vfsmod,
              )
              class bundlerevlog(revlog.revlog):
                  def __init__(self, opener, indexfile, cgunpacker, linkmapper):
                      # How it works:
                      # To retrieve a revision, we need to know the offset of the revision in
                      # the bundle (an unbundle object). We store this offset in the index
                      # (start). The base of the delta is stored in the base field.
                      #
                      # To differentiate a rev in the bundle from a rev in the revlog, we
                      # check revision against repotiprev.
                      opener = vfsmod.readonlyvfs(opener)
                      revlog.revlog.__init__(self, opener, indexfile)
                      self.bundle = cgunpacker
                      n = len(self)
                      self.repotiprev = n - 1
                      self.bundlerevs = set()  # used by 'bundle()' revset expression
                      for deltadata in cgunpacker.deltaiter():
                          node, p1, p2, cs, deltabase, delta, flags = deltadata
                          size = len(delta)
                          start = cgunpacker.tell() - size
                          link = linkmapper(cs)
                          if node in self.nodemap:
                              # this can happen if two branches make the same change
                              self.bundlerevs.add(self.nodemap[node])
                              continue
                          for p in (p1, p2):
                              if p not in self.nodemap:
                                  raise error.LookupError(
                                      p, self.indexfile, _(b"unknown parent")
                                  )
                          if deltabase not in self.nodemap:
                              raise LookupError(
                                  deltabase, self.indexfile, _(b'unknown delta base')
                              )
                          baserev = self.rev(deltabase)
                          # start, size, full unc. size, base (unused), link, p1, p2, node
                          e = (
                              revlog.offset_type(start, flags),
                              size,
                              -1,
                              baserev,
                              link,
                              self.rev(p1),
                              self.rev(p2),
                              node,
                          )
                          self.index.append(e)
                          self.nodemap[node] = n
                          self.bundlerevs.add(n)
                          n += 1
                  def _chunk(self, rev, df=None):
                      # Warning: in case of bundle, the diff is against what we stored as
                      # delta base, not against rev - 1
                      # XXX: could use some caching
                      if rev <= self.repotiprev:
                          return revlog.revlog._chunk(self, rev)
                      self.bundle.seek(self.start(rev))
                      return self.bundle.read(self.length(rev))
                  def revdiff(self, rev1, rev2):
                      """return or calculate a delta between two revisions"""
                      if rev1 > self.repotiprev and rev2 > self.repotiprev:
                          # hot path for bundle
                          revb = self.index[rev2][3]
                          if revb == rev1:
                              return self._chunk(rev2)
                      elif rev1 <= self.repotiprev and rev2 <= self.repotiprev:
                          return revlog.revlog.revdiff(self, rev1, rev2)
                      return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))
                  def _rawtext(self, node, rev, _df=None):
                      if rev is None:
                          rev = self.rev(node)
                      validated = False
                      rawtext = None
                      chain = []
                      iterrev = rev
                      # reconstruct the revision if it is from a changegroup
                      while iterrev > self.repotiprev:
                          if self._revisioncache and self._revisioncache[1] == iterrev:
                              rawtext = self._revisioncache[2]
                              break
                          chain.append(iterrev)
                          iterrev = self.index[iterrev][3]
                      if iterrev == nullrev:
                          rawtext = b''
                      elif rawtext is None:
                          r = super(bundlerevlog, self)._rawtext(
                              self.node(iterrev), iterrev, _df=_df
                          )
                          __, rawtext, validated = r
                      if chain:
                          validated = False
                      while chain:
                          delta = self._chunk(chain.pop())
                          rawtext = mdiff.patches(rawtext, [delta])
                      return rev, rawtext, validated
                  def addrevision(self, *args, **kwargs):
                      raise NotImplementedError
                  def addgroup(self, *args, **kwargs):
                      raise NotImplementedError
                  def strip(self, *args, **kwargs):
                      raise NotImplementedError
                  def checksize(self):
                      raise NotImplementedError
              class bundlechangelog(bundlerevlog, changelog.changelog):
                  def __init__(self, opener, cgunpacker):
                      changelog.changelog.__init__(self, opener)
                      linkmapper = lambda x: x
                      bundlerevlog.__init__(
                          self, opener, self.indexfile, cgunpacker, linkmapper
                      )
              class bundlemanifest(bundlerevlog, manifest.manifestrevlog):
                  def __init__(
                      self, opener, cgunpacker, linkmapper, dirlogstarts=None, dir=b''
                  ):
                      manifest.manifestrevlog.__init__(self, opener, tree=dir)
                      bundlerevlog.__init__(
                          self, opener, self.indexfile, cgunpacker, linkmapper
                      )
                      if dirlogstarts is None:
                          dirlogstarts = {}
                          if self.bundle.version == b"03":
                              dirlogstarts = _getfilestarts(self.bundle)
                      self._dirlogstarts = dirlogstarts
                      self._linkmapper = linkmapper
                  def dirlog(self, d):
                      if d in self._dirlogstarts:
                          self.bundle.seek(self._dirlogstarts[d])
                          return bundlemanifest(
                              self.opener,
                              self.bundle,
                              self._linkmapper,
                              self._dirlogstarts,
                              dir=d,
                          )
                      return super(bundlemanifest, self).dirlog(d)
              class bundlefilelog(filelog.filelog):
                  def __init__(self, opener, path, cgunpacker, linkmapper):
                      filelog.filelog.__init__(self, opener, path)
                      self._revlog = bundlerevlog(
                          opener, self.indexfile, cgunpacker, linkmapper
                      )
              class bundlepeer(localrepo.localpeer):
                  def canpush(self):
                      return False
              class bundlephasecache(phases.phasecache):
                  def __init__(self, *args, **kwargs):
                      super(bundlephasecache, self).__init__(*args, **kwargs)
-                     if util.safehasattr(self, b'opener'):
+                     if util.safehasattr(self, 'opener'):
                          self.opener = vfsmod.readonlyvfs(self.opener)
                  def write(self):
                      raise NotImplementedError
                  def _write(self, fp):
                      raise NotImplementedError
                  def _updateroots(self, phase, newroots, tr):
                      self.phaseroots[phase] = newroots
                      self.invalidate()
                      self.dirty = True
              def _getfilestarts(cgunpacker):
                  filespos = {}
                  for chunkdata in iter(cgunpacker.filelogheader, {}):
                      fname = chunkdata[b'filename']
                      filespos[fname] = cgunpacker.tell()
                      for chunk in iter(lambda: cgunpacker.deltachunk(None), {}):
                          pass
                  return filespos
              class bundlerepository(object):
                  """A repository instance that is a union of a local repo and a bundle.
                  Instances represent a read-only repository composed of a local repository
                  with the contents of a bundle file applied. The repository instance is
                  conceptually similar to the state of a repository after an
                  ``hg unbundle`` operation. However, the contents of the bundle are never
                  applied to the actual base repository.
                  Instances constructed directly are not usable as repository objects.
                  Use instance() or makebundlerepository() to create instances.
                  """
                  def __init__(self, bundlepath, url, tempparent):
                      self._tempparent = tempparent
                      self._url = url
                      self.ui.setconfig(b'phases', b'publish', False, b'bundlerepo')
                      self.tempfile = None
                      f = util.posixfile(bundlepath, b"rb")
                      bundle = exchange.readbundle(self.ui, f, bundlepath)
                      if isinstance(bundle, bundle2.unbundle20):
                          self._bundlefile = bundle
                          self._cgunpacker = None
                          cgpart = None
                          for part in bundle.iterparts(seekable=True):
                              if part.type == b'changegroup':
                                  if cgpart:
                                      raise NotImplementedError(
                                          b"can't process " b"multiple changegroups"
                                      )
                                  cgpart = part
                              self._handlebundle2part(bundle, part)
                          if not cgpart:
                              raise error.Abort(_(b"No changegroups found"))
                          # This is required to placate a later consumer, which expects
                          # the payload offset to be at the beginning of the changegroup.
                          # We need to do this after the iterparts() generator advances
                          # because iterparts() will seek to end of payload after the
                          # generator returns control to iterparts().
                          cgpart.seek(0, os.SEEK_SET)
                      elif isinstance(bundle, changegroup.cg1unpacker):
                          if bundle.compressed():
                              f = self._writetempbundle(
                                  bundle.read, b'.hg10un', header=b'HG10UN'
                              )
                              bundle = exchange.readbundle(self.ui, f, bundlepath, self.vfs)
                          self._bundlefile = bundle
                          self._cgunpacker = bundle
                      else:
                          raise error.Abort(
                              _(b'bundle type %s cannot be read') % type(bundle)
                          )
                      # dict with the mapping 'filename' -> position in the changegroup.
                      self._cgfilespos = {}
                      self.firstnewrev = self.changelog.repotiprev + 1
                      phases.retractboundary(
                          self,
                          None,
                          phases.draft,
                          [ctx.node() for ctx in self[self.firstnewrev :]],
                      )
                  def _handlebundle2part(self, bundle, part):
                      if part.type != b'changegroup':
                          return
                      cgstream = part
                      version = part.params.get(b'version', b'01')
                      legalcgvers = changegroup.supportedincomingversions(self)
                      if version not in legalcgvers:
                          msg = _(b'Unsupported changegroup version: %s')
                          raise error.Abort(msg % version)
                      if bundle.compressed():
                          cgstream = self._writetempbundle(part.read, b'.cg%sun' % version)
                      self._cgunpacker = changegroup.getunbundler(version, cgstream, b'UN')
                  def _writetempbundle(self, readfn, suffix, header=b''):
                      """Write a temporary file to disk
                      """
                      fdtemp, temp = self.vfs.mkstemp(prefix=b"hg-bundle-", suffix=suffix)
                      self.tempfile = temp
                      with os.fdopen(fdtemp, r'wb') as fptemp:
                          fptemp.write(header)
                          while True:
                              chunk = readfn(2 ** 18)
                              if not chunk:
                                  break
                              fptemp.write(chunk)
                      return self.vfs.open(self.tempfile, mode=b"rb")
                  @localrepo.unfilteredpropertycache
                  def _phasecache(self):
                      return bundlephasecache(self, self._phasedefaults)
                  @localrepo.unfilteredpropertycache
                  def changelog(self):
                      # consume the header if it exists
                      self._cgunpacker.changelogheader()
                      c = bundlechangelog(self.svfs, self._cgunpacker)
                      self.manstart = self._cgunpacker.tell()
                      return c
                  def _refreshchangelog(self):
                      # changelog for bundle repo are not filecache, this method is not
                      # applicable.
                      pass
                  @localrepo.unfilteredpropertycache
                  def manifestlog(self):
                      self._cgunpacker.seek(self.manstart)
                      # consume the header if it exists
                      self._cgunpacker.manifestheader()
                      linkmapper = self.unfiltered().changelog.rev
                      rootstore = bundlemanifest(self.svfs, self._cgunpacker, linkmapper)
                      self.filestart = self._cgunpacker.tell()
                      return manifest.manifestlog(
                          self.svfs, self, rootstore, self.narrowmatch()
                      )
                  def _consumemanifest(self):
                      """Consumes the manifest portion of the bundle, setting filestart so the
                      file portion can be read."""
                      self._cgunpacker.seek(self.manstart)
                      self._cgunpacker.manifestheader()
                      for delta in self._cgunpacker.deltaiter():
                          pass
                      self.filestart = self._cgunpacker.tell()
                  @localrepo.unfilteredpropertycache
                  def manstart(self):
                      self.changelog
                      return self.manstart
                  @localrepo.unfilteredpropertycache
                  def filestart(self):
                      self.manifestlog
                      # If filestart was not set by self.manifestlog, that means the
                      # manifestlog implementation did not consume the manifests from the
                      # changegroup (ex: it might be consuming trees from a separate bundle2
                      # part instead). So we need to manually consume it.
                      if r'filestart' not in self.__dict__:
                          self._consumemanifest()
                      return self.filestart
                  def url(self):
                      return self._url
                  def file(self, f):
                      if not self._cgfilespos:
                          self._cgunpacker.seek(self.filestart)
                          self._cgfilespos = _getfilestarts(self._cgunpacker)
                      if f in self._cgfilespos:
                          self._cgunpacker.seek(self._cgfilespos[f])
                          linkmapper = self.unfiltered().changelog.rev
                          return bundlefilelog(self.svfs, f, self._cgunpacker, linkmapper)
                      else:
                          return super(bundlerepository, self).file(f)
                  def close(self):
                      """Close assigned bundle file immediately."""
                      self._bundlefile.close()
                      if self.tempfile is not None:
                          self.vfs.unlink(self.tempfile)
                      if self._tempparent:
                          shutil.rmtree(self._tempparent, True)
                  def cancopy(self):
                      return False
                  def peer(self):
                      return bundlepeer(self)
                  def getcwd(self):
                      return encoding.getcwd()  # always outside the repo
                  # Check if parents exist in localrepo before setting
                  def setparents(self, p1, p2=nullid):
                      p1rev = self.changelog.rev(p1)
                      p2rev = self.changelog.rev(p2)
                      msg = _(b"setting parent to node %s that only exists in the bundle\n")
                      if self.changelog.repotiprev < p1rev:
                          self.ui.warn(msg % nodemod.hex(p1))
                      if self.changelog.repotiprev < p2rev:
                          self.ui.warn(msg % nodemod.hex(p2))
                      return super(bundlerepository, self).setparents(p1, p2)
              def instance(ui, path, create, intents=None, createopts=None):
                  if create:
                      raise error.Abort(_(b'cannot create new bundle repository'))
                  # internal config: bundle.mainreporoot
                  parentpath = ui.config(b"bundle", b"mainreporoot")
                  if not parentpath:
                      # try to find the correct path to the working directory repo
                      parentpath = cmdutil.findrepo(encoding.getcwd())
                      if parentpath is None:
                          parentpath = b''
                  if parentpath:
                      # Try to make the full path relative so we get a nice, short URL.
                      # In particular, we don't want temp dir names in test outputs.
                      cwd = encoding.getcwd()
                      if parentpath == cwd:
                          parentpath = b''
                      else:
                          cwd = pathutil.normasprefix(cwd)
                          if parentpath.startswith(cwd):
                              parentpath = parentpath[len(cwd) :]
                  u = util.url(path)
                  path = u.localpath()
                  if u.scheme == b'bundle':
                      s = path.split(b"+", 1)
                      if len(s) == 1:
                          repopath, bundlename = parentpath, s[0]
                      else:
                          repopath, bundlename = s
                  else:
                      repopath, bundlename = parentpath, path
                  return makebundlerepository(ui, repopath, bundlename)
              def makebundlerepository(ui, repopath, bundlepath):
                  """Make a bundle repository object based on repo and bundle paths."""
                  if repopath:
                      url = b'bundle:%s+%s' % (util.expandpath(repopath), bundlepath)
                  else:
                      url = b'bundle:%s' % bundlepath
                  # Because we can't make any guarantees about the type of the base
                  # repository, we can't have a static class representing the bundle
                  # repository. We also can't make any guarantees about how to even
                  # call the base repository's constructor!
                  #
                  # So, our strategy is to go through ``localrepo.instance()`` to construct
                  # a repo instance. Then, we dynamically create a new type derived from
                  # both it and our ``bundlerepository`` class which overrides some
                  # functionality. We then change the type of the constructed repository
                  # to this new type and initialize the bundle-specific bits of it.
                  try:
                      repo = localrepo.instance(ui, repopath, create=False)
                      tempparent = None
                  except error.RepoError:
                      tempparent = pycompat.mkdtemp()
                      try:
                          repo = localrepo.instance(ui, tempparent, create=True)
                      except Exception:
                          shutil.rmtree(tempparent)
                          raise
                  class derivedbundlerepository(bundlerepository, repo.__class__):
                      pass
                  repo.__class__ = derivedbundlerepository
                  bundlerepository.__init__(repo, bundlepath, url, tempparent)
                  return repo
              class bundletransactionmanager(object):
                  def transaction(self):
                      return None
                  def close(self):
                      raise NotImplementedError
                  def release(self):
                      raise NotImplementedError
              def getremotechanges(
                  ui, repo, peer, onlyheads=None, bundlename=None, force=False
              ):
                  '''obtains a bundle of changes incoming from peer
                  "onlyheads" restricts the returned changes to those reachable from the
                    specified heads.
                  "bundlename", if given, stores the bundle to this file path permanently;
                    otherwise it's stored to a temp file and gets deleted again when you call
                    the returned "cleanupfn".
                  "force" indicates whether to proceed on unrelated repos.
                  Returns a tuple (local, csets, cleanupfn):
                  "local" is a local repo from which to obtain the actual incoming
                    changesets; it is a bundlerepo for the obtained bundle when the
                    original "peer" is remote.
                  "csets" lists the incoming changeset node ids.
                  "cleanupfn" must be called without arguments when you're done processing
                    the changes; it closes both the original "peer" and the one returned
                    here.
                  '''
                  tmp = discovery.findcommonincoming(repo, peer, heads=onlyheads, force=force)
                  common, incoming, rheads = tmp
                  if not incoming:
                      try:
                          if bundlename:
                              os.unlink(bundlename)
                      except OSError:
                          pass
                      return repo, [], peer.close
                  commonset = set(common)
                  rheads = [x for x in rheads if x not in commonset]
                  bundle = None
                  bundlerepo = None
                  localrepo = peer.local()
                  if bundlename or not localrepo:
                      # create a bundle (uncompressed if peer repo is not local)
                      # developer config: devel.legacy.exchange
                      legexc = ui.configlist(b'devel', b'legacy.exchange')
                      forcebundle1 = b'bundle2' not in legexc and b'bundle1' in legexc
                      canbundle2 = (
                          not forcebundle1
                          and peer.capable(b'getbundle')
                          and peer.capable(b'bundle2')
                      )
                      if canbundle2:
                          with peer.commandexecutor() as e:
                              b2 = e.callcommand(
                                  b'getbundle',
                                  {
                                      b'source': b'incoming',
                                      b'common': common,
                                      b'heads': rheads,
                                      b'bundlecaps': exchange.caps20to10(
                                          repo, role=b'client'
                                      ),
                                      b'cg': True,
                                  },
                              ).result()
                              fname = bundle = changegroup.writechunks(
                                  ui, b2._forwardchunks(), bundlename
                              )
                      else:
                          if peer.capable(b'getbundle'):
                              with peer.commandexecutor() as e:
                                  cg = e.callcommand(
                                      b'getbundle',
                                      {
                                          b'source': b'incoming',
                                          b'common': common,
                                          b'heads': rheads,
                                      },
                                  ).result()
                          elif onlyheads is None and not peer.capable(b'changegroupsubset'):
                              # compat with older servers when pulling all remote heads
                              with peer.commandexecutor() as e:
                                  cg = e.callcommand(
                                      b'changegroup',
                                      {b'nodes': incoming, b'source': b'incoming',},
                                  ).result()
                              rheads = None
                          else:
                              with peer.commandexecutor() as e:
                                  cg = e.callcommand(
                                      b'changegroupsubset',
                                      {
                                          b'bases': incoming,
                                          b'heads': rheads,
                                          b'source': b'incoming',
                                      },
                                  ).result()
                          if localrepo:
                              bundletype = b"HG10BZ"
                          else:
                              bundletype = b"HG10UN"
                          fname = bundle = bundle2.writebundle(ui, cg, bundlename, bundletype)
                      # keep written bundle?
                      if bundlename:
                          bundle = None
                      if not localrepo:
                          # use the created uncompressed bundlerepo
                          localrepo = bundlerepo = makebundlerepository(
                              repo.baseui, repo.root, fname
                          )
                          # this repo contains local and peer now, so filter out local again
                          common = repo.heads()
                  if localrepo:
                      # Part of common may be remotely filtered
                      # So use an unfiltered version
                      # The discovery process probably need cleanup to avoid that
                      localrepo = localrepo.unfiltered()
                  csets = localrepo.changelog.findmissing(common, rheads)
                  if bundlerepo:
                      reponodes = [ctx.node() for ctx in bundlerepo[bundlerepo.firstnewrev :]]
                      with peer.commandexecutor() as e:
                          remotephases = e.callcommand(
                              b'listkeys', {b'namespace': b'phases',}
                          ).result()
                      pullop = exchange.pulloperation(bundlerepo, peer, heads=reponodes)
                      pullop.trmanager = bundletransactionmanager()
                      exchange._pullapplyphases(pullop, remotephases)
                  def cleanup():
                      if bundlerepo:
                          bundlerepo.close()
                      if bundle:
                          os.unlink(bundle)
                      peer.close()
                  return (localrepo, csets, cleanup)

mercurial/pvec.py

0 +1 -1

              # pvec.py - probabilistic vector clocks for Mercurial
              #
              # Copyright 2012 Matt Mackall <mpm@selenic.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              '''
              A "pvec" is a changeset property based on the theory of vector clocks
              that can be compared to discover relatedness without consulting a
              graph. This can be useful for tasks like determining how a
              disconnected patch relates to a repository.
              Currently a pvec consist of 448 bits, of which 24 are 'depth' and the
              remainder are a bit vector. It is represented as a 70-character base85
              string.
              Construction:
              - a root changeset has a depth of 0 and a bit vector based on its hash
              - a normal commit has a changeset where depth is increased by one and
                one bit vector bit is flipped based on its hash
              - a merge changeset pvec is constructed by copying changes from one pvec into
                the other to balance its depth
              Properties:
              - for linear changes, difference in depth is always <= hamming distance
              - otherwise, changes are probably divergent
              - when hamming distance is < 200, we can reliably detect when pvecs are near
              Issues:
              - hamming distance ceases to work over distances of ~ 200
              - detecting divergence is less accurate when the common ancestor is very close
                to either revision or total distance is high
              - this could probably be improved by modeling the relation between
                delta and hdist
              Uses:
              - a patch pvec can be used to locate the nearest available common ancestor for
                resolving conflicts
              - ordering of patches can be established without a DAG
              - two head pvecs can be compared to determine whether push/pull/merge is needed
                and approximately how many changesets are involved
              - can be used to find a heuristic divergence measure between changesets on
                different branches
              '''
              from __future__ import absolute_import
              from .node import nullrev
              from . import (
                  pycompat,
                  util,
              )
              _size = 448  # 70 chars b85-encoded
              _bytes = _size / 8
              _depthbits = 24
              _depthbytes = _depthbits / 8
              _vecbytes = _bytes - _depthbytes
              _vecbits = _vecbytes * 8
              _radius = (_vecbits - 30) / 2  # high probability vectors are related
              def _bin(bs):
                  '''convert a bytestring to a long'''
                  v = 0
                  for b in bs:
                      v = v * 256 + ord(b)
                  return v
              def _str(v, l):
                  bs = b""
                  for p in pycompat.xrange(l):
                      bs = chr(v & 255) + bs
                      v >>= 8
                  return bs
              def _split(b):
                  '''depth and bitvec'''
                  return _bin(b[:_depthbytes]), _bin(b[_depthbytes:])
              def _join(depth, bitvec):
                  return _str(depth, _depthbytes) + _str(bitvec, _vecbytes)
              def _hweight(x):
                  c = 0
                  while x:
                      if x & 1:
                          c += 1
                      x >>= 1
                  return c
              _htab = [_hweight(x) for x in pycompat.xrange(256)]
              def _hamming(a, b):
                  '''find the hamming distance between two longs'''
                  d = a ^ b
                  c = 0
                  while d:
                      c += _htab[d & 0xFF]
                      d >>= 8
                  return c
              def _mergevec(x, y, c):
                  # Ideally, this function would be x ^ y ^ ancestor, but finding
                  # ancestors is a nuisance. So instead we find the minimal number
                  # of changes to balance the depth and hamming distance
                  d1, v1 = x
                  d2, v2 = y
                  if d1 < d2:
                      d1, d2, v1, v2 = d2, d1, v2, v1
                  hdist = _hamming(v1, v2)
                  ddist = d1 - d2
                  v = v1
                  m = v1 ^ v2  # mask of different bits
                  i = 1
                  if hdist > ddist:
                      # if delta = 10 and hdist = 100, then we need to go up 55 steps
                      # to the ancestor and down 45
                      changes = (hdist - ddist + 1) / 2
                  else:
                      # must make at least one change
                      changes = 1
                  depth = d1 + changes
                  # copy changes from v2
                  if m:
                      while changes:
                          if m & i:
                              v ^= i
                              changes -= 1
                          i <<= 1
                  else:
                      v = _flipbit(v, c)
                  return depth, v
              def _flipbit(v, node):
                  # converting bit strings to longs is slow
                  bit = (hash(node) & 0xFFFFFFFF) % _vecbits
                  return v ^ (1 << bit)
              def ctxpvec(ctx):
                  '''construct a pvec for ctx while filling in the cache'''
                  r = ctx.repo()
-                 if not util.safehasattr(r, b"_pveccache"):
+                 if not util.safehasattr(r, "_pveccache"):
                      r._pveccache = {}
                  pvc = r._pveccache
                  if ctx.rev() not in pvc:
                      cl = r.changelog
                      for n in pycompat.xrange(ctx.rev() + 1):
                          if n not in pvc:
                              node = cl.node(n)
                              p1, p2 = cl.parentrevs(n)
                              if p1 == nullrev:
                                  # start with a 'random' vector at root
                                  pvc[n] = (0, _bin((node * 3)[:_vecbytes]))
                              elif p2 == nullrev:
                                  d, v = pvc[p1]
                                  pvc[n] = (d + 1, _flipbit(v, node))
                              else:
                                  pvc[n] = _mergevec(pvc[p1], pvc[p2], node)
                  bs = _join(*pvc[ctx.rev()])
                  return pvec(util.b85encode(bs))
              class pvec(object):
                  def __init__(self, hashorctx):
                      if isinstance(hashorctx, str):
                          self._bs = hashorctx
                          self._depth, self._vec = _split(util.b85decode(hashorctx))
                      else:
                          self._vec = ctxpvec(hashorctx)
                  def __str__(self):
                      return self._bs
                  def __eq__(self, b):
                      return self._vec == b._vec and self._depth == b._depth
                  def __lt__(self, b):
                      delta = b._depth - self._depth
                      if delta < 0:
                          return False  # always correct
                      if _hamming(self._vec, b._vec) > delta:
                          return False
                      return True
                  def __gt__(self, b):
                      return b < self
                  def __or__(self, b):
                      delta = abs(b._depth - self._depth)
                      if _hamming(self._vec, b._vec) <= delta:
                          return False
                      return True
                  def __sub__(self, b):
                      if self | b:
                          raise ValueError(b"concurrent pvecs")
                      return self._depth - b._depth
                  def distance(self, b):
                      d = abs(b._depth - self._depth)
                      h = _hamming(self._vec, b._vec)
                      return max(d, h)
                  def near(self, b):
                      dist = abs(b.depth - self._depth)
                      if dist > _radius or _hamming(self._vec, b._vec) > _radius:
                          return False

mercurial/registrar.py

0 +1 -1

              # registrar.py - utilities to register function for specific purpose
              #
              #  Copyright FUJIWARA Katsunori <foozy@lares.dti.ne.jp> and others
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              from . import (
                  configitems,
                  error,
                  pycompat,
                  util,
              )
              # unlike the other registered items, config options are neither functions or
              # classes. Registering the option is just small function call.
              #
              # We still add the official API to the registrar module for consistency with
              # the other items extensions want might to register.
              configitem = configitems.getitemregister
              class _funcregistrarbase(object):
                  """Base of decorator to register a function for specific purpose
                  This decorator stores decorated functions into own dict 'table'.
                  The least derived class can be defined by overriding 'formatdoc',
                  for example::
                      class keyword(_funcregistrarbase):
                          _docformat = ":%s: %s"
                  This should be used as below:
                      keyword = registrar.keyword()
                      @keyword('bar')
                      def barfunc(*args, **kwargs):
                          '''Explanation of bar keyword ....
                          '''
                          pass
                  In this case:
                  - 'barfunc' is stored as 'bar' in '_table' of an instance 'keyword' above
                  - 'barfunc.__doc__' becomes ":bar: Explanation of bar keyword"
                  """
                  def __init__(self, table=None):
                      if table is None:
                          self._table = {}
                      else:
                          self._table = table
                  def __call__(self, decl, *args, **kwargs):
                      return lambda func: self._doregister(func, decl, *args, **kwargs)
                  def _doregister(self, func, decl, *args, **kwargs):
                      name = self._getname(decl)
                      if name in self._table:
                          msg = b'duplicate registration for name: "%s"' % name
                          raise error.ProgrammingError(msg)
-                     if func.__doc__ and not util.safehasattr(func, b'_origdoc'):
+                     if func.__doc__ and not util.safehasattr(func, '_origdoc'):
                          func._origdoc = func.__doc__.strip()
                          doc = pycompat.sysbytes(func._origdoc)
                          func.__doc__ = pycompat.sysstr(self._formatdoc(decl, doc))
                      self._table[name] = func
                      self._extrasetup(name, func, *args, **kwargs)
                      return func
                  def _merge(self, registrarbase):
                      """Merge the entries of the given registrar object into this one.
                      The other registrar object must not contain any entries already in the
                      current one, or a ProgrammmingError is raised.  Additionally, the types
                      of the two registrars must match.
                      """
                      if not isinstance(registrarbase, type(self)):
                          msg = b"cannot merge different types of registrar"
                          raise error.ProgrammingError(msg)
                      dups = set(registrarbase._table).intersection(self._table)
                      if dups:
                          msg = b'duplicate registration for names: "%s"' % b'", "'.join(dups)
                          raise error.ProgrammingError(msg)
                      self._table.update(registrarbase._table)
                  def _parsefuncdecl(self, decl):
                      """Parse function declaration and return the name of function in it
                      """
                      i = decl.find(b'(')
                      if i >= 0:
                          return decl[:i]
                      else:
                          return decl
                  def _getname(self, decl):
                      """Return the name of the registered function from decl
                      Derived class should override this, if it allows more
                      descriptive 'decl' string than just a name.
                      """
                      return decl
                  _docformat = None
                  def _formatdoc(self, decl, doc):
                      """Return formatted document of the registered function for help
                      'doc' is '__doc__.strip()' of the registered function.
                      """
                      return self._docformat % (decl, doc)
                  def _extrasetup(self, name, func):
                      """Execute exra setup for registered function, if needed
                      """
              class command(_funcregistrarbase):
                  """Decorator to register a command function to table
                  This class receives a command table as its argument. The table should
                  be a dict.
                  The created object can be used as a decorator for adding commands to
                  that command table. This accepts multiple arguments to define a command.
                  The first argument is the command name (as bytes).
                  The `options` keyword argument is an iterable of tuples defining command
                  arguments. See ``mercurial.fancyopts.fancyopts()`` for the format of each
                  tuple.
                  The `synopsis` argument defines a short, one line summary of how to use the
                  command. This shows up in the help output.
                  There are three arguments that control what repository (if any) is found
                  and passed to the decorated function: `norepo`, `optionalrepo`, and
                  `inferrepo`.
                  The `norepo` argument defines whether the command does not require a
                  local repository. Most commands operate against a repository, thus the
                  default is False. When True, no repository will be passed.
                  The `optionalrepo` argument defines whether the command optionally requires
                  a local repository. If no repository can be found, None will be passed
                  to the decorated function.
                  The `inferrepo` argument defines whether to try to find a repository from
                  the command line arguments. If True, arguments will be examined for
                  potential repository locations. See ``findrepo()``. If a repository is
                  found, it will be used and passed to the decorated function.
                  The `intents` argument defines a set of intended actions or capabilities
                  the command is taking. These intents can be used to affect the construction
                  of the repository object passed to the command. For example, commands
                  declaring that they are read-only could receive a repository that doesn't
                  have any methods allowing repository mutation. Other intents could be used
                  to prevent the command from running if the requested intent could not be
                  fulfilled.
                  If `helpcategory` is set (usually to one of the constants in the help
                  module), the command will be displayed under that category in the help's
                  list of commands.
                  The following intents are defined:
                  readonly
                     The command is read-only
                  The signature of the decorated function looks like this:
                      def cmd(ui[, repo] [, <args>] [, <options>])
                    `repo` is required if `norepo` is False.
                    `<args>` are positional args (or `*args`) arguments, of non-option
                    arguments from the command line.
                    `<options>` are keyword arguments (or `**options`) of option arguments
                    from the command line.
                  See the WritingExtensions and MercurialApi documentation for more exhaustive
                  descriptions and examples.
                  """
                  # Command categories for grouping them in help output.
                  # These can also be specified for aliases, like:
                  # [alias]
                  # myalias = something
                  # myalias:category = repo
                  CATEGORY_REPO_CREATION = b'repo'
                  CATEGORY_REMOTE_REPO_MANAGEMENT = b'remote'
                  CATEGORY_COMMITTING = b'commit'
                  CATEGORY_CHANGE_MANAGEMENT = b'management'
                  CATEGORY_CHANGE_ORGANIZATION = b'organization'
                  CATEGORY_FILE_CONTENTS = b'files'
                  CATEGORY_CHANGE_NAVIGATION = b'navigation'
                  CATEGORY_WORKING_DIRECTORY = b'wdir'
                  CATEGORY_IMPORT_EXPORT = b'import'
                  CATEGORY_MAINTENANCE = b'maintenance'
                  CATEGORY_HELP = b'help'
                  CATEGORY_MISC = b'misc'
                  CATEGORY_NONE = b'none'
                  def _doregister(
                      self,
                      func,
                      name,
                      options=(),
                      synopsis=None,
                      norepo=False,
                      optionalrepo=False,
                      inferrepo=False,
                      intents=None,
                      helpcategory=None,
                      helpbasic=False,
                  ):
                      func.norepo = norepo
                      func.optionalrepo = optionalrepo
                      func.inferrepo = inferrepo
                      func.intents = intents or set()
                      func.helpcategory = helpcategory
                      func.helpbasic = helpbasic
                      if synopsis:
                          self._table[name] = func, list(options), synopsis
                      else:
                          self._table[name] = func, list(options)
                      return func
              INTENT_READONLY = b'readonly'
              class revsetpredicate(_funcregistrarbase):
                  """Decorator to register revset predicate
                  Usage::
                      revsetpredicate = registrar.revsetpredicate()
                      @revsetpredicate('mypredicate(arg1, arg2[, arg3])')
                      def mypredicatefunc(repo, subset, x):
                          '''Explanation of this revset predicate ....
                          '''
                          pass
                  The first string argument is used also in online help.
                  Optional argument 'safe' indicates whether a predicate is safe for
                  DoS attack (False by default).
                  Optional argument 'takeorder' indicates whether a predicate function
                  takes ordering policy as the last argument.
                  Optional argument 'weight' indicates the estimated run-time cost, useful
                  for static optimization, default is 1. Higher weight means more expensive.
                  Usually, revsets that are fast and return only one revision has a weight of
 .5 (ex. a symbol); revsets with O(changelog) complexity and read only the
                  changelog have weight 10 (ex. author); revsets reading manifest deltas have
                  weight 30 (ex. adds); revset reading manifest contents have weight 100
                  (ex. contains). Note: those values are flexible. If the revset has a
                  same big-O time complexity as 'contains', but with a smaller constant, it
                  might have a weight of 90.
                  'revsetpredicate' instance in example above can be used to
                  decorate multiple functions.
                  Decorated functions are registered automatically at loading
                  extension, if an instance named as 'revsetpredicate' is used for
                  decorating in extension.
                  Otherwise, explicit 'revset.loadpredicate()' is needed.
                  """
                  _getname = _funcregistrarbase._parsefuncdecl
                  _docformat = b"``%s``\n    %s"
                  def _extrasetup(self, name, func, safe=False, takeorder=False, weight=1):
                      func._safe = safe
                      func._takeorder = takeorder
                      func._weight = weight
              class filesetpredicate(_funcregistrarbase):
                  """Decorator to register fileset predicate
                  Usage::
                      filesetpredicate = registrar.filesetpredicate()
                      @filesetpredicate('mypredicate()')
                      def mypredicatefunc(mctx, x):
                          '''Explanation of this fileset predicate ....
                          '''
                          pass
                  The first string argument is used also in online help.
                  Optional argument 'callstatus' indicates whether a predicate
                   implies 'matchctx.status()' at runtime or not (False, by
                   default).
                  Optional argument 'weight' indicates the estimated run-time cost, useful
                  for static optimization, default is 1. Higher weight means more expensive.
                  There are predefined weights in the 'filesetlang' module.
                  ====== =============================================================
                  Weight Description and examples
                  ====== =============================================================
 .5    basic match patterns (e.g. a symbol)
 computing status (e.g. added()) or accessing a few files
 reading file content for each (e.g. grep())
 scanning working directory (ignored())
                  ====== =============================================================
                  'filesetpredicate' instance in example above can be used to
                  decorate multiple functions.
                  Decorated functions are registered automatically at loading
                  extension, if an instance named as 'filesetpredicate' is used for
                  decorating in extension.
                  Otherwise, explicit 'fileset.loadpredicate()' is needed.
                  """
                  _getname = _funcregistrarbase._parsefuncdecl
                  _docformat = b"``%s``\n    %s"
                  def _extrasetup(self, name, func, callstatus=False, weight=1):
                      func._callstatus = callstatus
                      func._weight = weight
              class _templateregistrarbase(_funcregistrarbase):
                  """Base of decorator to register functions as template specific one
                  """
                  _docformat = b":%s: %s"
              class templatekeyword(_templateregistrarbase):
                  """Decorator to register template keyword
                  Usage::
                      templatekeyword = registrar.templatekeyword()
                      # new API (since Mercurial 4.6)
                      @templatekeyword('mykeyword', requires={'repo', 'ctx'})
                      def mykeywordfunc(context, mapping):
                          '''Explanation of this template keyword ....
                          '''
                          pass
                  The first string argument is used also in online help.
                  Optional argument 'requires' should be a collection of resource names
                  which the template keyword depends on.
                  'templatekeyword' instance in example above can be used to
                  decorate multiple functions.
                  Decorated functions are registered automatically at loading
                  extension, if an instance named as 'templatekeyword' is used for
                  decorating in extension.
                  Otherwise, explicit 'templatekw.loadkeyword()' is needed.
                  """
                  def _extrasetup(self, name, func, requires=()):
                      func._requires = requires
              class templatefilter(_templateregistrarbase):
                  """Decorator to register template filer
                  Usage::
                      templatefilter = registrar.templatefilter()
                      @templatefilter('myfilter', intype=bytes)
                      def myfilterfunc(text):
                          '''Explanation of this template filter ....
                          '''
                          pass
                  The first string argument is used also in online help.
                  Optional argument 'intype' defines the type of the input argument,
                  which should be (bytes, int, templateutil.date, or None for any.)
                  'templatefilter' instance in example above can be used to
                  decorate multiple functions.
                  Decorated functions are registered automatically at loading
                  extension, if an instance named as 'templatefilter' is used for
                  decorating in extension.
                  Otherwise, explicit 'templatefilters.loadkeyword()' is needed.
                  """
                  def _extrasetup(self, name, func, intype=None):
                      func._intype = intype
              class templatefunc(_templateregistrarbase):
                  """Decorator to register template function
                  Usage::
                      templatefunc = registrar.templatefunc()
                      @templatefunc('myfunc(arg1, arg2[, arg3])', argspec='arg1 arg2 arg3',
                                    requires={'ctx'})
                      def myfuncfunc(context, mapping, args):
                          '''Explanation of this template function ....
                          '''
                          pass
                  The first string argument is used also in online help.
                  If optional 'argspec' is defined, the function will receive 'args' as
                  a dict of named arguments. Otherwise 'args' is a list of positional
                  arguments.
                  Optional argument 'requires' should be a collection of resource names
                  which the template function depends on.
                  'templatefunc' instance in example above can be used to
                  decorate multiple functions.
                  Decorated functions are registered automatically at loading
                  extension, if an instance named as 'templatefunc' is used for
                  decorating in extension.
                  Otherwise, explicit 'templatefuncs.loadfunction()' is needed.
                  """
                  _getname = _funcregistrarbase._parsefuncdecl
                  def _extrasetup(self, name, func, argspec=None, requires=()):
                      func._argspec = argspec
                      func._requires = requires
              class internalmerge(_funcregistrarbase):
                  """Decorator to register in-process merge tool
                  Usage::
                      internalmerge = registrar.internalmerge()
                      @internalmerge('mymerge', internalmerge.mergeonly,
                                     onfailure=None, precheck=None,
                                     binary=False, symlink=False):
                      def mymergefunc(repo, mynode, orig, fcd, fco, fca,
                                      toolconf, files, labels=None):
                          '''Explanation of this internal merge tool ....
                          '''
                          return 1, False # means "conflicted", "no deletion needed"
                  The first string argument is used to compose actual merge tool name,
                  ":name" and "internal:name" (the latter is historical one).
                  The second argument is one of merge types below:
                  ========== ======== ======== =========
                  merge type precheck premerge fullmerge
                  ========== ======== ======== =========
                  nomerge     x        x        x
                  mergeonly   o        x        o
                  fullmerge   o        o        o
                  ========== ======== ======== =========
                  Optional argument 'onfailure' is the format of warning message
                  to be used at failure of merging (target filename is specified
                  at formatting). Or, None or so, if warning message should be
                  suppressed.
                  Optional argument 'precheck' is the function to be used
                  before actual invocation of internal merge tool itself.
                  It takes as same arguments as internal merge tool does, other than
                  'files' and 'labels'. If it returns false value, merging is aborted
                  immediately (and file is marked as "unresolved").
                  Optional argument 'binary' is a binary files capability of internal
                  merge tool. 'nomerge' merge type implies binary=True.
                  Optional argument 'symlink' is a symlinks capability of inetrnal
                  merge function. 'nomerge' merge type implies symlink=True.
                  'internalmerge' instance in example above can be used to
                  decorate multiple functions.
                  Decorated functions are registered automatically at loading
                  extension, if an instance named as 'internalmerge' is used for
                  decorating in extension.
                  Otherwise, explicit 'filemerge.loadinternalmerge()' is needed.
                  """
                  _docformat = b"``:%s``\n    %s"
                  # merge type definitions:
                  nomerge = None
                  mergeonly = b'mergeonly'  # just the full merge, no premerge
                  fullmerge = b'fullmerge'  # both premerge and merge
                  def _extrasetup(
                      self,
                      name,
                      func,
                      mergetype,
                      onfailure=None,
                      precheck=None,
                      binary=False,
                      symlink=False,
                  ):
                      func.mergetype = mergetype
                      func.onfailure = onfailure
                      func.precheck = precheck
                      binarycap = binary or mergetype == self.nomerge
                      symlinkcap = symlink or mergetype == self.nomerge
                      # actual capabilities, which this internal merge tool has
                      func.capabilities = {b"binary": binarycap, b"symlink": symlinkcap}

mercurial/utils/procutil.py

0 +2 -2

              # procutil.py - utility for managing processes and executable environment
              #
              #  Copyright 2005 K. Thananchayan <thananck@yahoo.com>
              #  Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
              #  Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import contextlib
              import errno
              import imp
              import io
              import os
              import signal
              import subprocess
              import sys
              import time
              from ..i18n import _
              from ..pycompat import (
                  getattr,
                  open,
              )
              from .. import (
                  encoding,
                  error,
                  policy,
                  pycompat,
              )
              osutil = policy.importmod(r'osutil')
              stderr = pycompat.stderr
              stdin = pycompat.stdin
              stdout = pycompat.stdout
              def isatty(fp):
                  try:
                      return fp.isatty()
                  except AttributeError:
                      return False
              # glibc determines buffering on first write to stdout - if we replace a TTY
              # destined stdout with a pipe destined stdout (e.g. pager), we want line
              # buffering (or unbuffered, on Windows)
              if isatty(stdout):
                  if pycompat.iswindows:
                      # Windows doesn't support line buffering
                      stdout = os.fdopen(stdout.fileno(), r'wb', 0)
                  else:
                      stdout = os.fdopen(stdout.fileno(), r'wb', 1)
              if pycompat.iswindows:
                  from .. import windows as platform
                  stdout = platform.winstdout(stdout)
              else:
                  from .. import posix as platform
              findexe = platform.findexe
              _gethgcmd = platform.gethgcmd
              getuser = platform.getuser
              getpid = os.getpid
              hidewindow = platform.hidewindow
              quotecommand = platform.quotecommand
              readpipe = platform.readpipe
              setbinary = platform.setbinary
              setsignalhandler = platform.setsignalhandler
              shellquote = platform.shellquote
              shellsplit = platform.shellsplit
              spawndetached = platform.spawndetached
              sshargs = platform.sshargs
              testpid = platform.testpid
              try:
                  setprocname = osutil.setprocname
              except AttributeError:
                  pass
              try:
                  unblocksignal = osutil.unblocksignal
              except AttributeError:
                  pass
              closefds = pycompat.isposix
              def explainexit(code):
                  """return a message describing a subprocess status
                  (codes from kill are negative - not os.system/wait encoding)"""
                  if code >= 0:
                      return _(b"exited with status %d") % code
                  return _(b"killed by signal %d") % -code
              class _pfile(object):
                  """File-like wrapper for a stream opened by subprocess.Popen()"""
                  def __init__(self, proc, fp):
                      self._proc = proc
                      self._fp = fp
                  def close(self):
                      # unlike os.popen(), this returns an integer in subprocess coding
                      self._fp.close()
                      return self._proc.wait()
                  def __iter__(self):
                      return iter(self._fp)
                  def __getattr__(self, attr):
                      return getattr(self._fp, attr)
                  def __enter__(self):
                      return self
                  def __exit__(self, exc_type, exc_value, exc_tb):
                      self.close()
              def popen(cmd, mode=b'rb', bufsize=-1):
                  if mode == b'rb':
                      return _popenreader(cmd, bufsize)
                  elif mode == b'wb':
                      return _popenwriter(cmd, bufsize)
                  raise error.ProgrammingError(b'unsupported mode: %r' % mode)
              def _popenreader(cmd, bufsize):
                  p = subprocess.Popen(
                      tonativestr(quotecommand(cmd)),
                      shell=True,
                      bufsize=bufsize,
                      close_fds=closefds,
                      stdout=subprocess.PIPE,
                  )
                  return _pfile(p, p.stdout)
              def _popenwriter(cmd, bufsize):
                  p = subprocess.Popen(
                      tonativestr(quotecommand(cmd)),
                      shell=True,
                      bufsize=bufsize,
                      close_fds=closefds,
                      stdin=subprocess.PIPE,
                  )
                  return _pfile(p, p.stdin)
              def popen2(cmd, env=None):
                  # Setting bufsize to -1 lets the system decide the buffer size.
                  # The default for bufsize is 0, meaning unbuffered. This leads to
                  # poor performance on Mac OS X: http://bugs.python.org/issue4194
                  p = subprocess.Popen(
                      tonativestr(cmd),
                      shell=True,
                      bufsize=-1,
                      close_fds=closefds,
                      stdin=subprocess.PIPE,
                      stdout=subprocess.PIPE,
                      env=tonativeenv(env),
                  )
                  return p.stdin, p.stdout
              def popen3(cmd, env=None):
                  stdin, stdout, stderr, p = popen4(cmd, env)
                  return stdin, stdout, stderr
              def popen4(cmd, env=None, bufsize=-1):
                  p = subprocess.Popen(
                      tonativestr(cmd),
                      shell=True,
                      bufsize=bufsize,
                      close_fds=closefds,
                      stdin=subprocess.PIPE,
                      stdout=subprocess.PIPE,
                      stderr=subprocess.PIPE,
                      env=tonativeenv(env),
                  )
                  return p.stdin, p.stdout, p.stderr, p
              def pipefilter(s, cmd):
                  '''filter string S through command CMD, returning its output'''
                  p = subprocess.Popen(
                      tonativestr(cmd),
                      shell=True,
                      close_fds=closefds,
                      stdin=subprocess.PIPE,
                      stdout=subprocess.PIPE,
                  )
                  pout, perr = p.communicate(s)
                  return pout
              def tempfilter(s, cmd):
                  '''filter string S through a pair of temporary files with CMD.
                  CMD is used as a template to create the real command to be run,
                  with the strings INFILE and OUTFILE replaced by the real names of
                  the temporary files generated.'''
                  inname, outname = None, None
                  try:
                      infd, inname = pycompat.mkstemp(prefix=b'hg-filter-in-')
                      fp = os.fdopen(infd, r'wb')
                      fp.write(s)
                      fp.close()
                      outfd, outname = pycompat.mkstemp(prefix=b'hg-filter-out-')
                      os.close(outfd)
                      cmd = cmd.replace(b'INFILE', inname)
                      cmd = cmd.replace(b'OUTFILE', outname)
                      code = system(cmd)
                      if pycompat.sysplatform == b'OpenVMS' and code & 1:
                          code = 0
                      if code:
                          raise error.Abort(
                              _(b"command '%s' failed: %s") % (cmd, explainexit(code))
                          )
                      with open(outname, b'rb') as fp:
                          return fp.read()
                  finally:
                      try:
                          if inname:
                              os.unlink(inname)
                      except OSError:
                          pass
                      try:
                          if outname:
                              os.unlink(outname)
                      except OSError:
                          pass
              _filtertable = {
                  b'tempfile:': tempfilter,
                  b'pipe:': pipefilter,
              }
              def filter(s, cmd):
                  b"filter a string through a command that transforms its input to its output"
                  for name, fn in pycompat.iteritems(_filtertable):
                      if cmd.startswith(name):
                          return fn(s, cmd[len(name) :].lstrip())
                  return pipefilter(s, cmd)
              def mainfrozen():
                  """return True if we are a frozen executable.
                  The code supports py2exe (most common, Windows only) and tools/freeze
                  (portable, not much used).
                  """
                  return (
-                     pycompat.safehasattr(sys, b"frozen")
-                     or pycompat.safehasattr(sys, b"importers")  # new py2exe
+                     pycompat.safehasattr(sys, "frozen")
+                     or pycompat.safehasattr(sys, "importers")  # new py2exe
                      or imp.is_frozen(r"__main__")  # old py2exe
                  )  # tools/freeze
              _hgexecutable = None
              def hgexecutable():
                  """return location of the 'hg' executable.
                  Defaults to $HG or 'hg' in the search path.
                  """
                  if _hgexecutable is None:
                      hg = encoding.environ.get(b'HG')
                      mainmod = sys.modules[r'__main__']
                      if hg:
                          _sethgexecutable(hg)
                      elif mainfrozen():
                          if getattr(sys, 'frozen', None) == b'macosx_app':
                              # Env variable set by py2app
                              _sethgexecutable(encoding.environ[b'EXECUTABLEPATH'])
                          else:
                              _sethgexecutable(pycompat.sysexecutable)
                      elif (
                          not pycompat.iswindows
                          and os.path.basename(
                              pycompat.fsencode(getattr(mainmod, '__file__', b''))
                          )
                          == b'hg'
                      ):
                          _sethgexecutable(pycompat.fsencode(mainmod.__file__))
                      else:
                          _sethgexecutable(
                              findexe(b'hg') or os.path.basename(pycompat.sysargv[0])
                          )
                  return _hgexecutable
              def _sethgexecutable(path):
                  """set location of the 'hg' executable"""
                  global _hgexecutable
                  _hgexecutable = path
              def _testfileno(f, stdf):
                  fileno = getattr(f, 'fileno', None)
                  try:
                      return fileno and fileno() == stdf.fileno()
                  except io.UnsupportedOperation:
                      return False  # fileno() raised UnsupportedOperation
              def isstdin(f):
                  return _testfileno(f, sys.__stdin__)
              def isstdout(f):
                  return _testfileno(f, sys.__stdout__)
              def protectstdio(uin, uout):
                  """Duplicate streams and redirect original if (uin, uout) are stdio
                  If uin is stdin, it's redirected to /dev/null. If uout is stdout, it's
                  redirected to stderr so the output is still readable.
                  Returns (fin, fout) which point to the original (uin, uout) fds, but
                  may be copy of (uin, uout). The returned streams can be considered
                  "owned" in that print(), exec(), etc. never reach to them.
                  """
                  uout.flush()
                  fin, fout = uin, uout
                  if _testfileno(uin, stdin):
                      newfd = os.dup(uin.fileno())
                      nullfd = os.open(os.devnull, os.O_RDONLY)
                      os.dup2(nullfd, uin.fileno())
                      os.close(nullfd)
                      fin = os.fdopen(newfd, r'rb')
                  if _testfileno(uout, stdout):
                      newfd = os.dup(uout.fileno())
                      os.dup2(stderr.fileno(), uout.fileno())
                      fout = os.fdopen(newfd, r'wb')
                  return fin, fout
              def restorestdio(uin, uout, fin, fout):
                  """Restore (uin, uout) streams from possibly duplicated (fin, fout)"""
                  uout.flush()
                  for f, uif in [(fin, uin), (fout, uout)]:
                      if f is not uif:
                          os.dup2(f.fileno(), uif.fileno())
                          f.close()
              def shellenviron(environ=None):
                  """return environ with optional override, useful for shelling out"""
                  def py2shell(val):
                      b'convert python object into string that is useful to shell'
                      if val is None or val is False:
                          return b'0'
                      if val is True:
                          return b'1'
                      return pycompat.bytestr(val)
                  env = dict(encoding.environ)
                  if environ:
                      env.update((k, py2shell(v)) for k, v in pycompat.iteritems(environ))
                  env[b'HG'] = hgexecutable()
                  return env
              if pycompat.iswindows:
                  def shelltonative(cmd, env):
                      return platform.shelltocmdexe(cmd, shellenviron(env))
                  tonativestr = encoding.strfromlocal
              else:
                  def shelltonative(cmd, env):
                      return cmd
                  tonativestr = pycompat.identity
              def tonativeenv(env):
                  '''convert the environment from bytes to strings suitable for Popen(), etc.
                  '''
                  return pycompat.rapply(tonativestr, env)
              def system(cmd, environ=None, cwd=None, out=None):
                  '''enhanced shell command execution.
                  run with environment maybe modified, maybe in different dir.
                  if out is specified, it is assumed to be a file-like object that has a
                  write() method. stdout and stderr will be redirected to out.'''
                  try:
                      stdout.flush()
                  except Exception:
                      pass
                  cmd = quotecommand(cmd)
                  env = shellenviron(environ)
                  if out is None or isstdout(out):
                      rc = subprocess.call(
                          tonativestr(cmd),
                          shell=True,
                          close_fds=closefds,
                          env=tonativeenv(env),
                          cwd=pycompat.rapply(tonativestr, cwd),
                      )
                  else:
                      proc = subprocess.Popen(
                          tonativestr(cmd),
                          shell=True,
                          close_fds=closefds,
                          env=tonativeenv(env),
                          cwd=pycompat.rapply(tonativestr, cwd),
                          stdout=subprocess.PIPE,
                          stderr=subprocess.STDOUT,
                      )
                      for line in iter(proc.stdout.readline, b''):
                          out.write(line)
                      proc.wait()
                      rc = proc.returncode
                  if pycompat.sysplatform == b'OpenVMS' and rc & 1:
                      rc = 0
                  return rc
              def gui():
                  '''Are we running in a GUI?'''
                  if pycompat.isdarwin:
                      if b'SSH_CONNECTION' in encoding.environ:
                          # handle SSH access to a box where the user is logged in
                          return False
                      elif getattr(osutil, 'isgui', None):
                          # check if a CoreGraphics session is available
                          return osutil.isgui()
                      else:
                          # pure build; use a safe default
                          return True
                  else:
                      return pycompat.iswindows or encoding.environ.get(b"DISPLAY")
              def hgcmd():
                  """Return the command used to execute current hg
                  This is different from hgexecutable() because on Windows we want
                  to avoid things opening new shell windows like batch files, so we
                  get either the python call or current executable.
                  """
                  if mainfrozen():
                      if getattr(sys, 'frozen', None) == b'macosx_app':
                          # Env variable set by py2app
                          return [encoding.environ[b'EXECUTABLEPATH']]
                      else:
                          return [pycompat.sysexecutable]
                  return _gethgcmd()
              def rundetached(args, condfn):
                  """Execute the argument list in a detached process.
                  condfn is a callable which is called repeatedly and should return
                  True once the child process is known to have started successfully.
                  At this point, the child process PID is returned. If the child
                  process fails to start or finishes before condfn() evaluates to
                  True, return -1.
                  """
                  # Windows case is easier because the child process is either
                  # successfully starting and validating the condition or exiting
                  # on failure. We just poll on its PID. On Unix, if the child
                  # process fails to start, it will be left in a zombie state until
                  # the parent wait on it, which we cannot do since we expect a long
                  # running process on success. Instead we listen for SIGCHLD telling
                  # us our child process terminated.
                  terminated = set()
                  def handler(signum, frame):
                      terminated.add(os.wait())
                  prevhandler = None
                  SIGCHLD = getattr(signal, 'SIGCHLD', None)
                  if SIGCHLD is not None:
                      prevhandler = signal.signal(SIGCHLD, handler)
                  try:
                      pid = spawndetached(args)
                      while not condfn():
                          if (pid in terminated or not testpid(pid)) and not condfn():
                              return -1
                          time.sleep(0.1)
                      return pid
                  finally:
                      if prevhandler is not None:
                          signal.signal(signal.SIGCHLD, prevhandler)
              @contextlib.contextmanager
              def uninterruptible(warn):
                  """Inhibit SIGINT handling on a region of code.
                  Note that if this is called in a non-main thread, it turns into a no-op.
                  Args:
                    warn: A callable which takes no arguments, and returns True if the
                          previous signal handling should be restored.
                  """
                  oldsiginthandler = [signal.getsignal(signal.SIGINT)]
                  shouldbail = []
                  def disabledsiginthandler(*args):
                      if warn():
                          signal.signal(signal.SIGINT, oldsiginthandler[0])
                          del oldsiginthandler[0]
                      shouldbail.append(True)
                  try:
                      try:
                          signal.signal(signal.SIGINT, disabledsiginthandler)
                      except ValueError:
                          # wrong thread, oh well, we tried
                          del oldsiginthandler[0]
                      yield
                  finally:
                      if oldsiginthandler:
                          signal.signal(signal.SIGINT, oldsiginthandler[0])
                      if shouldbail:
                          raise KeyboardInterrupt
              if pycompat.iswindows:
                  # no fork on Windows, but we can create a detached process
                  # https://msdn.microsoft.com/en-us/library/windows/desktop/ms684863.aspx
                  # No stdlib constant exists for this value
                  DETACHED_PROCESS = 0x00000008
                  # Following creation flags might create a console GUI window.
                  # Using subprocess.CREATE_NEW_CONSOLE might helps.
                  # See https://phab.mercurial-scm.org/D1701 for discussion
                  _creationflags = DETACHED_PROCESS | subprocess.CREATE_NEW_PROCESS_GROUP
                  def runbgcommand(
                      script, env, shell=False, stdout=None, stderr=None, ensurestart=True
                  ):
                      '''Spawn a command without waiting for it to finish.'''
                      # we can't use close_fds *and* redirect stdin. I'm not sure that we
                      # need to because the detached process has no console connection.
                      subprocess.Popen(
                          tonativestr(script),
                          shell=shell,
                          env=tonativeenv(env),
                          close_fds=True,
                          creationflags=_creationflags,
                          stdout=stdout,
                          stderr=stderr,
                      )
              else:
                  def runbgcommand(
                      cmd, env, shell=False, stdout=None, stderr=None, ensurestart=True
                  ):
                      '''Spawn a command without waiting for it to finish.'''
                      # double-fork to completely detach from the parent process
                      # based on http://code.activestate.com/recipes/278731
                      pid = os.fork()
                      if pid:
                          if not ensurestart:
                              return
                          # Parent process
                          (_pid, status) = os.waitpid(pid, 0)
                          if os.WIFEXITED(status):
                              returncode = os.WEXITSTATUS(status)
                          else:
                              returncode = -(os.WTERMSIG(status))
                          if returncode != 0:
                              # The child process's return code is 0 on success, an errno
                              # value on failure, or 255 if we don't have a valid errno
                              # value.
                              #
                              # (It would be slightly nicer to return the full exception info
                              # over a pipe as the subprocess module does.  For now it
                              # doesn't seem worth adding that complexity here, though.)
                              if returncode == 255:
                                  returncode = errno.EINVAL
                              raise OSError(
                                  returncode,
                                  b'error running %r: %s' % (cmd, os.strerror(returncode)),
                              )
                          return
                      returncode = 255
                      try:
                          # Start a new session
                          os.setsid()
                          stdin = open(os.devnull, b'r')
                          if stdout is None:
                              stdout = open(os.devnull, b'w')
                          if stderr is None:
                              stderr = open(os.devnull, b'w')
                          # connect stdin to devnull to make sure the subprocess can't
                          # muck up that stream for mercurial.
                          subprocess.Popen(
                              cmd,
                              shell=shell,
                              env=env,
                              close_fds=True,
                              stdin=stdin,
                              stdout=stdout,
                              stderr=stderr,
                          )
                          returncode = 0
                      except EnvironmentError as ex:
                          returncode = ex.errno & 0xFF
                          if returncode == 0:
                              # This shouldn't happen, but just in case make sure the
                              # return code is never 0 here.
                              returncode = 255
                      except Exception:
                          returncode = 255
                      finally:
                          # mission accomplished, this child needs to exit and not
                          # continue the hg process here.
                          os._exit(returncode)

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages