upstream/mercurial-mirror Commit - r36347:93943eef

py3: use pycompat.byteskwargs in hgext/convert/...

Pulkit Goyal -

r36347:93943eef default

parent child

hgext/convert/common.py

0 +2 0

              # common.py - common code for the convert extension
              #
              #  Copyright 2005-2009 Matt Mackall <mpm@selenic.com> and others
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import base64
              import datetime
              import errno
              import os
              import re
              import subprocess
              from mercurial.i18n import _
              from mercurial import (
                  encoding,
                  error,
                  phases,
+                 pycompat,
                  util,
              )
              pickle = util.pickle
              propertycache = util.propertycache
              def encodeargs(args):
                  def encodearg(s):
                      lines = base64.encodestring(s)
                      lines = [l.splitlines()[0] for l in lines]
                      return ''.join(lines)
                  s = pickle.dumps(args)
                  return encodearg(s)
              def decodeargs(s):
                  s = base64.decodestring(s)
                  return pickle.loads(s)
              class MissingTool(Exception):
                  pass
              def checktool(exe, name=None, abort=True):
                  name = name or exe
                  if not util.findexe(exe):
                      if abort:
                          exc = error.Abort
                      else:
                          exc = MissingTool
                      raise exc(_('cannot find required "%s" tool') % name)
              class NoRepo(Exception):
                  pass
              SKIPREV = 'SKIP'
              class commit(object):
                  def __init__(self, author, date, desc, parents, branch=None, rev=None,
                               extra=None, sortkey=None, saverev=True, phase=phases.draft,
                               optparents=None):
                      self.author = author or 'unknown'
                      self.date = date or '0 0'
                      self.desc = desc
                      self.parents = parents # will be converted and used as parents
                      self.optparents = optparents or [] # will be used if already converted
                      self.branch = branch
                      self.rev = rev
                      self.extra = extra or {}
                      self.sortkey = sortkey
                      self.saverev = saverev
                      self.phase = phase
              class converter_source(object):
                  """Conversion source interface"""
                  def __init__(self, ui, repotype, path=None, revs=None):
                      """Initialize conversion source (or raise NoRepo("message")
                      exception if path is not a valid repository)"""
                      self.ui = ui
                      self.path = path
                      self.revs = revs
                      self.repotype = repotype
                      self.encoding = 'utf-8'
                  def checkhexformat(self, revstr, mapname='splicemap'):
                      """ fails if revstr is not a 40 byte hex. mercurial and git both uses
                          such format for their revision numbering
                      """
                      if not re.match(r'[0-9a-fA-F]{40,40}$', revstr):
                          raise error.Abort(_('%s entry %s is not a valid revision'
                                             ' identifier') % (mapname, revstr))
                  def before(self):
                      pass
                  def after(self):
                      pass
                  def targetfilebelongstosource(self, targetfilename):
                      """Returns true if the given targetfile belongs to the source repo. This
                      is useful when only a subdirectory of the target belongs to the source
                      repo."""
                      # For normal full repo converts, this is always True.
                      return True
                  def setrevmap(self, revmap):
                      """set the map of already-converted revisions"""
                  def getheads(self):
                      """Return a list of this repository's heads"""
                      raise NotImplementedError
                  def getfile(self, name, rev):
                      """Return a pair (data, mode) where data is the file content
                      as a string and mode one of '', 'x' or 'l'. rev is the
                      identifier returned by a previous call to getchanges().
                      Data is None if file is missing/deleted in rev.
                      """
                      raise NotImplementedError
                  def getchanges(self, version, full):
                      """Returns a tuple of (files, copies, cleanp2).
                      files is a sorted list of (filename, id) tuples for all files
                      changed between version and its first parent returned by
                      getcommit(). If full, all files in that revision is returned.
                      id is the source revision id of the file.
                      copies is a dictionary of dest: source
                      cleanp2 is the set of files filenames that are clean against p2.
                      (Files that are clean against p1 are already not in files (unless
                      full). This makes it possible to handle p2 clean files similarly.)
                      """
                      raise NotImplementedError
                  def getcommit(self, version):
                      """Return the commit object for version"""
                      raise NotImplementedError
                  def numcommits(self):
                      """Return the number of commits in this source.
                      If unknown, return None.
                      """
                      return None
                  def gettags(self):
                      """Return the tags as a dictionary of name: revision
                      Tag names must be UTF-8 strings.
                      """
                      raise NotImplementedError
                  def recode(self, s, encoding=None):
                      if not encoding:
                          encoding = self.encoding or 'utf-8'
                      if isinstance(s, unicode):
                          return s.encode("utf-8")
                      try:
                          return s.decode(encoding).encode("utf-8")
                      except UnicodeError:
                          try:
                              return s.decode("latin-1").encode("utf-8")
                          except UnicodeError:
                              return s.decode(encoding, "replace").encode("utf-8")
                  def getchangedfiles(self, rev, i):
                      """Return the files changed by rev compared to parent[i].
                      i is an index selecting one of the parents of rev.  The return
                      value should be the list of files that are different in rev and
                      this parent.
                      If rev has no parents, i is None.
                      This function is only needed to support --filemap
                      """
                      raise NotImplementedError
                  def converted(self, rev, sinkrev):
                      '''Notify the source that a revision has been converted.'''
                  def hasnativeorder(self):
                      """Return true if this source has a meaningful, native revision
                      order. For instance, Mercurial revisions are store sequentially
                      while there is no such global ordering with Darcs.
                      """
                      return False
                  def hasnativeclose(self):
                      """Return true if this source has ability to close branch.
                      """
                      return False
                  def lookuprev(self, rev):
                      """If rev is a meaningful revision reference in source, return
                      the referenced identifier in the same format used by getcommit().
                      return None otherwise.
                      """
                      return None
                  def getbookmarks(self):
                      """Return the bookmarks as a dictionary of name: revision
                      Bookmark names are to be UTF-8 strings.
                      """
                      return {}
                  def checkrevformat(self, revstr, mapname='splicemap'):
                      """revstr is a string that describes a revision in the given
                         source control system.  Return true if revstr has correct
                         format.
                      """
                      return True
              class converter_sink(object):
                  """Conversion sink (target) interface"""
                  def __init__(self, ui, repotype, path):
                      """Initialize conversion sink (or raise NoRepo("message")
                      exception if path is not a valid repository)
                      created is a list of paths to remove if a fatal error occurs
                      later"""
                      self.ui = ui
                      self.path = path
                      self.created = []
                      self.repotype = repotype
                  def revmapfile(self):
                      """Path to a file that will contain lines
                      source_rev_id sink_rev_id
                      mapping equivalent revision identifiers for each system."""
                      raise NotImplementedError
                  def authorfile(self):
                      """Path to a file that will contain lines
                      srcauthor=dstauthor
                      mapping equivalent authors identifiers for each system."""
                      return None
                  def putcommit(self, files, copies, parents, commit, source, revmap, full,
                                cleanp2):
                      """Create a revision with all changed files listed in 'files'
                      and having listed parents. 'commit' is a commit object
                      containing at a minimum the author, date, and message for this
                      changeset.  'files' is a list of (path, version) tuples,
                      'copies' is a dictionary mapping destinations to sources,
                      'source' is the source repository, and 'revmap' is a mapfile
                      of source revisions to converted revisions. Only getfile() and
                      lookuprev() should be called on 'source'. 'full' means that 'files'
                      is complete and all other files should be removed.
                      'cleanp2' is a set of the filenames that are unchanged from p2
                      (only in the common merge case where there two parents).
                      Note that the sink repository is not told to update itself to
                      a particular revision (or even what that revision would be)
                      before it receives the file data.
                      """
                      raise NotImplementedError
                  def puttags(self, tags):
                      """Put tags into sink.
                      tags: {tagname: sink_rev_id, ...} where tagname is an UTF-8 string.
                      Return a pair (tag_revision, tag_parent_revision), or (None, None)
                      if nothing was changed.
                      """
                      raise NotImplementedError
                  def setbranch(self, branch, pbranches):
                      """Set the current branch name. Called before the first putcommit
                      on the branch.
                      branch: branch name for subsequent commits
                      pbranches: (converted parent revision, parent branch) tuples"""
                  def setfilemapmode(self, active):
                      """Tell the destination that we're using a filemap
                      Some converter_sources (svn in particular) can claim that a file
                      was changed in a revision, even if there was no change.  This method
                      tells the destination that we're using a filemap and that it should
                      filter empty revisions.
                      """
                  def before(self):
                      pass
                  def after(self):
                      pass
                  def putbookmarks(self, bookmarks):
                      """Put bookmarks into sink.
                      bookmarks: {bookmarkname: sink_rev_id, ...}
                      where bookmarkname is an UTF-8 string.
                      """
                  def hascommitfrommap(self, rev):
                      """Return False if a rev mentioned in a filemap is known to not be
                      present."""
                      raise NotImplementedError
                  def hascommitforsplicemap(self, rev):
                      """This method is for the special needs for splicemap handling and not
                      for general use. Returns True if the sink contains rev, aborts on some
                      special cases."""
                      raise NotImplementedError
              class commandline(object):
                  def __init__(self, ui, command):
                      self.ui = ui
                      self.command = command
                  def prerun(self):
                      pass
                  def postrun(self):
                      pass
                  def _cmdline(self, cmd, *args, **kwargs):
+                     kwargs = pycompat.byteskwargs(kwargs)
                      cmdline = [self.command, cmd] + list(args)
                      for k, v in kwargs.iteritems():
                          if len(k) == 1:
                              cmdline.append('-' + k)
                          else:
                              cmdline.append('--' + k.replace('_', '-'))
                          try:
                              if len(k) == 1:
                                  cmdline.append('' + v)
                              else:
                                  cmdline[-1] += '=' + v
                          except TypeError:
                              pass
                      cmdline = [util.shellquote(arg) for arg in cmdline]
                      if not self.ui.debugflag:
                          cmdline += ['2>', os.devnull]
                      cmdline = ' '.join(cmdline)
                      return cmdline
                  def _run(self, cmd, *args, **kwargs):
                      def popen(cmdline):
                          p = subprocess.Popen(cmdline, shell=True, bufsize=-1,
                                  close_fds=util.closefds,
                                  stdout=subprocess.PIPE)
                          return p
                      return self._dorun(popen, cmd, *args, **kwargs)
                  def _run2(self, cmd, *args, **kwargs):
                      return self._dorun(util.popen2, cmd, *args, **kwargs)
                  def _run3(self, cmd, *args, **kwargs):
                      return self._dorun(util.popen3, cmd, *args, **kwargs)
                  def _dorun(self, openfunc, cmd,  *args, **kwargs):
                      cmdline = self._cmdline(cmd, *args, **kwargs)
                      self.ui.debug('running: %s\n' % (cmdline,))
                      self.prerun()
                      try:
                          return openfunc(cmdline)
                      finally:
                          self.postrun()
                  def run(self, cmd, *args, **kwargs):
                      p = self._run(cmd, *args, **kwargs)
                      output = p.communicate()[0]
                      self.ui.debug(output)
                      return output, p.returncode
                  def runlines(self, cmd, *args, **kwargs):
                      p = self._run(cmd, *args, **kwargs)
                      output = p.stdout.readlines()
                      p.wait()
                      self.ui.debug(''.join(output))
                      return output, p.returncode
                  def checkexit(self, status, output=''):
                      if status:
                          if output:
                              self.ui.warn(_('%s error:\n') % self.command)
                              self.ui.warn(output)
                          msg = util.explainexit(status)[0]
                          raise error.Abort('%s %s' % (self.command, msg))
                  def run0(self, cmd, *args, **kwargs):
                      output, status = self.run(cmd, *args, **kwargs)
                      self.checkexit(status, output)
                      return output
                  def runlines0(self, cmd, *args, **kwargs):
                      output, status = self.runlines(cmd, *args, **kwargs)
                      self.checkexit(status, ''.join(output))
                      return output
                  @propertycache
                  def argmax(self):
                      # POSIX requires at least 4096 bytes for ARG_MAX
                      argmax = 4096
                      try:
                          argmax = os.sysconf("SC_ARG_MAX")
                      except (AttributeError, ValueError):
                          pass
                      # Windows shells impose their own limits on command line length,
                      # down to 2047 bytes for cmd.exe under Windows NT/2k and 2500 bytes
                      # for older 4nt.exe. See http://support.microsoft.com/kb/830473 for
                      # details about cmd.exe limitations.
                      # Since ARG_MAX is for command line _and_ environment, lower our limit
                      # (and make happy Windows shells while doing this).
                      return argmax // 2 - 1
                  def _limit_arglist(self, arglist, cmd, *args, **kwargs):
                      cmdlen = len(self._cmdline(cmd, *args, **kwargs))
                      limit = self.argmax - cmdlen
                      bytes = 0
                      fl = []
                      for fn in arglist:
                          b = len(fn) + 3
                          if bytes + b < limit or len(fl) == 0:
                              fl.append(fn)
                              bytes += b
                          else:
                              yield fl
                              fl = [fn]
                              bytes = b
                      if fl:
                          yield fl
                  def xargs(self, arglist, cmd, *args, **kwargs):
                      for l in self._limit_arglist(arglist, cmd, *args, **kwargs):
                          self.run0(cmd, *(list(args) + l), **kwargs)
              class mapfile(dict):
                  def __init__(self, ui, path):
                      super(mapfile, self).__init__()
                      self.ui = ui
                      self.path = path
                      self.fp = None
                      self.order = []
                      self._read()
                  def _read(self):
                      if not self.path:
                          return
                      try:
                          fp = open(self.path, 'rb')
                      except IOError as err:
                          if err.errno != errno.ENOENT:
                              raise
                          return
                      for i, line in enumerate(util.iterfile(fp)):
                          line = line.splitlines()[0].rstrip()
                          if not line:
                              # Ignore blank lines
                              continue
                          try:
                              key, value = line.rsplit(' ', 1)
                          except ValueError:
                              raise error.Abort(
                                  _('syntax error in %s(%d): key/value pair expected')
                                  % (self.path, i + 1))
                          if key not in self:
                              self.order.append(key)
                          super(mapfile, self).__setitem__(key, value)
                      fp.close()
                  def __setitem__(self, key, value):
                      if self.fp is None:
                          try:
                              self.fp = open(self.path, 'ab')
                          except IOError as err:
                              raise error.Abort(
                                  _('could not open map file %r: %s') %
                                  (self.path, encoding.strtolocal(err.strerror)))
                      self.fp.write(util.tonativeeol('%s %s\n' % (key, value)))
                      self.fp.flush()
                      super(mapfile, self).__setitem__(key, value)
                  def close(self):
                      if self.fp:
                          self.fp.close()
                          self.fp = None
              def makedatetimestamp(t):
                  """Like util.makedate() but for time t instead of current time"""
                  delta = (datetime.datetime.utcfromtimestamp(t) -
                           datetime.datetime.fromtimestamp(t))
                  tz = delta.days * 86400 + delta.seconds
                  return t, tz

hgext/convert/convcmd.py

0 +1 0

              # convcmd - convert extension commands definition
              #
              # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import collections
              import os
              import shlex
              import shutil
              from mercurial.i18n import _
              from mercurial import (
                  encoding,
                  error,
                  hg,
                  pycompat,
                  scmutil,
                  util,
              )
              from . import (
                  bzr,
                  common,
                  cvs,
                  darcs,
                  filemap,
                  git,
                  gnuarch,
                  hg as hgconvert,
                  monotone,
                  p4,
                  subversion,
              )
              mapfile = common.mapfile
              MissingTool = common.MissingTool
              NoRepo = common.NoRepo
              SKIPREV = common.SKIPREV
              bzr_source = bzr.bzr_source
              convert_cvs = cvs.convert_cvs
              convert_git = git.convert_git
              darcs_source = darcs.darcs_source
              gnuarch_source = gnuarch.gnuarch_source
              mercurial_sink = hgconvert.mercurial_sink
              mercurial_source = hgconvert.mercurial_source
              monotone_source = monotone.monotone_source
              p4_source = p4.p4_source
              svn_sink = subversion.svn_sink
              svn_source = subversion.svn_source
              orig_encoding = 'ascii'
              def recode(s):
                  if isinstance(s, unicode):
                      return s.encode(pycompat.sysstr(orig_encoding), 'replace')
                  else:
                      return s.decode('utf-8').encode(
                          pycompat.sysstr(orig_encoding), 'replace')
              def mapbranch(branch, branchmap):
                  '''
                  >>> bmap = {b'default': b'branch1'}
                  >>> for i in [b'', None]:
                  ...     mapbranch(i, bmap)
                  'branch1'
                  'branch1'
                  >>> bmap = {b'None': b'branch2'}
                  >>> for i in [b'', None]:
                  ...     mapbranch(i, bmap)
                  'branch2'
                  'branch2'
                  >>> bmap = {b'None': b'branch3', b'default': b'branch4'}
                  >>> for i in [b'None', b'', None, b'default', b'branch5']:
                  ...     mapbranch(i, bmap)
                  'branch3'
                  'branch4'
                  'branch4'
                  'branch4'
                  'branch5'
                  '''
                  # If branch is None or empty, this commit is coming from the source
                  # repository's default branch and destined for the default branch in the
                  # destination repository. For such commits, using a literal "default"
                  # in branchmap below allows the user to map "default" to an alternate
                  # default branch in the destination repository.
                  branch = branchmap.get(branch or 'default', branch)
                  # At some point we used "None" literal to denote the default branch,
                  # attempt to use that for backward compatibility.
                  if (not branch):
                      branch = branchmap.get('None', branch)
                  return branch
              source_converters = [
                  ('cvs', convert_cvs, 'branchsort'),
                  ('git', convert_git, 'branchsort'),
                  ('svn', svn_source, 'branchsort'),
                  ('hg', mercurial_source, 'sourcesort'),
                  ('darcs', darcs_source, 'branchsort'),
                  ('mtn', monotone_source, 'branchsort'),
                  ('gnuarch', gnuarch_source, 'branchsort'),
                  ('bzr', bzr_source, 'branchsort'),
                  ('p4', p4_source, 'branchsort'),
                  ]
              sink_converters = [
                  ('hg', mercurial_sink),
                  ('svn', svn_sink),
                  ]
              def convertsource(ui, path, type, revs):
                  exceptions = []
                  if type and type not in [s[0] for s in source_converters]:
                      raise error.Abort(_('%s: invalid source repository type') % type)
                  for name, source, sortmode in source_converters:
                      try:
                          if not type or name == type:
                              return source(ui, name, path, revs), sortmode
                      except (NoRepo, MissingTool) as inst:
                          exceptions.append(inst)
                  if not ui.quiet:
                      for inst in exceptions:
                          ui.write("%s\n" % inst)
                  raise error.Abort(_('%s: missing or unsupported repository') % path)
              def convertsink(ui, path, type):
                  if type and type not in [s[0] for s in sink_converters]:
                      raise error.Abort(_('%s: invalid destination repository type') % type)
                  for name, sink in sink_converters:
                      try:
                          if not type or name == type:
                              return sink(ui, name, path)
                      except NoRepo as inst:
                          ui.note(_("convert: %s\n") % inst)
                      except MissingTool as inst:
                          raise error.Abort('%s\n' % inst)
                  raise error.Abort(_('%s: unknown repository type') % path)
              class progresssource(object):
                  def __init__(self, ui, source, filecount):
                      self.ui = ui
                      self.source = source
                      self.filecount = filecount
                      self.retrieved = 0
                  def getfile(self, file, rev):
                      self.retrieved += 1
                      self.ui.progress(_('getting files'), self.retrieved,
                                       item=file, total=self.filecount, unit=_('files'))
                      return self.source.getfile(file, rev)
                  def targetfilebelongstosource(self, targetfilename):
                      return self.source.targetfilebelongstosource(targetfilename)
                  def lookuprev(self, rev):
                      return self.source.lookuprev(rev)
                  def close(self):
                      self.ui.progress(_('getting files'), None)
              class converter(object):
                  def __init__(self, ui, source, dest, revmapfile, opts):
                      self.source = source
                      self.dest = dest
                      self.ui = ui
                      self.opts = opts
                      self.commitcache = {}
                      self.authors = {}
                      self.authorfile = None
                      # Record converted revisions persistently: maps source revision
                      # ID to target revision ID (both strings).  (This is how
                      # incremental conversions work.)
                      self.map = mapfile(ui, revmapfile)
                      # Read first the dst author map if any
                      authorfile = self.dest.authorfile()
                      if authorfile and os.path.exists(authorfile):
                          self.readauthormap(authorfile)
                      # Extend/Override with new author map if necessary
                      if opts.get('authormap'):
                          self.readauthormap(opts.get('authormap'))
                          self.authorfile = self.dest.authorfile()
                      self.splicemap = self.parsesplicemap(opts.get('splicemap'))
                      self.branchmap = mapfile(ui, opts.get('branchmap'))
                  def parsesplicemap(self, path):
                      """ check and validate the splicemap format and
                          return a child/parents dictionary.
                          Format checking has two parts.
 . generic format which is same across all source types
 . specific format checking which may be different for
                             different source type.  This logic is implemented in
                             checkrevformat function in source files like
                             hg.py, subversion.py etc.
                      """
                      if not path:
                          return {}
                      m = {}
                      try:
                          fp = open(path, 'rb')
                          for i, line in enumerate(util.iterfile(fp)):
                              line = line.splitlines()[0].rstrip()
                              if not line:
                                  # Ignore blank lines
                                  continue
                              # split line
                              lex = shlex.shlex(line, posix=True)
                              lex.whitespace_split = True
                              lex.whitespace += ','
                              line = list(lex)
                              # check number of parents
                              if not (2 <= len(line) <= 3):
                                  raise error.Abort(_('syntax error in %s(%d): child parent1'
                                                     '[,parent2] expected') % (path, i + 1))
                              for part in line:
                                  self.source.checkrevformat(part)
                              child, p1, p2 = line[0], line[1:2], line[2:]
                              if p1 == p2:
                                  m[child] = p1
                              else:
                                  m[child] = p1 + p2
                       # if file does not exist or error reading, exit
                      except IOError:
                          raise error.Abort(_('splicemap file not found or error reading %s:')
                                             % path)
                      return m
                  def walktree(self, heads):
                      '''Return a mapping that identifies the uncommitted parents of every
                      uncommitted changeset.'''
                      visit = heads
                      known = set()
                      parents = {}
                      numcommits = self.source.numcommits()
                      while visit:
                          n = visit.pop(0)
                          if n in known:
                              continue
                          if n in self.map:
                              m = self.map[n]
                              if m == SKIPREV or self.dest.hascommitfrommap(m):
                                  continue
                          known.add(n)
                          self.ui.progress(_('scanning'), len(known), unit=_('revisions'),
                                           total=numcommits)
                          commit = self.cachecommit(n)
                          parents[n] = []
                          for p in commit.parents:
                              parents[n].append(p)
                              visit.append(p)
                      self.ui.progress(_('scanning'), None)
                      return parents
                  def mergesplicemap(self, parents, splicemap):
                      """A splicemap redefines child/parent relationships. Check the
                      map contains valid revision identifiers and merge the new
                      links in the source graph.
                      """
                      for c in sorted(splicemap):
                          if c not in parents:
                              if not self.dest.hascommitforsplicemap(self.map.get(c, c)):
                                  # Could be in source but not converted during this run
                                  self.ui.warn(_('splice map revision %s is not being '
                                                 'converted, ignoring\n') % c)
                              continue
                          pc = []
                          for p in splicemap[c]:
                              # We do not have to wait for nodes already in dest.
                              if self.dest.hascommitforsplicemap(self.map.get(p, p)):
                                  continue
                              # Parent is not in dest and not being converted, not good
                              if p not in parents:
                                  raise error.Abort(_('unknown splice map parent: %s') % p)
                              pc.append(p)
                          parents[c] = pc
                  def toposort(self, parents, sortmode):
                      '''Return an ordering such that every uncommitted changeset is
                      preceded by all its uncommitted ancestors.'''
                      def mapchildren(parents):
                          """Return a (children, roots) tuple where 'children' maps parent
                          revision identifiers to children ones, and 'roots' is the list of
                          revisions without parents. 'parents' must be a mapping of revision
                          identifier to its parents ones.
                          """
                          visit = collections.deque(sorted(parents))
                          seen = set()
                          children = {}
                          roots = []
                          while visit:
                              n = visit.popleft()
                              if n in seen:
                                  continue
                              seen.add(n)
                              # Ensure that nodes without parents are present in the
                              # 'children' mapping.
                              children.setdefault(n, [])
                              hasparent = False
                              for p in parents[n]:
                                  if p not in self.map:
                                      visit.append(p)
                                      hasparent = True
                                  children.setdefault(p, []).append(n)
                              if not hasparent:
                                  roots.append(n)
                          return children, roots
                      # Sort functions are supposed to take a list of revisions which
                      # can be converted immediately and pick one
                      def makebranchsorter():
                          """If the previously converted revision has a child in the
                          eligible revisions list, pick it. Return the list head
                          otherwise. Branch sort attempts to minimize branch
                          switching, which is harmful for Mercurial backend
                          compression.
                          """
                          prev = [None]
                          def picknext(nodes):
                              next = nodes[0]
                              for n in nodes:
                                  if prev[0] in parents[n]:
                                      next = n
                                      break
                              prev[0] = next
                              return next
                          return picknext
                      def makesourcesorter():
                          """Source specific sort."""
                          keyfn = lambda n: self.commitcache[n].sortkey
                          def picknext(nodes):
                              return sorted(nodes, key=keyfn)[0]
                          return picknext
                      def makeclosesorter():
                          """Close order sort."""
                          keyfn = lambda n: ('close' not in self.commitcache[n].extra,
                                             self.commitcache[n].sortkey)
                          def picknext(nodes):
                              return sorted(nodes, key=keyfn)[0]
                          return picknext
                      def makedatesorter():
                          """Sort revisions by date."""
                          dates = {}
                          def getdate(n):
                              if n not in dates:
                                  dates[n] = util.parsedate(self.commitcache[n].date)
                              return dates[n]
                          def picknext(nodes):
                              return min([(getdate(n), n) for n in nodes])[1]
                          return picknext
                      if sortmode == 'branchsort':
                          picknext = makebranchsorter()
                      elif sortmode == 'datesort':
                          picknext = makedatesorter()
                      elif sortmode == 'sourcesort':
                          picknext = makesourcesorter()
                      elif sortmode == 'closesort':
                          picknext = makeclosesorter()
                      else:
                          raise error.Abort(_('unknown sort mode: %s') % sortmode)
                      children, actives = mapchildren(parents)
                      s = []
                      pendings = {}
                      while actives:
                          n = picknext(actives)
                          actives.remove(n)
                          s.append(n)
                          # Update dependents list
                          for c in children.get(n, []):
                              if c not in pendings:
                                  pendings[c] = [p for p in parents[c] if p not in self.map]
                              try:
                                  pendings[c].remove(n)
                              except ValueError:
                                  raise error.Abort(_('cycle detected between %s and %s')
                                                     % (recode(c), recode(n)))
                              if not pendings[c]:
                                  # Parents are converted, node is eligible
                                  actives.insert(0, c)
                                  pendings[c] = None
                      if len(s) != len(parents):
                          raise error.Abort(_("not all revisions were sorted"))
                      return s
                  def writeauthormap(self):
                      authorfile = self.authorfile
                      if authorfile:
                          self.ui.status(_('writing author map file %s\n') % authorfile)
                          ofile = open(authorfile, 'wb+')
                          for author in self.authors:
                              ofile.write(util.tonativeeol("%s=%s\n"
                                                           % (author, self.authors[author])))
                          ofile.close()
                  def readauthormap(self, authorfile):
                      afile = open(authorfile, 'rb')
                      for line in afile:
                          line = line.strip()
                          if not line or line.startswith('#'):
                              continue
                          try:
                              srcauthor, dstauthor = line.split('=', 1)
                          except ValueError:
                              msg = _('ignoring bad line in author map file %s: %s\n')
                              self.ui.warn(msg % (authorfile, line.rstrip()))
                              continue
                          srcauthor = srcauthor.strip()
                          dstauthor = dstauthor.strip()
                          if self.authors.get(srcauthor) in (None, dstauthor):
                              msg = _('mapping author %s to %s\n')
                              self.ui.debug(msg % (srcauthor, dstauthor))
                              self.authors[srcauthor] = dstauthor
                              continue
                          m = _('overriding mapping for author %s, was %s, will be %s\n')
                          self.ui.status(m % (srcauthor, self.authors[srcauthor], dstauthor))
                      afile.close()
                  def cachecommit(self, rev):
                      commit = self.source.getcommit(rev)
                      commit.author = self.authors.get(commit.author, commit.author)
                      commit.branch = mapbranch(commit.branch, self.branchmap)
                      self.commitcache[rev] = commit
                      return commit
                  def copy(self, rev):
                      commit = self.commitcache[rev]
                      full = self.opts.get('full')
                      changes = self.source.getchanges(rev, full)
                      if isinstance(changes, bytes):
                          if changes == SKIPREV:
                              dest = SKIPREV
                          else:
                              dest = self.map[changes]
                          self.map[rev] = dest
                          return
                      files, copies, cleanp2 = changes
                      pbranches = []
                      if commit.parents:
                          for prev in commit.parents:
                              if prev not in self.commitcache:
                                  self.cachecommit(prev)
                              pbranches.append((self.map[prev],
                                                self.commitcache[prev].branch))
                      self.dest.setbranch(commit.branch, pbranches)
                      try:
                          parents = self.splicemap[rev]
                          self.ui.status(_('spliced in %s as parents of %s\n') %
                                         (_(' and ').join(parents), rev))
                          parents = [self.map.get(p, p) for p in parents]
                      except KeyError:
                          parents = [b[0] for b in pbranches]
                          parents.extend(self.map[x]
                                         for x in commit.optparents
                                         if x in self.map)
                      if len(pbranches) != 2:
                          cleanp2 = set()
                      if len(parents) < 3:
                          source = progresssource(self.ui, self.source, len(files))
                      else:
                          # For an octopus merge, we end up traversing the list of
                          # changed files N-1 times. This tweak to the number of
                          # files makes it so the progress bar doesn't overflow
                          # itself.
                          source = progresssource(self.ui, self.source,
                                                  len(files) * (len(parents) - 1))
                      newnode = self.dest.putcommit(files, copies, parents, commit,
                                                    source, self.map, full, cleanp2)
                      source.close()
                      self.source.converted(rev, newnode)
                      self.map[rev] = newnode
                  def convert(self, sortmode):
                      try:
                          self.source.before()
                          self.dest.before()
                          self.source.setrevmap(self.map)
                          self.ui.status(_("scanning source...\n"))
                          heads = self.source.getheads()
                          parents = self.walktree(heads)
                          self.mergesplicemap(parents, self.splicemap)
                          self.ui.status(_("sorting...\n"))
                          t = self.toposort(parents, sortmode)
                          num = len(t)
                          c = None
                          self.ui.status(_("converting...\n"))
                          for i, c in enumerate(t):
                              num -= 1
                              desc = self.commitcache[c].desc
                              if "\n" in desc:
                                  desc = desc.splitlines()[0]
                              # convert log message to local encoding without using
                              # tolocal() because the encoding.encoding convert()
                              # uses is 'utf-8'
                              self.ui.status("%d %s\n" % (num, recode(desc)))
                              self.ui.note(_("source: %s\n") % recode(c))
                              self.ui.progress(_('converting'), i, unit=_('revisions'),
                                               total=len(t))
                              self.copy(c)
                          self.ui.progress(_('converting'), None)
                          if not self.ui.configbool('convert', 'skiptags'):
                              tags = self.source.gettags()
                              ctags = {}
                              for k in tags:
                                  v = tags[k]
                                  if self.map.get(v, SKIPREV) != SKIPREV:
                                      ctags[k] = self.map[v]
                              if c and ctags:
                                  nrev, tagsparent = self.dest.puttags(ctags)
                                  if nrev and tagsparent:
                                      # write another hash correspondence to override the
                                      # previous one so we don't end up with extra tag heads
                                      tagsparents = [e for e in self.map.iteritems()
                                                     if e[1] == tagsparent]
                                      if tagsparents:
                                          self.map[tagsparents[0][0]] = nrev
                          bookmarks = self.source.getbookmarks()
                          cbookmarks = {}
                          for k in bookmarks:
                              v = bookmarks[k]
                              if self.map.get(v, SKIPREV) != SKIPREV:
                                  cbookmarks[k] = self.map[v]
                          if c and cbookmarks:
                              self.dest.putbookmarks(cbookmarks)
                          self.writeauthormap()
                      finally:
                          self.cleanup()
                  def cleanup(self):
                      try:
                          self.dest.after()
                      finally:
                          self.source.after()
                      self.map.close()
              def convert(ui, src, dest=None, revmapfile=None, **opts):
+                 opts = pycompat.byteskwargs(opts)
                  global orig_encoding
                  orig_encoding = encoding.encoding
                  encoding.encoding = 'UTF-8'
                  # support --authors as an alias for --authormap
                  if not opts.get('authormap'):
                      opts['authormap'] = opts.get('authors')
                  if not dest:
                      dest = hg.defaultdest(src) + "-hg"
                      ui.status(_("assuming destination %s\n") % dest)
                  destc = convertsink(ui, dest, opts.get('dest_type'))
                  destc = scmutil.wrapconvertsink(destc)
                  try:
                      srcc, defaultsort = convertsource(ui, src, opts.get('source_type'),
                                                        opts.get('rev'))
                  except Exception:
                      for path in destc.created:
                          shutil.rmtree(path, True)
                      raise
                  sortmodes = ('branchsort', 'datesort', 'sourcesort', 'closesort')
                  sortmode = [m for m in sortmodes if opts.get(m)]
                  if len(sortmode) > 1:
                      raise error.Abort(_('more than one sort mode specified'))
                  if sortmode:
                      sortmode = sortmode[0]
                  else:
                      sortmode = defaultsort
                  if sortmode == 'sourcesort' and not srcc.hasnativeorder():
                      raise error.Abort(_('--sourcesort is not supported by this data source')
                                       )
                  if sortmode == 'closesort' and not srcc.hasnativeclose():
                      raise error.Abort(_('--closesort is not supported by this data source'))
                  fmap = opts.get('filemap')
                  if fmap:
                      srcc = filemap.filemap_source(ui, srcc, fmap)
                      destc.setfilemapmode(True)
                  if not revmapfile:
                      revmapfile = destc.revmapfile()
                  c = converter(ui, srcc, destc, revmapfile, opts)
                  c.convert(sortmode)

hgext/convert/cvsps.py

0 +1 0

              # Mercurial built-in replacement for cvsps.
              #
              # Copyright 2008, Frank Kingswood <frank@kingswood-consulting.co.uk>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import os
              import re
              from mercurial.i18n import _
              from mercurial import (
                  encoding,
                  error,
                  hook,
                  pycompat,
                  util,
              )
              pickle = util.pickle
              class logentry(object):
                  '''Class logentry has the following attributes:
                      .author    - author name as CVS knows it
                      .branch    - name of branch this revision is on
                      .branches  - revision tuple of branches starting at this revision
                      .comment   - commit message
                      .commitid  - CVS commitid or None
                      .date      - the commit date as a (time, tz) tuple
                      .dead      - true if file revision is dead
                      .file      - Name of file
                      .lines     - a tuple (+lines, -lines) or None
                      .parent    - Previous revision of this entry
                      .rcs       - name of file as returned from CVS
                      .revision  - revision number as tuple
                      .tags      - list of tags on the file
                      .synthetic - is this a synthetic "file ... added on ..." revision?
                      .mergepoint - the branch that has been merged from (if present in
                                    rlog output) or None
                      .branchpoints - the branches that start at the current entry or empty
                  '''
                  def __init__(self, **entries):
                      self.synthetic = False
                      self.__dict__.update(entries)
                  def __repr__(self):
                      items = ("%s=%r"%(k, self.__dict__[k]) for k in sorted(self.__dict__))
                      return "%s(%s)"%(type(self).__name__, ", ".join(items))
              class logerror(Exception):
                  pass
              def getrepopath(cvspath):
                  """Return the repository path from a CVS path.
                  >>> getrepopath(b'/foo/bar')
                  '/foo/bar'
                  >>> getrepopath(b'c:/foo/bar')
                  '/foo/bar'
                  >>> getrepopath(b':pserver:10/foo/bar')
                  '/foo/bar'
                  >>> getrepopath(b':pserver:10c:/foo/bar')
                  '/foo/bar'
                  >>> getrepopath(b':pserver:/foo/bar')
                  '/foo/bar'
                  >>> getrepopath(b':pserver:c:/foo/bar')
                  '/foo/bar'
                  >>> getrepopath(b':pserver:truc@foo.bar:/foo/bar')
                  '/foo/bar'
                  >>> getrepopath(b':pserver:truc@foo.bar:c:/foo/bar')
                  '/foo/bar'
                  >>> getrepopath(b'user@server/path/to/repository')
                  '/path/to/repository'
                  """
                  # According to CVS manual, CVS paths are expressed like:
                  # [:method:][[user][:password]@]hostname[:[port]]/path/to/repository
                  #
                  # CVSpath is splitted into parts and then position of the first occurrence
                  # of the '/' char after the '@' is located. The solution is the rest of the
                  # string after that '/' sign including it
                  parts = cvspath.split(':')
                  atposition = parts[-1].find('@')
                  start = 0
                  if atposition != -1:
                      start = atposition
                  repopath = parts[-1][parts[-1].find('/', start):]
                  return repopath
              def createlog(ui, directory=None, root="", rlog=True, cache=None):
                  '''Collect the CVS rlog'''
                  # Because we store many duplicate commit log messages, reusing strings
                  # saves a lot of memory and pickle storage space.
                  _scache = {}
                  def scache(s):
                      "return a shared version of a string"
                      return _scache.setdefault(s, s)
                  ui.status(_('collecting CVS rlog\n'))
                  log = []      # list of logentry objects containing the CVS state
                  # patterns to match in CVS (r)log output, by state of use
                  re_00 = re.compile('RCS file: (.+)$')
                  re_01 = re.compile('cvs \\[r?log aborted\\]: (.+)$')
                  re_02 = re.compile('cvs (r?log|server): (.+)\n$')
                  re_03 = re.compile("(Cannot access.+CVSROOT)|"
                                     "(can't create temporary directory.+)$")
                  re_10 = re.compile('Working file: (.+)$')
                  re_20 = re.compile('symbolic names:')
                  re_30 = re.compile('\t(.+): ([\\d.]+)$')
                  re_31 = re.compile('----------------------------$')
                  re_32 = re.compile('======================================='
                                     '======================================$')
                  re_50 = re.compile('revision ([\\d.]+)(\s+locked by:\s+.+;)?$')
                  re_60 = re.compile(r'date:\s+(.+);\s+author:\s+(.+);\s+state:\s+(.+?);'
                                     r'(\s+lines:\s+(\+\d+)?\s+(-\d+)?;)?'
                                     r'(\s+commitid:\s+([^;]+);)?'
                                     r'(.*mergepoint:\s+([^;]+);)?')
                  re_70 = re.compile('branches: (.+);$')
                  file_added_re = re.compile(r'file [^/]+ was (initially )?added on branch')
                  prefix = ''   # leading path to strip of what we get from CVS
                  if directory is None:
                      # Current working directory
                      # Get the real directory in the repository
                      try:
                          prefix = open(os.path.join('CVS','Repository'), 'rb').read().strip()
                          directory = prefix
                          if prefix == ".":
                              prefix = ""
                      except IOError:
                          raise logerror(_('not a CVS sandbox'))
                      if prefix and not prefix.endswith(pycompat.ossep):
                          prefix += pycompat.ossep
                      # Use the Root file in the sandbox, if it exists
                      try:
                          root = open(os.path.join('CVS','Root'), 'rb').read().strip()
                      except IOError:
                          pass
                  if not root:
                      root = encoding.environ.get('CVSROOT', '')
                  # read log cache if one exists
                  oldlog = []
                  date = None
                  if cache:
                      cachedir = os.path.expanduser('~/.hg.cvsps')
                      if not os.path.exists(cachedir):
                          os.mkdir(cachedir)
                      # The cvsps cache pickle needs a uniquified name, based on the
                      # repository location. The address may have all sort of nasties
                      # in it, slashes, colons and such. So here we take just the
                      # alphanumeric characters, concatenated in a way that does not
                      # mix up the various components, so that
                      #    :pserver:user@server:/path
                      # and
                      #    /pserver/user/server/path
                      # are mapped to different cache file names.
                      cachefile = root.split(":") + [directory, "cache"]
                      cachefile = ['-'.join(re.findall(r'\w+', s)) for s in cachefile if s]
                      cachefile = os.path.join(cachedir,
                                               '.'.join([s for s in cachefile if s]))
                  if cache == 'update':
                      try:
                          ui.note(_('reading cvs log cache %s\n') % cachefile)
                          oldlog = pickle.load(open(cachefile, 'rb'))
                          for e in oldlog:
                              if not (util.safehasattr(e, 'branchpoints') and
                                      util.safehasattr(e, 'commitid') and
                                      util.safehasattr(e, 'mergepoint')):
                                  ui.status(_('ignoring old cache\n'))
                                  oldlog = []
                                  break
                          ui.note(_('cache has %d log entries\n') % len(oldlog))
                      except Exception as e:
                          ui.note(_('error reading cache: %r\n') % e)
                      if oldlog:
                          date = oldlog[-1].date    # last commit date as a (time,tz) tuple
                          date = util.datestr(date, '%Y/%m/%d %H:%M:%S %1%2')
                  # build the CVS commandline
                  cmd = ['cvs', '-q']
                  if root:
                      cmd.append('-d%s' % root)
                      p = util.normpath(getrepopath(root))
                      if not p.endswith('/'):
                          p += '/'
                      if prefix:
                          # looks like normpath replaces "" by "."
                          prefix = p + util.normpath(prefix)
                      else:
                          prefix = p
                  cmd.append(['log', 'rlog'][rlog])
                  if date:
                      # no space between option and date string
                      cmd.append('-d>%s' % date)
                  cmd.append(directory)
                  # state machine begins here
                  tags = {}     # dictionary of revisions on current file with their tags
                  branchmap = {} # mapping between branch names and revision numbers
                  rcsmap = {}
                  state = 0
                  store = False # set when a new record can be appended
                  cmd = [util.shellquote(arg) for arg in cmd]
                  ui.note(_("running %s\n") % (' '.join(cmd)))
                  ui.debug("prefix=%r directory=%r root=%r\n" % (prefix, directory, root))
                  pfp = util.popen(' '.join(cmd))
                  peek = pfp.readline()
                  while True:
                      line = peek
                      if line == '':
                          break
                      peek = pfp.readline()
                      if line.endswith('\n'):
                          line = line[:-1]
                      #ui.debug('state=%d line=%r\n' % (state, line))
                      if state == 0:
                          # initial state, consume input until we see 'RCS file'
                          match = re_00.match(line)
                          if match:
                              rcs = match.group(1)
                              tags = {}
                              if rlog:
                                  filename = util.normpath(rcs[:-2])
                                  if filename.startswith(prefix):
                                      filename = filename[len(prefix):]
                                  if filename.startswith('/'):
                                      filename = filename[1:]
                                  if filename.startswith('Attic/'):
                                      filename = filename[6:]
                                  else:
                                      filename = filename.replace('/Attic/', '/')
                                  state = 2
                                  continue
                              state = 1
                              continue
                          match = re_01.match(line)
                          if match:
                              raise logerror(match.group(1))
                          match = re_02.match(line)
                          if match:
                              raise logerror(match.group(2))
                          if re_03.match(line):
                              raise logerror(line)
                      elif state == 1:
                          # expect 'Working file' (only when using log instead of rlog)
                          match = re_10.match(line)
                          assert match, _('RCS file must be followed by working file')
                          filename = util.normpath(match.group(1))
                          state = 2
                      elif state == 2:
                          # expect 'symbolic names'
                          if re_20.match(line):
                              branchmap = {}
                              state = 3
                      elif state == 3:
                          # read the symbolic names and store as tags
                          match = re_30.match(line)
                          if match:
                              rev = [int(x) for x in match.group(2).split('.')]
                              # Convert magic branch number to an odd-numbered one
                              revn = len(rev)
                              if revn > 3 and (revn % 2) == 0 and rev[-2] == 0:
                                  rev = rev[:-2] + rev[-1:]
                              rev = tuple(rev)
                              if rev not in tags:
                                  tags[rev] = []
                              tags[rev].append(match.group(1))
                              branchmap[match.group(1)] = match.group(2)
                          elif re_31.match(line):
                              state = 5
                          elif re_32.match(line):
                              state = 0
                      elif state == 4:
                          # expecting '------' separator before first revision
                          if re_31.match(line):
                              state = 5
                          else:
                              assert not re_32.match(line), _('must have at least '
                                                              'some revisions')
                      elif state == 5:
                          # expecting revision number and possibly (ignored) lock indication
                          # we create the logentry here from values stored in states 0 to 4,
                          # as this state is re-entered for subsequent revisions of a file.
                          match = re_50.match(line)
                          assert match, _('expected revision number')
                          e = logentry(rcs=scache(rcs),
                                       file=scache(filename),
                                       revision=tuple([int(x) for x in
                                                       match.group(1).split('.')]),
                                       branches=[],
                                       parent=None,
                                       commitid=None,
                                       mergepoint=None,
                                       branchpoints=set())
                          state = 6
                      elif state == 6:
                          # expecting date, author, state, lines changed
                          match = re_60.match(line)
                          assert match, _('revision must be followed by date line')
                          d = match.group(1)
                          if d[2] == '/':
                              # Y2K
                              d = '19' + d
                          if len(d.split()) != 3:
                              # cvs log dates always in GMT
                              d = d + ' UTC'
                          e.date = util.parsedate(d, ['%y/%m/%d %H:%M:%S',
                                                      '%Y/%m/%d %H:%M:%S',
                                                      '%Y-%m-%d %H:%M:%S'])
                          e.author = scache(match.group(2))
                          e.dead = match.group(3).lower() == 'dead'
                          if match.group(5):
                              if match.group(6):
                                  e.lines = (int(match.group(5)), int(match.group(6)))
                              else:
                                  e.lines = (int(match.group(5)), 0)
                          elif match.group(6):
                              e.lines = (0, int(match.group(6)))
                          else:
                              e.lines = None
                          if match.group(7): # cvs 1.12 commitid
                              e.commitid = match.group(8)
                          if match.group(9): # cvsnt mergepoint
                              myrev = match.group(10).split('.')
                              if len(myrev) == 2: # head
                                  e.mergepoint = 'HEAD'
                              else:
                                  myrev = '.'.join(myrev[:-2] + ['0', myrev[-2]])
                                  branches = [b for b in branchmap if branchmap[b] == myrev]
                                  assert len(branches) == 1, ('unknown branch: %s'
                                                              % e.mergepoint)
                                  e.mergepoint = branches[0]
                          e.comment = []
                          state = 7
                      elif state == 7:
                          # read the revision numbers of branches that start at this revision
                          # or store the commit log message otherwise
                          m = re_70.match(line)
                          if m:
                              e.branches = [tuple([int(y) for y in x.strip().split('.')])
                                              for x in m.group(1).split(';')]
                              state = 8
                          elif re_31.match(line) and re_50.match(peek):
                              state = 5
                              store = True
                          elif re_32.match(line):
                              state = 0
                              store = True
                          else:
                              e.comment.append(line)
                      elif state == 8:
                          # store commit log message
                          if re_31.match(line):
                              cpeek = peek
                              if cpeek.endswith('\n'):
                                  cpeek = cpeek[:-1]
                              if re_50.match(cpeek):
                                  state = 5
                                  store = True
                              else:
                                  e.comment.append(line)
                          elif re_32.match(line):
                              state = 0
                              store = True
                          else:
                              e.comment.append(line)
                      # When a file is added on a branch B1, CVS creates a synthetic
                      # dead trunk revision 1.1 so that the branch has a root.
                      # Likewise, if you merge such a file to a later branch B2 (one
                      # that already existed when the file was added on B1), CVS
                      # creates a synthetic dead revision 1.1.x.1 on B2.  Don't drop
                      # these revisions now, but mark them synthetic so
                      # createchangeset() can take care of them.
                      if (store and
                            e.dead and
                            e.revision[-1] == 1 and      # 1.1 or 1.1.x.1
                            len(e.comment) == 1 and
                            file_added_re.match(e.comment[0])):
                          ui.debug('found synthetic revision in %s: %r\n'
                                   % (e.rcs, e.comment[0]))
                          e.synthetic = True
                      if store:
                          # clean up the results and save in the log.
                          store = False
                          e.tags = sorted([scache(x) for x in tags.get(e.revision, [])])
                          e.comment = scache('\n'.join(e.comment))
                          revn = len(e.revision)
                          if revn > 3 and (revn % 2) == 0:
                              e.branch = tags.get(e.revision[:-1], [None])[0]
                          else:
                              e.branch = None
                          # find the branches starting from this revision
                          branchpoints = set()
                          for branch, revision in branchmap.iteritems():
                              revparts = tuple([int(i) for i in revision.split('.')])
                              if len(revparts) < 2: # bad tags
                                  continue
                              if revparts[-2] == 0 and revparts[-1] % 2 == 0:
                                  # normal branch
                                  if revparts[:-2] == e.revision:
                                      branchpoints.add(branch)
                              elif revparts == (1, 1, 1): # vendor branch
                                  if revparts in e.branches:
                                      branchpoints.add(branch)
                          e.branchpoints = branchpoints
                          log.append(e)
                          rcsmap[e.rcs.replace('/Attic/', '/')] = e.rcs
                          if len(log) % 100 == 0:
                              ui.status(util.ellipsis('%d %s' % (len(log), e.file), 80)+'\n')
                  log.sort(key=lambda x: (x.rcs, x.revision))
                  # find parent revisions of individual files
                  versions = {}
                  for e in sorted(oldlog, key=lambda x: (x.rcs, x.revision)):
                      rcs = e.rcs.replace('/Attic/', '/')
                      if rcs in rcsmap:
                          e.rcs = rcsmap[rcs]
                      branch = e.revision[:-1]
                      versions[(e.rcs, branch)] = e.revision
                  for e in log:
                      branch = e.revision[:-1]
                      p = versions.get((e.rcs, branch), None)
                      if p is None:
                          p = e.revision[:-2]
                      e.parent = p
                      versions[(e.rcs, branch)] = e.revision
                  # update the log cache
                  if cache:
                      if log:
                          # join up the old and new logs
                          log.sort(key=lambda x: x.date)
                          if oldlog and oldlog[-1].date >= log[0].date:
                              raise logerror(_('log cache overlaps with new log entries,'
                                               ' re-run without cache.'))
                          log = oldlog + log
                          # write the new cachefile
                          ui.note(_('writing cvs log cache %s\n') % cachefile)
                          pickle.dump(log, open(cachefile, 'wb'))
                      else:
                          log = oldlog
                  ui.status(_('%d log entries\n') % len(log))
                  encodings = ui.configlist('convert', 'cvsps.logencoding')
                  if encodings:
                      def revstr(r):
                          # this is needed, because logentry.revision is a tuple of "int"
                          # (e.g. (1, 2) for "1.2")
                          return '.'.join(pycompat.maplist(pycompat.bytestr, r))
                      for entry in log:
                          comment = entry.comment
                          for e in encodings:
                              try:
                                  entry.comment = comment.decode(e).encode('utf-8')
                                  if ui.debugflag:
                                      ui.debug("transcoding by %s: %s of %s\n" %
                                               (e, revstr(entry.revision), entry.file))
                                  break
                              except UnicodeDecodeError:
                                  pass # try next encoding
                              except LookupError as inst: # unknown encoding, maybe
                                  raise error.Abort(inst,
                                                    hint=_('check convert.cvsps.logencoding'
                                                           ' configuration'))
                          else:
                              raise error.Abort(_("no encoding can transcode"
                                                  " CVS log message for %s of %s")
                                                % (revstr(entry.revision), entry.file),
                                                hint=_('check convert.cvsps.logencoding'
                                                       ' configuration'))
                  hook.hook(ui, None, "cvslog", True, log=log)
                  return log
              class changeset(object):
                  '''Class changeset has the following attributes:
                      .id        - integer identifying this changeset (list index)
                      .author    - author name as CVS knows it
                      .branch    - name of branch this changeset is on, or None
                      .comment   - commit message
                      .commitid  - CVS commitid or None
                      .date      - the commit date as a (time,tz) tuple
                      .entries   - list of logentry objects in this changeset
                      .parents   - list of one or two parent changesets
                      .tags      - list of tags on this changeset
                      .synthetic - from synthetic revision "file ... added on branch ..."
                      .mergepoint- the branch that has been merged from or None
                      .branchpoints- the branches that start at the current entry or empty
                  '''
                  def __init__(self, **entries):
                      self.id = None
                      self.synthetic = False
                      self.__dict__.update(entries)
                  def __repr__(self):
                      items = ("%s=%r"%(k, self.__dict__[k]) for k in sorted(self.__dict__))
                      return "%s(%s)"%(type(self).__name__, ", ".join(items))
              def createchangeset(ui, log, fuzz=60, mergefrom=None, mergeto=None):
                  '''Convert log into changesets.'''
                  ui.status(_('creating changesets\n'))
                  # try to order commitids by date
                  mindate = {}
                  for e in log:
                      if e.commitid:
                          mindate[e.commitid] = min(e.date, mindate.get(e.commitid))
                  # Merge changesets
                  log.sort(key=lambda x: (mindate.get(x.commitid), x.commitid, x.comment,
                                          x.author, x.branch, x.date, x.branchpoints))
                  changesets = []
                  files = set()
                  c = None
                  for i, e in enumerate(log):
                      # Check if log entry belongs to the current changeset or not.
                      # Since CVS is file-centric, two different file revisions with
                      # different branchpoints should be treated as belonging to two
                      # different changesets (and the ordering is important and not
                      # honoured by cvsps at this point).
                      #
                      # Consider the following case:
                      # foo 1.1 branchpoints: [MYBRANCH]
                      # bar 1.1 branchpoints: [MYBRANCH, MYBRANCH2]
                      #
                      # Here foo is part only of MYBRANCH, but not MYBRANCH2, e.g. a
                      # later version of foo may be in MYBRANCH2, so foo should be the
                      # first changeset and bar the next and MYBRANCH and MYBRANCH2
                      # should both start off of the bar changeset. No provisions are
                      # made to ensure that this is, in fact, what happens.
                      if not (c and e.branchpoints == c.branchpoints and
                              (# cvs commitids
                               (e.commitid is not None and e.commitid == c.commitid) or
                               (# no commitids, use fuzzy commit detection
                                (e.commitid is None or c.commitid is None) and
                                 e.comment == c.comment and
                                 e.author == c.author and
                                 e.branch == c.branch and
                                 ((c.date[0] + c.date[1]) <=
                                  (e.date[0] + e.date[1]) <=
                                  (c.date[0] + c.date[1]) + fuzz) and
                                 e.file not in files))):
                          c = changeset(comment=e.comment, author=e.author,
                                        branch=e.branch, date=e.date,
                                        entries=[], mergepoint=e.mergepoint,
                                        branchpoints=e.branchpoints, commitid=e.commitid)
                          changesets.append(c)
                          files = set()
                          if len(changesets) % 100 == 0:
                              t = '%d %s' % (len(changesets), repr(e.comment)[1:-1])
                              ui.status(util.ellipsis(t, 80) + '\n')
                      c.entries.append(e)
                      files.add(e.file)
                      c.date = e.date       # changeset date is date of latest commit in it
                  # Mark synthetic changesets
                  for c in changesets:
                      # Synthetic revisions always get their own changeset, because
                      # the log message includes the filename.  E.g. if you add file3
                      # and file4 on a branch, you get four log entries and three
                      # changesets:
                      #   "File file3 was added on branch ..." (synthetic, 1 entry)
                      #   "File file4 was added on branch ..." (synthetic, 1 entry)
                      #   "Add file3 and file4 to fix ..."     (real, 2 entries)
                      # Hence the check for 1 entry here.
                      c.synthetic = len(c.entries) == 1 and c.entries[0].synthetic
                  # Sort files in each changeset
                  def entitycompare(l, r):
                      'Mimic cvsps sorting order'
                      l = l.file.split('/')
                      r = r.file.split('/')
                      nl = len(l)
                      nr = len(r)
                      n = min(nl, nr)
                      for i in range(n):
                          if i + 1 == nl and nl < nr:
                              return -1
                          elif i + 1 == nr and nl > nr:
                              return +1
                          elif l[i] < r[i]:
                              return -1
                          elif l[i] > r[i]:
                              return +1
                      return 0
                  for c in changesets:
                      c.entries.sort(entitycompare)
                  # Sort changesets by date
                  odd = set()
                  def cscmp(l, r):
                      d = sum(l.date) - sum(r.date)
                      if d:
                          return d
                      # detect vendor branches and initial commits on a branch
                      le = {}
                      for e in l.entries:
                          le[e.rcs] = e.revision
                      re = {}
                      for e in r.entries:
                          re[e.rcs] = e.revision
                      d = 0
                      for e in l.entries:
                          if re.get(e.rcs, None) == e.parent:
                              assert not d
                              d = 1
                              break
                      for e in r.entries:
                          if le.get(e.rcs, None) == e.parent:
                              if d:
                                  odd.add((l, r))
                              d = -1
                              break
                      # By this point, the changesets are sufficiently compared that
                      # we don't really care about ordering. However, this leaves
                      # some race conditions in the tests, so we compare on the
                      # number of files modified, the files contained in each
                      # changeset, and the branchpoints in the change to ensure test
                      # output remains stable.
                      # recommended replacement for cmp from
                      # https://docs.python.org/3.0/whatsnew/3.0.html
                      c = lambda x, y: (x > y) - (x < y)
                      # Sort bigger changes first.
                      if not d:
                          d = c(len(l.entries), len(r.entries))
                      # Try sorting by filename in the change.
                      if not d:
                          d = c([e.file for e in l.entries], [e.file for e in r.entries])
                      # Try and put changes without a branch point before ones with
                      # a branch point.
                      if not d:
                          d = c(len(l.branchpoints), len(r.branchpoints))
                      return d
                  changesets.sort(cscmp)
                  # Collect tags
                  globaltags = {}
                  for c in changesets:
                      for e in c.entries:
                          for tag in e.tags:
                              # remember which is the latest changeset to have this tag
                              globaltags[tag] = c
                  for c in changesets:
                      tags = set()
                      for e in c.entries:
                          tags.update(e.tags)
                      # remember tags only if this is the latest changeset to have it
                      c.tags = sorted(tag for tag in tags if globaltags[tag] is c)
                  # Find parent changesets, handle {{mergetobranch BRANCHNAME}}
                  # by inserting dummy changesets with two parents, and handle
                  # {{mergefrombranch BRANCHNAME}} by setting two parents.
                  if mergeto is None:
                      mergeto = r'{{mergetobranch ([-\w]+)}}'
                  if mergeto:
                      mergeto = re.compile(mergeto)
                  if mergefrom is None:
                      mergefrom = r'{{mergefrombranch ([-\w]+)}}'
                  if mergefrom:
                      mergefrom = re.compile(mergefrom)
                  versions = {}    # changeset index where we saw any particular file version
                  branches = {}    # changeset index where we saw a branch
                  n = len(changesets)
                  i = 0
                  while i < n:
                      c = changesets[i]
                      for f in c.entries:
                          versions[(f.rcs, f.revision)] = i
                      p = None
                      if c.branch in branches:
                          p = branches[c.branch]
                      else:
                          # first changeset on a new branch
                          # the parent is a changeset with the branch in its
                          # branchpoints such that it is the latest possible
                          # commit without any intervening, unrelated commits.
                          for candidate in xrange(i):
                              if c.branch not in changesets[candidate].branchpoints:
                                  if p is not None:
                                      break
                                  continue
                              p = candidate
                      c.parents = []
                      if p is not None:
                          p = changesets[p]
                          # Ensure no changeset has a synthetic changeset as a parent.
                          while p.synthetic:
                              assert len(p.parents) <= 1, \
                                     _('synthetic changeset cannot have multiple parents')
                              if p.parents:
                                  p = p.parents[0]
                              else:
                                  p = None
                                  break
                          if p is not None:
                              c.parents.append(p)
                      if c.mergepoint:
                          if c.mergepoint == 'HEAD':
                              c.mergepoint = None
                          c.parents.append(changesets[branches[c.mergepoint]])
                      if mergefrom:
                          m = mergefrom.search(c.comment)
                          if m:
                              m = m.group(1)
                              if m == 'HEAD':
                                  m = None
                              try:
                                  candidate = changesets[branches[m]]
                              except KeyError:
                                  ui.warn(_("warning: CVS commit message references "
                                            "non-existent branch %r:\n%s\n")
                                          % (m, c.comment))
                              if m in branches and c.branch != m and not candidate.synthetic:
                                  c.parents.append(candidate)
                      if mergeto:
                          m = mergeto.search(c.comment)
                          if m:
                              if m.groups():
                                  m = m.group(1)
                                  if m == 'HEAD':
                                      m = None
                              else:
                                  m = None   # if no group found then merge to HEAD
                              if m in branches and c.branch != m:
                                  # insert empty changeset for merge
                                  cc = changeset(
                                      author=c.author, branch=m, date=c.date,
                                      comment='convert-repo: CVS merge from branch %s'
                                      % c.branch,
                                      entries=[], tags=[],
                                      parents=[changesets[branches[m]], c])
                                  changesets.insert(i + 1, cc)
                                  branches[m] = i + 1
                                  # adjust our loop counters now we have inserted a new entry
                                  n += 1
                                  i += 2
                                  continue
                      branches[c.branch] = i
                      i += 1
                  # Drop synthetic changesets (safe now that we have ensured no other
                  # changesets can have them as parents).
                  i = 0
                  while i < len(changesets):
                      if changesets[i].synthetic:
                          del changesets[i]
                      else:
                          i += 1
                  # Number changesets
                  for i, c in enumerate(changesets):
                      c.id = i + 1
                  if odd:
                      for l, r in odd:
                          if l.id is not None and r.id is not None:
                              ui.warn(_('changeset %d is both before and after %d\n')
                                      % (l.id, r.id))
                  ui.status(_('%d changeset entries\n') % len(changesets))
                  hook.hook(ui, None, "cvschangesets", True, changesets=changesets)
                  return changesets
              def debugcvsps(ui, *args, **opts):
                  '''Read CVS rlog for current directory or named path in
                  repository, and convert the log to changesets based on matching
                  commit log entries and dates.
                  '''
+                 opts = pycompat.byteskwargs(opts)
                  if opts["new_cache"]:
                      cache = "write"
                  elif opts["update_cache"]:
                      cache = "update"
                  else:
                      cache = None
                  revisions = opts["revisions"]
                  try:
                      if args:
                          log = []
                          for d in args:
                              log += createlog(ui, d, root=opts["root"], cache=cache)
                      else:
                          log = createlog(ui, root=opts["root"], cache=cache)
                  except logerror as e:
                      ui.write("%r\n"%e)
                      return
                  changesets = createchangeset(ui, log, opts["fuzz"])
                  del log
                  # Print changesets (optionally filtered)
                  off = len(revisions)
                  branches = {}    # latest version number in each branch
                  ancestors = {}   # parent branch
                  for cs in changesets:
                      if opts["ancestors"]:
                          if cs.branch not in branches and cs.parents and cs.parents[0].id:
                              ancestors[cs.branch] = (changesets[cs.parents[0].id - 1].branch,
                                                      cs.parents[0].id)
                          branches[cs.branch] = cs.id
                      # limit by branches
                      if opts["branches"] and (cs.branch or 'HEAD') not in opts["branches"]:
                          continue
                      if not off:
                          # Note: trailing spaces on several lines here are needed to have
                          #       bug-for-bug compatibility with cvsps.
                          ui.write('---------------------\n')
                          ui.write(('PatchSet %d \n' % cs.id))
                          ui.write(('Date: %s\n' % util.datestr(cs.date,
                                                               '%Y/%m/%d %H:%M:%S %1%2')))
                          ui.write(('Author: %s\n' % cs.author))
                          ui.write(('Branch: %s\n' % (cs.branch or 'HEAD')))
                          ui.write(('Tag%s: %s \n' % (['', 's'][len(cs.tags) > 1],
                                                ','.join(cs.tags) or '(none)')))
                          if cs.branchpoints:
                              ui.write(('Branchpoints: %s \n') %
                                       ', '.join(sorted(cs.branchpoints)))
                          if opts["parents"] and cs.parents:
                              if len(cs.parents) > 1:
                                  ui.write(('Parents: %s\n' %
                                           (','.join([str(p.id) for p in cs.parents]))))
                              else:
                                  ui.write(('Parent: %d\n' % cs.parents[0].id))
                          if opts["ancestors"]:
                              b = cs.branch
                              r = []
                              while b:
                                  b, c = ancestors[b]
                                  r.append('%s:%d:%d' % (b or "HEAD", c, branches[b]))
                              if r:
                                  ui.write(('Ancestors: %s\n' % (','.join(r))))
                          ui.write(('Log:\n'))
                          ui.write('%s\n\n' % cs.comment)
                          ui.write(('Members: \n'))
                          for f in cs.entries:
                              fn = f.file
                              if fn.startswith(opts["prefix"]):
                                  fn = fn[len(opts["prefix"]):]
                              ui.write('\t%s:%s->%s%s \n' % (
                                      fn, '.'.join([str(x) for x in f.parent]) or 'INITIAL',
                                      '.'.join([str(x) for x in f.revision]),
                                      ['', '(DEAD)'][f.dead]))
                          ui.write('\n')
                      # have we seen the start tag?
                      if revisions and off:
                          if revisions[0] == str(cs.id) or \
                              revisions[0] in cs.tags:
                              off = False
                      # see if we reached the end tag
                      if len(revisions) > 1 and not off:
                          if revisions[1] == str(cs.id) or \
                              revisions[1] in cs.tags:
                              break

hgext/convert/monotone.py

0 +2 0

              # monotone.py - monotone support for the convert extension
              #
              #  Copyright 2008, 2009 Mikkel Fahnoe Jorgensen <mikkel@dvide.com> and
              #  others
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import os
              import re
              from mercurial.i18n import _
              from mercurial import (
                  error,
+                 pycompat,
                  util,
              )
              from . import common
              class monotone_source(common.converter_source, common.commandline):
                  def __init__(self, ui, repotype, path=None, revs=None):
                      common.converter_source.__init__(self, ui, repotype, path, revs)
                      if revs and len(revs) > 1:
                          raise error.Abort(_('monotone source does not support specifying '
                                             'multiple revs'))
                      common.commandline.__init__(self, ui, 'mtn')
                      self.ui = ui
                      self.path = path
                      self.automatestdio = False
                      self.revs = revs
                      norepo = common.NoRepo(_("%s does not look like a monotone repository")
                                           % path)
                      if not os.path.exists(os.path.join(path, '_MTN')):
                          # Could be a monotone repository (SQLite db file)
                          try:
                              f = file(path, 'rb')
                              header = f.read(16)
                              f.close()
                          except IOError:
                              header = ''
                          if header != 'SQLite format 3\x00':
                              raise norepo
                      # regular expressions for parsing monotone output
                      space    = r'\s*'
                      name     = r'\s+"((?:\\"|[^"])*)"\s*'
                      value    = name
                      revision = r'\s+\[(\w+)\]\s*'
                      lines    = r'(?:.|\n)+'
                      self.dir_re      = re.compile(space + "dir" + name)
                      self.file_re     = re.compile(space + "file" + name +
                                                    "content" + revision)
                      self.add_file_re = re.compile(space + "add_file" + name +
                                                    "content" + revision)
                      self.patch_re    = re.compile(space + "patch" + name +
                                                    "from" + revision + "to" + revision)
                      self.rename_re   = re.compile(space + "rename" + name + "to" + name)
                      self.delete_re   = re.compile(space + "delete" + name)
                      self.tag_re      = re.compile(space + "tag" + name + "revision" +
                                                    revision)
                      self.cert_re     = re.compile(lines + space + "name" + name +
                                                    "value" + value)
                      attr = space + "file" + lines + space + "attr" + space
                      self.attr_execute_re = re.compile(attr  + '"mtn:execute"' +
                                                        space + '"true"')
                      # cached data
                      self.manifest_rev = None
                      self.manifest = None
                      self.files = None
                      self.dirs  = None
                      common.checktool('mtn', abort=False)
                  def mtnrun(self, *args, **kwargs):
                      if self.automatestdio:
                          return self.mtnrunstdio(*args, **kwargs)
                      else:
                          return self.mtnrunsingle(*args, **kwargs)
                  def mtnrunsingle(self, *args, **kwargs):
                      kwargs['d'] = self.path
                      return self.run0('automate', *args, **kwargs)
                  def mtnrunstdio(self, *args, **kwargs):
                      # Prepare the command in automate stdio format
+                     kwargs = pycompat.byteskwargs(kwargs)
                      command = []
                      for k, v in kwargs.iteritems():
                          command.append("%s:%s" % (len(k), k))
                          if v:
                              command.append("%s:%s" % (len(v), v))
                      if command:
                          command.insert(0, 'o')
                          command.append('e')
                      command.append('l')
                      for arg in args:
                          command += "%s:%s" % (len(arg), arg)
                      command.append('e')
                      command = ''.join(command)
                      self.ui.debug("mtn: sending '%s'\n" % command)
                      self.mtnwritefp.write(command)
                      self.mtnwritefp.flush()
                      return self.mtnstdioreadcommandoutput(command)
                  def mtnstdioreadpacket(self):
                      read = None
                      commandnbr = ''
                      while read != ':':
                          read = self.mtnreadfp.read(1)
                          if not read:
                              raise error.Abort(_('bad mtn packet - no end of commandnbr'))
                          commandnbr += read
                      commandnbr = commandnbr[:-1]
                      stream = self.mtnreadfp.read(1)
                      if stream not in 'mewptl':
                          raise error.Abort(_('bad mtn packet - bad stream type %s') % stream)
                      read = self.mtnreadfp.read(1)
                      if read != ':':
                          raise error.Abort(_('bad mtn packet - no divider before size'))
                      read = None
                      lengthstr = ''
                      while read != ':':
                          read = self.mtnreadfp.read(1)
                          if not read:
                              raise error.Abort(_('bad mtn packet - no end of packet size'))
                          lengthstr += read
                      try:
                          length = long(lengthstr[:-1])
                      except TypeError:
                          raise error.Abort(_('bad mtn packet - bad packet size %s')
                              % lengthstr)
                      read = self.mtnreadfp.read(length)
                      if len(read) != length:
                          raise error.Abort(_("bad mtn packet - unable to read full packet "
                              "read %s of %s") % (len(read), length))
                      return (commandnbr, stream, length, read)
                  def mtnstdioreadcommandoutput(self, command):
                      retval = []
                      while True:
                          commandnbr, stream, length, output = self.mtnstdioreadpacket()
                          self.ui.debug('mtn: read packet %s:%s:%s\n' %
                              (commandnbr, stream, length))
                          if stream == 'l':
                              # End of command
                              if output != '0':
                                  raise error.Abort(_("mtn command '%s' returned %s") %
                                      (command, output))
                              break
                          elif stream in 'ew':
                              # Error, warning output
                              self.ui.warn(_('%s error:\n') % self.command)
                              self.ui.warn(output)
                          elif stream == 'p':
                              # Progress messages
                              self.ui.debug('mtn: ' + output)
                          elif stream == 'm':
                              # Main stream - command output
                              retval.append(output)
                      return ''.join(retval)
                  def mtnloadmanifest(self, rev):
                      if self.manifest_rev == rev:
                          return
                      self.manifest = self.mtnrun("get_manifest_of", rev).split("\n\n")
                      self.manifest_rev = rev
                      self.files = {}
                      self.dirs = {}
                      for e in self.manifest:
                          m = self.file_re.match(e)
                          if m:
                              attr = ""
                              name = m.group(1)
                              node = m.group(2)
                              if self.attr_execute_re.match(e):
                                  attr += "x"
                              self.files[name] = (node, attr)
                          m = self.dir_re.match(e)
                          if m:
                              self.dirs[m.group(1)] = True
                  def mtnisfile(self, name, rev):
                      # a non-file could be a directory or a deleted or renamed file
                      self.mtnloadmanifest(rev)
                      return name in self.files
                  def mtnisdir(self, name, rev):
                      self.mtnloadmanifest(rev)
                      return name in self.dirs
                  def mtngetcerts(self, rev):
                      certs = {"author":"<missing>", "date":"<missing>",
                          "changelog":"<missing>", "branch":"<missing>"}
                      certlist = self.mtnrun("certs", rev)
                      # mtn < 0.45:
                      #   key "test@selenic.com"
                      # mtn >= 0.45:
                      #   key [ff58a7ffb771907c4ff68995eada1c4da068d328]
                      certlist = re.split('\n\n      key ["\[]', certlist)
                      for e in certlist:
                          m = self.cert_re.match(e)
                          if m:
                              name, value = m.groups()
                              value = value.replace(r'\"', '"')
                              value = value.replace(r'\\', '\\')
                              certs[name] = value
                      # Monotone may have subsecond dates: 2005-02-05T09:39:12.364306
                      # and all times are stored in UTC
                      certs["date"] = certs["date"].split('.')[0] + " UTC"
                      return certs
                  # implement the converter_source interface:
                  def getheads(self):
                      if not self.revs:
                          return self.mtnrun("leaves").splitlines()
                      else:
                          return self.revs
                  def getchanges(self, rev, full):
                      if full:
                          raise error.Abort(_("convert from monotone does not support "
                                            "--full"))
                      revision = self.mtnrun("get_revision", rev).split("\n\n")
                      files = {}
                      ignoremove = {}
                      renameddirs = []
                      copies = {}
                      for e in revision:
                          m = self.add_file_re.match(e)
                          if m:
                              files[m.group(1)] = rev
                              ignoremove[m.group(1)] = rev
                          m = self.patch_re.match(e)
                          if m:
                              files[m.group(1)] = rev
                          # Delete/rename is handled later when the convert engine
                          # discovers an IOError exception from getfile,
                          # but only if we add the "from" file to the list of changes.
                          m = self.delete_re.match(e)
                          if m:
                              files[m.group(1)] = rev
                          m = self.rename_re.match(e)
                          if m:
                              toname = m.group(2)
                              fromname = m.group(1)
                              if self.mtnisfile(toname, rev):
                                  ignoremove[toname] = 1
                                  copies[toname] = fromname
                                  files[toname] = rev
                                  files[fromname] = rev
                              elif self.mtnisdir(toname, rev):
                                  renameddirs.append((fromname, toname))
                      # Directory renames can be handled only once we have recorded
                      # all new files
                      for fromdir, todir in renameddirs:
                          renamed = {}
                          for tofile in self.files:
                              if tofile in ignoremove:
                                  continue
                              if tofile.startswith(todir + '/'):
                                  renamed[tofile] = fromdir + tofile[len(todir):]
                                  # Avoid chained moves like:
                                  # d1(/a) => d3/d1(/a)
                                  # d2 => d3
                                  ignoremove[tofile] = 1
                          for tofile, fromfile in renamed.items():
                              self.ui.debug (_("copying file in renamed directory "
                                               "from '%s' to '%s'")
                                             % (fromfile, tofile), '\n')
                              files[tofile] = rev
                              copies[tofile] = fromfile
                          for fromfile in renamed.values():
                              files[fromfile] = rev
                      return (files.items(), copies, set())
                  def getfile(self, name, rev):
                      if not self.mtnisfile(name, rev):
                          return None, None
                      try:
                          data = self.mtnrun("get_file_of", name, r=rev)
                      except Exception:
                          return None, None
                      self.mtnloadmanifest(rev)
                      node, attr = self.files.get(name, (None, ""))
                      return data, attr
                  def getcommit(self, rev):
                      extra = {}
                      certs = self.mtngetcerts(rev)
                      if certs.get('suspend') == certs["branch"]:
                          extra['close'] = 1
                      return common.commit(
                          author=certs["author"],
                          date=util.datestr(util.strdate(certs["date"], "%Y-%m-%dT%H:%M:%S")),
                          desc=certs["changelog"],
                          rev=rev,
                          parents=self.mtnrun("parents", rev).splitlines(),
                          branch=certs["branch"],
                          extra=extra)
                  def gettags(self):
                      tags = {}
                      for e in self.mtnrun("tags").split("\n\n"):
                          m = self.tag_re.match(e)
                          if m:
                              tags[m.group(1)] = m.group(2)
                      return tags
                  def getchangedfiles(self, rev, i):
                      # This function is only needed to support --filemap
                      # ... and we don't support that
                      raise NotImplementedError
                  def before(self):
                      # Check if we have a new enough version to use automate stdio
                      version = 0.0
                      try:
                          versionstr = self.mtnrunsingle("interface_version")
                          version = float(versionstr)
                      except Exception:
                          raise error.Abort(_("unable to determine mtn automate interface "
                              "version"))
                      if version >= 12.0:
                          self.automatestdio = True
                          self.ui.debug("mtn automate version %s - using automate stdio\n" %
                              version)
                          # launch the long-running automate stdio process
                          self.mtnwritefp, self.mtnreadfp = self._run2('automate', 'stdio',
                              '-d', self.path)
                          # read the headers
                          read = self.mtnreadfp.readline()
                          if read != 'format-version: 2\n':
                              raise error.Abort(_('mtn automate stdio header unexpected: %s')
                                  % read)
                          while read != '\n':
                              read = self.mtnreadfp.readline()
                              if not read:
                                  raise error.Abort(_("failed to reach end of mtn automate "
                                      "stdio headers"))
                      else:
                          self.ui.debug("mtn automate version %s - not using automate stdio "
                              "(automate >= 12.0 - mtn >= 0.46 is needed)\n" % version)
                  def after(self):
                      if self.automatestdio:
                          self.mtnwritefp.close()
                          self.mtnwritefp = None
                          self.mtnreadfp.close()
                          self.mtnreadfp = None

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages