upstream/mercurial-mirror Commit - r8456:e9e2a2c9

convert: use set instead of dict

Benoit Boissinot -

r8456:e9e2a2c9 default

parent child

hgext/convert/convcmd.py

0 +4 -4

              # convcmd - convert extension commands definition
              #
              # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2, incorporated herein by reference.
              from common import NoRepo, MissingTool, SKIPREV, mapfile
              from cvs import convert_cvs
              from darcs import darcs_source
              from git import convert_git
              from hg import mercurial_source, mercurial_sink
              from subversion import svn_source, svn_sink
              from monotone import monotone_source
              from gnuarch import gnuarch_source
              from bzr import bzr_source
              from p4 import p4_source
              import filemap
              import os, shutil
              from mercurial import hg, util, encoding
              from mercurial.i18n import _
              orig_encoding = 'ascii'
              def recode(s):
                  if isinstance(s, unicode):
                      return s.encode(orig_encoding, 'replace')
                  else:
                      return s.decode('utf-8').encode(orig_encoding, 'replace')
              source_converters = [
                  ('cvs', convert_cvs),
                  ('git', convert_git),
                  ('svn', svn_source),
                  ('hg', mercurial_source),
                  ('darcs', darcs_source),
                  ('mtn', monotone_source),
                  ('gnuarch', gnuarch_source),
                  ('bzr', bzr_source),
                  ('p4', p4_source),
                  ]
              sink_converters = [
                  ('hg', mercurial_sink),
                  ('svn', svn_sink),
                  ]
              def convertsource(ui, path, type, rev):
                  exceptions = []
                  for name, source in source_converters:
                      try:
                          if not type or name == type:
                              return source(ui, path, rev)
                      except (NoRepo, MissingTool), inst:
                          exceptions.append(inst)
                  if not ui.quiet:
                      for inst in exceptions:
                          ui.write("%s\n" % inst)
                  raise util.Abort(_('%s: missing or unsupported repository') % path)
              def convertsink(ui, path, type):
                  for name, sink in sink_converters:
                      try:
                          if not type or name == type:
                              return sink(ui, path)
                      except NoRepo, inst:
                          ui.note(_("convert: %s\n") % inst)
                  raise util.Abort(_('%s: unknown repository type') % path)
              class converter(object):
                  def __init__(self, ui, source, dest, revmapfile, opts):
                      self.source = source
                      self.dest = dest
                      self.ui = ui
                      self.opts = opts
                      self.commitcache = {}
                      self.authors = {}
                      self.authorfile = None
                      # Record converted revisions persistently: maps source revision
                      # ID to target revision ID (both strings).  (This is how
                      # incremental conversions work.)
                      self.map = mapfile(ui, revmapfile)
                      # Read first the dst author map if any
                      authorfile = self.dest.authorfile()
                      if authorfile and os.path.exists(authorfile):
                          self.readauthormap(authorfile)
                      # Extend/Override with new author map if necessary
                      if opts.get('authors'):
                          self.readauthormap(opts.get('authors'))
                          self.authorfile = self.dest.authorfile()
                      self.splicemap = mapfile(ui, opts.get('splicemap'))
                      self.branchmap = mapfile(ui, opts.get('branchmap'))
                  def walktree(self, heads):
                      '''Return a mapping that identifies the uncommitted parents of every
                      uncommitted changeset.'''
                      visit = heads
-                     known = {}
+                     known = set()
                      parents = {}
                      while visit:
                          n = visit.pop(0)
                          if n in known or n in self.map: continue
-                         known[n] = 1
+                         known.add(n)
                          commit = self.cachecommit(n)
                          parents[n] = []
                          for p in commit.parents:
                              parents[n].append(p)
                              visit.append(p)
                      return parents
                  def toposort(self, parents):
                      '''Return an ordering such that every uncommitted changeset is
                      preceeded by all its uncommitted ancestors.'''
                      visit = parents.keys()
-                     seen = {}
+                     seen = set()
                      children = {}
                      actives = []
                      while visit:
                          n = visit.pop(0)
                          if n in seen: continue
-                         seen[n] = 1
+                         seen.add(n)
                          # Ensure that nodes without parents are present in the 'children'
                          # mapping.
                          children.setdefault(n, [])
                          hasparent = False
                          for p in parents[n]:
                              if not p in self.map:
                                  visit.append(p)
                                  hasparent = True
                              children.setdefault(p, []).append(n)
                          if not hasparent:
                              actives.append(n)
                      del seen
                      del visit
                      if self.opts.get('datesort'):
                          dates = {}
                          def getdate(n):
                              if n not in dates:
                                  dates[n] = util.parsedate(self.commitcache[n].date)
                              return dates[n]
                          def picknext(nodes):
                              return min([(getdate(n), n) for n in nodes])[1]
                      else:
                          prev = [None]
                          def picknext(nodes):
                              # Return the first eligible child of the previously converted
                              # revision, or any of them.
                              next = nodes[0]
                              for n in nodes:
                                  if prev[0] in parents[n]:
                                      next = n
                                      break
                              prev[0] = next
                              return next
                      s = []
                      pendings = {}
                      while actives:
                          n = picknext(actives)
                          actives.remove(n)
                          s.append(n)
                          # Update dependents list
                          for c in children.get(n, []):
                              if c not in pendings:
                                  pendings[c] = [p for p in parents[c] if p not in self.map]
                              try:
                                  pendings[c].remove(n)
                              except ValueError:
                                  raise util.Abort(_('cycle detected between %s and %s')
                                                     % (recode(c), recode(n)))
                              if not pendings[c]:
                                  # Parents are converted, node is eligible
                                  actives.insert(0, c)
                                  pendings[c] = None
                      if len(s) != len(parents):
                          raise util.Abort(_("not all revisions were sorted"))
                      return s
                  def writeauthormap(self):
                      authorfile = self.authorfile
                      if authorfile:
                          self.ui.status(_('Writing author map file %s\n') % authorfile)
                          ofile = open(authorfile, 'w+')
                          for author in self.authors:
                              ofile.write("%s=%s\n" % (author, self.authors[author]))
                          ofile.close()
                  def readauthormap(self, authorfile):
                      afile = open(authorfile, 'r')
                      for line in afile:
                          line = line.strip()
                          if not line or line.startswith('#'):
                              continue
                          try:
                              srcauthor, dstauthor = line.split('=', 1)
                          except ValueError:
                              msg = _('Ignoring bad line in author map file %s: %s\n')
                              self.ui.warn(msg % (authorfile, line.rstrip()))
                              continue
                          srcauthor = srcauthor.strip()
                          dstauthor = dstauthor.strip()
                          if self.authors.get(srcauthor) in (None, dstauthor):
                              msg = _('mapping author %s to %s\n')
                              self.ui.debug(msg % (srcauthor, dstauthor))
                              self.authors[srcauthor] = dstauthor
                              continue
                          m = _('overriding mapping for author %s, was %s, will be %s\n')
                          self.ui.status(m % (srcauthor, self.authors[srcauthor], dstauthor))
                      afile.close()
                  def cachecommit(self, rev):
                      commit = self.source.getcommit(rev)
                      commit.author = self.authors.get(commit.author, commit.author)
                      commit.branch = self.branchmap.get(commit.branch, commit.branch)
                      self.commitcache[rev] = commit
                      return commit
                  def copy(self, rev):
                      commit = self.commitcache[rev]
                      changes = self.source.getchanges(rev)
                      if isinstance(changes, basestring):
                          if changes == SKIPREV:
                              dest = SKIPREV
                          else:
                              dest = self.map[changes]
                          self.map[rev] = dest
                          return
                      files, copies = changes
                      pbranches = []
                      if commit.parents:
                          for prev in commit.parents:
                              if prev not in self.commitcache:
                                  self.cachecommit(prev)
                              pbranches.append((self.map[prev],
                                                self.commitcache[prev].branch))
                      self.dest.setbranch(commit.branch, pbranches)
                      try:
                          parents = self.splicemap[rev].replace(',', ' ').split()
                          self.ui.status(_('spliced in %s as parents of %s\n') %
                                         (parents, rev))
                          parents = [self.map.get(p, p) for p in parents]
                      except KeyError:
                          parents = [b[0] for b in pbranches]
                      newnode = self.dest.putcommit(files, copies, parents, commit, self.source)
                      self.source.converted(rev, newnode)
                      self.map[rev] = newnode
                  def convert(self):
                      try:
                          self.source.before()
                          self.dest.before()
                          self.source.setrevmap(self.map)
                          self.ui.status(_("scanning source...\n"))
                          heads = self.source.getheads()
                          parents = self.walktree(heads)
                          self.ui.status(_("sorting...\n"))
                          t = self.toposort(parents)
                          num = len(t)
                          c = None
                          self.ui.status(_("converting...\n"))
                          for c in t:
                              num -= 1
                              desc = self.commitcache[c].desc
                              if "\n" in desc:
                                  desc = desc.splitlines()[0]
                              # convert log message to local encoding without using
                              # tolocal() because encoding.encoding conver() use it as
                              # 'utf-8'
                              self.ui.status("%d %s\n" % (num, recode(desc)))
                              self.ui.note(_("source: %s\n") % recode(c))
                              self.copy(c)
                          tags = self.source.gettags()
                          ctags = {}
                          for k in tags:
                              v = tags[k]
                              if self.map.get(v, SKIPREV) != SKIPREV:
                                  ctags[k] = self.map[v]
                          if c and ctags:
                              nrev = self.dest.puttags(ctags)
                              # write another hash correspondence to override the previous
                              # one so we don't end up with extra tag heads
                              if nrev:
                                  self.map[c] = nrev
                          self.writeauthormap()
                      finally:
                          self.cleanup()
                  def cleanup(self):
                      try:
                          self.dest.after()
                      finally:
                          self.source.after()
                      self.map.close()
              def convert(ui, src, dest=None, revmapfile=None, **opts):
                  global orig_encoding
                  orig_encoding = encoding.encoding
                  encoding.encoding = 'UTF-8'
                  if not dest:
                      dest = hg.defaultdest(src) + "-hg"
                      ui.status(_("assuming destination %s\n") % dest)
                  destc = convertsink(ui, dest, opts.get('dest_type'))
                  try:
                      srcc = convertsource(ui, src, opts.get('source_type'),
                                           opts.get('rev'))
                  except Exception:
                      for path in destc.created:
                          shutil.rmtree(path, True)
                      raise
                  fmap = opts.get('filemap')
                  if fmap:
                      srcc = filemap.filemap_source(ui, srcc, fmap)
                      destc.setfilemapmode(True)
                  if not revmapfile:
                      try:
                          revmapfile = destc.revmapfile()
                      except:
                          revmapfile = os.path.join(destc, "map")
                  c = converter(ui, srcc, destc, revmapfile, opts)
                  c.convert()

hgext/convert/cvsps.py

0 +6 -7

              #
              # Mercurial built-in replacement for cvsps.
              #
              # Copyright 2008, Frank Kingswood <frank@kingswood-consulting.co.uk>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2, incorporated herein by reference.
              import os
              import re
              import cPickle as pickle
              from mercurial import util
              from mercurial.i18n import _
              def listsort(list, key):
                  "helper to sort by key in Python 2.3"
                  try:
                      list.sort(key=key)
                  except TypeError:
                      list.sort(lambda l, r: cmp(key(l), key(r)))
              class logentry(object):
                  '''Class logentry has the following attributes:
                      .author    - author name as CVS knows it
                      .branch    - name of branch this revision is on
                      .branches  - revision tuple of branches starting at this revision
                      .comment   - commit message
                      .date      - the commit date as a (time, tz) tuple
                      .dead      - true if file revision is dead
                      .file      - Name of file
                      .lines     - a tuple (+lines, -lines) or None
                      .parent    - Previous revision of this entry
                      .rcs       - name of file as returned from CVS
                      .revision  - revision number as tuple
                      .tags      - list of tags on the file
                      .synthetic - is this a synthetic "file ... added on ..." revision?
                      .mergepoint- the branch that has been merged from (if present in rlog output)
                  '''
                  def __init__(self, **entries):
                      self.__dict__.update(entries)
                  def __repr__(self):
                      return "<%s at 0x%x: %s %s>" % (self.__class__.__name__,
                                                      id(self),
                                                      self.file,
                                                      ".".join(map(str, self.revision)))
              class logerror(Exception):
                  pass
              def getrepopath(cvspath):
                  """Return the repository path from a CVS path.
                  >>> getrepopath('/foo/bar')
                  '/foo/bar'
                  >>> getrepopath('c:/foo/bar')
                  'c:/foo/bar'
                  >>> getrepopath(':pserver:10/foo/bar')
                  '/foo/bar'
                  >>> getrepopath(':pserver:10c:/foo/bar')
                  '/foo/bar'
                  >>> getrepopath(':pserver:/foo/bar')
                  '/foo/bar'
                  >>> getrepopath(':pserver:c:/foo/bar')
                  'c:/foo/bar'
                  >>> getrepopath(':pserver:truc@foo.bar:/foo/bar')
                  '/foo/bar'
                  >>> getrepopath(':pserver:truc@foo.bar:c:/foo/bar')
                  'c:/foo/bar'
                  """
                  # According to CVS manual, CVS paths are expressed like:
                  # [:method:][[user][:password]@]hostname[:[port]]/path/to/repository
                  #
                  # Unfortunately, Windows absolute paths start with a drive letter
                  # like 'c:' making it harder to parse. Here we assume that drive
                  # letters are only one character long and any CVS component before
                  # the repository path is at least 2 characters long, and use this
                  # to disambiguate.
                  parts = cvspath.split(':')
                  if len(parts) == 1:
                      return parts[0]
                  # Here there is an ambiguous case if we have a port number
                  # immediately followed by a Windows driver letter. We assume this
                  # never happens and decide it must be CVS path component,
                  # therefore ignoring it.
                  if len(parts[-2]) > 1:
                      return parts[-1].lstrip('0123456789')
                  return parts[-2] + ':' + parts[-1]
              def createlog(ui, directory=None, root="", rlog=True, cache=None):
                  '''Collect the CVS rlog'''
                  # Because we store many duplicate commit log messages, reusing strings
                  # saves a lot of memory and pickle storage space.
                  _scache = {}
                  def scache(s):
                      "return a shared version of a string"
                      return _scache.setdefault(s, s)
                  ui.status(_('collecting CVS rlog\n'))
                  log = []      # list of logentry objects containing the CVS state
                  # patterns to match in CVS (r)log output, by state of use
                  re_00 = re.compile('RCS file: (.+)$')
                  re_01 = re.compile('cvs \\[r?log aborted\\]: (.+)$')
                  re_02 = re.compile('cvs (r?log|server): (.+)\n$')
                  re_03 = re.compile("(Cannot access.+CVSROOT)|(can't create temporary directory.+)$")
                  re_10 = re.compile('Working file: (.+)$')
                  re_20 = re.compile('symbolic names:')
                  re_30 = re.compile('\t(.+): ([\\d.]+)$')
                  re_31 = re.compile('----------------------------$')
                  re_32 = re.compile('=============================================================================$')
                  re_50 = re.compile('revision ([\\d.]+)(\s+locked by:\s+.+;)?$')
                  re_60 = re.compile(r'date:\s+(.+);\s+author:\s+(.+);\s+state:\s+(.+?);(\s+lines:\s+(\+\d+)?\s+(-\d+)?;)?(.*mergepoint:\s+([^;]+);)?')
                  re_70 = re.compile('branches: (.+);$')
                  file_added_re = re.compile(r'file [^/]+ was (initially )?added on branch')
                  prefix = ''   # leading path to strip of what we get from CVS
                  if directory is None:
                      # Current working directory
                      # Get the real directory in the repository
                      try:
                          prefix = file(os.path.join('CVS','Repository')).read().strip()
                          if prefix == ".":
                              prefix = ""
                          directory = prefix
                      except IOError:
                          raise logerror('Not a CVS sandbox')
                      if prefix and not prefix.endswith(os.sep):
                          prefix += os.sep
                      # Use the Root file in the sandbox, if it exists
                      try:
                          root = file(os.path.join('CVS','Root')).read().strip()
                      except IOError:
                          pass
                  if not root:
                      root = os.environ.get('CVSROOT', '')
                  # read log cache if one exists
                  oldlog = []
                  date = None
                  if cache:
                      cachedir = os.path.expanduser('~/.hg.cvsps')
                      if not os.path.exists(cachedir):
                          os.mkdir(cachedir)
                      # The cvsps cache pickle needs a uniquified name, based on the
                      # repository location. The address may have all sort of nasties
                      # in it, slashes, colons and such. So here we take just the
                      # alphanumerics, concatenated in a way that does not mix up the
                      # various components, so that
                      #    :pserver:user@server:/path
                      # and
                      #    /pserver/user/server/path
                      # are mapped to different cache file names.
                      cachefile = root.split(":") + [directory, "cache"]
                      cachefile = ['-'.join(re.findall(r'\w+', s)) for s in cachefile if s]
                      cachefile = os.path.join(cachedir,
                                               '.'.join([s for s in cachefile if s]))
                  if cache == 'update':
                      try:
                          ui.note(_('reading cvs log cache %s\n') % cachefile)
                          oldlog = pickle.load(file(cachefile))
                          ui.note(_('cache has %d log entries\n') % len(oldlog))
                      except Exception, e:
                          ui.note(_('error reading cache: %r\n') % e)
                      if oldlog:
                          date = oldlog[-1].date    # last commit date as a (time,tz) tuple
                          date = util.datestr(date, '%Y/%m/%d %H:%M:%S %1%2')
                  # build the CVS commandline
                  cmd = ['cvs', '-q']
                  if root:
                      cmd.append('-d%s' % root)
                      p = util.normpath(getrepopath(root))
                      if not p.endswith('/'):
                          p += '/'
                      prefix = p + util.normpath(prefix)
                  cmd.append(['log', 'rlog'][rlog])
                  if date:
                      # no space between option and date string
                      cmd.append('-d>%s' % date)
                  cmd.append(directory)
                  # state machine begins here
                  tags = {}     # dictionary of revisions on current file with their tags
                  branchmap = {} # mapping between branch names and revision numbers
                  state = 0
                  store = False # set when a new record can be appended
                  cmd = [util.shellquote(arg) for arg in cmd]
                  ui.note(_("running %s\n") % (' '.join(cmd)))
                  ui.debug(_("prefix=%r directory=%r root=%r\n") % (prefix, directory, root))
                  pfp = util.popen(' '.join(cmd))
                  peek = pfp.readline()
                  while True:
                      line = peek
                      if line == '':
                          break
                      peek = pfp.readline()
                      if line.endswith('\n'):
                          line = line[:-1]
                      #ui.debug('state=%d line=%r\n' % (state, line))
                      if state == 0:
                          # initial state, consume input until we see 'RCS file'
                          match = re_00.match(line)
                          if match:
                              rcs = match.group(1)
                              tags = {}
                              if rlog:
                                  filename = util.normpath(rcs[:-2])
                                  if filename.startswith(prefix):
                                      filename = filename[len(prefix):]
                                  if filename.startswith('/'):
                                      filename = filename[1:]
                                  if filename.startswith('Attic/'):
                                      filename = filename[6:]
                                  else:
                                      filename = filename.replace('/Attic/', '/')
                                  state = 2
                                  continue
                              state = 1
                              continue
                          match = re_01.match(line)
                          if match:
                              raise Exception(match.group(1))
                          match = re_02.match(line)
                          if match:
                              raise Exception(match.group(2))
                          if re_03.match(line):
                              raise Exception(line)
                      elif state == 1:
                          # expect 'Working file' (only when using log instead of rlog)
                          match = re_10.match(line)
                          assert match, _('RCS file must be followed by working file')
                          filename = util.normpath(match.group(1))
                          state = 2
                      elif state == 2:
                          # expect 'symbolic names'
                          if re_20.match(line):
                              branchmap = {}
                              state = 3
                      elif state == 3:
                          # read the symbolic names and store as tags
                          match = re_30.match(line)
                          if match:
                              rev = [int(x) for x in match.group(2).split('.')]
                              # Convert magic branch number to an odd-numbered one
                              revn = len(rev)
                              if revn > 3 and (revn % 2) == 0 and rev[-2] == 0:
                                  rev = rev[:-2] + rev[-1:]
                              rev = tuple(rev)
                              if rev not in tags:
                                  tags[rev] = []
                              tags[rev].append(match.group(1))
                              branchmap[match.group(1)] = match.group(2)
                          elif re_31.match(line):
                              state = 5
                          elif re_32.match(line):
                              state = 0
                      elif state == 4:
                          # expecting '------' separator before first revision
                          if re_31.match(line):
                              state = 5
                          else:
                              assert not re_32.match(line), _('must have at least some revisions')
                      elif state == 5:
                          # expecting revision number and possibly (ignored) lock indication
                          # we create the logentry here from values stored in states 0 to 4,
                          # as this state is re-entered for subsequent revisions of a file.
                          match = re_50.match(line)
                          assert match, _('expected revision number')
                          e = logentry(rcs=scache(rcs), file=scache(filename),
                                  revision=tuple([int(x) for x in match.group(1).split('.')]),
                                  branches=[], parent=None,
                                  synthetic=False)
                          state = 6
                      elif state == 6:
                          # expecting date, author, state, lines changed
                          match = re_60.match(line)
                          assert match, _('revision must be followed by date line')
                          d = match.group(1)
                          if d[2] == '/':
                              # Y2K
                              d = '19' + d
                          if len(d.split()) != 3:
                              # cvs log dates always in GMT
                              d = d + ' UTC'
                          e.date = util.parsedate(d, ['%y/%m/%d %H:%M:%S', '%Y/%m/%d %H:%M:%S', '%Y-%m-%d %H:%M:%S'])
                          e.author = scache(match.group(2))
                          e.dead = match.group(3).lower() == 'dead'
                          if match.group(5):
                              if match.group(6):
                                  e.lines = (int(match.group(5)), int(match.group(6)))
                              else:
                                  e.lines = (int(match.group(5)), 0)
                          elif match.group(6):
                              e.lines = (0, int(match.group(6)))
                          else:
                              e.lines = None
                          if match.group(7): # cvsnt mergepoint
                              myrev = match.group(8).split('.')
                              if len(myrev) == 2: # head
                                  e.mergepoint = 'HEAD'
                              else:
                                  myrev = '.'.join(myrev[:-2] + ['0', myrev[-2]])
                                  branches = [b for b in branchmap if branchmap[b] == myrev]
                                  assert len(branches) == 1, 'unknown branch: %s' % e.mergepoint
                                  e.mergepoint = branches[0]
                          else:
                              e.mergepoint = None
                          e.comment = []
                          state = 7
                      elif state == 7:
                          # read the revision numbers of branches that start at this revision
                          # or store the commit log message otherwise
                          m = re_70.match(line)
                          if m:
                              e.branches = [tuple([int(y) for y in x.strip().split('.')])
                                              for x in m.group(1).split(';')]
                              state = 8
                          elif re_31.match(line) and re_50.match(peek):
                              state = 5
                              store = True
                          elif re_32.match(line):
                              state = 0
                              store = True
                          else:
                              e.comment.append(line)
                      elif state == 8:
                          # store commit log message
                          if re_31.match(line):
                              state = 5
                              store = True
                          elif re_32.match(line):
                              state = 0
                              store = True
                          else:
                              e.comment.append(line)
                      # When a file is added on a branch B1, CVS creates a synthetic
                      # dead trunk revision 1.1 so that the branch has a root.
                      # Likewise, if you merge such a file to a later branch B2 (one
                      # that already existed when the file was added on B1), CVS
                      # creates a synthetic dead revision 1.1.x.1 on B2.  Don't drop
                      # these revisions now, but mark them synthetic so
                      # createchangeset() can take care of them.
                      if (store and
                            e.dead and
                            e.revision[-1] == 1 and      # 1.1 or 1.1.x.1
                            len(e.comment) == 1 and
                            file_added_re.match(e.comment[0])):
                          ui.debug(_('found synthetic revision in %s: %r\n')
                                   % (e.rcs, e.comment[0]))
                          e.synthetic = True
                      if store:
                          # clean up the results and save in the log.
                          store = False
                          e.tags = sorted([scache(x) for x in tags.get(e.revision, [])])
                          e.comment = scache('\n'.join(e.comment))
                          revn = len(e.revision)
                          if revn > 3 and (revn % 2) == 0:
                              e.branch = tags.get(e.revision[:-1], [None])[0]
                          else:
                              e.branch = None
                          log.append(e)
                          if len(log) % 100 == 0:
                              ui.status(util.ellipsis('%d %s' % (len(log), e.file), 80)+'\n')
                  listsort(log, key=lambda x:(x.rcs, x.revision))
                  # find parent revisions of individual files
                  versions = {}
                  for e in log:
                      branch = e.revision[:-1]
                      p = versions.get((e.rcs, branch), None)
                      if p is None:
                          p = e.revision[:-2]
                      e.parent = p
                      versions[(e.rcs, branch)] = e.revision
                  # update the log cache
                  if cache:
                      if log:
                          # join up the old and new logs
                          listsort(log, key=lambda x:x.date)
                          if oldlog and oldlog[-1].date >= log[0].date:
                              raise logerror('Log cache overlaps with new log entries,'
                                             ' re-run without cache.')
                          log = oldlog + log
                          # write the new cachefile
                          ui.note(_('writing cvs log cache %s\n') % cachefile)
                          pickle.dump(log, file(cachefile, 'w'))
                      else:
                          log = oldlog
                  ui.status(_('%d log entries\n') % len(log))
                  return log
              class changeset(object):
                  '''Class changeset has the following attributes:
                      .id        - integer identifying this changeset (list index)
                      .author    - author name as CVS knows it
                      .branch    - name of branch this changeset is on, or None
                      .comment   - commit message
                      .date      - the commit date as a (time,tz) tuple
                      .entries   - list of logentry objects in this changeset
                      .parents   - list of one or two parent changesets
                      .tags      - list of tags on this changeset
                      .synthetic - from synthetic revision "file ... added on branch ..."
                      .mergepoint- the branch that has been merged from (if present in rlog output)
                  '''
                  def __init__(self, **entries):
                      self.__dict__.update(entries)
                  def __repr__(self):
                      return "<%s at 0x%x: %s>" % (self.__class__.__name__,
                                                   id(self),
                                                   getattr(self, 'id', "(no id)"))
              def createchangeset(ui, log, fuzz=60, mergefrom=None, mergeto=None):
                  '''Convert log into changesets.'''
                  ui.status(_('creating changesets\n'))
                  # Merge changesets
                  listsort(log, key=lambda x:(x.comment, x.author, x.branch, x.date))
                  changesets = []
-                 files = {}
+                 files = set()
                  c = None
                  for i, e in enumerate(log):
                      # Check if log entry belongs to the current changeset or not.
                      if not (c and
                                e.comment == c.comment and
                                e.author == c.author and
                                e.branch == c.branch and
                                ((c.date[0] + c.date[1]) <=
                                 (e.date[0] + e.date[1]) <=
                                 (c.date[0] + c.date[1]) + fuzz) and
                                e.file not in files):
                          c = changeset(comment=e.comment, author=e.author,
                                        branch=e.branch, date=e.date, entries=[],
                                        mergepoint=getattr(e, 'mergepoint', None))
                          changesets.append(c)
-                         files = {}
+                         files = set()
                          if len(changesets) % 100 == 0:
                              t = '%d %s' % (len(changesets), repr(e.comment)[1:-1])
                              ui.status(util.ellipsis(t, 80) + '\n')
                      c.entries.append(e)
-                     files[e.file] = True
+                     files.add(e.file)
                      c.date = e.date       # changeset date is date of latest commit in it
                  # Mark synthetic changesets
                  for c in changesets:
                      # Synthetic revisions always get their own changeset, because
                      # the log message includes the filename.  E.g. if you add file3
                      # and file4 on a branch, you get four log entries and three
                      # changesets:
                      #   "File file3 was added on branch ..." (synthetic, 1 entry)
                      #   "File file4 was added on branch ..." (synthetic, 1 entry)
                      #   "Add file3 and file4 to fix ..."     (real, 2 entries)
                      # Hence the check for 1 entry here.
                      synth = getattr(c.entries[0], 'synthetic', None)
                      c.synthetic = (len(c.entries) == 1 and synth)
                  # Sort files in each changeset
                  for c in changesets:
                      def pathcompare(l, r):
                          'Mimic cvsps sorting order'
                          l = l.split('/')
                          r = r.split('/')
                          nl = len(l)
                          nr = len(r)
                          n = min(nl, nr)
                          for i in range(n):
                              if i + 1 == nl and nl < nr:
                                  return -1
                              elif i + 1 == nr and nl > nr:
                                  return +1
                              elif l[i] < r[i]:
                                  return -1
                              elif l[i] > r[i]:
                                  return +1
                          return 0
                      def entitycompare(l, r):
                          return pathcompare(l.file, r.file)
                      c.entries.sort(entitycompare)
                  # Sort changesets by date
                  def cscmp(l, r):
                      d = sum(l.date) - sum(r.date)
                      if d:
                          return d
                      # detect vendor branches and initial commits on a branch
                      le = {}
                      for e in l.entries:
                          le[e.rcs] = e.revision
                      re = {}
                      for e in r.entries:
                          re[e.rcs] = e.revision
                      d = 0
                      for e in l.entries:
                          if re.get(e.rcs, None) == e.parent:
                              assert not d
                              d = 1
                              break
                      for e in r.entries:
                          if le.get(e.rcs, None) == e.parent:
                              assert not d
                              d = -1
                              break
                      return d
                  changesets.sort(cscmp)
                  # Collect tags
                  globaltags = {}
                  for c in changesets:
-                     tags = {}
                      for e in c.entries:
                          for tag in e.tags:
                              # remember which is the latest changeset to have this tag
                              globaltags[tag] = c
                  for c in changesets:
-                     tags = {}
+                     tags = set()
                      for e in c.entries:
                          for tag in e.tags:
-                             tags[tag] = True
+                             tags.add(tag)
                      # remember tags only if this is the latest changeset to have it
-                     c.tags = sorted([tag for tag in tags if globaltags[tag] is c])
+                     c.tags = sorted(tag for tag in tags if globaltags[tag] is c)
                  # Find parent changesets, handle {{mergetobranch BRANCHNAME}}
                  # by inserting dummy changesets with two parents, and handle
                  # {{mergefrombranch BRANCHNAME}} by setting two parents.
                  if mergeto is None:
                      mergeto = r'{{mergetobranch ([-\w]+)}}'
                  if mergeto:
                      mergeto = re.compile(mergeto)
                  if mergefrom is None:
                      mergefrom = r'{{mergefrombranch ([-\w]+)}}'
                  if mergefrom:
                      mergefrom = re.compile(mergefrom)
                  versions = {}    # changeset index where we saw any particular file version
                  branches = {}    # changeset index where we saw a branch
                  n = len(changesets)
                  i = 0
                  while i<n:
                      c = changesets[i]
                      for f in c.entries:
                          versions[(f.rcs, f.revision)] = i
                      p = None
                      if c.branch in branches:
                          p = branches[c.branch]
                      else:
                          for f in c.entries:
                              p = max(p, versions.get((f.rcs, f.parent), None))
                      c.parents = []
                      if p is not None:
                          p = changesets[p]
                          # Ensure no changeset has a synthetic changeset as a parent.
                          while p.synthetic:
                              assert len(p.parents) <= 1, \
                                     _('synthetic changeset cannot have multiple parents')
                              if p.parents:
                                  p = p.parents[0]
                              else:
                                  p = None
                                  break
                          if p is not None:
                              c.parents.append(p)
                      if c.mergepoint:
                          if c.mergepoint == 'HEAD':
                              c.mergepoint = None
                          c.parents.append(changesets[branches[c.mergepoint]])
                      if mergefrom:
                          m = mergefrom.search(c.comment)
                          if m:
                              m = m.group(1)
                              if m == 'HEAD':
                                  m = None
                              try:
                                  candidate = changesets[branches[m]]
                              except KeyError:
                                  ui.warn(_("warning: CVS commit message references "
                                            "non-existent branch %r:\n%s\n")
                                          % (m, c.comment))
                              if m in branches and c.branch != m and not candidate.synthetic:
                                  c.parents.append(candidate)
                      if mergeto:
                          m = mergeto.search(c.comment)
                          if m:
                              try:
                                  m = m.group(1)
                                  if m == 'HEAD':
                                      m = None
                              except:
                                  m = None   # if no group found then merge to HEAD
                              if m in branches and c.branch != m:
                                  # insert empty changeset for merge
                                  cc = changeset(author=c.author, branch=m, date=c.date,
                                          comment='convert-repo: CVS merge from branch %s' % c.branch,
                                          entries=[], tags=[], parents=[changesets[branches[m]], c])
                                  changesets.insert(i + 1, cc)
                                  branches[m] = i + 1
                                  # adjust our loop counters now we have inserted a new entry
                                  n += 1
                                  i += 2
                                  continue
                      branches[c.branch] = i
                      i += 1
                  # Drop synthetic changesets (safe now that we have ensured no other
                  # changesets can have them as parents).
                  i = 0
                  while i < len(changesets):
                      if changesets[i].synthetic:
                          del changesets[i]
                      else:
                          i += 1
                  # Number changesets
                  for i, c in enumerate(changesets):
                      c.id = i + 1
                  ui.status(_('%d changeset entries\n') % len(changesets))
                  return changesets
              def debugcvsps(ui, *args, **opts):
                  '''Read CVS rlog for current directory or named path in repository, and
                  convert the log to changesets based on matching commit log entries and dates.'''
                  if opts["new_cache"]:
                      cache = "write"
                  elif opts["update_cache"]:
                      cache = "update"
                  else:
                      cache = None
                  revisions = opts["revisions"]
                  try:
                      if args:
                          log = []
                          for d in args:
                              log += createlog(ui, d, root=opts["root"], cache=cache)
                      else:
                          log = createlog(ui, root=opts["root"], cache=cache)
                  except logerror, e:
                      ui.write("%r\n"%e)
                      return
                  changesets = createchangeset(ui, log, opts["fuzz"])
                  del log
                  # Print changesets (optionally filtered)
                  off = len(revisions)
                  branches = {}    # latest version number in each branch
                  ancestors = {}   # parent branch
                  for cs in changesets:
                      if opts["ancestors"]:
                          if cs.branch not in branches and cs.parents and cs.parents[0].id:
                              ancestors[cs.branch] = changesets[cs.parents[0].id-1].branch, cs.parents[0].id
                          branches[cs.branch] = cs.id
                      # limit by branches
                      if opts["branches"] and (cs.branch or 'HEAD') not in opts["branches"]:
                          continue
                      if not off:
                          # Note: trailing spaces on several lines here are needed to have
                          #       bug-for-bug compatibility with cvsps.
                          ui.write('---------------------\n')
                          ui.write('PatchSet %d \n' % cs.id)
                          ui.write('Date: %s\n' % util.datestr(cs.date, '%Y/%m/%d %H:%M:%S %1%2'))
                          ui.write('Author: %s\n' % cs.author)
                          ui.write('Branch: %s\n' % (cs.branch or 'HEAD'))
                          ui.write('Tag%s: %s \n' % (['', 's'][len(cs.tags)>1],
                                                ','.join(cs.tags) or '(none)'))
                          if opts["parents"] and cs.parents:
                              if len(cs.parents)>1:
                                  ui.write('Parents: %s\n' % (','.join([str(p.id) for p in cs.parents])))
                              else:
                                  ui.write('Parent: %d\n' % cs.parents[0].id)
                          if opts["ancestors"]:
                              b = cs.branch
                              r = []
                              while b:
                                  b, c = ancestors[b]
                                  r.append('%s:%d:%d' % (b or "HEAD", c, branches[b]))
                              if r:
                                  ui.write('Ancestors: %s\n' % (','.join(r)))
                          ui.write('Log:\n')
                          ui.write('%s\n\n' % cs.comment)
                          ui.write('Members: \n')
                          for f in cs.entries:
                              fn = f.file
                              if fn.startswith(opts["prefix"]):
                                  fn = fn[len(opts["prefix"]):]
                              ui.write('\t%s:%s->%s%s \n' % (fn, '.'.join([str(x) for x in f.parent]) or 'INITIAL',
                                                        '.'.join([str(x) for x in f.revision]), ['', '(DEAD)'][f.dead]))
                          ui.write('\n')
                      # have we seen the start tag?
                      if revisions and off:
                          if revisions[0] == str(cs.id) or \
                              revisions[0] in cs.tags:
                              off = False
                      # see if we reached the end tag
                      if len(revisions)>1 and not off:
                          if revisions[1] == str(cs.id) or \
                              revisions[1] in cs.tags:
                              break

hgext/convert/git.py

0 +2 -2

              # git.py - git support for the convert extension
              #
              #  Copyright 2005-2009 Matt Mackall <mpm@selenic.com> and others
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2, incorporated herein by reference.
              import os
              from mercurial import util
              from common import NoRepo, commit, converter_source, checktool
              class convert_git(converter_source):
                  # Windows does not support GIT_DIR= construct while other systems
                  # cannot remove environment variable. Just assume none have
                  # both issues.
                  if hasattr(os, 'unsetenv'):
                      def gitcmd(self, s):
                          prevgitdir = os.environ.get('GIT_DIR')
                          os.environ['GIT_DIR'] = self.path
                          try:
                              return util.popen(s, 'rb')
                          finally:
                              if prevgitdir is None:
                                  del os.environ['GIT_DIR']
                              else:
                                  os.environ['GIT_DIR'] = prevgitdir
                  else:
                      def gitcmd(self, s):
                          return util.popen('GIT_DIR=%s %s' % (self.path, s), 'rb')
                  def __init__(self, ui, path, rev=None):
                      super(convert_git, self).__init__(ui, path, rev=rev)
                      if os.path.isdir(path + "/.git"):
                          path += "/.git"
                      if not os.path.exists(path + "/objects"):
                          raise NoRepo("%s does not look like a Git repo" % path)
                      checktool('git', 'git')
                      self.path = path
                  def getheads(self):
                      if not self.rev:
                          return self.gitcmd('git rev-parse --branches --remotes').read().splitlines()
                      else:
                          fh = self.gitcmd("git rev-parse --verify %s" % self.rev)
                          return [fh.read()[:-1]]
                  def catfile(self, rev, type):
                      if rev == "0" * 40: raise IOError()
                      fh = self.gitcmd("git cat-file %s %s" % (type, rev))
                      return fh.read()
                  def getfile(self, name, rev):
                      return self.catfile(rev, "blob")
                  def getmode(self, name, rev):
                      return self.modecache[(name, rev)]
                  def getchanges(self, version):
                      self.modecache = {}
                      fh = self.gitcmd("git diff-tree -z --root -m -r %s" % version)
                      changes = []
-                     seen = {}
+                     seen = set()
                      entry = None
                      for l in fh.read().split('\x00'):
                          if not entry:
                              if not l.startswith(':'):
                                  continue
                              entry = l
                              continue
                          f = l
                          if f not in seen:
-                             seen[f] = 1
+                             seen.add(f)
                              entry = entry.split()
                              h = entry[3]
                              p = (entry[1] == "100755")
                              s = (entry[1] == "120000")
                              self.modecache[(f, h)] = (p and "x") or (s and "l") or ""
                              changes.append((f, h))
                          entry = None
                      return (changes, {})
                  def getcommit(self, version):
                      c = self.catfile(version, "commit") # read the commit hash
                      end = c.find("\n\n")
                      message = c[end+2:]
                      message = self.recode(message)
                      l = c[:end].splitlines()
                      parents = []
                      author = committer = None
                      for e in l[1:]:
                          n, v = e.split(" ", 1)
                          if n == "author":
                              p = v.split()
                              tm, tz = p[-2:]
                              author = " ".join(p[:-2])
                              if author[0] == "<": author = author[1:-1]
                              author = self.recode(author)
                          if n == "committer":
                              p = v.split()
                              tm, tz = p[-2:]
                              committer = " ".join(p[:-2])
                              if committer[0] == "<": committer = committer[1:-1]
                              committer = self.recode(committer)
                          if n == "parent": parents.append(v)
                      if committer and committer != author:
                          message += "\ncommitter: %s\n" % committer
                      tzs, tzh, tzm = tz[-5:-4] + "1", tz[-4:-2], tz[-2:]
                      tz = -int(tzs) * (int(tzh) * 3600 + int(tzm))
                      date = tm + " " + str(tz)
                      c = commit(parents=parents, date=date, author=author, desc=message,
                                 rev=version)
                      return c
                  def gettags(self):
                      tags = {}
                      fh = self.gitcmd('git ls-remote --tags "%s"' % self.path)
                      prefix = 'refs/tags/'
                      for line in fh:
                          line = line.strip()
                          if not line.endswith("^{}"):
                              continue
                          node, tag = line.split(None, 1)
                          if not tag.startswith(prefix):
                              continue
                          tag = tag[len(prefix):-3]
                          tags[tag] = node
                      return tags
                  def getchangedfiles(self, version, i):
                      changes = []
                      if i is None:
                          fh = self.gitcmd("git diff-tree --root -m -r %s" % version)
                          for l in fh:
                              if "\t" not in l:
                                  continue
                              m, f = l[:-1].split("\t")
                              changes.append(f)
                          fh.close()
                      else:
                          fh = self.gitcmd('git diff-tree --name-only --root -r %s "%s^%s" --'
                                           % (version, version, i+1))
                          changes = [f.rstrip('\n') for f in fh]
                          fh.close()
                      return changes

hgext/convert/hg.py

0 +2 -2

              # hg.py - hg backend for convert extension
              #
              #  Copyright 2005-2009 Matt Mackall <mpm@selenic.com> and others
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2, incorporated herein by reference.
              # Notes for hg->hg conversion:
              #
              # * Old versions of Mercurial didn't trim the whitespace from the ends
              #   of commit messages, but new versions do.  Changesets created by
              #   those older versions, then converted, may thus have different
              #   hashes for changesets that are otherwise identical.
              #
              # * By default, the source revision is stored in the converted
              #   revision.  This will cause the converted revision to have a
              #   different identity than the source.  To avoid this, use the
              #   following option: "--config convert.hg.saverev=false"
              import os, time
              from mercurial.i18n import _
              from mercurial.node import bin, hex, nullid
              from mercurial import hg, util, context, error
              from common import NoRepo, commit, converter_source, converter_sink
              class mercurial_sink(converter_sink):
                  def __init__(self, ui, path):
                      converter_sink.__init__(self, ui, path)
                      self.branchnames = ui.configbool('convert', 'hg.usebranchnames', True)
                      self.clonebranches = ui.configbool('convert', 'hg.clonebranches', False)
                      self.tagsbranch = ui.config('convert', 'hg.tagsbranch', 'default')
                      self.lastbranch = None
                      if os.path.isdir(path) and len(os.listdir(path)) > 0:
                          try:
                              self.repo = hg.repository(self.ui, path)
                              if not self.repo.local():
                                  raise NoRepo(_('%s is not a local Mercurial repo') % path)
                          except error.RepoError, err:
                              ui.traceback()
                              raise NoRepo(err.args[0])
                      else:
                          try:
                              ui.status(_('initializing destination %s repository\n') % path)
                              self.repo = hg.repository(self.ui, path, create=True)
                              if not self.repo.local():
                                  raise NoRepo(_('%s is not a local Mercurial repo') % path)
                              self.created.append(path)
                          except error.RepoError:
                              ui.traceback()
                              raise NoRepo("could not create hg repo %s as sink" % path)
                      self.lock = None
                      self.wlock = None
                      self.filemapmode = False
                  def before(self):
                      self.ui.debug(_('run hg sink pre-conversion action\n'))
                      self.wlock = self.repo.wlock()
                      self.lock = self.repo.lock()
                  def after(self):
                      self.ui.debug(_('run hg sink post-conversion action\n'))
                      self.lock.release()
                      self.wlock.release()
                  def revmapfile(self):
                      return os.path.join(self.path, ".hg", "shamap")
                  def authorfile(self):
                      return os.path.join(self.path, ".hg", "authormap")
                  def getheads(self):
                      h = self.repo.changelog.heads()
                      return [ hex(x) for x in h ]
                  def setbranch(self, branch, pbranches):
                      if not self.clonebranches:
                          return
                      setbranch = (branch != self.lastbranch)
                      self.lastbranch = branch
                      if not branch:
                          branch = 'default'
                      pbranches = [(b[0], b[1] and b[1] or 'default') for b in pbranches]
                      pbranch = pbranches and pbranches[0][1] or 'default'
                      branchpath = os.path.join(self.path, branch)
                      if setbranch:
                          self.after()
                          try:
                              self.repo = hg.repository(self.ui, branchpath)
                          except:
                              self.repo = hg.repository(self.ui, branchpath, create=True)
                          self.before()
                      # pbranches may bring revisions from other branches (merge parents)
                      # Make sure we have them, or pull them.
                      missings = {}
                      for b in pbranches:
                          try:
                              self.repo.lookup(b[0])
                          except:
                              missings.setdefault(b[1], []).append(b[0])
                      if missings:
                          self.after()
                          for pbranch, heads in missings.iteritems():
                              pbranchpath = os.path.join(self.path, pbranch)
                              prepo = hg.repository(self.ui, pbranchpath)
                              self.ui.note(_('pulling from %s into %s\n') % (pbranch, branch))
                              self.repo.pull(prepo, [prepo.lookup(h) for h in heads])
                          self.before()
                  def putcommit(self, files, copies, parents, commit, source):
                      files = dict(files)
                      def getfilectx(repo, memctx, f):
                          v = files[f]
                          data = source.getfile(f, v)
                          e = source.getmode(f, v)
                          return context.memfilectx(f, data, 'l' in e, 'x' in e, copies.get(f))
                      pl = []
                      for p in parents:
                          if p not in pl:
                              pl.append(p)
                      parents = pl
                      nparents = len(parents)
                      if self.filemapmode and nparents == 1:
                          m1node = self.repo.changelog.read(bin(parents[0]))[0]
                          parent = parents[0]
                      if len(parents) < 2: parents.append("0" * 40)
                      if len(parents) < 2: parents.append("0" * 40)
                      p2 = parents.pop(0)
                      text = commit.desc
                      extra = commit.extra.copy()
                      if self.branchnames and commit.branch:
                          extra['branch'] = commit.branch
                      if commit.rev:
                          extra['convert_revision'] = commit.rev
                      while parents:
                          p1 = p2
                          p2 = parents.pop(0)
                          ctx = context.memctx(self.repo, (p1, p2), text, files.keys(), getfilectx,
                                               commit.author, commit.date, extra)
                          self.repo.commitctx(ctx)
                          text = "(octopus merge fixup)\n"
                          p2 = hex(self.repo.changelog.tip())
                      if self.filemapmode and nparents == 1:
                          man = self.repo.manifest
                          mnode = self.repo.changelog.read(bin(p2))[0]
                          if not man.cmp(m1node, man.revision(mnode)):
                              self.repo.rollback()
                              return parent
                      return p2
                  def puttags(self, tags):
                      try:
                          parentctx = self.repo[self.tagsbranch]
                          tagparent = parentctx.node()
                      except error.RepoError:
                          parentctx = None
                          tagparent = nullid
                      try:
                          oldlines = sorted(parentctx['.hgtags'].data().splitlines(1))
                      except:
                          oldlines = []
                      newlines = sorted([("%s %s\n" % (tags[tag], tag)) for tag in tags])
                      if newlines == oldlines:
                          return None
                      data = "".join(newlines)
                      def getfilectx(repo, memctx, f):
                          return context.memfilectx(f, data, False, False, None)
                      self.ui.status(_("updating tags\n"))
                      date = "%s 0" % int(time.mktime(time.gmtime()))
                      extra = {'branch': self.tagsbranch}
                      ctx = context.memctx(self.repo, (tagparent, None), "update tags",
                                           [".hgtags"], getfilectx, "convert-repo", date,
                                           extra)
                      self.repo.commitctx(ctx)
                      return hex(self.repo.changelog.tip())
                  def setfilemapmode(self, active):
                      self.filemapmode = active
              class mercurial_source(converter_source):
                  def __init__(self, ui, path, rev=None):
                      converter_source.__init__(self, ui, path, rev)
                      self.ignoreerrors = ui.configbool('convert', 'hg.ignoreerrors', False)
-                     self.ignored = {}
+                     self.ignored = set()
                      self.saverev = ui.configbool('convert', 'hg.saverev', False)
                      try:
                          self.repo = hg.repository(self.ui, path)
                          # try to provoke an exception if this isn't really a hg
                          # repo, but some other bogus compatible-looking url
                          if not self.repo.local():
                              raise error.RepoError()
                      except error.RepoError:
                          ui.traceback()
                          raise NoRepo("%s is not a local Mercurial repo" % path)
                      self.lastrev = None
                      self.lastctx = None
                      self._changescache = None
                      self.convertfp = None
                      # Restrict converted revisions to startrev descendants
                      startnode = ui.config('convert', 'hg.startrev')
                      if startnode is not None:
                          try:
                              startnode = self.repo.lookup(startnode)
                          except error.RepoError:
                              raise util.Abort(_('%s is not a valid start revision')
                                               % startnode)
                          startrev = self.repo.changelog.rev(startnode)
                          children = {startnode: 1}
                          for rev in self.repo.changelog.descendants(startrev):
                              children[self.repo.changelog.node(rev)] = 1
                          self.keep = children.__contains__
                      else:
                          self.keep = util.always
                  def changectx(self, rev):
                      if self.lastrev != rev:
                          self.lastctx = self.repo[rev]
                          self.lastrev = rev
                      return self.lastctx
                  def parents(self, ctx):
                      return [p.node() for p in ctx.parents()
                              if p and self.keep(p.node())]
                  def getheads(self):
                      if self.rev:
                          heads = [self.repo[self.rev].node()]
                      else:
                          heads = self.repo.heads()
                      return [hex(h) for h in heads if self.keep(h)]
                  def getfile(self, name, rev):
                      try:
                          return self.changectx(rev)[name].data()
                      except error.LookupError, err:
                          raise IOError(err)
                  def getmode(self, name, rev):
                      return self.changectx(rev).manifest().flags(name)
                  def getchanges(self, rev):
                      ctx = self.changectx(rev)
                      parents = self.parents(ctx)
                      if not parents:
                          files = sorted(ctx.manifest())
                          if self.ignoreerrors:
                              # calling getcopies() is a simple way to detect missing
                              # revlogs and populate self.ignored
                              self.getcopies(ctx, files)
                          return [(f, rev) for f in files if f not in self.ignored], {}
                      if self._changescache and self._changescache[0] == rev:
                          m, a, r = self._changescache[1]
                      else:
                          m, a, r = self.repo.status(parents[0], ctx.node())[:3]
                      # getcopies() detects missing revlogs early, run it before
                      # filtering the changes.
                      copies = self.getcopies(ctx, m + a)
                      changes = [(name, rev) for name in m + a + r
                                 if name not in self.ignored]
                      return sorted(changes), copies
                  def getcopies(self, ctx, files):
                      copies = {}
                      for name in files:
                          if name in self.ignored:
                              continue
                          try:
                              copysource, copynode = ctx.filectx(name).renamed()
                              if copysource in self.ignored or not self.keep(copynode):
                                  continue
                              copies[name] = copysource
                          except TypeError:
                              pass
                          except error.LookupError, e:
                              if not self.ignoreerrors:
                                  raise
-                             self.ignored[name] = 1
+                             self.ignored.add(name)
                              self.ui.warn(_('ignoring: %s\n') % e)
                      return copies
                  def getcommit(self, rev):
                      ctx = self.changectx(rev)
                      parents = [hex(p) for p in self.parents(ctx)]
                      if self.saverev:
                          crev = rev
                      else:
                          crev = None
                      return commit(author=ctx.user(), date=util.datestr(ctx.date()),
                                    desc=ctx.description(), rev=crev, parents=parents,
                                    branch=ctx.branch(), extra=ctx.extra())
                  def gettags(self):
                      tags = [t for t in self.repo.tagslist() if t[0] != 'tip']
                      return dict([(name, hex(node)) for name, node in tags
                                   if self.keep(node)])
                  def getchangedfiles(self, rev, i):
                      ctx = self.changectx(rev)
                      parents = self.parents(ctx)
                      if not parents and i is None:
                          i = 0
                          changes = [], ctx.manifest().keys(), []
                      else:
                          i = i or 0
                          changes = self.repo.status(parents[i], ctx.node())[:3]
                      changes = [[f for f in l if f not in self.ignored] for l in changes]
                      if i == 0:
                          self._changescache = (rev, changes)
                      return changes[0] + changes[1] + changes[2]
                  def converted(self, rev, destrev):
                      if self.convertfp is None:
                          self.convertfp = open(os.path.join(self.path, '.hg', 'shamap'),
                                                'a')
                      self.convertfp.write('%s %s\n' % (destrev, rev))
                      self.convertfp.flush()
                  def before(self):
                      self.ui.debug(_('run hg source pre-conversion action\n'))
                  def after(self):
                      self.ui.debug(_('run hg source post-conversion action\n'))

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No reviewers

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages