upstream/mercurial-mirror Files · mercurial/repair.py

localrepo.commit: normalize commit message even for rawcommit....

localrepo.commit: normalize commit message even for rawcommit. This normalization consists of: - stripping trailing whitespace - always using "\n" as the line separator I think the main reason rawcommit was skipping this normalization was an attempt to preserve hashes during an hg->hg conversion. While this is a nice goal, it's not particularly interesting in practice. Since SHA-1 is so strong, the only safe way to do it is to have absolutely identical revisions. But: - if the original revision was created with a recent version of hg, the commit message will be the same, with or without that normalization - if it was created with an ancient version of hg that didn't do any normalization, even if the commit message is identical, the file list in the changelog is likely to be different (e.g. no removed files), and there were some old issues with e.g. extra file merging, which will end up changing the hash anyway - in any case, if one *really* has to preserve hashes, it's easier (and faster) to fake a partial conversion using something like: hg clone -U -r rev orig-repo new-repo hg -R new-repo log --template '#node# #node#\n' > new-repo/.hg/shamap Additionally, we've had some reports of problems arising from this lack of normalization - e.g. issue871, and a user that was wondering why hg export/hg import was not preserving hashes when there was nothing unusual going on (it was just import doing the normalization that had been skipped). This also means that it's even more unlikely to get identical revisions when going $VCS->hg->$VCS.

Joel Rosdahl - - Load All Authors

File last commit:

r6211:f89fd07f default


                r6254:3667b6e4

default

Download file

             repair.py
        
                    136 lines
            
             | 4.6 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / mercurial / repair.py
          
                    History
                
                 |
                  Annotation
                 | Raw
                 |Copy content
                 |Copy permalink

      # repair.py - functions for repository repair for mercurial

      #

      # Copyright 2005, 2006 Chris Mason <mason@suse.com>

      # Copyright 2007 Matt Mackall

      #

      # This software may be used and distributed according to the terms

      # of the GNU General Public License, incorporated herein by reference.

      import changegroup, os

      from node import nullrev, short

      def _bundle(repo, bases, heads, node, suffix, extranodes=None):

          """create a bundle with the specified revisions as a backup"""

          cg = repo.changegroupsubset(bases, heads, 'strip', extranodes)

          backupdir = repo.join("strip-backup")

          if not os.path.isdir(backupdir):

              os.mkdir(backupdir)

          name = os.path.join(backupdir, "%s-%s" % (short(node), suffix))

          repo.ui.warn("saving bundle to %s\n" % name)

          return changegroup.writebundle(cg, name, "HG10BZ")

      def _collectfiles(repo, striprev):

          """find out the filelogs affected by the strip"""

          files = {}

          for x in xrange(striprev, repo.changelog.count()):

              for name in repo.changectx(x).files():

                  if name in files:

                      continue

                  files[name] = 1

          files = files.keys()

          files.sort()

          return files

      def _collectextranodes(repo, files, link):

          """return the nodes that have to be saved before the strip"""

          def collectone(revlog):

              extra = []

              startrev = count = revlog.count()

              # find the truncation point of the revlog

              for i in xrange(0, count):

                  node = revlog.node(i)

                  lrev = revlog.linkrev(node)

                  if lrev >= link:

                      startrev = i + 1

                      break

              # see if any revision after that point has a linkrev less than link

              # (we have to manually save these guys)

              for i in xrange(startrev, count):

                  node = revlog.node(i)

                  lrev = revlog.linkrev(node)

                  if lrev < link:

                      extra.append((node, cl.node(lrev)))

              return extra

          extranodes = {}

          cl = repo.changelog

          extra = collectone(repo.manifest)

          if extra:

              extranodes[1] = extra

          for fname in files:

              f = repo.file(fname)

              extra = collectone(f)

              if extra:

                  extranodes[fname] = extra

          return extranodes

      def strip(ui, repo, node, backup="all"):

          cl = repo.changelog

          # TODO delete the undo files, and handle undo of merge sets

          pp = cl.parents(node)

          striprev = cl.rev(node)

          # Some revisions with rev > striprev may not be descendants of striprev.

          # We have to find these revisions and put them in a bundle, so that

          # we can restore them after the truncations.

          # To create the bundle we use repo.changegroupsubset which requires

          # the list of heads and bases of the set of interesting revisions.

          # (head = revision in the set that has no descendant in the set;

          #  base = revision in the set that has no ancestor in the set)

          tostrip = {striprev: 1}

          saveheads = {}

          savebases = []

          for r in xrange(striprev + 1, cl.count()):

              parents = cl.parentrevs(r)

              if parents[0] in tostrip or parents[1] in tostrip:

                  # r is a descendant of striprev

                  tostrip[r] = 1

                  # if this is a merge and one of the parents does not descend

                  # from striprev, mark that parent as a savehead.

                  if parents[1] != nullrev:

                      for p in parents:

                          if p not in tostrip and p > striprev:

                              saveheads[p] = 1

              else:

                  # if no parents of this revision will be stripped, mark it as

                  # a savebase

                  if parents[0] < striprev and parents[1] < striprev:

                      savebases.append(cl.node(r))

                  for p in parents:

                      if p in saveheads:

                          del saveheads[p]

                  saveheads[r] = 1

          saveheads = [cl.node(r) for r in saveheads]

          files = _collectfiles(repo, striprev)

          extranodes = _collectextranodes(repo, files, striprev)

          # create a changegroup for all the branches we need to keep

          if backup == "all":

              _bundle(repo, [node], cl.heads(), node, 'backup')

          if saveheads or extranodes:

              chgrpfile = _bundle(repo, savebases, saveheads, node, 'temp',

                                  extranodes)

          cl.strip(striprev)

          repo.manifest.strip(striprev)

          for name in files:

              f = repo.file(name)

              f.strip(striprev)

          if saveheads or extranodes:

              ui.status("adding branch\n")

              f = open(chgrpfile, "rb")

              gen = changegroup.readbundle(f, chgrpfile)

              repo.addchangegroup(gen, 'strip', 'bundle:' + chgrpfile, True)

              f.close()

              if backup != "strip":

                  os.unlink(chgrpfile)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

				# repair.py - functions for repository repair for mercurial
				#
				# Copyright 2005, 2006 Chris Mason <mason@suse.com>
				# Copyright 2007 Matt Mackall
				#
				# This software may be used and distributed according to the terms
				# of the GNU General Public License, incorporated herein by reference.

				import changegroup, os
				from node import nullrev, short

				def _bundle(repo, bases, heads, node, suffix, extranodes=None):
				"""create a bundle with the specified revisions as a backup"""
				cg = repo.changegroupsubset(bases, heads, 'strip', extranodes)
				backupdir = repo.join("strip-backup")
				if not os.path.isdir(backupdir):
				os.mkdir(backupdir)
				name = os.path.join(backupdir, "%s-%s" % (short(node), suffix))
				repo.ui.warn("saving bundle to %s\n" % name)
				return changegroup.writebundle(cg, name, "HG10BZ")

				def _collectfiles(repo, striprev):
				"""find out the filelogs affected by the strip"""
				files = {}

				for x in xrange(striprev, repo.changelog.count()):
				for name in repo.changectx(x).files():
				if name in files:
				continue
				files[name] = 1

				files = files.keys()
				files.sort()
				return files

				def _collectextranodes(repo, files, link):
				"""return the nodes that have to be saved before the strip"""
				def collectone(revlog):
				extra = []
				startrev = count = revlog.count()
				# find the truncation point of the revlog
				for i in xrange(0, count):
				node = revlog.node(i)
				lrev = revlog.linkrev(node)
				if lrev >= link:
				startrev = i + 1
				break

				# see if any revision after that point has a linkrev less than link
				# (we have to manually save these guys)
				for i in xrange(startrev, count):
				node = revlog.node(i)
				lrev = revlog.linkrev(node)
				if lrev < link:
				extra.append((node, cl.node(lrev)))

				return extra

				extranodes = {}
				cl = repo.changelog
				extra = collectone(repo.manifest)
				if extra:
				extranodes[1] = extra
				for fname in files:
				f = repo.file(fname)
				extra = collectone(f)
				if extra:
				extranodes[fname] = extra

				return extranodes

				def strip(ui, repo, node, backup="all"):
				cl = repo.changelog
				# TODO delete the undo files, and handle undo of merge sets
				pp = cl.parents(node)
				striprev = cl.rev(node)

				# Some revisions with rev > striprev may not be descendants of striprev.
				# We have to find these revisions and put them in a bundle, so that
				# we can restore them after the truncations.
				# To create the bundle we use repo.changegroupsubset which requires
				# the list of heads and bases of the set of interesting revisions.
				# (head = revision in the set that has no descendant in the set;
				# base = revision in the set that has no ancestor in the set)
				tostrip = {striprev: 1}
				saveheads = {}
				savebases = []
				for r in xrange(striprev + 1, cl.count()):
				parents = cl.parentrevs(r)
				if parents[0] in tostrip or parents[1] in tostrip:
				# r is a descendant of striprev
				tostrip[r] = 1
				# if this is a merge and one of the parents does not descend
				# from striprev, mark that parent as a savehead.
				if parents[1] != nullrev:
				for p in parents:
				if p not in tostrip and p > striprev:
				saveheads[p] = 1
				else:
				# if no parents of this revision will be stripped, mark it as
				# a savebase
				if parents[0] < striprev and parents[1] < striprev:
				savebases.append(cl.node(r))

				for p in parents:
				if p in saveheads:
				del saveheads[p]
				saveheads[r] = 1

				saveheads = [cl.node(r) for r in saveheads]
				files = _collectfiles(repo, striprev)

				extranodes = _collectextranodes(repo, files, striprev)

				# create a changegroup for all the branches we need to keep
				if backup == "all":
				_bundle(repo, [node], cl.heads(), node, 'backup')
				if saveheads or extranodes:
				chgrpfile = _bundle(repo, savebases, saveheads, node, 'temp',
				extranodes)

				cl.strip(striprev)
				repo.manifest.strip(striprev)
				for name in files:
				f = repo.file(name)
				f.strip(striprev)

				if saveheads or extranodes:
				ui.status("adding branch\n")
				f = open(chgrpfile, "rb")
				gen = changegroup.readbundle(f, chgrpfile)
				repo.addchangegroup(gen, 'strip', 'bundle:' + chgrpfile, True)
				f.close()
				if backup != "strip":
				os.unlink(chgrpfile)