upstream/mercurial-mirror Files · mercurial/filelog.py

filelog: add hash-based comparisons...

filelog: add hash-based comparisons For status, rather than reconstruct full file versions from revlog for comparison, compare hashes.

Matt Mackall - - Load All Authors

File last commit:

r2887:05257fd2 default


                r2887:05257fd2

default

Download file

             filelog.py
        
                    128 lines
            
             | 3.9 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / mercurial / filelog.py
          
                    History
                
                 |
                  Annotation
                 | Raw
                 |Copy content
                 |Copy permalink

      # filelog.py - file history class for mercurial

      #

      # Copyright 2005, 2006 Matt Mackall <mpm@selenic.com>

      #

      # This software may be used and distributed according to the terms

      # of the GNU General Public License, incorporated herein by reference.

      from revlog import *

      from demandload import *

      demandload(globals(), "bdiff os")

      class filelog(revlog):

          def __init__(self, opener, path, defversion=REVLOG_DEFAULT_VERSION):

              revlog.__init__(self, opener,

                              os.path.join("data", self.encodedir(path + ".i")),

                              os.path.join("data", self.encodedir(path + ".d")),

                              defversion)

          # This avoids a collision between a file named foo and a dir named

          # foo.i or foo.d

          def encodedir(self, path):

              return (path

                      .replace(".hg/", ".hg.hg/")

                      .replace(".i/", ".i.hg/")

                      .replace(".d/", ".d.hg/"))

          def decodedir(self, path):

              return (path

                      .replace(".d.hg/", ".d/")

                      .replace(".i.hg/", ".i/")

                      .replace(".hg.hg/", ".hg/"))

          def read(self, node):

              t = self.revision(node)

              if not t.startswith('\1\n'):

                  return t

              s = t.index('\1\n', 2)

              return t[s+2:]

          def readmeta(self, node):

              t = self.revision(node)

              if not t.startswith('\1\n'):

                  return {}

              s = t.index('\1\n', 2)

              mt = t[2:s]

              m = {}

              for l in mt.splitlines():

                  k, v = l.split(": ", 1)

                  m[k] = v

              return m

          def add(self, text, meta, transaction, link, p1=None, p2=None):

              if meta or text.startswith('\1\n'):

                  mt = ""

                  if meta:

                      mt = [ "%s: %s\n" % (k, v) for k,v in meta.items() ]

                  text = "\1\n%s\1\n%s" % ("".join(mt), text)

              return self.addrevision(text, transaction, link, p1, p2)

          def renamed(self, node):

              if self.parents(node)[0] != nullid:

                  return False

              m = self.readmeta(node)

              if m and m.has_key("copy"):

                  return (m["copy"], bin(m["copyrev"]))

              return False

          def cmp(self, node, text):

              """compare text with a given file revision"""

              # for renames, we have to go the slow way

              if self.renamed(node):

                  t2 = self.read(node)

                  return t2 == text

              p1, p2 = self.parents(node)

              h = hash(text, p1, p2)

              return h != node

          def makenode(self, node, text):

              """calculate a file nodeid for text, descended or possibly

              unchanged from node"""

              if self.cmp(node, text):

                  return hash(text, node, nullid)

              return node

          def annotate(self, node):

              def decorate(text, rev):

                  return ([rev] * len(text.splitlines()), text)

              def pair(parent, child):

                  for a1, a2, b1, b2 in bdiff.blocks(parent[1], child[1]):

                      child[0][b1:b2] = parent[0][a1:a2]

                  return child

              # find all ancestors

              needed = {node:1}

              visit = [node]

              while visit:

                  n = visit.pop(0)

                  for p in self.parents(n):

                      if p not in needed:

                          needed[p] = 1

                          visit.append(p)

                      else:

                          # count how many times we'll use this

                          needed[p] += 1

              # sort by revision which is a topological order

              visit = [ (self.rev(n), n) for n in needed.keys() ]

              visit.sort()

              hist = {}

              for r,n in visit:

                  curr = decorate(self.read(n), self.linkrev(n))

                  for p in self.parents(n):

                      if p != nullid:

                          curr = pair(hist[p], curr)

                          # trim the history of unneeded revs

                          needed[p] -= 1

                          if not needed[p]:

                              del hist[p]

                  hist[n] = curr

              return zip(hist[n][0], hist[n][1].splitlines(1))

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

				# filelog.py - file history class for mercurial
				#
				# Copyright 2005, 2006 Matt Mackall <mpm@selenic.com>
				#
				# This software may be used and distributed according to the terms
				# of the GNU General Public License, incorporated herein by reference.

				from revlog import *
				from demandload import *
				demandload(globals(), "bdiff os")

				class filelog(revlog):
				def __init__(self, opener, path, defversion=REVLOG_DEFAULT_VERSION):
				revlog.__init__(self, opener,
				os.path.join("data", self.encodedir(path + ".i")),
				os.path.join("data", self.encodedir(path + ".d")),
				defversion)

				# This avoids a collision between a file named foo and a dir named
				# foo.i or foo.d
				def encodedir(self, path):
				return (path
				.replace(".hg/", ".hg.hg/")
				.replace(".i/", ".i.hg/")
				.replace(".d/", ".d.hg/"))

				def decodedir(self, path):
				return (path
				.replace(".d.hg/", ".d/")
				.replace(".i.hg/", ".i/")
				.replace(".hg.hg/", ".hg/"))

				def read(self, node):
				t = self.revision(node)
				if not t.startswith('\1\n'):
				return t
				s = t.index('\1\n', 2)
				return t[s+2:]

				def readmeta(self, node):
				t = self.revision(node)
				if not t.startswith('\1\n'):
				return {}
				s = t.index('\1\n', 2)
				mt = t[2:s]
				m = {}
				for l in mt.splitlines():
				k, v = l.split(": ", 1)
				m[k] = v
				return m

				def add(self, text, meta, transaction, link, p1=None, p2=None):
				if meta or text.startswith('\1\n'):
				mt = ""
				if meta:
				mt = [ "%s: %s\n" % (k, v) for k,v in meta.items() ]
				text = "\1\n%s\1\n%s" % ("".join(mt), text)
				return self.addrevision(text, transaction, link, p1, p2)

				def renamed(self, node):
				if self.parents(node)[0] != nullid:
				return False
				m = self.readmeta(node)
				if m and m.has_key("copy"):
				return (m["copy"], bin(m["copyrev"]))
				return False

				def cmp(self, node, text):
				"""compare text with a given file revision"""

				# for renames, we have to go the slow way
				if self.renamed(node):
				t2 = self.read(node)
				return t2 == text

				p1, p2 = self.parents(node)
				h = hash(text, p1, p2)

				return h != node

				def makenode(self, node, text):
				"""calculate a file nodeid for text, descended or possibly
				unchanged from node"""

				if self.cmp(node, text):
				return hash(text, node, nullid)
				return node

				def annotate(self, node):

				def decorate(text, rev):
				return ([rev] * len(text.splitlines()), text)

				def pair(parent, child):
				for a1, a2, b1, b2 in bdiff.blocks(parent[1], child[1]):
				child[0][b1:b2] = parent[0][a1:a2]
				return child

				# find all ancestors
				needed = {node:1}
				visit = [node]
				while visit:
				n = visit.pop(0)
				for p in self.parents(n):
				if p not in needed:
				needed[p] = 1
				visit.append(p)
				else:
				# count how many times we'll use this
				needed[p] += 1

				# sort by revision which is a topological order
				visit = [ (self.rev(n), n) for n in needed.keys() ]
				visit.sort()
				hist = {}

				for r,n in visit:
				curr = decorate(self.read(n), self.linkrev(n))
				for p in self.parents(n):
				if p != nullid:
				curr = pair(hist[p], curr)
				# trim the history of unneeded revs
				needed[p] -= 1
				if not needed[p]:
				del hist[p]
				hist[n] = curr

				return zip(hist[n][0], hist[n][1].splitlines(1))