upstream/mercurial-mirror Commit - r22788:160efd22

1

# manifest.py - manifest revision class for mercurial

1

# manifest.py - manifest revision class for mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from i18n import _

8

from i18n import _

9

import mdiff, parsers, error, revlog, util, dicthelpers

9

import mdiff, parsers, error, revlog, util, dicthelpers

10

import array, struct

10

import array, struct

11

12

class manifestdict(dict):

12

class manifestdict(dict):

13

def __init__(self, mapping=None, flags=None):

13

def __init__(self, mapping=None, flags=None):

14

if mapping is None:

14

if mapping is None:

15

mapping = {}

15

mapping = {}

16

if flags is None:

16

if flags is None:

17

flags = {}

17

flags = {}

18

dict.__init__(self, mapping)

18

dict.__init__(self, mapping)

19

self._flags = flags

19

self._flags = flags

20

def flags(self, f):

20

def flags(self, f):

21

return self._flags.get(f, "")

21

return self._flags.get(f, "")

22

def withflags(self):

22

def withflags(self):

23

return set(self._flags.keys())

23

return set(self._flags.keys())

24

def set(self, f, flags):

24

def set(self, f, flags):

25

self._flags[f] = flags

25

self._flags[f] = flags

26

def copy(self):

26

def copy(self):

27

return manifestdict(self, dict.copy(self._flags))

27

return manifestdict(self, dict.copy(self._flags))

28

def intersectfiles(self, files):

28

def intersectfiles(self, files):

29

'''make a new manifestdict with the intersection of self with files

29

'''make a new manifestdict with the intersection of self with files

30

31

The algorithm assumes that files is much smaller than self.'''

31

The algorithm assumes that files is much smaller than self.'''

32

ret = manifestdict()

32

ret = manifestdict()

33

for fn in files:

33

for fn in files:

34

if fn in self:

34

if fn in self:

35

ret[fn] = self[fn]

35

ret[fn] = self[fn]

36

flags = self._flags.get(fn, None)

36

flags = self._flags.get(fn, None)

37

if flags:

37

if flags:

38

ret._flags[fn] = flags

38

ret._flags[fn] = flags

39

return ret

39

return ret

40

def flagsdiff(self, d2):

40

def flagsdiff(self, d2):

41

return dicthelpers.diff(self._flags, d2._flags, "")

41

return dicthelpers.diff(self._flags, d2._flags, "")

42

43

44

def _checkforbidden(l):

44

def _checkforbidden(l):

45

"""Check filenames for illegal characters."""

45

"""Check filenames for illegal characters."""

46

for f in l:

46

for f in l:

47

if '\n' in f or '\r' in f:

47

if '\n' in f or '\r' in f:

48

raise error.RevlogError(

48

raise error.RevlogError(

49

_("'\\n' and '\\r' disallowed in filenames: %r") % f)

49

_("'\\n' and '\\r' disallowed in filenames: %r") % f)

50

51

52

# apply the changes collected during the bisect loop to our addlist

52

# apply the changes collected during the bisect loop to our addlist

53

# return a delta suitable for addrevision

53

# return a delta suitable for addrevision

54

def _addlistdelta(addlist, x):

54

def _addlistdelta(addlist, x):

55

# for large addlist arrays, building a new array is cheaper

55

# for large addlist arrays, building a new array is cheaper

56

# than repeatedly modifying the existing one

56

# than repeatedly modifying the existing one

57

currentposition = 0

57

currentposition = 0

58

newaddlist = array.array('c')

58

newaddlist = array.array('c')

59

60

for start, end, content in x:

60

for start, end, content in x:

61

newaddlist += addlist[currentposition:start]

61

newaddlist += addlist[currentposition:start]

62

if content:

62

if content:

63

newaddlist += array.array('c', content)

63

newaddlist += array.array('c', content)

64

65

currentposition = end

65

currentposition = end

66

67

newaddlist += addlist[currentposition:]

67

newaddlist += addlist[currentposition:]

68

69

deltatext = "".join(struct.pack(">lll", start, end, len(content))

69

deltatext = "".join(struct.pack(">lll", start, end, len(content))

70

+ content for start, end, content in x)

70

+ content for start, end, content in x)

71

return deltatext, newaddlist

71

return deltatext, newaddlist

72

73

def _parse(lines):

73

def _parse(lines):

74

mfdict = manifestdict()

74

mfdict = manifestdict()

75

parsers.parse_manifest(mfdict, mfdict._flags, lines)

75

parsers.parse_manifest(mfdict, mfdict._flags, lines)

76

return mfdict

76

return mfdict

77

78

class manifest(revlog.revlog):

78

class manifest(revlog.revlog):

79

def __init__(self, opener):

79

def __init__(self, opener):

80

# we expect to deal with not more than four revs at a time,

80

# we expect to deal with not more than four revs at a time,

81

# during a commit --amend

81

# during a commit --amend

82

self._mancache = util.lrucachedict(4)

82

self._mancache = util.lrucachedict(4)

83

revlog.revlog.__init__(self, opener, "00manifest.i")

83

revlog.revlog.__init__(self, opener, "00manifest.i")

84

85

def readdelta(self, node):

85

def readdelta(self, node):

86

r = self.rev(node)

86

r = self.rev(node)

87

return _parse(mdiff.patchtext(self.revdiff(self.deltaparent(r), r)))

87

return _parse(mdiff.patchtext(self.revdiff(self.deltaparent(r), r)))

88

89

def readfast(self, node):

89

def readfast(self, node):

90

'''use the faster of readdelta or read'''

90

'''use the faster of readdelta or read'''

91

r = self.rev(node)

91

r = self.rev(node)

92

deltaparent = self.deltaparent(r)

92

deltaparent = self.deltaparent(r)

93

if deltaparent != revlog.nullrev and deltaparent in self.parentrevs(r):

93

if deltaparent != revlog.nullrev and deltaparent in self.parentrevs(r):

94

return self.readdelta(node)

94

return self.readdelta(node)

95

return self.read(node)

95

return self.read(node)

96

97

def read(self, node):

97

def read(self, node):

98

if node == revlog.nullid:

98

if node == revlog.nullid:

99

return manifestdict() # don't upset local cache

99

return manifestdict() # don't upset local cache

100

if node in self._mancache:

100

if node in self._mancache:

101

return self._mancache[node][0]

101

return self._mancache[node][0]

102

text = self.revision(node)

102

text = self.revision(node)

103

arraytext = array.array('c', text)

103

arraytext = array.array('c', text)

104

mapping = _parse(text)

104

mapping = _parse(text)

105

self._mancache[node] = (mapping, arraytext)

105

self._mancache[node] = (mapping, arraytext)

106

return mapping

106

return mapping

107

108

def _search(self, m, s, lo=0, hi=None):

108

def _search(self, m, s, lo=0, hi=None):

109

'''return a tuple (start, end) that says where to find s within m.

109

'''return a tuple (start, end) that says where to find s within m.

110

111

If the string is found m[start:end] are the line containing

111

If the string is found m[start:end] are the line containing

112

that string. If start == end the string was not found and

112

that string. If start == end the string was not found and

113

they indicate the proper sorted insertion point.

113

they indicate the proper sorted insertion point.

114

115

m should be a buffer or a string

115

m should be a buffer or a string

116

s is a string'''

116

s is a string'''

117

def advance(i, c):

117

def advance(i, c):

118

while i < lenm and m[i] != c:

118

while i < lenm and m[i] != c:

119

i += 1

119

i += 1

120

return i

120

return i

121

if not s:

121

if not s:

122

return (lo, lo)

122

return (lo, lo)

123

lenm = len(m)

123

lenm = len(m)

124

if not hi:

124

if not hi:

125

hi = lenm

125

hi = lenm

126

while lo < hi:

126

while lo < hi:

127

mid = (lo + hi) // 2

127

mid = (lo + hi) // 2

128

start = mid

128

start = mid

129

while start > 0 and m[start - 1] != '\n':

129

while start > 0 and m[start - 1] != '\n':

130

start -= 1

130

start -= 1

131

end = advance(start, '\0')

131

end = advance(start, '\0')

132

if m[start:end] < s:

132

if m[start:end] < s:

133

# we know that after the null there are 40 bytes of sha1

133

# we know that after the null there are 40 bytes of sha1

134

# this translates to the bisect lo = mid + 1

134

# this translates to the bisect lo = mid + 1

135

lo = advance(end + 40, '\n') + 1

135

lo = advance(end + 40, '\n') + 1

136

else:

136

else:

137

# this translates to the bisect hi = mid

137

# this translates to the bisect hi = mid

138

hi = start

138

hi = start

139

end = advance(lo, '\0')

139

end = advance(lo, '\0')

140

found = m[lo:end]

140

found = m[lo:end]

141

if s == found:

141

if s == found:

142

# we know that after the null there are 40 bytes of sha1

142

# we know that after the null there are 40 bytes of sha1

143

end = advance(end + 40, '\n')

143

end = advance(end + 40, '\n')

144

return (lo, end + 1)

144

return (lo, end + 1)

145

else:

145

else:

146

return (lo, lo)

146

return (lo, lo)

147

148

def find(self, node, f):

148

def find(self, node, f):

149

'''look up entry for a single file efficiently.

149

'''look up entry for a single file efficiently.

150

return (node, flags) pair if found, (None, None) if not.'''

150

return (node, flags) pair if found, (None, None) if not.'''

151

if node in self._mancache:

151

if node in self._mancache:

152

mapping = self._mancache[node][0]

152

mapping = self._mancache[node][0]

153

return mapping.get(f), mapping.flags(f)

153

return mapping.get(f), mapping.flags(f)

154

text = self.revision(node)

154

text = self.revision(node)

155

start, end = self._search(text, f)

155

start, end = self._search(text, f)

156

if start == end:

156

if start == end:

157

return None, None

157

return None, None

158

l = text[start:end]

158

l = text[start:end]

159

f, n = l.split('\0')

159

f, n = l.split('\0')

160

return revlog.bin(n[:40]), n[40:-1]

160

return revlog.bin(n[:40]), n[40:-1]

161

162

def add(self, map, transaction, link, p1, p2, added, removed):

162

def add(self, map, transaction, link, p1, p2, added, removed):

163

# if we're using the cache, make sure it is valid and

163

if p1 in self._mancache:

164

# parented by the same node we're diffing against

164

# If our first parent is in the manifest cache, we can

165

if not (p1 and (p1 in self._mancache)):

165

# compute a delta here using properties we know about the

166

files = sorted(map)

166

# manifest up-front, which may save time later for the

167

_checkforbidden(files)

167

# revlog layer.

168

169

# if this is changed to support newlines in filenames,

170

# be sure to check the templates/ dir again (especially *-raw.tmpl)

171

hex, flags = revlog.hex, map.flags

172

text = ''.join("%s\0%s%s\n" % (f, hex(map[f]), flags(f))

173

for f in files)

174

arraytext = array.array('c', text)

175

cachedelta = None

176

else:

177

addlist = self._mancache[p1][1]

168

addlist = self._mancache[p1][1]

178

169

179

_checkforbidden(added)

170

_checkforbidden(added)

180

# combine the changed lists into one list for sorting

171

# combine the changed lists into one list for sorting

181

work = [(x, False) for x in added]

172

work = [(x, False) for x in added]

182

work.extend((x, True) for x in removed)

173

work.extend((x, True) for x in removed)

183

# this could use heapq.merge() (from Python 2.6+) or equivalent

174

# this could use heapq.merge() (from Python 2.6+) or equivalent

184

# since the lists are already sorted

175

# since the lists are already sorted

185

work.sort()

176

work.sort()

186

177

187

delta = []

178

delta = []

188

dstart = None

179

dstart = None

189

dend = None

180

dend = None

190

dline = [""]

181

dline = [""]

191

start = 0

182

start = 0

192

# zero copy representation of addlist as a buffer

183

# zero copy representation of addlist as a buffer

193

addbuf = util.buffer(addlist)

184

addbuf = util.buffer(addlist)

194

185

195

# start with a readonly loop that finds the offset of

186

# start with a readonly loop that finds the offset of

196

# each line and creates the deltas

187

# each line and creates the deltas

197

for f, todelete in work:

188

for f, todelete in work:

198

# bs will either be the index of the item or the insert point

189

# bs will either be the index of the item or the insert point

199

start, end = self._search(addbuf, f, start)

190

start, end = self._search(addbuf, f, start)

200

if not todelete:

191

if not todelete:

201

l = "%s\0%s%s\n" % (f, revlog.hex(map[f]), map.flags(f))

192

l = "%s\0%s%s\n" % (f, revlog.hex(map[f]), map.flags(f))

202

else:

193

else:

203

if start == end:

194

if start == end:

204

# item we want to delete was not found, error out

195

# item we want to delete was not found, error out

205

raise AssertionError(

196

raise AssertionError(

206

_("failed to remove %s from manifest") % f)

197

_("failed to remove %s from manifest") % f)

207

l = ""

198

l = ""

208

if dstart is not None and dstart <= start and dend >= start:

199

if dstart is not None and dstart <= start and dend >= start:

209

if dend < end:

200

if dend < end:

210

dend = end

201

dend = end

211

if l:

202

if l:

212

dline.append(l)

203

dline.append(l)

213

else:

204

else:

214

if dstart is not None:

205

if dstart is not None:

215

delta.append([dstart, dend, "".join(dline)])

206

delta.append([dstart, dend, "".join(dline)])

216

dstart = start

207

dstart = start

217

dend = end

208

dend = end

218

dline = [l]

209

dline = [l]

219

210

220

if dstart is not None:

211

if dstart is not None:

221

delta.append([dstart, dend, "".join(dline)])

212

delta.append([dstart, dend, "".join(dline)])

222

# apply the delta to the addlist, and get a delta for addrevision

213

# apply the delta to the addlist, and get a delta for addrevision

223

deltatext, addlist = _addlistdelta(addlist, delta)

214

deltatext, addlist = _addlistdelta(addlist, delta)

224

cachedelta = (self.rev(p1), deltatext)

215

cachedelta = (self.rev(p1), deltatext)

225

arraytext = addlist

216

arraytext = addlist

226

text = util.buffer(arraytext)

217

text = util.buffer(arraytext)

218

else:

219

# The first parent manifest isn't already loaded, so we'll

220

# just encode a fulltext of the manifest and pass that

221

# through to the revlog layer, and let it handle the delta

222

# process.

223

files = sorted(map)

224

_checkforbidden(files)

225

226

# if this is changed to support newlines in filenames,

227

# be sure to check the templates/ dir again (especially *-raw.tmpl)

228

hex, flags = revlog.hex, map.flags

229

text = ''.join("%s\0%s%s\n" % (f, hex(map[f]), flags(f))

230

for f in files)

231

arraytext = array.array('c', text)

232

cachedelta = None

227

233

228

n = self.addrevision(text, transaction, link, p1, p2, cachedelta)

234

n = self.addrevision(text, transaction, link, p1, p2, cachedelta)

229

self._mancache[n] = (map, arraytext)

235

self._mancache[n] = (map, arraytext)

230

236

231

return n

237

return n

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # manifest.py - manifest revision class for mercurial
             #
             # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from i18n import _
             import mdiff, parsers, error, revlog, util, dicthelpers
             import array, struct
             class manifestdict(dict):
                 def __init__(self, mapping=None, flags=None):
                     if mapping is None:
                         mapping = {}
                     if flags is None:
                         flags = {}
                     dict.__init__(self, mapping)
                     self._flags = flags
                 def flags(self, f):
                     return self._flags.get(f, "")
                 def withflags(self):
                     return set(self._flags.keys())
                 def set(self, f, flags):
                     self._flags[f] = flags
                 def copy(self):
                     return manifestdict(self, dict.copy(self._flags))
                 def intersectfiles(self, files):
                     '''make a new manifestdict with the intersection of self with files
                     The algorithm assumes that files is much smaller than self.'''
                     ret = manifestdict()
                     for fn in files:
                         if fn in self:
                             ret[fn] = self[fn]
                             flags = self._flags.get(fn, None)
                             if flags:
                                 ret._flags[fn] = flags
                     return ret
                 def flagsdiff(self, d2):
                     return dicthelpers.diff(self._flags, d2._flags, "")
             def _checkforbidden(l):
                 """Check filenames for illegal characters."""
                 for f in l:
                     if '\n' in f or '\r' in f:
                         raise error.RevlogError(
                             _("'\\n' and '\\r' disallowed in filenames: %r") % f)
             # apply the changes collected during the bisect loop to our addlist
             # return a delta suitable for addrevision
             def _addlistdelta(addlist, x):
                 # for large addlist arrays, building a new array is cheaper
                 # than repeatedly modifying the existing one
                 currentposition = 0
                 newaddlist = array.array('c')
                 for start, end, content in x:
                     newaddlist += addlist[currentposition:start]
                     if content:
                         newaddlist += array.array('c', content)
                     currentposition = end
                 newaddlist += addlist[currentposition:]
                 deltatext = "".join(struct.pack(">lll", start, end, len(content))
                                + content for start, end, content in x)
                 return deltatext, newaddlist
             def _parse(lines):
                 mfdict = manifestdict()
                 parsers.parse_manifest(mfdict, mfdict._flags, lines)
                 return mfdict
             class manifest(revlog.revlog):
                 def __init__(self, opener):
                     # we expect to deal with not more than four revs at a time,
                     # during a commit --amend
                     self._mancache = util.lrucachedict(4)
                     revlog.revlog.__init__(self, opener, "00manifest.i")
                 def readdelta(self, node):
                     r = self.rev(node)
                     return _parse(mdiff.patchtext(self.revdiff(self.deltaparent(r), r)))
                 def readfast(self, node):
                     '''use the faster of readdelta or read'''
                     r = self.rev(node)
                     deltaparent = self.deltaparent(r)
                     if deltaparent != revlog.nullrev and deltaparent in self.parentrevs(r):
                         return self.readdelta(node)
                     return self.read(node)
                 def read(self, node):
                     if node == revlog.nullid:
                         return manifestdict() # don't upset local cache
                     if node in self._mancache:
                         return self._mancache[node][0]
                     text = self.revision(node)
                     arraytext = array.array('c', text)
                     mapping = _parse(text)
                     self._mancache[node] = (mapping, arraytext)
                     return mapping
                 def _search(self, m, s, lo=0, hi=None):
                     '''return a tuple (start, end) that says where to find s within m.
                     If the string is found m[start:end] are the line containing
                     that string.  If start == end the string was not found and
                     they indicate the proper sorted insertion point.
                     m should be a buffer or a string
                     s is a string'''
                     def advance(i, c):
                         while i < lenm and m[i] != c:
                             i += 1
                         return i
                     if not s:
                         return (lo, lo)
                     lenm = len(m)
                     if not hi:
                         hi = lenm
                     while lo < hi:
                         mid = (lo + hi) // 2
                         start = mid
                         while start > 0 and m[start - 1] != '\n':
                             start -= 1
                         end = advance(start, '\0')
                         if m[start:end] < s:
                             # we know that after the null there are 40 bytes of sha1
                             # this translates to the bisect lo = mid + 1
                             lo = advance(end + 40, '\n') + 1
                         else:
                             # this translates to the bisect hi = mid
                             hi = start
                     end = advance(lo, '\0')
                     found = m[lo:end]
                     if s == found:
                         # we know that after the null there are 40 bytes of sha1
                         end = advance(end + 40, '\n')
                         return (lo, end + 1)
                     else:
                         return (lo, lo)
                 def find(self, node, f):
                     '''look up entry for a single file efficiently.
                     return (node, flags) pair if found, (None, None) if not.'''
                     if node in self._mancache:
                         mapping = self._mancache[node][0]
                         return mapping.get(f), mapping.flags(f)
                     text = self.revision(node)
                     start, end = self._search(text, f)
                     if start == end:
                         return None, None
                     l = text[start:end]
                     f, n = l.split('\0')
                     return revlog.bin(n[:40]), n[40:-1]
                 def add(self, map, transaction, link, p1, p2, added, removed):
-                    # if we're using the cache, make sure it is valid and
+                    if p1 in self._mancache:
-                    # parented by the same node we're diffing against
+                        # If our first parent is in the manifest cache, we can
-                    if not (p1 and (p1 in self._mancache)):
+                        # compute a delta here using properties we know about the
-                        files = sorted(map)
+                        # manifest up-front, which may save time later for the
-                        _checkforbidden(files)
+                        # revlog layer.
-                        # if this is changed to support newlines in filenames,
-                        # be sure to check the templates/ dir again (especially *-raw.tmpl)
-                        hex, flags = revlog.hex, map.flags
-                        text = ''.join("%s\0%s%s\n" % (f, hex(map[f]), flags(f))
-                                       for f in files)
-                        arraytext = array.array('c', text)
-                        cachedelta = None
-                    else:
                         addlist = self._mancache[p1][1]
                         _checkforbidden(added)
                         # combine the changed lists into one list for sorting
                         work = [(x, False) for x in added]
                         work.extend((x, True) for x in removed)
                         # this could use heapq.merge() (from Python 2.6+) or equivalent
                         # since the lists are already sorted
                         work.sort()
                         delta = []
                         dstart = None
                         dend = None
                         dline = [""]
                         start = 0
                         # zero copy representation of addlist as a buffer
                         addbuf = util.buffer(addlist)
                         # start with a readonly loop that finds the offset of
                         # each line and creates the deltas
                         for f, todelete in work:
                             # bs will either be the index of the item or the insert point
                             start, end = self._search(addbuf, f, start)
                             if not todelete:
                                 l = "%s\0%s%s\n" % (f, revlog.hex(map[f]), map.flags(f))
                             else:
                                 if start == end:
                                     # item we want to delete was not found, error out
                                     raise AssertionError(
                                             _("failed to remove %s from manifest") % f)
                                 l = ""
                             if dstart is not None and dstart <= start and dend >= start:
                                 if dend < end:
                                     dend = end
                                 if l:
                                     dline.append(l)
                             else:
                                 if dstart is not None:
                                     delta.append([dstart, dend, "".join(dline)])
                                 dstart = start
                                 dend = end
                                 dline = [l]
                         if dstart is not None:
                             delta.append([dstart, dend, "".join(dline)])
                         # apply the delta to the addlist, and get a delta for addrevision
                         deltatext, addlist = _addlistdelta(addlist, delta)
                         cachedelta = (self.rev(p1), deltatext)
                         arraytext = addlist
                         text = util.buffer(arraytext)
+                    else:
+                        # The first parent manifest isn't already loaded, so we'll
+                        # just encode a fulltext of the manifest and pass that
+                        # through to the revlog layer, and let it handle the delta
+                        # process.
+                        files = sorted(map)
+                        _checkforbidden(files)
+                        # if this is changed to support newlines in filenames,
+                        # be sure to check the templates/ dir again (especially *-raw.tmpl)
+                        hex, flags = revlog.hex, map.flags
+                        text = ''.join("%s\0%s%s\n" % (f, hex(map[f]), flags(f))
+                                       for f in files)
+                        arraytext = array.array('c', text)
+                        cachedelta = None
                     n = self.addrevision(text, transaction, link, p1, p2, cachedelta)
                     self._mancache[n] = (map, arraytext)
                     return n