##// END OF EJS Templates
manifest: leave a TODO where we may have more work for sha1 portability...
Augie Fackler -
r45198:f0d88d20 default draft
parent child Browse files
Show More
@@ -1,2297 +1,2298 b''
1 # manifest.py - manifest revision class for mercurial
1 # manifest.py - manifest revision class for mercurial
2 #
2 #
3 # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
3 # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
4 #
4 #
5 # This software may be used and distributed according to the terms of the
5 # This software may be used and distributed according to the terms of the
6 # GNU General Public License version 2 or any later version.
6 # GNU General Public License version 2 or any later version.
7
7
8 from __future__ import absolute_import
8 from __future__ import absolute_import
9
9
10 import heapq
10 import heapq
11 import itertools
11 import itertools
12 import struct
12 import struct
13 import weakref
13 import weakref
14
14
15 from .i18n import _
15 from .i18n import _
16 from .node import (
16 from .node import (
17 bin,
17 bin,
18 hex,
18 hex,
19 nullid,
19 nullid,
20 nullrev,
20 nullrev,
21 )
21 )
22 from .pycompat import getattr
22 from .pycompat import getattr
23 from . import (
23 from . import (
24 encoding,
24 encoding,
25 error,
25 error,
26 match as matchmod,
26 match as matchmod,
27 mdiff,
27 mdiff,
28 pathutil,
28 pathutil,
29 policy,
29 policy,
30 pycompat,
30 pycompat,
31 revlog,
31 revlog,
32 util,
32 util,
33 )
33 )
34 from .interfaces import (
34 from .interfaces import (
35 repository,
35 repository,
36 util as interfaceutil,
36 util as interfaceutil,
37 )
37 )
38
38
39 parsers = policy.importmod('parsers')
39 parsers = policy.importmod('parsers')
40 propertycache = util.propertycache
40 propertycache = util.propertycache
41
41
42 # Allow tests to more easily test the alternate path in manifestdict.fastdelta()
42 # Allow tests to more easily test the alternate path in manifestdict.fastdelta()
43 FASTDELTA_TEXTDIFF_THRESHOLD = 1000
43 FASTDELTA_TEXTDIFF_THRESHOLD = 1000
44
44
45
45
46 def _parse(data):
46 def _parse(data):
47 # This method does a little bit of excessive-looking
47 # This method does a little bit of excessive-looking
48 # precondition checking. This is so that the behavior of this
48 # precondition checking. This is so that the behavior of this
49 # class exactly matches its C counterpart to try and help
49 # class exactly matches its C counterpart to try and help
50 # prevent surprise breakage for anyone that develops against
50 # prevent surprise breakage for anyone that develops against
51 # the pure version.
51 # the pure version.
52 if data and data[-1:] != b'\n':
52 if data and data[-1:] != b'\n':
53 raise ValueError(b'Manifest did not end in a newline.')
53 raise ValueError(b'Manifest did not end in a newline.')
54 prev = None
54 prev = None
55 for l in data.splitlines():
55 for l in data.splitlines():
56 if prev is not None and prev > l:
56 if prev is not None and prev > l:
57 raise ValueError(b'Manifest lines not in sorted order.')
57 raise ValueError(b'Manifest lines not in sorted order.')
58 prev = l
58 prev = l
59 f, n = l.split(b'\0')
59 f, n = l.split(b'\0')
60 nl = len(n)
60 nl = len(n)
61 if 64 < nl:
61 if 64 < nl:
62 # modern hash, full width
62 # modern hash, full width
63 yield f, bin(n[:64]), n[64:]
63 yield f, bin(n[:64]), n[64:]
64 if 40 < nl < 45:
64 if 40 < nl < 45:
65 # legacy hash, always sha1
65 # legacy hash, always sha1
66 yield f, bin(n[:40]), n[40:]
66 yield f, bin(n[:40]), n[40:]
67 else:
67 else:
68 yield f, bin(n), b''
68 yield f, bin(n), b''
69
69
70
70
71 def _text(it):
71 def _text(it):
72 files = []
72 files = []
73 lines = []
73 lines = []
74 for f, n, fl in it:
74 for f, n, fl in it:
75 files.append(f)
75 files.append(f)
76 # if this is changed to support newlines in filenames,
76 # if this is changed to support newlines in filenames,
77 # be sure to check the templates/ dir again (especially *-raw.tmpl)
77 # be sure to check the templates/ dir again (especially *-raw.tmpl)
78 lines.append(b"%s\0%s%s\n" % (f, hex(n), fl))
78 lines.append(b"%s\0%s%s\n" % (f, hex(n), fl))
79
79
80 _checkforbidden(files)
80 _checkforbidden(files)
81 return b''.join(lines)
81 return b''.join(lines)
82
82
83
83
84 class lazymanifestiter(object):
84 class lazymanifestiter(object):
85 def __init__(self, lm):
85 def __init__(self, lm):
86 self.pos = 0
86 self.pos = 0
87 self.lm = lm
87 self.lm = lm
88
88
89 def __iter__(self):
89 def __iter__(self):
90 return self
90 return self
91
91
92 def next(self):
92 def next(self):
93 try:
93 try:
94 data, pos = self.lm._get(self.pos)
94 data, pos = self.lm._get(self.pos)
95 except IndexError:
95 except IndexError:
96 raise StopIteration
96 raise StopIteration
97 if pos == -1:
97 if pos == -1:
98 self.pos += 1
98 self.pos += 1
99 return data[0]
99 return data[0]
100 self.pos += 1
100 self.pos += 1
101 zeropos = data.find(b'\x00', pos)
101 zeropos = data.find(b'\x00', pos)
102 return data[pos:zeropos]
102 return data[pos:zeropos]
103
103
104 __next__ = next
104 __next__ = next
105
105
106
106
107 class lazymanifestiterentries(object):
107 class lazymanifestiterentries(object):
108 def __init__(self, lm):
108 def __init__(self, lm):
109 self.lm = lm
109 self.lm = lm
110 self.pos = 0
110 self.pos = 0
111
111
112 def __iter__(self):
112 def __iter__(self):
113 return self
113 return self
114
114
115 def next(self):
115 def next(self):
116 try:
116 try:
117 data, pos = self.lm._get(self.pos)
117 data, pos = self.lm._get(self.pos)
118 except IndexError:
118 except IndexError:
119 raise StopIteration
119 raise StopIteration
120 if pos == -1:
120 if pos == -1:
121 self.pos += 1
121 self.pos += 1
122 return data
122 return data
123 zeropos = data.find(b'\x00', pos)
123 zeropos = data.find(b'\x00', pos)
124 hashval = unhexlify(data, self.lm.extrainfo[self.pos], zeropos + 1, 40)
124 hashval = unhexlify(data, self.lm.extrainfo[self.pos], zeropos + 1, 40)
125 flags = self.lm._getflags(data, self.pos, zeropos)
125 flags = self.lm._getflags(data, self.pos, zeropos)
126 self.pos += 1
126 self.pos += 1
127 return (data[pos:zeropos], hashval, flags)
127 return (data[pos:zeropos], hashval, flags)
128
128
129 __next__ = next
129 __next__ = next
130
130
131
131
132 def unhexlify(data, extra, pos, length):
132 def unhexlify(data, extra, pos, length):
133 s = bin(data[pos : pos + length])
133 s = bin(data[pos : pos + length])
134 if extra:
134 if extra:
135 s += chr(extra & 0xFF)
135 s += chr(extra & 0xFF)
136 return s
136 return s
137
137
138
138
139 def _cmp(a, b):
139 def _cmp(a, b):
140 return (a > b) - (a < b)
140 return (a > b) - (a < b)
141
141
142
142
143 class _lazymanifest(object):
143 class _lazymanifest(object):
144 """A pure python manifest backed by a byte string. It is supplimented with
144 """A pure python manifest backed by a byte string. It is supplimented with
145 internal lists as it is modified, until it is compacted back to a pure byte
145 internal lists as it is modified, until it is compacted back to a pure byte
146 string.
146 string.
147
147
148 ``data`` is the initial manifest data.
148 ``data`` is the initial manifest data.
149
149
150 ``positions`` is a list of offsets, one per manifest entry. Positive
150 ``positions`` is a list of offsets, one per manifest entry. Positive
151 values are offsets into ``data``, negative values are offsets into the
151 values are offsets into ``data``, negative values are offsets into the
152 ``extradata`` list. When an entry is removed, its entry is dropped from
152 ``extradata`` list. When an entry is removed, its entry is dropped from
153 ``positions``. The values are encoded such that when walking the list and
153 ``positions``. The values are encoded such that when walking the list and
154 indexing into ``data`` or ``extradata`` as appropriate, the entries are
154 indexing into ``data`` or ``extradata`` as appropriate, the entries are
155 sorted by filename.
155 sorted by filename.
156
156
157 ``extradata`` is a list of (key, hash, flags) for entries that were added or
157 ``extradata`` is a list of (key, hash, flags) for entries that were added or
158 modified since the manifest was created or compacted.
158 modified since the manifest was created or compacted.
159 """
159 """
160
160
161 def __init__(
161 def __init__(
162 self,
162 self,
163 data,
163 data,
164 positions=None,
164 positions=None,
165 extrainfo=None,
165 extrainfo=None,
166 extradata=None,
166 extradata=None,
167 hasremovals=False,
167 hasremovals=False,
168 ):
168 ):
169 if positions is None:
169 if positions is None:
170 self.positions = self.findlines(data)
170 self.positions = self.findlines(data)
171 self.extrainfo = [0] * len(self.positions)
171 self.extrainfo = [0] * len(self.positions)
172 self.data = data
172 self.data = data
173 self.extradata = []
173 self.extradata = []
174 self.hasremovals = False
174 self.hasremovals = False
175 else:
175 else:
176 self.positions = positions[:]
176 self.positions = positions[:]
177 self.extrainfo = extrainfo[:]
177 self.extrainfo = extrainfo[:]
178 self.extradata = extradata[:]
178 self.extradata = extradata[:]
179 self.data = data
179 self.data = data
180 self.hasremovals = hasremovals
180 self.hasremovals = hasremovals
181
181
182 def findlines(self, data):
182 def findlines(self, data):
183 if not data:
183 if not data:
184 return []
184 return []
185 pos = data.find(b"\n")
185 pos = data.find(b"\n")
186 if pos == -1 or data[-1:] != b'\n':
186 if pos == -1 or data[-1:] != b'\n':
187 raise ValueError(b"Manifest did not end in a newline.")
187 raise ValueError(b"Manifest did not end in a newline.")
188 positions = [0]
188 positions = [0]
189 prev = data[: data.find(b'\x00')]
189 prev = data[: data.find(b'\x00')]
190 while pos < len(data) - 1 and pos != -1:
190 while pos < len(data) - 1 and pos != -1:
191 positions.append(pos + 1)
191 positions.append(pos + 1)
192 nexts = data[pos + 1 : data.find(b'\x00', pos + 1)]
192 nexts = data[pos + 1 : data.find(b'\x00', pos + 1)]
193 if nexts < prev:
193 if nexts < prev:
194 raise ValueError(b"Manifest lines not in sorted order.")
194 raise ValueError(b"Manifest lines not in sorted order.")
195 prev = nexts
195 prev = nexts
196 pos = data.find(b"\n", pos + 1)
196 pos = data.find(b"\n", pos + 1)
197 return positions
197 return positions
198
198
199 def _get(self, index):
199 def _get(self, index):
200 # get the position encoded in pos:
200 # get the position encoded in pos:
201 # positive number is an index in 'data'
201 # positive number is an index in 'data'
202 # negative number is in extrapieces
202 # negative number is in extrapieces
203 pos = self.positions[index]
203 pos = self.positions[index]
204 if pos >= 0:
204 if pos >= 0:
205 return self.data, pos
205 return self.data, pos
206 return self.extradata[-pos - 1], -1
206 return self.extradata[-pos - 1], -1
207
207
208 def _getkey(self, pos):
208 def _getkey(self, pos):
209 if pos >= 0:
209 if pos >= 0:
210 return self.data[pos : self.data.find(b'\x00', pos + 1)]
210 return self.data[pos : self.data.find(b'\x00', pos + 1)]
211 return self.extradata[-pos - 1][0]
211 return self.extradata[-pos - 1][0]
212
212
213 def bsearch(self, key):
213 def bsearch(self, key):
214 first = 0
214 first = 0
215 last = len(self.positions) - 1
215 last = len(self.positions) - 1
216
216
217 while first <= last:
217 while first <= last:
218 midpoint = (first + last) // 2
218 midpoint = (first + last) // 2
219 nextpos = self.positions[midpoint]
219 nextpos = self.positions[midpoint]
220 candidate = self._getkey(nextpos)
220 candidate = self._getkey(nextpos)
221 r = _cmp(key, candidate)
221 r = _cmp(key, candidate)
222 if r == 0:
222 if r == 0:
223 return midpoint
223 return midpoint
224 else:
224 else:
225 if r < 0:
225 if r < 0:
226 last = midpoint - 1
226 last = midpoint - 1
227 else:
227 else:
228 first = midpoint + 1
228 first = midpoint + 1
229 return -1
229 return -1
230
230
231 def bsearch2(self, key):
231 def bsearch2(self, key):
232 # same as the above, but will always return the position
232 # same as the above, but will always return the position
233 # done for performance reasons
233 # done for performance reasons
234 first = 0
234 first = 0
235 last = len(self.positions) - 1
235 last = len(self.positions) - 1
236
236
237 while first <= last:
237 while first <= last:
238 midpoint = (first + last) // 2
238 midpoint = (first + last) // 2
239 nextpos = self.positions[midpoint]
239 nextpos = self.positions[midpoint]
240 candidate = self._getkey(nextpos)
240 candidate = self._getkey(nextpos)
241 r = _cmp(key, candidate)
241 r = _cmp(key, candidate)
242 if r == 0:
242 if r == 0:
243 return (midpoint, True)
243 return (midpoint, True)
244 else:
244 else:
245 if r < 0:
245 if r < 0:
246 last = midpoint - 1
246 last = midpoint - 1
247 else:
247 else:
248 first = midpoint + 1
248 first = midpoint + 1
249 return (first, False)
249 return (first, False)
250
250
251 def __contains__(self, key):
251 def __contains__(self, key):
252 return self.bsearch(key) != -1
252 return self.bsearch(key) != -1
253
253
254 def _getflags(self, data, needle, pos):
254 def _getflags(self, data, needle, pos):
255 start = pos + 41
255 start = pos + 41
256 end = data.find(b"\n", start)
256 end = data.find(b"\n", start)
257 if end == -1:
257 if end == -1:
258 end = len(data) - 1
258 end = len(data) - 1
259 if start == end:
259 if start == end:
260 return b''
260 return b''
261 return self.data[start:end]
261 return self.data[start:end]
262
262
263 def __getitem__(self, key):
263 def __getitem__(self, key):
264 if not isinstance(key, bytes):
264 if not isinstance(key, bytes):
265 raise TypeError(b"getitem: manifest keys must be a bytes.")
265 raise TypeError(b"getitem: manifest keys must be a bytes.")
266 needle = self.bsearch(key)
266 needle = self.bsearch(key)
267 if needle == -1:
267 if needle == -1:
268 raise KeyError
268 raise KeyError
269 data, pos = self._get(needle)
269 data, pos = self._get(needle)
270 if pos == -1:
270 if pos == -1:
271 return (data[1], data[2])
271 return (data[1], data[2])
272 zeropos = data.find(b'\x00', pos)
272 zeropos = data.find(b'\x00', pos)
273 nlpos = data.find(b'\n', zeropos)
273 nlpos = data.find(b'\n', zeropos)
274 assert 0 <= needle <= len(self.positions)
274 assert 0 <= needle <= len(self.positions)
275 assert len(self.extrainfo) == len(self.positions)
275 assert len(self.extrainfo) == len(self.positions)
276 hlen = nlpos - zeropos - 1
276 hlen = nlpos - zeropos - 1
277 # Hashes sometimes have an extra byte tucked on the end, so
277 # Hashes sometimes have an extra byte tucked on the end, so
278 # detect that.
278 # detect that.
279 if hlen % 2:
279 if hlen % 2:
280 hlen -= 1
280 hlen -= 1
281 hashval = unhexlify(data, self.extrainfo[needle], zeropos + 1, hlen)
281 hashval = unhexlify(data, self.extrainfo[needle], zeropos + 1, hlen)
282 flags = self._getflags(data, needle, zeropos)
282 flags = self._getflags(data, needle, zeropos)
283 return (hashval, flags)
283 return (hashval, flags)
284
284
285 def __delitem__(self, key):
285 def __delitem__(self, key):
286 needle, found = self.bsearch2(key)
286 needle, found = self.bsearch2(key)
287 if not found:
287 if not found:
288 raise KeyError
288 raise KeyError
289 cur = self.positions[needle]
289 cur = self.positions[needle]
290 self.positions = self.positions[:needle] + self.positions[needle + 1 :]
290 self.positions = self.positions[:needle] + self.positions[needle + 1 :]
291 self.extrainfo = self.extrainfo[:needle] + self.extrainfo[needle + 1 :]
291 self.extrainfo = self.extrainfo[:needle] + self.extrainfo[needle + 1 :]
292 if cur >= 0:
292 if cur >= 0:
293 # This does NOT unsort the list as far as the search functions are
293 # This does NOT unsort the list as far as the search functions are
294 # concerned, as they only examine lines mapped by self.positions.
294 # concerned, as they only examine lines mapped by self.positions.
295 self.data = self.data[:cur] + b'\x00' + self.data[cur + 1 :]
295 self.data = self.data[:cur] + b'\x00' + self.data[cur + 1 :]
296 self.hasremovals = True
296 self.hasremovals = True
297
297
298 def __setitem__(self, key, value):
298 def __setitem__(self, key, value):
299 if not isinstance(key, bytes):
299 if not isinstance(key, bytes):
300 raise TypeError(b"setitem: manifest keys must be a byte string.")
300 raise TypeError(b"setitem: manifest keys must be a byte string.")
301 if not isinstance(value, tuple) or len(value) != 2:
301 if not isinstance(value, tuple) or len(value) != 2:
302 raise TypeError(
302 raise TypeError(
303 b"Manifest values must be a tuple of (node, flags)."
303 b"Manifest values must be a tuple of (node, flags)."
304 )
304 )
305 hashval = value[0]
305 hashval = value[0]
306 # hashes are either 20 or 32 bytes (sha1 or its replacement),
306 # hashes are either 20 or 32 bytes (sha1 or its replacement),
307 # and allow one extra byte taht won't be persisted to disk but
307 # and allow one extra byte taht won't be persisted to disk but
308 # is sometimes used in memory.
308 # is sometimes used in memory.
309 if not isinstance(hashval, bytes) or not (
309 if not isinstance(hashval, bytes) or not (
310 20 <= len(hashval) <= 22 or 32 <= len(hashval) <= 34
310 20 <= len(hashval) <= 22 or 32 <= len(hashval) <= 34
311 ):
311 ):
312 raise TypeError(b"node must be a 20-byte or 32-byte byte string")
312 raise TypeError(b"node must be a 20-byte or 32-byte byte string")
313 flags = value[1]
313 flags = value[1]
314 if len(hashval) == 22:
314 if len(hashval) == 22:
315 hashval = hashval[:-1]
315 hashval = hashval[:-1]
316 if not isinstance(flags, bytes) or len(flags) > 1:
316 if not isinstance(flags, bytes) or len(flags) > 1:
317 raise TypeError(b"flags must a 0 or 1 byte string, got %r", flags)
317 raise TypeError(b"flags must a 0 or 1 byte string, got %r", flags)
318 needle, found = self.bsearch2(key)
318 needle, found = self.bsearch2(key)
319 if found:
319 if found:
320 # put the item
320 # put the item
321 pos = self.positions[needle]
321 pos = self.positions[needle]
322 if pos < 0:
322 if pos < 0:
323 self.extradata[-pos - 1] = (key, hashval, value[1])
323 self.extradata[-pos - 1] = (key, hashval, value[1])
324 else:
324 else:
325 # just don't bother
325 # just don't bother
326 self.extradata.append((key, hashval, value[1]))
326 self.extradata.append((key, hashval, value[1]))
327 self.positions[needle] = -len(self.extradata)
327 self.positions[needle] = -len(self.extradata)
328 else:
328 else:
329 # not found, put it in with extra positions
329 # not found, put it in with extra positions
330 self.extradata.append((key, hashval, value[1]))
330 self.extradata.append((key, hashval, value[1]))
331 self.positions = (
331 self.positions = (
332 self.positions[:needle]
332 self.positions[:needle]
333 + [-len(self.extradata)]
333 + [-len(self.extradata)]
334 + self.positions[needle:]
334 + self.positions[needle:]
335 )
335 )
336 self.extrainfo = (
336 self.extrainfo = (
337 self.extrainfo[:needle] + [0] + self.extrainfo[needle:]
337 self.extrainfo[:needle] + [0] + self.extrainfo[needle:]
338 )
338 )
339
339
340 def copy(self):
340 def copy(self):
341 # XXX call _compact like in C?
341 # XXX call _compact like in C?
342 return _lazymanifest(
342 return _lazymanifest(
343 self.data,
343 self.data,
344 self.positions,
344 self.positions,
345 self.extrainfo,
345 self.extrainfo,
346 self.extradata,
346 self.extradata,
347 self.hasremovals,
347 self.hasremovals,
348 )
348 )
349
349
350 def _compact(self):
350 def _compact(self):
351 # hopefully not called TOO often
351 # hopefully not called TOO often
352 if len(self.extradata) == 0 and not self.hasremovals:
352 if len(self.extradata) == 0 and not self.hasremovals:
353 return
353 return
354 l = []
354 l = []
355 i = 0
355 i = 0
356 offset = 0
356 offset = 0
357 self.extrainfo = [0] * len(self.positions)
357 self.extrainfo = [0] * len(self.positions)
358 while i < len(self.positions):
358 while i < len(self.positions):
359 if self.positions[i] >= 0:
359 if self.positions[i] >= 0:
360 cur = self.positions[i]
360 cur = self.positions[i]
361 last_cut = cur
361 last_cut = cur
362
362
363 # Collect all contiguous entries in the buffer at the current
363 # Collect all contiguous entries in the buffer at the current
364 # offset, breaking out only for added/modified items held in
364 # offset, breaking out only for added/modified items held in
365 # extradata, or a deleted line prior to the next position.
365 # extradata, or a deleted line prior to the next position.
366 while True:
366 while True:
367 self.positions[i] = offset
367 self.positions[i] = offset
368 i += 1
368 i += 1
369 if i == len(self.positions) or self.positions[i] < 0:
369 if i == len(self.positions) or self.positions[i] < 0:
370 break
370 break
371
371
372 # A removed file has no positions[] entry, but does have an
372 # A removed file has no positions[] entry, but does have an
373 # overwritten first byte. Break out and find the end of the
373 # overwritten first byte. Break out and find the end of the
374 # current good entry/entries if there is a removed file
374 # current good entry/entries if there is a removed file
375 # before the next position.
375 # before the next position.
376 if (
376 if (
377 self.hasremovals
377 self.hasremovals
378 and self.data.find(b'\n\x00', cur, self.positions[i])
378 and self.data.find(b'\n\x00', cur, self.positions[i])
379 != -1
379 != -1
380 ):
380 ):
381 break
381 break
382
382
383 offset += self.positions[i] - cur
383 offset += self.positions[i] - cur
384 cur = self.positions[i]
384 cur = self.positions[i]
385 end_cut = self.data.find(b'\n', cur)
385 end_cut = self.data.find(b'\n', cur)
386 if end_cut != -1:
386 if end_cut != -1:
387 end_cut += 1
387 end_cut += 1
388 offset += end_cut - cur
388 offset += end_cut - cur
389 l.append(self.data[last_cut:end_cut])
389 l.append(self.data[last_cut:end_cut])
390 else:
390 else:
391 while i < len(self.positions) and self.positions[i] < 0:
391 while i < len(self.positions) and self.positions[i] < 0:
392 cur = self.positions[i]
392 cur = self.positions[i]
393 t = self.extradata[-cur - 1]
393 t = self.extradata[-cur - 1]
394 l.append(self._pack(t))
394 l.append(self._pack(t))
395 self.positions[i] = offset
395 self.positions[i] = offset
396 # Hashes are either 20 bytes (old sha1s) or 32
396 # Hashes are either 20 bytes (old sha1s) or 32
397 # bytes (new non-sha1).
397 # bytes (new non-sha1).
398 hlen = 20
398 hlen = 20
399 if len(t[1]) > 25:
399 if len(t[1]) > 25:
400 hlen = 32
400 hlen = 32
401 if len(t[1]) > hlen:
401 if len(t[1]) > hlen:
402 self.extrainfo[i] = ord(t[1][hlen + 1])
402 self.extrainfo[i] = ord(t[1][hlen + 1])
403 offset += len(l[-1])
403 offset += len(l[-1])
404 i += 1
404 i += 1
405 self.data = b''.join(l)
405 self.data = b''.join(l)
406 self.hasremovals = False
406 self.hasremovals = False
407 self.extradata = []
407 self.extradata = []
408
408
409 def _pack(self, d):
409 def _pack(self, d):
410 n = d[1]
410 n = d[1]
411 if len(n) == 21 or len(n) == 33:
411 if len(n) == 21 or len(n) == 33:
412 n = n[:-1]
412 n = n[:-1]
413 assert len(n) == 20 or len(n) == 32
413 assert len(n) == 20 or len(n) == 32
414 return d[0] + b'\x00' + hex(n) + d[2] + b'\n'
414 return d[0] + b'\x00' + hex(n) + d[2] + b'\n'
415
415
416 def text(self):
416 def text(self):
417 self._compact()
417 self._compact()
418 return self.data
418 return self.data
419
419
420 def diff(self, m2, clean=False):
420 def diff(self, m2, clean=False):
421 '''Finds changes between the current manifest and m2.'''
421 '''Finds changes between the current manifest and m2.'''
422 # XXX think whether efficiency matters here
422 # XXX think whether efficiency matters here
423 diff = {}
423 diff = {}
424
424
425 for fn, e1, flags in self.iterentries():
425 for fn, e1, flags in self.iterentries():
426 if fn not in m2:
426 if fn not in m2:
427 diff[fn] = (e1, flags), (None, b'')
427 diff[fn] = (e1, flags), (None, b'')
428 else:
428 else:
429 e2 = m2[fn]
429 e2 = m2[fn]
430 if (e1, flags) != e2:
430 if (e1, flags) != e2:
431 diff[fn] = (e1, flags), e2
431 diff[fn] = (e1, flags), e2
432 elif clean:
432 elif clean:
433 diff[fn] = None
433 diff[fn] = None
434
434
435 for fn, e2, flags in m2.iterentries():
435 for fn, e2, flags in m2.iterentries():
436 if fn not in self:
436 if fn not in self:
437 diff[fn] = (None, b''), (e2, flags)
437 diff[fn] = (None, b''), (e2, flags)
438
438
439 return diff
439 return diff
440
440
441 def iterentries(self):
441 def iterentries(self):
442 return lazymanifestiterentries(self)
442 return lazymanifestiterentries(self)
443
443
444 def iterkeys(self):
444 def iterkeys(self):
445 return lazymanifestiter(self)
445 return lazymanifestiter(self)
446
446
447 def __iter__(self):
447 def __iter__(self):
448 return lazymanifestiter(self)
448 return lazymanifestiter(self)
449
449
450 def __len__(self):
450 def __len__(self):
451 return len(self.positions)
451 return len(self.positions)
452
452
453 def filtercopy(self, filterfn):
453 def filtercopy(self, filterfn):
454 # XXX should be optimized
454 # XXX should be optimized
455 c = _lazymanifest(b'')
455 c = _lazymanifest(b'')
456 for f, n, fl in self.iterentries():
456 for f, n, fl in self.iterentries():
457 if filterfn(f):
457 if filterfn(f):
458 c[f] = n, fl
458 c[f] = n, fl
459 return c
459 return c
460
460
461
461
462 try:
462 try:
463 _lazymanifest = parsers.lazymanifest
463 _lazymanifest = parsers.lazymanifest
464 except AttributeError:
464 except AttributeError:
465 pass
465 pass
466
466
467
467
468 @interfaceutil.implementer(repository.imanifestdict)
468 @interfaceutil.implementer(repository.imanifestdict)
469 class manifestdict(object):
469 class manifestdict(object):
470 def __init__(self, data=b''):
470 def __init__(self, data=b''):
471 self._lm = _lazymanifest(data)
471 self._lm = _lazymanifest(data)
472
472
473 def __getitem__(self, key):
473 def __getitem__(self, key):
474 return self._lm[key][0]
474 return self._lm[key][0]
475
475
476 def find(self, key):
476 def find(self, key):
477 return self._lm[key]
477 return self._lm[key]
478
478
479 def __len__(self):
479 def __len__(self):
480 return len(self._lm)
480 return len(self._lm)
481
481
482 def __nonzero__(self):
482 def __nonzero__(self):
483 # nonzero is covered by the __len__ function, but implementing it here
483 # nonzero is covered by the __len__ function, but implementing it here
484 # makes it easier for extensions to override.
484 # makes it easier for extensions to override.
485 return len(self._lm) != 0
485 return len(self._lm) != 0
486
486
487 __bool__ = __nonzero__
487 __bool__ = __nonzero__
488
488
489 def __setitem__(self, key, node):
489 def __setitem__(self, key, node):
490 self._lm[key] = node, self.flags(key)
490 self._lm[key] = node, self.flags(key)
491
491
492 def __contains__(self, key):
492 def __contains__(self, key):
493 if key is None:
493 if key is None:
494 return False
494 return False
495 return key in self._lm
495 return key in self._lm
496
496
497 def __delitem__(self, key):
497 def __delitem__(self, key):
498 del self._lm[key]
498 del self._lm[key]
499
499
500 def __iter__(self):
500 def __iter__(self):
501 return self._lm.__iter__()
501 return self._lm.__iter__()
502
502
503 def iterkeys(self):
503 def iterkeys(self):
504 return self._lm.iterkeys()
504 return self._lm.iterkeys()
505
505
506 def keys(self):
506 def keys(self):
507 return list(self.iterkeys())
507 return list(self.iterkeys())
508
508
509 def filesnotin(self, m2, match=None):
509 def filesnotin(self, m2, match=None):
510 '''Set of files in this manifest that are not in the other'''
510 '''Set of files in this manifest that are not in the other'''
511 if match is not None:
511 if match is not None:
512 match = matchmod.badmatch(match, lambda path, msg: None)
512 match = matchmod.badmatch(match, lambda path, msg: None)
513 sm2 = set(m2.walk(match))
513 sm2 = set(m2.walk(match))
514 return {f for f in self.walk(match) if f not in sm2}
514 return {f for f in self.walk(match) if f not in sm2}
515 return {f for f in self if f not in m2}
515 return {f for f in self if f not in m2}
516
516
517 @propertycache
517 @propertycache
518 def _dirs(self):
518 def _dirs(self):
519 return pathutil.dirs(self)
519 return pathutil.dirs(self)
520
520
521 def dirs(self):
521 def dirs(self):
522 return self._dirs
522 return self._dirs
523
523
524 def hasdir(self, dir):
524 def hasdir(self, dir):
525 return dir in self._dirs
525 return dir in self._dirs
526
526
527 def _filesfastpath(self, match):
527 def _filesfastpath(self, match):
528 '''Checks whether we can correctly and quickly iterate over matcher
528 '''Checks whether we can correctly and quickly iterate over matcher
529 files instead of over manifest files.'''
529 files instead of over manifest files.'''
530 files = match.files()
530 files = match.files()
531 return len(files) < 100 and (
531 return len(files) < 100 and (
532 match.isexact()
532 match.isexact()
533 or (match.prefix() and all(fn in self for fn in files))
533 or (match.prefix() and all(fn in self for fn in files))
534 )
534 )
535
535
536 def walk(self, match):
536 def walk(self, match):
537 '''Generates matching file names.
537 '''Generates matching file names.
538
538
539 Equivalent to manifest.matches(match).iterkeys(), but without creating
539 Equivalent to manifest.matches(match).iterkeys(), but without creating
540 an entirely new manifest.
540 an entirely new manifest.
541
541
542 It also reports nonexistent files by marking them bad with match.bad().
542 It also reports nonexistent files by marking them bad with match.bad().
543 '''
543 '''
544 if match.always():
544 if match.always():
545 for f in iter(self):
545 for f in iter(self):
546 yield f
546 yield f
547 return
547 return
548
548
549 fset = set(match.files())
549 fset = set(match.files())
550
550
551 # avoid the entire walk if we're only looking for specific files
551 # avoid the entire walk if we're only looking for specific files
552 if self._filesfastpath(match):
552 if self._filesfastpath(match):
553 for fn in sorted(fset):
553 for fn in sorted(fset):
554 if fn in self:
554 if fn in self:
555 yield fn
555 yield fn
556 return
556 return
557
557
558 for fn in self:
558 for fn in self:
559 if fn in fset:
559 if fn in fset:
560 # specified pattern is the exact name
560 # specified pattern is the exact name
561 fset.remove(fn)
561 fset.remove(fn)
562 if match(fn):
562 if match(fn):
563 yield fn
563 yield fn
564
564
565 # for dirstate.walk, files=[''] means "walk the whole tree".
565 # for dirstate.walk, files=[''] means "walk the whole tree".
566 # follow that here, too
566 # follow that here, too
567 fset.discard(b'')
567 fset.discard(b'')
568
568
569 for fn in sorted(fset):
569 for fn in sorted(fset):
570 if not self.hasdir(fn):
570 if not self.hasdir(fn):
571 match.bad(fn, None)
571 match.bad(fn, None)
572
572
573 def _matches(self, match):
573 def _matches(self, match):
574 '''generate a new manifest filtered by the match argument'''
574 '''generate a new manifest filtered by the match argument'''
575 if match.always():
575 if match.always():
576 return self.copy()
576 return self.copy()
577
577
578 if self._filesfastpath(match):
578 if self._filesfastpath(match):
579 m = manifestdict()
579 m = manifestdict()
580 lm = self._lm
580 lm = self._lm
581 for fn in match.files():
581 for fn in match.files():
582 if fn in lm:
582 if fn in lm:
583 m._lm[fn] = lm[fn]
583 m._lm[fn] = lm[fn]
584 return m
584 return m
585
585
586 m = manifestdict()
586 m = manifestdict()
587 m._lm = self._lm.filtercopy(match)
587 m._lm = self._lm.filtercopy(match)
588 return m
588 return m
589
589
590 def diff(self, m2, match=None, clean=False):
590 def diff(self, m2, match=None, clean=False):
591 '''Finds changes between the current manifest and m2.
591 '''Finds changes between the current manifest and m2.
592
592
593 Args:
593 Args:
594 m2: the manifest to which this manifest should be compared.
594 m2: the manifest to which this manifest should be compared.
595 clean: if true, include files unchanged between these manifests
595 clean: if true, include files unchanged between these manifests
596 with a None value in the returned dictionary.
596 with a None value in the returned dictionary.
597
597
598 The result is returned as a dict with filename as key and
598 The result is returned as a dict with filename as key and
599 values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the
599 values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the
600 nodeid in the current/other manifest and fl1/fl2 is the flag
600 nodeid in the current/other manifest and fl1/fl2 is the flag
601 in the current/other manifest. Where the file does not exist,
601 in the current/other manifest. Where the file does not exist,
602 the nodeid will be None and the flags will be the empty
602 the nodeid will be None and the flags will be the empty
603 string.
603 string.
604 '''
604 '''
605 if match:
605 if match:
606 m1 = self._matches(match)
606 m1 = self._matches(match)
607 m2 = m2._matches(match)
607 m2 = m2._matches(match)
608 return m1.diff(m2, clean=clean)
608 return m1.diff(m2, clean=clean)
609 return self._lm.diff(m2._lm, clean)
609 return self._lm.diff(m2._lm, clean)
610
610
611 def setflag(self, key, flag):
611 def setflag(self, key, flag):
612 self._lm[key] = self[key], flag
612 self._lm[key] = self[key], flag
613
613
614 def get(self, key, default=None):
614 def get(self, key, default=None):
615 try:
615 try:
616 return self._lm[key][0]
616 return self._lm[key][0]
617 except KeyError:
617 except KeyError:
618 return default
618 return default
619
619
620 def flags(self, key):
620 def flags(self, key):
621 try:
621 try:
622 return self._lm[key][1]
622 return self._lm[key][1]
623 except KeyError:
623 except KeyError:
624 return b''
624 return b''
625
625
626 def copy(self):
626 def copy(self):
627 c = manifestdict()
627 c = manifestdict()
628 c._lm = self._lm.copy()
628 c._lm = self._lm.copy()
629 return c
629 return c
630
630
631 def items(self):
631 def items(self):
632 return (x[:2] for x in self._lm.iterentries())
632 return (x[:2] for x in self._lm.iterentries())
633
633
634 def iteritems(self):
634 def iteritems(self):
635 return (x[:2] for x in self._lm.iterentries())
635 return (x[:2] for x in self._lm.iterentries())
636
636
637 def iterentries(self):
637 def iterentries(self):
638 return self._lm.iterentries()
638 return self._lm.iterentries()
639
639
640 def text(self):
640 def text(self):
641 # most likely uses native version
641 # most likely uses native version
642 return self._lm.text()
642 return self._lm.text()
643
643
644 def fastdelta(self, base, changes):
644 def fastdelta(self, base, changes):
645 """Given a base manifest text as a bytearray and a list of changes
645 """Given a base manifest text as a bytearray and a list of changes
646 relative to that text, compute a delta that can be used by revlog.
646 relative to that text, compute a delta that can be used by revlog.
647 """
647 """
648 delta = []
648 delta = []
649 dstart = None
649 dstart = None
650 dend = None
650 dend = None
651 dline = [b""]
651 dline = [b""]
652 start = 0
652 start = 0
653 # zero copy representation of base as a buffer
653 # zero copy representation of base as a buffer
654 addbuf = util.buffer(base)
654 addbuf = util.buffer(base)
655
655
656 changes = list(changes)
656 changes = list(changes)
657 if len(changes) < FASTDELTA_TEXTDIFF_THRESHOLD:
657 if len(changes) < FASTDELTA_TEXTDIFF_THRESHOLD:
658 # start with a readonly loop that finds the offset of
658 # start with a readonly loop that finds the offset of
659 # each line and creates the deltas
659 # each line and creates the deltas
660 for f, todelete in changes:
660 for f, todelete in changes:
661 # bs will either be the index of the item or the insert point
661 # bs will either be the index of the item or the insert point
662 start, end = _msearch(addbuf, f, start)
662 start, end = _msearch(addbuf, f, start)
663 if not todelete:
663 if not todelete:
664 h, fl = self._lm[f]
664 h, fl = self._lm[f]
665 l = b"%s\0%s%s\n" % (f, hex(h), fl)
665 l = b"%s\0%s%s\n" % (f, hex(h), fl)
666 else:
666 else:
667 if start == end:
667 if start == end:
668 # item we want to delete was not found, error out
668 # item we want to delete was not found, error out
669 raise AssertionError(
669 raise AssertionError(
670 _(b"failed to remove %s from manifest") % f
670 _(b"failed to remove %s from manifest") % f
671 )
671 )
672 l = b""
672 l = b""
673 if dstart is not None and dstart <= start and dend >= start:
673 if dstart is not None and dstart <= start and dend >= start:
674 if dend < end:
674 if dend < end:
675 dend = end
675 dend = end
676 if l:
676 if l:
677 dline.append(l)
677 dline.append(l)
678 else:
678 else:
679 if dstart is not None:
679 if dstart is not None:
680 delta.append([dstart, dend, b"".join(dline)])
680 delta.append([dstart, dend, b"".join(dline)])
681 dstart = start
681 dstart = start
682 dend = end
682 dend = end
683 dline = [l]
683 dline = [l]
684
684
685 if dstart is not None:
685 if dstart is not None:
686 delta.append([dstart, dend, b"".join(dline)])
686 delta.append([dstart, dend, b"".join(dline)])
687 # apply the delta to the base, and get a delta for addrevision
687 # apply the delta to the base, and get a delta for addrevision
688 deltatext, arraytext = _addlistdelta(base, delta)
688 deltatext, arraytext = _addlistdelta(base, delta)
689 else:
689 else:
690 # For large changes, it's much cheaper to just build the text and
690 # For large changes, it's much cheaper to just build the text and
691 # diff it.
691 # diff it.
692 arraytext = bytearray(self.text())
692 arraytext = bytearray(self.text())
693 deltatext = mdiff.textdiff(
693 deltatext = mdiff.textdiff(
694 util.buffer(base), util.buffer(arraytext)
694 util.buffer(base), util.buffer(arraytext)
695 )
695 )
696
696
697 return arraytext, deltatext
697 return arraytext, deltatext
698
698
699
699
700 def _msearch(m, s, lo=0, hi=None):
700 def _msearch(m, s, lo=0, hi=None):
701 '''return a tuple (start, end) that says where to find s within m.
701 '''return a tuple (start, end) that says where to find s within m.
702
702
703 If the string is found m[start:end] are the line containing
703 If the string is found m[start:end] are the line containing
704 that string. If start == end the string was not found and
704 that string. If start == end the string was not found and
705 they indicate the proper sorted insertion point.
705 they indicate the proper sorted insertion point.
706
706
707 m should be a buffer, a memoryview or a byte string.
707 m should be a buffer, a memoryview or a byte string.
708 s is a byte string'''
708 s is a byte string'''
709
709
710 def advance(i, c):
710 def advance(i, c):
711 while i < lenm and m[i : i + 1] != c:
711 while i < lenm and m[i : i + 1] != c:
712 i += 1
712 i += 1
713 return i
713 return i
714
714
715 if not s:
715 if not s:
716 return (lo, lo)
716 return (lo, lo)
717 lenm = len(m)
717 lenm = len(m)
718 if not hi:
718 if not hi:
719 hi = lenm
719 hi = lenm
720 while lo < hi:
720 while lo < hi:
721 mid = (lo + hi) // 2
721 mid = (lo + hi) // 2
722 start = mid
722 start = mid
723 while start > 0 and m[start - 1 : start] != b'\n':
723 while start > 0 and m[start - 1 : start] != b'\n':
724 start -= 1
724 start -= 1
725 end = advance(start, b'\0')
725 end = advance(start, b'\0')
726 if bytes(m[start:end]) < s:
726 if bytes(m[start:end]) < s:
727 # we know that after the null there are 40 bytes of sha1
727 # we know that after the null there are 40 bytes of sha1
728 # this translates to the bisect lo = mid + 1
728 # this translates to the bisect lo = mid + 1
729 lo = advance(end + 40, b'\n') + 1
729 lo = advance(end + 40, b'\n') + 1
730 else:
730 else:
731 # this translates to the bisect hi = mid
731 # this translates to the bisect hi = mid
732 hi = start
732 hi = start
733 end = advance(lo, b'\0')
733 end = advance(lo, b'\0')
734 found = m[lo:end]
734 found = m[lo:end]
735 if s == found:
735 if s == found:
736 # we know that after the null there are 40 bytes of sha1
736 # we know that after the null there are 40 bytes of sha1
737 end = advance(end + 40, b'\n')
737 end = advance(end + 40, b'\n')
738 return (lo, end + 1)
738 return (lo, end + 1)
739 else:
739 else:
740 return (lo, lo)
740 return (lo, lo)
741
741
742
742
743 def _checkforbidden(l):
743 def _checkforbidden(l):
744 """Check filenames for illegal characters."""
744 """Check filenames for illegal characters."""
745 for f in l:
745 for f in l:
746 if b'\n' in f or b'\r' in f:
746 if b'\n' in f or b'\r' in f:
747 raise error.StorageError(
747 raise error.StorageError(
748 _(b"'\\n' and '\\r' disallowed in filenames: %r")
748 _(b"'\\n' and '\\r' disallowed in filenames: %r")
749 % pycompat.bytestr(f)
749 % pycompat.bytestr(f)
750 )
750 )
751
751
752
752
753 # apply the changes collected during the bisect loop to our addlist
753 # apply the changes collected during the bisect loop to our addlist
754 # return a delta suitable for addrevision
754 # return a delta suitable for addrevision
755 def _addlistdelta(addlist, x):
755 def _addlistdelta(addlist, x):
756 # for large addlist arrays, building a new array is cheaper
756 # for large addlist arrays, building a new array is cheaper
757 # than repeatedly modifying the existing one
757 # than repeatedly modifying the existing one
758 currentposition = 0
758 currentposition = 0
759 newaddlist = bytearray()
759 newaddlist = bytearray()
760
760
761 for start, end, content in x:
761 for start, end, content in x:
762 newaddlist += addlist[currentposition:start]
762 newaddlist += addlist[currentposition:start]
763 if content:
763 if content:
764 newaddlist += bytearray(content)
764 newaddlist += bytearray(content)
765
765
766 currentposition = end
766 currentposition = end
767
767
768 newaddlist += addlist[currentposition:]
768 newaddlist += addlist[currentposition:]
769
769
770 deltatext = b"".join(
770 deltatext = b"".join(
771 struct.pack(b">lll", start, end, len(content)) + content
771 struct.pack(b">lll", start, end, len(content)) + content
772 for start, end, content in x
772 for start, end, content in x
773 )
773 )
774 return deltatext, newaddlist
774 return deltatext, newaddlist
775
775
776
776
777 def _splittopdir(f):
777 def _splittopdir(f):
778 if b'/' in f:
778 if b'/' in f:
779 dir, subpath = f.split(b'/', 1)
779 dir, subpath = f.split(b'/', 1)
780 return dir + b'/', subpath
780 return dir + b'/', subpath
781 else:
781 else:
782 return b'', f
782 return b'', f
783
783
784
784
785 _noop = lambda s: None
785 _noop = lambda s: None
786
786
787
787
788 @interfaceutil.implementer(repository.imanifestdict)
788 @interfaceutil.implementer(repository.imanifestdict)
789 class treemanifest(object):
789 class treemanifest(object):
790 def __init__(self, dir=b'', text=b''):
790 def __init__(self, dir=b'', text=b''):
791 self._dir = dir
791 self._dir = dir
792 self._node = nullid
792 self._node = nullid
793 self._loadfunc = _noop
793 self._loadfunc = _noop
794 self._copyfunc = _noop
794 self._copyfunc = _noop
795 self._dirty = False
795 self._dirty = False
796 self._dirs = {}
796 self._dirs = {}
797 self._lazydirs = {}
797 self._lazydirs = {}
798 # Using _lazymanifest here is a little slower than plain old dicts
798 # Using _lazymanifest here is a little slower than plain old dicts
799 self._files = {}
799 self._files = {}
800 self._flags = {}
800 self._flags = {}
801 if text:
801 if text:
802
802
803 def readsubtree(subdir, subm):
803 def readsubtree(subdir, subm):
804 raise AssertionError(
804 raise AssertionError(
805 b'treemanifest constructor only accepts flat manifests'
805 b'treemanifest constructor only accepts flat manifests'
806 )
806 )
807
807
808 self.parse(text, readsubtree)
808 self.parse(text, readsubtree)
809 self._dirty = True # Mark flat manifest dirty after parsing
809 self._dirty = True # Mark flat manifest dirty after parsing
810
810
811 def _subpath(self, path):
811 def _subpath(self, path):
812 return self._dir + path
812 return self._dir + path
813
813
814 def _loadalllazy(self):
814 def _loadalllazy(self):
815 selfdirs = self._dirs
815 selfdirs = self._dirs
816 for d, (path, node, readsubtree, docopy) in pycompat.iteritems(
816 for d, (path, node, readsubtree, docopy) in pycompat.iteritems(
817 self._lazydirs
817 self._lazydirs
818 ):
818 ):
819 if docopy:
819 if docopy:
820 selfdirs[d] = readsubtree(path, node).copy()
820 selfdirs[d] = readsubtree(path, node).copy()
821 else:
821 else:
822 selfdirs[d] = readsubtree(path, node)
822 selfdirs[d] = readsubtree(path, node)
823 self._lazydirs = {}
823 self._lazydirs = {}
824
824
825 def _loadlazy(self, d):
825 def _loadlazy(self, d):
826 v = self._lazydirs.get(d)
826 v = self._lazydirs.get(d)
827 if v:
827 if v:
828 path, node, readsubtree, docopy = v
828 path, node, readsubtree, docopy = v
829 if docopy:
829 if docopy:
830 self._dirs[d] = readsubtree(path, node).copy()
830 self._dirs[d] = readsubtree(path, node).copy()
831 else:
831 else:
832 self._dirs[d] = readsubtree(path, node)
832 self._dirs[d] = readsubtree(path, node)
833 del self._lazydirs[d]
833 del self._lazydirs[d]
834
834
835 def _loadchildrensetlazy(self, visit):
835 def _loadchildrensetlazy(self, visit):
836 if not visit:
836 if not visit:
837 return None
837 return None
838 if visit == b'all' or visit == b'this':
838 if visit == b'all' or visit == b'this':
839 self._loadalllazy()
839 self._loadalllazy()
840 return None
840 return None
841
841
842 loadlazy = self._loadlazy
842 loadlazy = self._loadlazy
843 for k in visit:
843 for k in visit:
844 loadlazy(k + b'/')
844 loadlazy(k + b'/')
845 return visit
845 return visit
846
846
847 def _loaddifflazy(self, t1, t2):
847 def _loaddifflazy(self, t1, t2):
848 """load items in t1 and t2 if they're needed for diffing.
848 """load items in t1 and t2 if they're needed for diffing.
849
849
850 The criteria currently is:
850 The criteria currently is:
851 - if it's not present in _lazydirs in either t1 or t2, load it in the
851 - if it's not present in _lazydirs in either t1 or t2, load it in the
852 other (it may already be loaded or it may not exist, doesn't matter)
852 other (it may already be loaded or it may not exist, doesn't matter)
853 - if it's present in _lazydirs in both, compare the nodeid; if it
853 - if it's present in _lazydirs in both, compare the nodeid; if it
854 differs, load it in both
854 differs, load it in both
855 """
855 """
856 toloadlazy = []
856 toloadlazy = []
857 for d, v1 in pycompat.iteritems(t1._lazydirs):
857 for d, v1 in pycompat.iteritems(t1._lazydirs):
858 v2 = t2._lazydirs.get(d)
858 v2 = t2._lazydirs.get(d)
859 if not v2 or v2[1] != v1[1]:
859 if not v2 or v2[1] != v1[1]:
860 toloadlazy.append(d)
860 toloadlazy.append(d)
861 for d, v1 in pycompat.iteritems(t2._lazydirs):
861 for d, v1 in pycompat.iteritems(t2._lazydirs):
862 if d not in t1._lazydirs:
862 if d not in t1._lazydirs:
863 toloadlazy.append(d)
863 toloadlazy.append(d)
864
864
865 for d in toloadlazy:
865 for d in toloadlazy:
866 t1._loadlazy(d)
866 t1._loadlazy(d)
867 t2._loadlazy(d)
867 t2._loadlazy(d)
868
868
869 def __len__(self):
869 def __len__(self):
870 self._load()
870 self._load()
871 size = len(self._files)
871 size = len(self._files)
872 self._loadalllazy()
872 self._loadalllazy()
873 for m in self._dirs.values():
873 for m in self._dirs.values():
874 size += m.__len__()
874 size += m.__len__()
875 return size
875 return size
876
876
877 def __nonzero__(self):
877 def __nonzero__(self):
878 # Faster than "__len() != 0" since it avoids loading sub-manifests
878 # Faster than "__len() != 0" since it avoids loading sub-manifests
879 return not self._isempty()
879 return not self._isempty()
880
880
881 __bool__ = __nonzero__
881 __bool__ = __nonzero__
882
882
883 def _isempty(self):
883 def _isempty(self):
884 self._load() # for consistency; already loaded by all callers
884 self._load() # for consistency; already loaded by all callers
885 # See if we can skip loading everything.
885 # See if we can skip loading everything.
886 if self._files or (
886 if self._files or (
887 self._dirs and any(not m._isempty() for m in self._dirs.values())
887 self._dirs and any(not m._isempty() for m in self._dirs.values())
888 ):
888 ):
889 return False
889 return False
890 self._loadalllazy()
890 self._loadalllazy()
891 return not self._dirs or all(m._isempty() for m in self._dirs.values())
891 return not self._dirs or all(m._isempty() for m in self._dirs.values())
892
892
893 @encoding.strmethod
893 @encoding.strmethod
894 def __repr__(self):
894 def __repr__(self):
895 return (
895 return (
896 b'<treemanifest dir=%s, node=%s, loaded=%r, dirty=%r at 0x%x>'
896 b'<treemanifest dir=%s, node=%s, loaded=%r, dirty=%r at 0x%x>'
897 % (
897 % (
898 self._dir,
898 self._dir,
899 hex(self._node),
899 hex(self._node),
900 bool(self._loadfunc is _noop),
900 bool(self._loadfunc is _noop),
901 self._dirty,
901 self._dirty,
902 id(self),
902 id(self),
903 )
903 )
904 )
904 )
905
905
906 def dir(self):
906 def dir(self):
907 '''The directory that this tree manifest represents, including a
907 '''The directory that this tree manifest represents, including a
908 trailing '/'. Empty string for the repo root directory.'''
908 trailing '/'. Empty string for the repo root directory.'''
909 return self._dir
909 return self._dir
910
910
911 def node(self):
911 def node(self):
912 '''This node of this instance. nullid for unsaved instances. Should
912 '''This node of this instance. nullid for unsaved instances. Should
913 be updated when the instance is read or written from a revlog.
913 be updated when the instance is read or written from a revlog.
914 '''
914 '''
915 assert not self._dirty
915 assert not self._dirty
916 return self._node
916 return self._node
917
917
918 def setnode(self, node):
918 def setnode(self, node):
919 self._node = node
919 self._node = node
920 self._dirty = False
920 self._dirty = False
921
921
922 def iterentries(self):
922 def iterentries(self):
923 self._load()
923 self._load()
924 self._loadalllazy()
924 self._loadalllazy()
925 for p, n in sorted(
925 for p, n in sorted(
926 itertools.chain(self._dirs.items(), self._files.items())
926 itertools.chain(self._dirs.items(), self._files.items())
927 ):
927 ):
928 if p in self._files:
928 if p in self._files:
929 yield self._subpath(p), n, self._flags.get(p, b'')
929 yield self._subpath(p), n, self._flags.get(p, b'')
930 else:
930 else:
931 for x in n.iterentries():
931 for x in n.iterentries():
932 yield x
932 yield x
933
933
934 def items(self):
934 def items(self):
935 self._load()
935 self._load()
936 self._loadalllazy()
936 self._loadalllazy()
937 for p, n in sorted(
937 for p, n in sorted(
938 itertools.chain(self._dirs.items(), self._files.items())
938 itertools.chain(self._dirs.items(), self._files.items())
939 ):
939 ):
940 if p in self._files:
940 if p in self._files:
941 yield self._subpath(p), n
941 yield self._subpath(p), n
942 else:
942 else:
943 for f, sn in pycompat.iteritems(n):
943 for f, sn in pycompat.iteritems(n):
944 yield f, sn
944 yield f, sn
945
945
946 iteritems = items
946 iteritems = items
947
947
948 def iterkeys(self):
948 def iterkeys(self):
949 self._load()
949 self._load()
950 self._loadalllazy()
950 self._loadalllazy()
951 for p in sorted(itertools.chain(self._dirs, self._files)):
951 for p in sorted(itertools.chain(self._dirs, self._files)):
952 if p in self._files:
952 if p in self._files:
953 yield self._subpath(p)
953 yield self._subpath(p)
954 else:
954 else:
955 for f in self._dirs[p]:
955 for f in self._dirs[p]:
956 yield f
956 yield f
957
957
958 def keys(self):
958 def keys(self):
959 return list(self.iterkeys())
959 return list(self.iterkeys())
960
960
961 def __iter__(self):
961 def __iter__(self):
962 return self.iterkeys()
962 return self.iterkeys()
963
963
964 def __contains__(self, f):
964 def __contains__(self, f):
965 if f is None:
965 if f is None:
966 return False
966 return False
967 self._load()
967 self._load()
968 dir, subpath = _splittopdir(f)
968 dir, subpath = _splittopdir(f)
969 if dir:
969 if dir:
970 self._loadlazy(dir)
970 self._loadlazy(dir)
971
971
972 if dir not in self._dirs:
972 if dir not in self._dirs:
973 return False
973 return False
974
974
975 return self._dirs[dir].__contains__(subpath)
975 return self._dirs[dir].__contains__(subpath)
976 else:
976 else:
977 return f in self._files
977 return f in self._files
978
978
979 def get(self, f, default=None):
979 def get(self, f, default=None):
980 self._load()
980 self._load()
981 dir, subpath = _splittopdir(f)
981 dir, subpath = _splittopdir(f)
982 if dir:
982 if dir:
983 self._loadlazy(dir)
983 self._loadlazy(dir)
984
984
985 if dir not in self._dirs:
985 if dir not in self._dirs:
986 return default
986 return default
987 return self._dirs[dir].get(subpath, default)
987 return self._dirs[dir].get(subpath, default)
988 else:
988 else:
989 return self._files.get(f, default)
989 return self._files.get(f, default)
990
990
991 def __getitem__(self, f):
991 def __getitem__(self, f):
992 self._load()
992 self._load()
993 dir, subpath = _splittopdir(f)
993 dir, subpath = _splittopdir(f)
994 if dir:
994 if dir:
995 self._loadlazy(dir)
995 self._loadlazy(dir)
996
996
997 return self._dirs[dir].__getitem__(subpath)
997 return self._dirs[dir].__getitem__(subpath)
998 else:
998 else:
999 return self._files[f]
999 return self._files[f]
1000
1000
1001 def flags(self, f):
1001 def flags(self, f):
1002 self._load()
1002 self._load()
1003 dir, subpath = _splittopdir(f)
1003 dir, subpath = _splittopdir(f)
1004 if dir:
1004 if dir:
1005 self._loadlazy(dir)
1005 self._loadlazy(dir)
1006
1006
1007 if dir not in self._dirs:
1007 if dir not in self._dirs:
1008 return b''
1008 return b''
1009 return self._dirs[dir].flags(subpath)
1009 return self._dirs[dir].flags(subpath)
1010 else:
1010 else:
1011 if f in self._lazydirs or f in self._dirs:
1011 if f in self._lazydirs or f in self._dirs:
1012 return b''
1012 return b''
1013 return self._flags.get(f, b'')
1013 return self._flags.get(f, b'')
1014
1014
1015 def find(self, f):
1015 def find(self, f):
1016 self._load()
1016 self._load()
1017 dir, subpath = _splittopdir(f)
1017 dir, subpath = _splittopdir(f)
1018 if dir:
1018 if dir:
1019 self._loadlazy(dir)
1019 self._loadlazy(dir)
1020
1020
1021 return self._dirs[dir].find(subpath)
1021 return self._dirs[dir].find(subpath)
1022 else:
1022 else:
1023 return self._files[f], self._flags.get(f, b'')
1023 return self._files[f], self._flags.get(f, b'')
1024
1024
1025 def __delitem__(self, f):
1025 def __delitem__(self, f):
1026 self._load()
1026 self._load()
1027 dir, subpath = _splittopdir(f)
1027 dir, subpath = _splittopdir(f)
1028 if dir:
1028 if dir:
1029 self._loadlazy(dir)
1029 self._loadlazy(dir)
1030
1030
1031 self._dirs[dir].__delitem__(subpath)
1031 self._dirs[dir].__delitem__(subpath)
1032 # If the directory is now empty, remove it
1032 # If the directory is now empty, remove it
1033 if self._dirs[dir]._isempty():
1033 if self._dirs[dir]._isempty():
1034 del self._dirs[dir]
1034 del self._dirs[dir]
1035 else:
1035 else:
1036 del self._files[f]
1036 del self._files[f]
1037 if f in self._flags:
1037 if f in self._flags:
1038 del self._flags[f]
1038 del self._flags[f]
1039 self._dirty = True
1039 self._dirty = True
1040
1040
1041 def __setitem__(self, f, n):
1041 def __setitem__(self, f, n):
1042 assert n is not None
1042 assert n is not None
1043 self._load()
1043 self._load()
1044 dir, subpath = _splittopdir(f)
1044 dir, subpath = _splittopdir(f)
1045 if dir:
1045 if dir:
1046 self._loadlazy(dir)
1046 self._loadlazy(dir)
1047 if dir not in self._dirs:
1047 if dir not in self._dirs:
1048 self._dirs[dir] = treemanifest(self._subpath(dir))
1048 self._dirs[dir] = treemanifest(self._subpath(dir))
1049 self._dirs[dir].__setitem__(subpath, n)
1049 self._dirs[dir].__setitem__(subpath, n)
1050 else:
1050 else:
1051 # manifest nodes are either 20 bytes or 32 bytes,
1051 # manifest nodes are either 20 bytes or 32 bytes,
1052 # depending on the hash in use. An extra byte is
1052 # depending on the hash in use. An extra byte is
1053 # occasionally used by hg, but won't ever be
1053 # occasionally used by hg, but won't ever be
1054 # persisted. Trim to 21 or 33 bytes as appropriate.
1054 # persisted. Trim to 21 or 33 bytes as appropriate.
1055 trim = 21 if len(n) < 25 else 33
1055 trim = 21 if len(n) < 25 else 33
1056 self._files[f] = n[:trim] # to match manifestdict's behavior
1056 self._files[f] = n[:trim] # to match manifestdict's behavior
1057 self._dirty = True
1057 self._dirty = True
1058
1058
1059 def _load(self):
1059 def _load(self):
1060 if self._loadfunc is not _noop:
1060 if self._loadfunc is not _noop:
1061 lf, self._loadfunc = self._loadfunc, _noop
1061 lf, self._loadfunc = self._loadfunc, _noop
1062 lf(self)
1062 lf(self)
1063 elif self._copyfunc is not _noop:
1063 elif self._copyfunc is not _noop:
1064 cf, self._copyfunc = self._copyfunc, _noop
1064 cf, self._copyfunc = self._copyfunc, _noop
1065 cf(self)
1065 cf(self)
1066
1066
1067 def setflag(self, f, flags):
1067 def setflag(self, f, flags):
1068 """Set the flags (symlink, executable) for path f."""
1068 """Set the flags (symlink, executable) for path f."""
1069 self._load()
1069 self._load()
1070 dir, subpath = _splittopdir(f)
1070 dir, subpath = _splittopdir(f)
1071 if dir:
1071 if dir:
1072 self._loadlazy(dir)
1072 self._loadlazy(dir)
1073 if dir not in self._dirs:
1073 if dir not in self._dirs:
1074 self._dirs[dir] = treemanifest(self._subpath(dir))
1074 self._dirs[dir] = treemanifest(self._subpath(dir))
1075 self._dirs[dir].setflag(subpath, flags)
1075 self._dirs[dir].setflag(subpath, flags)
1076 else:
1076 else:
1077 self._flags[f] = flags
1077 self._flags[f] = flags
1078 self._dirty = True
1078 self._dirty = True
1079
1079
1080 def copy(self):
1080 def copy(self):
1081 copy = treemanifest(self._dir)
1081 copy = treemanifest(self._dir)
1082 copy._node = self._node
1082 copy._node = self._node
1083 copy._dirty = self._dirty
1083 copy._dirty = self._dirty
1084 if self._copyfunc is _noop:
1084 if self._copyfunc is _noop:
1085
1085
1086 def _copyfunc(s):
1086 def _copyfunc(s):
1087 self._load()
1087 self._load()
1088 s._lazydirs = {
1088 s._lazydirs = {
1089 d: (p, n, r, True)
1089 d: (p, n, r, True)
1090 for d, (p, n, r, c) in pycompat.iteritems(self._lazydirs)
1090 for d, (p, n, r, c) in pycompat.iteritems(self._lazydirs)
1091 }
1091 }
1092 sdirs = s._dirs
1092 sdirs = s._dirs
1093 for d, v in pycompat.iteritems(self._dirs):
1093 for d, v in pycompat.iteritems(self._dirs):
1094 sdirs[d] = v.copy()
1094 sdirs[d] = v.copy()
1095 s._files = dict.copy(self._files)
1095 s._files = dict.copy(self._files)
1096 s._flags = dict.copy(self._flags)
1096 s._flags = dict.copy(self._flags)
1097
1097
1098 if self._loadfunc is _noop:
1098 if self._loadfunc is _noop:
1099 _copyfunc(copy)
1099 _copyfunc(copy)
1100 else:
1100 else:
1101 copy._copyfunc = _copyfunc
1101 copy._copyfunc = _copyfunc
1102 else:
1102 else:
1103 copy._copyfunc = self._copyfunc
1103 copy._copyfunc = self._copyfunc
1104 return copy
1104 return copy
1105
1105
1106 def filesnotin(self, m2, match=None):
1106 def filesnotin(self, m2, match=None):
1107 '''Set of files in this manifest that are not in the other'''
1107 '''Set of files in this manifest that are not in the other'''
1108 if match and not match.always():
1108 if match and not match.always():
1109 m1 = self._matches(match)
1109 m1 = self._matches(match)
1110 m2 = m2._matches(match)
1110 m2 = m2._matches(match)
1111 return m1.filesnotin(m2)
1111 return m1.filesnotin(m2)
1112
1112
1113 files = set()
1113 files = set()
1114
1114
1115 def _filesnotin(t1, t2):
1115 def _filesnotin(t1, t2):
1116 if t1._node == t2._node and not t1._dirty and not t2._dirty:
1116 if t1._node == t2._node and not t1._dirty and not t2._dirty:
1117 return
1117 return
1118 t1._load()
1118 t1._load()
1119 t2._load()
1119 t2._load()
1120 self._loaddifflazy(t1, t2)
1120 self._loaddifflazy(t1, t2)
1121 for d, m1 in pycompat.iteritems(t1._dirs):
1121 for d, m1 in pycompat.iteritems(t1._dirs):
1122 if d in t2._dirs:
1122 if d in t2._dirs:
1123 m2 = t2._dirs[d]
1123 m2 = t2._dirs[d]
1124 _filesnotin(m1, m2)
1124 _filesnotin(m1, m2)
1125 else:
1125 else:
1126 files.update(m1.iterkeys())
1126 files.update(m1.iterkeys())
1127
1127
1128 for fn in t1._files:
1128 for fn in t1._files:
1129 if fn not in t2._files:
1129 if fn not in t2._files:
1130 files.add(t1._subpath(fn))
1130 files.add(t1._subpath(fn))
1131
1131
1132 _filesnotin(self, m2)
1132 _filesnotin(self, m2)
1133 return files
1133 return files
1134
1134
1135 @propertycache
1135 @propertycache
1136 def _alldirs(self):
1136 def _alldirs(self):
1137 return pathutil.dirs(self)
1137 return pathutil.dirs(self)
1138
1138
1139 def dirs(self):
1139 def dirs(self):
1140 return self._alldirs
1140 return self._alldirs
1141
1141
1142 def hasdir(self, dir):
1142 def hasdir(self, dir):
1143 self._load()
1143 self._load()
1144 topdir, subdir = _splittopdir(dir)
1144 topdir, subdir = _splittopdir(dir)
1145 if topdir:
1145 if topdir:
1146 self._loadlazy(topdir)
1146 self._loadlazy(topdir)
1147 if topdir in self._dirs:
1147 if topdir in self._dirs:
1148 return self._dirs[topdir].hasdir(subdir)
1148 return self._dirs[topdir].hasdir(subdir)
1149 return False
1149 return False
1150 dirslash = dir + b'/'
1150 dirslash = dir + b'/'
1151 return dirslash in self._dirs or dirslash in self._lazydirs
1151 return dirslash in self._dirs or dirslash in self._lazydirs
1152
1152
1153 def walk(self, match):
1153 def walk(self, match):
1154 '''Generates matching file names.
1154 '''Generates matching file names.
1155
1155
1156 It also reports nonexistent files by marking them bad with match.bad().
1156 It also reports nonexistent files by marking them bad with match.bad().
1157 '''
1157 '''
1158 if match.always():
1158 if match.always():
1159 for f in iter(self):
1159 for f in iter(self):
1160 yield f
1160 yield f
1161 return
1161 return
1162
1162
1163 fset = set(match.files())
1163 fset = set(match.files())
1164
1164
1165 for fn in self._walk(match):
1165 for fn in self._walk(match):
1166 if fn in fset:
1166 if fn in fset:
1167 # specified pattern is the exact name
1167 # specified pattern is the exact name
1168 fset.remove(fn)
1168 fset.remove(fn)
1169 yield fn
1169 yield fn
1170
1170
1171 # for dirstate.walk, files=[''] means "walk the whole tree".
1171 # for dirstate.walk, files=[''] means "walk the whole tree".
1172 # follow that here, too
1172 # follow that here, too
1173 fset.discard(b'')
1173 fset.discard(b'')
1174
1174
1175 for fn in sorted(fset):
1175 for fn in sorted(fset):
1176 if not self.hasdir(fn):
1176 if not self.hasdir(fn):
1177 match.bad(fn, None)
1177 match.bad(fn, None)
1178
1178
1179 def _walk(self, match):
1179 def _walk(self, match):
1180 '''Recursively generates matching file names for walk().'''
1180 '''Recursively generates matching file names for walk().'''
1181 visit = match.visitchildrenset(self._dir[:-1])
1181 visit = match.visitchildrenset(self._dir[:-1])
1182 if not visit:
1182 if not visit:
1183 return
1183 return
1184
1184
1185 # yield this dir's files and walk its submanifests
1185 # yield this dir's files and walk its submanifests
1186 self._load()
1186 self._load()
1187 visit = self._loadchildrensetlazy(visit)
1187 visit = self._loadchildrensetlazy(visit)
1188 for p in sorted(list(self._dirs) + list(self._files)):
1188 for p in sorted(list(self._dirs) + list(self._files)):
1189 if p in self._files:
1189 if p in self._files:
1190 fullp = self._subpath(p)
1190 fullp = self._subpath(p)
1191 if match(fullp):
1191 if match(fullp):
1192 yield fullp
1192 yield fullp
1193 else:
1193 else:
1194 if not visit or p[:-1] in visit:
1194 if not visit or p[:-1] in visit:
1195 for f in self._dirs[p]._walk(match):
1195 for f in self._dirs[p]._walk(match):
1196 yield f
1196 yield f
1197
1197
1198 def _matches(self, match):
1198 def _matches(self, match):
1199 '''recursively generate a new manifest filtered by the match argument.
1199 '''recursively generate a new manifest filtered by the match argument.
1200 '''
1200 '''
1201 if match.always():
1201 if match.always():
1202 return self.copy()
1202 return self.copy()
1203 return self._matches_inner(match)
1203 return self._matches_inner(match)
1204
1204
1205 def _matches_inner(self, match):
1205 def _matches_inner(self, match):
1206 if match.always():
1206 if match.always():
1207 return self.copy()
1207 return self.copy()
1208
1208
1209 visit = match.visitchildrenset(self._dir[:-1])
1209 visit = match.visitchildrenset(self._dir[:-1])
1210 if visit == b'all':
1210 if visit == b'all':
1211 return self.copy()
1211 return self.copy()
1212 ret = treemanifest(self._dir)
1212 ret = treemanifest(self._dir)
1213 if not visit:
1213 if not visit:
1214 return ret
1214 return ret
1215
1215
1216 self._load()
1216 self._load()
1217 for fn in self._files:
1217 for fn in self._files:
1218 # While visitchildrenset *usually* lists only subdirs, this is
1218 # While visitchildrenset *usually* lists only subdirs, this is
1219 # actually up to the matcher and may have some files in the set().
1219 # actually up to the matcher and may have some files in the set().
1220 # If visit == 'this', we should obviously look at the files in this
1220 # If visit == 'this', we should obviously look at the files in this
1221 # directory; if visit is a set, and fn is in it, we should inspect
1221 # directory; if visit is a set, and fn is in it, we should inspect
1222 # fn (but no need to inspect things not in the set).
1222 # fn (but no need to inspect things not in the set).
1223 if visit != b'this' and fn not in visit:
1223 if visit != b'this' and fn not in visit:
1224 continue
1224 continue
1225 fullp = self._subpath(fn)
1225 fullp = self._subpath(fn)
1226 # visitchildrenset isn't perfect, we still need to call the regular
1226 # visitchildrenset isn't perfect, we still need to call the regular
1227 # matcher code to further filter results.
1227 # matcher code to further filter results.
1228 if not match(fullp):
1228 if not match(fullp):
1229 continue
1229 continue
1230 ret._files[fn] = self._files[fn]
1230 ret._files[fn] = self._files[fn]
1231 if fn in self._flags:
1231 if fn in self._flags:
1232 ret._flags[fn] = self._flags[fn]
1232 ret._flags[fn] = self._flags[fn]
1233
1233
1234 visit = self._loadchildrensetlazy(visit)
1234 visit = self._loadchildrensetlazy(visit)
1235 for dir, subm in pycompat.iteritems(self._dirs):
1235 for dir, subm in pycompat.iteritems(self._dirs):
1236 if visit and dir[:-1] not in visit:
1236 if visit and dir[:-1] not in visit:
1237 continue
1237 continue
1238 m = subm._matches_inner(match)
1238 m = subm._matches_inner(match)
1239 if not m._isempty():
1239 if not m._isempty():
1240 ret._dirs[dir] = m
1240 ret._dirs[dir] = m
1241
1241
1242 if not ret._isempty():
1242 if not ret._isempty():
1243 ret._dirty = True
1243 ret._dirty = True
1244 return ret
1244 return ret
1245
1245
1246 def fastdelta(self, base, changes):
1246 def fastdelta(self, base, changes):
1247 raise FastdeltaUnavailable()
1247 raise FastdeltaUnavailable()
1248
1248
1249 def diff(self, m2, match=None, clean=False):
1249 def diff(self, m2, match=None, clean=False):
1250 '''Finds changes between the current manifest and m2.
1250 '''Finds changes between the current manifest and m2.
1251
1251
1252 Args:
1252 Args:
1253 m2: the manifest to which this manifest should be compared.
1253 m2: the manifest to which this manifest should be compared.
1254 clean: if true, include files unchanged between these manifests
1254 clean: if true, include files unchanged between these manifests
1255 with a None value in the returned dictionary.
1255 with a None value in the returned dictionary.
1256
1256
1257 The result is returned as a dict with filename as key and
1257 The result is returned as a dict with filename as key and
1258 values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the
1258 values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the
1259 nodeid in the current/other manifest and fl1/fl2 is the flag
1259 nodeid in the current/other manifest and fl1/fl2 is the flag
1260 in the current/other manifest. Where the file does not exist,
1260 in the current/other manifest. Where the file does not exist,
1261 the nodeid will be None and the flags will be the empty
1261 the nodeid will be None and the flags will be the empty
1262 string.
1262 string.
1263 '''
1263 '''
1264 if match and not match.always():
1264 if match and not match.always():
1265 m1 = self._matches(match)
1265 m1 = self._matches(match)
1266 m2 = m2._matches(match)
1266 m2 = m2._matches(match)
1267 return m1.diff(m2, clean=clean)
1267 return m1.diff(m2, clean=clean)
1268 result = {}
1268 result = {}
1269 emptytree = treemanifest()
1269 emptytree = treemanifest()
1270
1270
1271 def _iterativediff(t1, t2, stack):
1271 def _iterativediff(t1, t2, stack):
1272 """compares two tree manifests and append new tree-manifests which
1272 """compares two tree manifests and append new tree-manifests which
1273 needs to be compared to stack"""
1273 needs to be compared to stack"""
1274 if t1._node == t2._node and not t1._dirty and not t2._dirty:
1274 if t1._node == t2._node and not t1._dirty and not t2._dirty:
1275 return
1275 return
1276 t1._load()
1276 t1._load()
1277 t2._load()
1277 t2._load()
1278 self._loaddifflazy(t1, t2)
1278 self._loaddifflazy(t1, t2)
1279
1279
1280 for d, m1 in pycompat.iteritems(t1._dirs):
1280 for d, m1 in pycompat.iteritems(t1._dirs):
1281 m2 = t2._dirs.get(d, emptytree)
1281 m2 = t2._dirs.get(d, emptytree)
1282 stack.append((m1, m2))
1282 stack.append((m1, m2))
1283
1283
1284 for d, m2 in pycompat.iteritems(t2._dirs):
1284 for d, m2 in pycompat.iteritems(t2._dirs):
1285 if d not in t1._dirs:
1285 if d not in t1._dirs:
1286 stack.append((emptytree, m2))
1286 stack.append((emptytree, m2))
1287
1287
1288 for fn, n1 in pycompat.iteritems(t1._files):
1288 for fn, n1 in pycompat.iteritems(t1._files):
1289 fl1 = t1._flags.get(fn, b'')
1289 fl1 = t1._flags.get(fn, b'')
1290 n2 = t2._files.get(fn, None)
1290 n2 = t2._files.get(fn, None)
1291 fl2 = t2._flags.get(fn, b'')
1291 fl2 = t2._flags.get(fn, b'')
1292 if n1 != n2 or fl1 != fl2:
1292 if n1 != n2 or fl1 != fl2:
1293 result[t1._subpath(fn)] = ((n1, fl1), (n2, fl2))
1293 result[t1._subpath(fn)] = ((n1, fl1), (n2, fl2))
1294 elif clean:
1294 elif clean:
1295 result[t1._subpath(fn)] = None
1295 result[t1._subpath(fn)] = None
1296
1296
1297 for fn, n2 in pycompat.iteritems(t2._files):
1297 for fn, n2 in pycompat.iteritems(t2._files):
1298 if fn not in t1._files:
1298 if fn not in t1._files:
1299 fl2 = t2._flags.get(fn, b'')
1299 fl2 = t2._flags.get(fn, b'')
1300 result[t2._subpath(fn)] = ((None, b''), (n2, fl2))
1300 result[t2._subpath(fn)] = ((None, b''), (n2, fl2))
1301
1301
1302 stackls = []
1302 stackls = []
1303 _iterativediff(self, m2, stackls)
1303 _iterativediff(self, m2, stackls)
1304 while stackls:
1304 while stackls:
1305 t1, t2 = stackls.pop()
1305 t1, t2 = stackls.pop()
1306 # stackls is populated in the function call
1306 # stackls is populated in the function call
1307 _iterativediff(t1, t2, stackls)
1307 _iterativediff(t1, t2, stackls)
1308 return result
1308 return result
1309
1309
1310 def unmodifiedsince(self, m2):
1310 def unmodifiedsince(self, m2):
1311 return not self._dirty and not m2._dirty and self._node == m2._node
1311 return not self._dirty and not m2._dirty and self._node == m2._node
1312
1312
1313 def parse(self, text, readsubtree):
1313 def parse(self, text, readsubtree):
1314 selflazy = self._lazydirs
1314 selflazy = self._lazydirs
1315 subpath = self._subpath
1315 subpath = self._subpath
1316 for f, n, fl in _parse(text):
1316 for f, n, fl in _parse(text):
1317 if fl == b't':
1317 if fl == b't':
1318 f = f + b'/'
1318 f = f + b'/'
1319 # False below means "doesn't need to be copied" and can use the
1319 # False below means "doesn't need to be copied" and can use the
1320 # cached value from readsubtree directly.
1320 # cached value from readsubtree directly.
1321 selflazy[f] = (subpath(f), n, readsubtree, False)
1321 selflazy[f] = (subpath(f), n, readsubtree, False)
1322 elif b'/' in f:
1322 elif b'/' in f:
1323 # This is a flat manifest, so use __setitem__ and setflag rather
1323 # This is a flat manifest, so use __setitem__ and setflag rather
1324 # than assigning directly to _files and _flags, so we can
1324 # than assigning directly to _files and _flags, so we can
1325 # assign a path in a subdirectory, and to mark dirty (compared
1325 # assign a path in a subdirectory, and to mark dirty (compared
1326 # to nullid).
1326 # to nullid).
1327 self[f] = n
1327 self[f] = n
1328 if fl:
1328 if fl:
1329 self.setflag(f, fl)
1329 self.setflag(f, fl)
1330 else:
1330 else:
1331 # Assigning to _files and _flags avoids marking as dirty,
1331 # Assigning to _files and _flags avoids marking as dirty,
1332 # and should be a little faster.
1332 # and should be a little faster.
1333 self._files[f] = n
1333 self._files[f] = n
1334 if fl:
1334 if fl:
1335 self._flags[f] = fl
1335 self._flags[f] = fl
1336
1336
1337 def text(self):
1337 def text(self):
1338 """Get the full data of this manifest as a bytestring."""
1338 """Get the full data of this manifest as a bytestring."""
1339 self._load()
1339 self._load()
1340 return _text(self.iterentries())
1340 return _text(self.iterentries())
1341
1341
1342 def dirtext(self):
1342 def dirtext(self):
1343 """Get the full data of this directory as a bytestring. Make sure that
1343 """Get the full data of this directory as a bytestring. Make sure that
1344 any submanifests have been written first, so their nodeids are correct.
1344 any submanifests have been written first, so their nodeids are correct.
1345 """
1345 """
1346 self._load()
1346 self._load()
1347 flags = self.flags
1347 flags = self.flags
1348 lazydirs = [
1348 lazydirs = [
1349 (d[:-1], v[1], b't') for d, v in pycompat.iteritems(self._lazydirs)
1349 (d[:-1], v[1], b't') for d, v in pycompat.iteritems(self._lazydirs)
1350 ]
1350 ]
1351 dirs = [(d[:-1], self._dirs[d]._node, b't') for d in self._dirs]
1351 dirs = [(d[:-1], self._dirs[d]._node, b't') for d in self._dirs]
1352 files = [(f, self._files[f], flags(f)) for f in self._files]
1352 files = [(f, self._files[f], flags(f)) for f in self._files]
1353 return _text(sorted(dirs + files + lazydirs))
1353 return _text(sorted(dirs + files + lazydirs))
1354
1354
1355 def read(self, gettext, readsubtree):
1355 def read(self, gettext, readsubtree):
1356 def _load_for_read(s):
1356 def _load_for_read(s):
1357 s.parse(gettext(), readsubtree)
1357 s.parse(gettext(), readsubtree)
1358 s._dirty = False
1358 s._dirty = False
1359
1359
1360 self._loadfunc = _load_for_read
1360 self._loadfunc = _load_for_read
1361
1361
1362 def writesubtrees(self, m1, m2, writesubtree, match):
1362 def writesubtrees(self, m1, m2, writesubtree, match):
1363 self._load() # for consistency; should never have any effect here
1363 self._load() # for consistency; should never have any effect here
1364 m1._load()
1364 m1._load()
1365 m2._load()
1365 m2._load()
1366 emptytree = treemanifest()
1366 emptytree = treemanifest()
1367
1367
1368 def getnode(m, d):
1368 def getnode(m, d):
1369 ld = m._lazydirs.get(d)
1369 ld = m._lazydirs.get(d)
1370 if ld:
1370 if ld:
1371 return ld[1]
1371 return ld[1]
1372 return m._dirs.get(d, emptytree)._node
1372 return m._dirs.get(d, emptytree)._node
1373
1373
1374 # let's skip investigating things that `match` says we do not need.
1374 # let's skip investigating things that `match` says we do not need.
1375 visit = match.visitchildrenset(self._dir[:-1])
1375 visit = match.visitchildrenset(self._dir[:-1])
1376 visit = self._loadchildrensetlazy(visit)
1376 visit = self._loadchildrensetlazy(visit)
1377 if visit == b'this' or visit == b'all':
1377 if visit == b'this' or visit == b'all':
1378 visit = None
1378 visit = None
1379 for d, subm in pycompat.iteritems(self._dirs):
1379 for d, subm in pycompat.iteritems(self._dirs):
1380 if visit and d[:-1] not in visit:
1380 if visit and d[:-1] not in visit:
1381 continue
1381 continue
1382 subp1 = getnode(m1, d)
1382 subp1 = getnode(m1, d)
1383 subp2 = getnode(m2, d)
1383 subp2 = getnode(m2, d)
1384 if subp1 == nullid:
1384 if subp1 == nullid:
1385 subp1, subp2 = subp2, subp1
1385 subp1, subp2 = subp2, subp1
1386 writesubtree(subm, subp1, subp2, match)
1386 writesubtree(subm, subp1, subp2, match)
1387
1387
1388 def walksubtrees(self, matcher=None):
1388 def walksubtrees(self, matcher=None):
1389 """Returns an iterator of the subtrees of this manifest, including this
1389 """Returns an iterator of the subtrees of this manifest, including this
1390 manifest itself.
1390 manifest itself.
1391
1391
1392 If `matcher` is provided, it only returns subtrees that match.
1392 If `matcher` is provided, it only returns subtrees that match.
1393 """
1393 """
1394 if matcher and not matcher.visitdir(self._dir[:-1]):
1394 if matcher and not matcher.visitdir(self._dir[:-1]):
1395 return
1395 return
1396 if not matcher or matcher(self._dir[:-1]):
1396 if not matcher or matcher(self._dir[:-1]):
1397 yield self
1397 yield self
1398
1398
1399 self._load()
1399 self._load()
1400 # OPT: use visitchildrenset to avoid loading everything.
1400 # OPT: use visitchildrenset to avoid loading everything.
1401 self._loadalllazy()
1401 self._loadalllazy()
1402 for d, subm in pycompat.iteritems(self._dirs):
1402 for d, subm in pycompat.iteritems(self._dirs):
1403 for subtree in subm.walksubtrees(matcher=matcher):
1403 for subtree in subm.walksubtrees(matcher=matcher):
1404 yield subtree
1404 yield subtree
1405
1405
1406
1406
1407 class manifestfulltextcache(util.lrucachedict):
1407 class manifestfulltextcache(util.lrucachedict):
1408 """File-backed LRU cache for the manifest cache
1408 """File-backed LRU cache for the manifest cache
1409
1409
1410 File consists of entries, up to EOF:
1410 File consists of entries, up to EOF:
1411
1411
1412 - 20 bytes node, 4 bytes length, <length> manifest data
1412 - 20 bytes node, 4 bytes length, <length> manifest data
1413
1413
1414 These are written in reverse cache order (oldest to newest).
1414 These are written in reverse cache order (oldest to newest).
1415
1415
1416 """
1416 """
1417
1417
1418 _file = b'manifestfulltextcache'
1418 _file = b'manifestfulltextcache'
1419
1419
1420 def __init__(self, max):
1420 def __init__(self, max):
1421 super(manifestfulltextcache, self).__init__(max)
1421 super(manifestfulltextcache, self).__init__(max)
1422 self._dirty = False
1422 self._dirty = False
1423 self._read = False
1423 self._read = False
1424 self._opener = None
1424 self._opener = None
1425
1425
1426 def read(self):
1426 def read(self):
1427 if self._read or self._opener is None:
1427 if self._read or self._opener is None:
1428 return
1428 return
1429
1429
1430 try:
1430 try:
1431 with self._opener(self._file) as fp:
1431 with self._opener(self._file) as fp:
1432 set = super(manifestfulltextcache, self).__setitem__
1432 set = super(manifestfulltextcache, self).__setitem__
1433 # ignore trailing data, this is a cache, corruption is skipped
1433 # ignore trailing data, this is a cache, corruption is skipped
1434 while True:
1434 while True:
1435 # TODO do we need to do work here for sha1 portability?
1435 node = fp.read(20)
1436 node = fp.read(20)
1436 if len(node) < 20:
1437 if len(node) < 20:
1437 break
1438 break
1438 try:
1439 try:
1439 size = struct.unpack(b'>L', fp.read(4))[0]
1440 size = struct.unpack(b'>L', fp.read(4))[0]
1440 except struct.error:
1441 except struct.error:
1441 break
1442 break
1442 value = bytearray(fp.read(size))
1443 value = bytearray(fp.read(size))
1443 if len(value) != size:
1444 if len(value) != size:
1444 break
1445 break
1445 set(node, value)
1446 set(node, value)
1446 except IOError:
1447 except IOError:
1447 # the file is allowed to be missing
1448 # the file is allowed to be missing
1448 pass
1449 pass
1449
1450
1450 self._read = True
1451 self._read = True
1451 self._dirty = False
1452 self._dirty = False
1452
1453
1453 def write(self):
1454 def write(self):
1454 if not self._dirty or self._opener is None:
1455 if not self._dirty or self._opener is None:
1455 return
1456 return
1456 # rotate backwards to the first used node
1457 # rotate backwards to the first used node
1457 with self._opener(
1458 with self._opener(
1458 self._file, b'w', atomictemp=True, checkambig=True
1459 self._file, b'w', atomictemp=True, checkambig=True
1459 ) as fp:
1460 ) as fp:
1460 node = self._head.prev
1461 node = self._head.prev
1461 while True:
1462 while True:
1462 if node.key in self._cache:
1463 if node.key in self._cache:
1463 fp.write(node.key)
1464 fp.write(node.key)
1464 fp.write(struct.pack(b'>L', len(node.value)))
1465 fp.write(struct.pack(b'>L', len(node.value)))
1465 fp.write(node.value)
1466 fp.write(node.value)
1466 if node is self._head:
1467 if node is self._head:
1467 break
1468 break
1468 node = node.prev
1469 node = node.prev
1469
1470
1470 def __len__(self):
1471 def __len__(self):
1471 if not self._read:
1472 if not self._read:
1472 self.read()
1473 self.read()
1473 return super(manifestfulltextcache, self).__len__()
1474 return super(manifestfulltextcache, self).__len__()
1474
1475
1475 def __contains__(self, k):
1476 def __contains__(self, k):
1476 if not self._read:
1477 if not self._read:
1477 self.read()
1478 self.read()
1478 return super(manifestfulltextcache, self).__contains__(k)
1479 return super(manifestfulltextcache, self).__contains__(k)
1479
1480
1480 def __iter__(self):
1481 def __iter__(self):
1481 if not self._read:
1482 if not self._read:
1482 self.read()
1483 self.read()
1483 return super(manifestfulltextcache, self).__iter__()
1484 return super(manifestfulltextcache, self).__iter__()
1484
1485
1485 def __getitem__(self, k):
1486 def __getitem__(self, k):
1486 if not self._read:
1487 if not self._read:
1487 self.read()
1488 self.read()
1488 # the cache lru order can change on read
1489 # the cache lru order can change on read
1489 setdirty = self._cache.get(k) is not self._head
1490 setdirty = self._cache.get(k) is not self._head
1490 value = super(manifestfulltextcache, self).__getitem__(k)
1491 value = super(manifestfulltextcache, self).__getitem__(k)
1491 if setdirty:
1492 if setdirty:
1492 self._dirty = True
1493 self._dirty = True
1493 return value
1494 return value
1494
1495
1495 def __setitem__(self, k, v):
1496 def __setitem__(self, k, v):
1496 if not self._read:
1497 if not self._read:
1497 self.read()
1498 self.read()
1498 super(manifestfulltextcache, self).__setitem__(k, v)
1499 super(manifestfulltextcache, self).__setitem__(k, v)
1499 self._dirty = True
1500 self._dirty = True
1500
1501
1501 def __delitem__(self, k):
1502 def __delitem__(self, k):
1502 if not self._read:
1503 if not self._read:
1503 self.read()
1504 self.read()
1504 super(manifestfulltextcache, self).__delitem__(k)
1505 super(manifestfulltextcache, self).__delitem__(k)
1505 self._dirty = True
1506 self._dirty = True
1506
1507
1507 def get(self, k, default=None):
1508 def get(self, k, default=None):
1508 if not self._read:
1509 if not self._read:
1509 self.read()
1510 self.read()
1510 return super(manifestfulltextcache, self).get(k, default=default)
1511 return super(manifestfulltextcache, self).get(k, default=default)
1511
1512
1512 def clear(self, clear_persisted_data=False):
1513 def clear(self, clear_persisted_data=False):
1513 super(manifestfulltextcache, self).clear()
1514 super(manifestfulltextcache, self).clear()
1514 if clear_persisted_data:
1515 if clear_persisted_data:
1515 self._dirty = True
1516 self._dirty = True
1516 self.write()
1517 self.write()
1517 self._read = False
1518 self._read = False
1518
1519
1519
1520
1520 # and upper bound of what we expect from compression
1521 # and upper bound of what we expect from compression
1521 # (real live value seems to be "3")
1522 # (real live value seems to be "3")
1522 MAXCOMPRESSION = 3
1523 MAXCOMPRESSION = 3
1523
1524
1524
1525
1525 class FastdeltaUnavailable(Exception):
1526 class FastdeltaUnavailable(Exception):
1526 """Exception raised when fastdelta isn't usable on a manifest."""
1527 """Exception raised when fastdelta isn't usable on a manifest."""
1527
1528
1528
1529
1529 @interfaceutil.implementer(repository.imanifeststorage)
1530 @interfaceutil.implementer(repository.imanifeststorage)
1530 class manifestrevlog(object):
1531 class manifestrevlog(object):
1531 '''A revlog that stores manifest texts. This is responsible for caching the
1532 '''A revlog that stores manifest texts. This is responsible for caching the
1532 full-text manifest contents.
1533 full-text manifest contents.
1533 '''
1534 '''
1534
1535
1535 def __init__(
1536 def __init__(
1536 self,
1537 self,
1537 opener,
1538 opener,
1538 tree=b'',
1539 tree=b'',
1539 dirlogcache=None,
1540 dirlogcache=None,
1540 indexfile=None,
1541 indexfile=None,
1541 treemanifest=False,
1542 treemanifest=False,
1542 ):
1543 ):
1543 """Constructs a new manifest revlog
1544 """Constructs a new manifest revlog
1544
1545
1545 `indexfile` - used by extensions to have two manifests at once, like
1546 `indexfile` - used by extensions to have two manifests at once, like
1546 when transitioning between flatmanifeset and treemanifests.
1547 when transitioning between flatmanifeset and treemanifests.
1547
1548
1548 `treemanifest` - used to indicate this is a tree manifest revlog. Opener
1549 `treemanifest` - used to indicate this is a tree manifest revlog. Opener
1549 options can also be used to make this a tree manifest revlog. The opener
1550 options can also be used to make this a tree manifest revlog. The opener
1550 option takes precedence, so if it is set to True, we ignore whatever
1551 option takes precedence, so if it is set to True, we ignore whatever
1551 value is passed in to the constructor.
1552 value is passed in to the constructor.
1552 """
1553 """
1553 # During normal operations, we expect to deal with not more than four
1554 # During normal operations, we expect to deal with not more than four
1554 # revs at a time (such as during commit --amend). When rebasing large
1555 # revs at a time (such as during commit --amend). When rebasing large
1555 # stacks of commits, the number can go up, hence the config knob below.
1556 # stacks of commits, the number can go up, hence the config knob below.
1556 cachesize = 4
1557 cachesize = 4
1557 optiontreemanifest = False
1558 optiontreemanifest = False
1558 opts = getattr(opener, 'options', None)
1559 opts = getattr(opener, 'options', None)
1559 if opts is not None:
1560 if opts is not None:
1560 cachesize = opts.get(b'manifestcachesize', cachesize)
1561 cachesize = opts.get(b'manifestcachesize', cachesize)
1561 optiontreemanifest = opts.get(b'treemanifest', False)
1562 optiontreemanifest = opts.get(b'treemanifest', False)
1562
1563
1563 self._treeondisk = optiontreemanifest or treemanifest
1564 self._treeondisk = optiontreemanifest or treemanifest
1564
1565
1565 self._fulltextcache = manifestfulltextcache(cachesize)
1566 self._fulltextcache = manifestfulltextcache(cachesize)
1566
1567
1567 if tree:
1568 if tree:
1568 assert self._treeondisk, b'opts is %r' % opts
1569 assert self._treeondisk, b'opts is %r' % opts
1569
1570
1570 if indexfile is None:
1571 if indexfile is None:
1571 indexfile = b'00manifest.i'
1572 indexfile = b'00manifest.i'
1572 if tree:
1573 if tree:
1573 indexfile = b"meta/" + tree + indexfile
1574 indexfile = b"meta/" + tree + indexfile
1574
1575
1575 self.tree = tree
1576 self.tree = tree
1576
1577
1577 # The dirlogcache is kept on the root manifest log
1578 # The dirlogcache is kept on the root manifest log
1578 if tree:
1579 if tree:
1579 self._dirlogcache = dirlogcache
1580 self._dirlogcache = dirlogcache
1580 else:
1581 else:
1581 self._dirlogcache = {b'': self}
1582 self._dirlogcache = {b'': self}
1582
1583
1583 self._revlog = revlog.revlog(
1584 self._revlog = revlog.revlog(
1584 opener,
1585 opener,
1585 indexfile,
1586 indexfile,
1586 # only root indexfile is cached
1587 # only root indexfile is cached
1587 checkambig=not bool(tree),
1588 checkambig=not bool(tree),
1588 mmaplargeindex=True,
1589 mmaplargeindex=True,
1589 upperboundcomp=MAXCOMPRESSION,
1590 upperboundcomp=MAXCOMPRESSION,
1590 )
1591 )
1591
1592
1592 self.index = self._revlog.index
1593 self.index = self._revlog.index
1593 self.version = self._revlog.version
1594 self.version = self._revlog.version
1594 self._generaldelta = self._revlog._generaldelta
1595 self._generaldelta = self._revlog._generaldelta
1595
1596
1596 def _setupmanifestcachehooks(self, repo):
1597 def _setupmanifestcachehooks(self, repo):
1597 """Persist the manifestfulltextcache on lock release"""
1598 """Persist the manifestfulltextcache on lock release"""
1598 if not util.safehasattr(repo, b'_wlockref'):
1599 if not util.safehasattr(repo, b'_wlockref'):
1599 return
1600 return
1600
1601
1601 self._fulltextcache._opener = repo.wcachevfs
1602 self._fulltextcache._opener = repo.wcachevfs
1602 if repo._currentlock(repo._wlockref) is None:
1603 if repo._currentlock(repo._wlockref) is None:
1603 return
1604 return
1604
1605
1605 reporef = weakref.ref(repo)
1606 reporef = weakref.ref(repo)
1606 manifestrevlogref = weakref.ref(self)
1607 manifestrevlogref = weakref.ref(self)
1607
1608
1608 def persistmanifestcache(success):
1609 def persistmanifestcache(success):
1609 # Repo is in an unknown state, do not persist.
1610 # Repo is in an unknown state, do not persist.
1610 if not success:
1611 if not success:
1611 return
1612 return
1612
1613
1613 repo = reporef()
1614 repo = reporef()
1614 self = manifestrevlogref()
1615 self = manifestrevlogref()
1615 if repo is None or self is None:
1616 if repo is None or self is None:
1616 return
1617 return
1617 if repo.manifestlog.getstorage(b'') is not self:
1618 if repo.manifestlog.getstorage(b'') is not self:
1618 # there's a different manifest in play now, abort
1619 # there's a different manifest in play now, abort
1619 return
1620 return
1620 self._fulltextcache.write()
1621 self._fulltextcache.write()
1621
1622
1622 repo._afterlock(persistmanifestcache)
1623 repo._afterlock(persistmanifestcache)
1623
1624
1624 @property
1625 @property
1625 def fulltextcache(self):
1626 def fulltextcache(self):
1626 return self._fulltextcache
1627 return self._fulltextcache
1627
1628
1628 def clearcaches(self, clear_persisted_data=False):
1629 def clearcaches(self, clear_persisted_data=False):
1629 self._revlog.clearcaches()
1630 self._revlog.clearcaches()
1630 self._fulltextcache.clear(clear_persisted_data=clear_persisted_data)
1631 self._fulltextcache.clear(clear_persisted_data=clear_persisted_data)
1631 self._dirlogcache = {self.tree: self}
1632 self._dirlogcache = {self.tree: self}
1632
1633
1633 def dirlog(self, d):
1634 def dirlog(self, d):
1634 if d:
1635 if d:
1635 assert self._treeondisk
1636 assert self._treeondisk
1636 if d not in self._dirlogcache:
1637 if d not in self._dirlogcache:
1637 mfrevlog = manifestrevlog(
1638 mfrevlog = manifestrevlog(
1638 self.opener, d, self._dirlogcache, treemanifest=self._treeondisk
1639 self.opener, d, self._dirlogcache, treemanifest=self._treeondisk
1639 )
1640 )
1640 self._dirlogcache[d] = mfrevlog
1641 self._dirlogcache[d] = mfrevlog
1641 return self._dirlogcache[d]
1642 return self._dirlogcache[d]
1642
1643
1643 def add(
1644 def add(
1644 self,
1645 self,
1645 m,
1646 m,
1646 transaction,
1647 transaction,
1647 link,
1648 link,
1648 p1,
1649 p1,
1649 p2,
1650 p2,
1650 added,
1651 added,
1651 removed,
1652 removed,
1652 readtree=None,
1653 readtree=None,
1653 match=None,
1654 match=None,
1654 ):
1655 ):
1655 try:
1656 try:
1656 if p1 not in self.fulltextcache:
1657 if p1 not in self.fulltextcache:
1657 raise FastdeltaUnavailable()
1658 raise FastdeltaUnavailable()
1658 # If our first parent is in the manifest cache, we can
1659 # If our first parent is in the manifest cache, we can
1659 # compute a delta here using properties we know about the
1660 # compute a delta here using properties we know about the
1660 # manifest up-front, which may save time later for the
1661 # manifest up-front, which may save time later for the
1661 # revlog layer.
1662 # revlog layer.
1662
1663
1663 _checkforbidden(added)
1664 _checkforbidden(added)
1664 # combine the changed lists into one sorted iterator
1665 # combine the changed lists into one sorted iterator
1665 work = heapq.merge(
1666 work = heapq.merge(
1666 [(x, False) for x in sorted(added)],
1667 [(x, False) for x in sorted(added)],
1667 [(x, True) for x in sorted(removed)],
1668 [(x, True) for x in sorted(removed)],
1668 )
1669 )
1669
1670
1670 arraytext, deltatext = m.fastdelta(self.fulltextcache[p1], work)
1671 arraytext, deltatext = m.fastdelta(self.fulltextcache[p1], work)
1671 cachedelta = self._revlog.rev(p1), deltatext
1672 cachedelta = self._revlog.rev(p1), deltatext
1672 text = util.buffer(arraytext)
1673 text = util.buffer(arraytext)
1673 n = self._revlog.addrevision(
1674 n = self._revlog.addrevision(
1674 text, transaction, link, p1, p2, cachedelta
1675 text, transaction, link, p1, p2, cachedelta
1675 )
1676 )
1676 except FastdeltaUnavailable:
1677 except FastdeltaUnavailable:
1677 # The first parent manifest isn't already loaded or the
1678 # The first parent manifest isn't already loaded or the
1678 # manifest implementation doesn't support fastdelta, so
1679 # manifest implementation doesn't support fastdelta, so
1679 # we'll just encode a fulltext of the manifest and pass
1680 # we'll just encode a fulltext of the manifest and pass
1680 # that through to the revlog layer, and let it handle the
1681 # that through to the revlog layer, and let it handle the
1681 # delta process.
1682 # delta process.
1682 if self._treeondisk:
1683 if self._treeondisk:
1683 assert readtree, b"readtree must be set for treemanifest writes"
1684 assert readtree, b"readtree must be set for treemanifest writes"
1684 assert match, b"match must be specified for treemanifest writes"
1685 assert match, b"match must be specified for treemanifest writes"
1685 m1 = readtree(self.tree, p1)
1686 m1 = readtree(self.tree, p1)
1686 m2 = readtree(self.tree, p2)
1687 m2 = readtree(self.tree, p2)
1687 n = self._addtree(
1688 n = self._addtree(
1688 m, transaction, link, m1, m2, readtree, match=match
1689 m, transaction, link, m1, m2, readtree, match=match
1689 )
1690 )
1690 arraytext = None
1691 arraytext = None
1691 else:
1692 else:
1692 text = m.text()
1693 text = m.text()
1693 n = self._revlog.addrevision(text, transaction, link, p1, p2)
1694 n = self._revlog.addrevision(text, transaction, link, p1, p2)
1694 arraytext = bytearray(text)
1695 arraytext = bytearray(text)
1695
1696
1696 if arraytext is not None:
1697 if arraytext is not None:
1697 self.fulltextcache[n] = arraytext
1698 self.fulltextcache[n] = arraytext
1698
1699
1699 return n
1700 return n
1700
1701
1701 def _addtree(self, m, transaction, link, m1, m2, readtree, match):
1702 def _addtree(self, m, transaction, link, m1, m2, readtree, match):
1702 # If the manifest is unchanged compared to one parent,
1703 # If the manifest is unchanged compared to one parent,
1703 # don't write a new revision
1704 # don't write a new revision
1704 if self.tree != b'' and (
1705 if self.tree != b'' and (
1705 m.unmodifiedsince(m1) or m.unmodifiedsince(m2)
1706 m.unmodifiedsince(m1) or m.unmodifiedsince(m2)
1706 ):
1707 ):
1707 return m.node()
1708 return m.node()
1708
1709
1709 def writesubtree(subm, subp1, subp2, match):
1710 def writesubtree(subm, subp1, subp2, match):
1710 sublog = self.dirlog(subm.dir())
1711 sublog = self.dirlog(subm.dir())
1711 sublog.add(
1712 sublog.add(
1712 subm,
1713 subm,
1713 transaction,
1714 transaction,
1714 link,
1715 link,
1715 subp1,
1716 subp1,
1716 subp2,
1717 subp2,
1717 None,
1718 None,
1718 None,
1719 None,
1719 readtree=readtree,
1720 readtree=readtree,
1720 match=match,
1721 match=match,
1721 )
1722 )
1722
1723
1723 m.writesubtrees(m1, m2, writesubtree, match)
1724 m.writesubtrees(m1, m2, writesubtree, match)
1724 text = m.dirtext()
1725 text = m.dirtext()
1725 n = None
1726 n = None
1726 if self.tree != b'':
1727 if self.tree != b'':
1727 # Double-check whether contents are unchanged to one parent
1728 # Double-check whether contents are unchanged to one parent
1728 if text == m1.dirtext():
1729 if text == m1.dirtext():
1729 n = m1.node()
1730 n = m1.node()
1730 elif text == m2.dirtext():
1731 elif text == m2.dirtext():
1731 n = m2.node()
1732 n = m2.node()
1732
1733
1733 if not n:
1734 if not n:
1734 n = self._revlog.addrevision(
1735 n = self._revlog.addrevision(
1735 text, transaction, link, m1.node(), m2.node()
1736 text, transaction, link, m1.node(), m2.node()
1736 )
1737 )
1737
1738
1738 # Save nodeid so parent manifest can calculate its nodeid
1739 # Save nodeid so parent manifest can calculate its nodeid
1739 m.setnode(n)
1740 m.setnode(n)
1740 return n
1741 return n
1741
1742
1742 def __len__(self):
1743 def __len__(self):
1743 return len(self._revlog)
1744 return len(self._revlog)
1744
1745
1745 def __iter__(self):
1746 def __iter__(self):
1746 return self._revlog.__iter__()
1747 return self._revlog.__iter__()
1747
1748
1748 def rev(self, node):
1749 def rev(self, node):
1749 return self._revlog.rev(node)
1750 return self._revlog.rev(node)
1750
1751
1751 def node(self, rev):
1752 def node(self, rev):
1752 return self._revlog.node(rev)
1753 return self._revlog.node(rev)
1753
1754
1754 def lookup(self, value):
1755 def lookup(self, value):
1755 return self._revlog.lookup(value)
1756 return self._revlog.lookup(value)
1756
1757
1757 def parentrevs(self, rev):
1758 def parentrevs(self, rev):
1758 return self._revlog.parentrevs(rev)
1759 return self._revlog.parentrevs(rev)
1759
1760
1760 def parents(self, node):
1761 def parents(self, node):
1761 return self._revlog.parents(node)
1762 return self._revlog.parents(node)
1762
1763
1763 def linkrev(self, rev):
1764 def linkrev(self, rev):
1764 return self._revlog.linkrev(rev)
1765 return self._revlog.linkrev(rev)
1765
1766
1766 def checksize(self):
1767 def checksize(self):
1767 return self._revlog.checksize()
1768 return self._revlog.checksize()
1768
1769
1769 def revision(self, node, _df=None, raw=False):
1770 def revision(self, node, _df=None, raw=False):
1770 return self._revlog.revision(node, _df=_df, raw=raw)
1771 return self._revlog.revision(node, _df=_df, raw=raw)
1771
1772
1772 def rawdata(self, node, _df=None):
1773 def rawdata(self, node, _df=None):
1773 return self._revlog.rawdata(node, _df=_df)
1774 return self._revlog.rawdata(node, _df=_df)
1774
1775
1775 def revdiff(self, rev1, rev2):
1776 def revdiff(self, rev1, rev2):
1776 return self._revlog.revdiff(rev1, rev2)
1777 return self._revlog.revdiff(rev1, rev2)
1777
1778
1778 def cmp(self, node, text):
1779 def cmp(self, node, text):
1779 return self._revlog.cmp(node, text)
1780 return self._revlog.cmp(node, text)
1780
1781
1781 def deltaparent(self, rev):
1782 def deltaparent(self, rev):
1782 return self._revlog.deltaparent(rev)
1783 return self._revlog.deltaparent(rev)
1783
1784
1784 def emitrevisions(
1785 def emitrevisions(
1785 self,
1786 self,
1786 nodes,
1787 nodes,
1787 nodesorder=None,
1788 nodesorder=None,
1788 revisiondata=False,
1789 revisiondata=False,
1789 assumehaveparentrevisions=False,
1790 assumehaveparentrevisions=False,
1790 deltamode=repository.CG_DELTAMODE_STD,
1791 deltamode=repository.CG_DELTAMODE_STD,
1791 ):
1792 ):
1792 return self._revlog.emitrevisions(
1793 return self._revlog.emitrevisions(
1793 nodes,
1794 nodes,
1794 nodesorder=nodesorder,
1795 nodesorder=nodesorder,
1795 revisiondata=revisiondata,
1796 revisiondata=revisiondata,
1796 assumehaveparentrevisions=assumehaveparentrevisions,
1797 assumehaveparentrevisions=assumehaveparentrevisions,
1797 deltamode=deltamode,
1798 deltamode=deltamode,
1798 )
1799 )
1799
1800
1800 def addgroup(self, deltas, linkmapper, transaction, addrevisioncb=None):
1801 def addgroup(self, deltas, linkmapper, transaction, addrevisioncb=None):
1801 return self._revlog.addgroup(
1802 return self._revlog.addgroup(
1802 deltas, linkmapper, transaction, addrevisioncb=addrevisioncb
1803 deltas, linkmapper, transaction, addrevisioncb=addrevisioncb
1803 )
1804 )
1804
1805
1805 def rawsize(self, rev):
1806 def rawsize(self, rev):
1806 return self._revlog.rawsize(rev)
1807 return self._revlog.rawsize(rev)
1807
1808
1808 def getstrippoint(self, minlink):
1809 def getstrippoint(self, minlink):
1809 return self._revlog.getstrippoint(minlink)
1810 return self._revlog.getstrippoint(minlink)
1810
1811
1811 def strip(self, minlink, transaction):
1812 def strip(self, minlink, transaction):
1812 return self._revlog.strip(minlink, transaction)
1813 return self._revlog.strip(minlink, transaction)
1813
1814
1814 def files(self):
1815 def files(self):
1815 return self._revlog.files()
1816 return self._revlog.files()
1816
1817
1817 def clone(self, tr, destrevlog, **kwargs):
1818 def clone(self, tr, destrevlog, **kwargs):
1818 if not isinstance(destrevlog, manifestrevlog):
1819 if not isinstance(destrevlog, manifestrevlog):
1819 raise error.ProgrammingError(b'expected manifestrevlog to clone()')
1820 raise error.ProgrammingError(b'expected manifestrevlog to clone()')
1820
1821
1821 return self._revlog.clone(tr, destrevlog._revlog, **kwargs)
1822 return self._revlog.clone(tr, destrevlog._revlog, **kwargs)
1822
1823
1823 def storageinfo(
1824 def storageinfo(
1824 self,
1825 self,
1825 exclusivefiles=False,
1826 exclusivefiles=False,
1826 sharedfiles=False,
1827 sharedfiles=False,
1827 revisionscount=False,
1828 revisionscount=False,
1828 trackedsize=False,
1829 trackedsize=False,
1829 storedsize=False,
1830 storedsize=False,
1830 ):
1831 ):
1831 return self._revlog.storageinfo(
1832 return self._revlog.storageinfo(
1832 exclusivefiles=exclusivefiles,
1833 exclusivefiles=exclusivefiles,
1833 sharedfiles=sharedfiles,
1834 sharedfiles=sharedfiles,
1834 revisionscount=revisionscount,
1835 revisionscount=revisionscount,
1835 trackedsize=trackedsize,
1836 trackedsize=trackedsize,
1836 storedsize=storedsize,
1837 storedsize=storedsize,
1837 )
1838 )
1838
1839
1839 @property
1840 @property
1840 def indexfile(self):
1841 def indexfile(self):
1841 return self._revlog.indexfile
1842 return self._revlog.indexfile
1842
1843
1843 @indexfile.setter
1844 @indexfile.setter
1844 def indexfile(self, value):
1845 def indexfile(self, value):
1845 self._revlog.indexfile = value
1846 self._revlog.indexfile = value
1846
1847
1847 @property
1848 @property
1848 def opener(self):
1849 def opener(self):
1849 return self._revlog.opener
1850 return self._revlog.opener
1850
1851
1851 @opener.setter
1852 @opener.setter
1852 def opener(self, value):
1853 def opener(self, value):
1853 self._revlog.opener = value
1854 self._revlog.opener = value
1854
1855
1855
1856
1856 @interfaceutil.implementer(repository.imanifestlog)
1857 @interfaceutil.implementer(repository.imanifestlog)
1857 class manifestlog(object):
1858 class manifestlog(object):
1858 """A collection class representing the collection of manifest snapshots
1859 """A collection class representing the collection of manifest snapshots
1859 referenced by commits in the repository.
1860 referenced by commits in the repository.
1860
1861
1861 In this situation, 'manifest' refers to the abstract concept of a snapshot
1862 In this situation, 'manifest' refers to the abstract concept of a snapshot
1862 of the list of files in the given commit. Consumers of the output of this
1863 of the list of files in the given commit. Consumers of the output of this
1863 class do not care about the implementation details of the actual manifests
1864 class do not care about the implementation details of the actual manifests
1864 they receive (i.e. tree or flat or lazily loaded, etc)."""
1865 they receive (i.e. tree or flat or lazily loaded, etc)."""
1865
1866
1866 def __init__(self, opener, repo, rootstore, narrowmatch):
1867 def __init__(self, opener, repo, rootstore, narrowmatch):
1867 usetreemanifest = False
1868 usetreemanifest = False
1868 cachesize = 4
1869 cachesize = 4
1869
1870
1870 opts = getattr(opener, 'options', None)
1871 opts = getattr(opener, 'options', None)
1871 if opts is not None:
1872 if opts is not None:
1872 usetreemanifest = opts.get(b'treemanifest', usetreemanifest)
1873 usetreemanifest = opts.get(b'treemanifest', usetreemanifest)
1873 cachesize = opts.get(b'manifestcachesize', cachesize)
1874 cachesize = opts.get(b'manifestcachesize', cachesize)
1874
1875
1875 self._treemanifests = usetreemanifest
1876 self._treemanifests = usetreemanifest
1876
1877
1877 self._rootstore = rootstore
1878 self._rootstore = rootstore
1878 self._rootstore._setupmanifestcachehooks(repo)
1879 self._rootstore._setupmanifestcachehooks(repo)
1879 self._narrowmatch = narrowmatch
1880 self._narrowmatch = narrowmatch
1880
1881
1881 # A cache of the manifestctx or treemanifestctx for each directory
1882 # A cache of the manifestctx or treemanifestctx for each directory
1882 self._dirmancache = {}
1883 self._dirmancache = {}
1883 self._dirmancache[b''] = util.lrucachedict(cachesize)
1884 self._dirmancache[b''] = util.lrucachedict(cachesize)
1884
1885
1885 self._cachesize = cachesize
1886 self._cachesize = cachesize
1886
1887
1887 def __getitem__(self, node):
1888 def __getitem__(self, node):
1888 """Retrieves the manifest instance for the given node. Throws a
1889 """Retrieves the manifest instance for the given node. Throws a
1889 LookupError if not found.
1890 LookupError if not found.
1890 """
1891 """
1891 return self.get(b'', node)
1892 return self.get(b'', node)
1892
1893
1893 def get(self, tree, node, verify=True):
1894 def get(self, tree, node, verify=True):
1894 """Retrieves the manifest instance for the given node. Throws a
1895 """Retrieves the manifest instance for the given node. Throws a
1895 LookupError if not found.
1896 LookupError if not found.
1896
1897
1897 `verify` - if True an exception will be thrown if the node is not in
1898 `verify` - if True an exception will be thrown if the node is not in
1898 the revlog
1899 the revlog
1899 """
1900 """
1900 if node in self._dirmancache.get(tree, ()):
1901 if node in self._dirmancache.get(tree, ()):
1901 return self._dirmancache[tree][node]
1902 return self._dirmancache[tree][node]
1902
1903
1903 if not self._narrowmatch.always():
1904 if not self._narrowmatch.always():
1904 if not self._narrowmatch.visitdir(tree[:-1]):
1905 if not self._narrowmatch.visitdir(tree[:-1]):
1905 return excludeddirmanifestctx(tree, node)
1906 return excludeddirmanifestctx(tree, node)
1906 if tree:
1907 if tree:
1907 if self._rootstore._treeondisk:
1908 if self._rootstore._treeondisk:
1908 if verify:
1909 if verify:
1909 # Side-effect is LookupError is raised if node doesn't
1910 # Side-effect is LookupError is raised if node doesn't
1910 # exist.
1911 # exist.
1911 self.getstorage(tree).rev(node)
1912 self.getstorage(tree).rev(node)
1912
1913
1913 m = treemanifestctx(self, tree, node)
1914 m = treemanifestctx(self, tree, node)
1914 else:
1915 else:
1915 raise error.Abort(
1916 raise error.Abort(
1916 _(
1917 _(
1917 b"cannot ask for manifest directory '%s' in a flat "
1918 b"cannot ask for manifest directory '%s' in a flat "
1918 b"manifest"
1919 b"manifest"
1919 )
1920 )
1920 % tree
1921 % tree
1921 )
1922 )
1922 else:
1923 else:
1923 if verify:
1924 if verify:
1924 # Side-effect is LookupError is raised if node doesn't exist.
1925 # Side-effect is LookupError is raised if node doesn't exist.
1925 self._rootstore.rev(node)
1926 self._rootstore.rev(node)
1926
1927
1927 if self._treemanifests:
1928 if self._treemanifests:
1928 m = treemanifestctx(self, b'', node)
1929 m = treemanifestctx(self, b'', node)
1929 else:
1930 else:
1930 m = manifestctx(self, node)
1931 m = manifestctx(self, node)
1931
1932
1932 if node != nullid:
1933 if node != nullid:
1933 mancache = self._dirmancache.get(tree)
1934 mancache = self._dirmancache.get(tree)
1934 if not mancache:
1935 if not mancache:
1935 mancache = util.lrucachedict(self._cachesize)
1936 mancache = util.lrucachedict(self._cachesize)
1936 self._dirmancache[tree] = mancache
1937 self._dirmancache[tree] = mancache
1937 mancache[node] = m
1938 mancache[node] = m
1938 return m
1939 return m
1939
1940
1940 def getstorage(self, tree):
1941 def getstorage(self, tree):
1941 return self._rootstore.dirlog(tree)
1942 return self._rootstore.dirlog(tree)
1942
1943
1943 def clearcaches(self, clear_persisted_data=False):
1944 def clearcaches(self, clear_persisted_data=False):
1944 self._dirmancache.clear()
1945 self._dirmancache.clear()
1945 self._rootstore.clearcaches(clear_persisted_data=clear_persisted_data)
1946 self._rootstore.clearcaches(clear_persisted_data=clear_persisted_data)
1946
1947
1947 def rev(self, node):
1948 def rev(self, node):
1948 return self._rootstore.rev(node)
1949 return self._rootstore.rev(node)
1949
1950
1950
1951
1951 @interfaceutil.implementer(repository.imanifestrevisionwritable)
1952 @interfaceutil.implementer(repository.imanifestrevisionwritable)
1952 class memmanifestctx(object):
1953 class memmanifestctx(object):
1953 def __init__(self, manifestlog):
1954 def __init__(self, manifestlog):
1954 self._manifestlog = manifestlog
1955 self._manifestlog = manifestlog
1955 self._manifestdict = manifestdict()
1956 self._manifestdict = manifestdict()
1956
1957
1957 def _storage(self):
1958 def _storage(self):
1958 return self._manifestlog.getstorage(b'')
1959 return self._manifestlog.getstorage(b'')
1959
1960
1960 def copy(self):
1961 def copy(self):
1961 memmf = memmanifestctx(self._manifestlog)
1962 memmf = memmanifestctx(self._manifestlog)
1962 memmf._manifestdict = self.read().copy()
1963 memmf._manifestdict = self.read().copy()
1963 return memmf
1964 return memmf
1964
1965
1965 def read(self):
1966 def read(self):
1966 return self._manifestdict
1967 return self._manifestdict
1967
1968
1968 def write(self, transaction, link, p1, p2, added, removed, match=None):
1969 def write(self, transaction, link, p1, p2, added, removed, match=None):
1969 return self._storage().add(
1970 return self._storage().add(
1970 self._manifestdict,
1971 self._manifestdict,
1971 transaction,
1972 transaction,
1972 link,
1973 link,
1973 p1,
1974 p1,
1974 p2,
1975 p2,
1975 added,
1976 added,
1976 removed,
1977 removed,
1977 match=match,
1978 match=match,
1978 )
1979 )
1979
1980
1980
1981
1981 @interfaceutil.implementer(repository.imanifestrevisionstored)
1982 @interfaceutil.implementer(repository.imanifestrevisionstored)
1982 class manifestctx(object):
1983 class manifestctx(object):
1983 """A class representing a single revision of a manifest, including its
1984 """A class representing a single revision of a manifest, including its
1984 contents, its parent revs, and its linkrev.
1985 contents, its parent revs, and its linkrev.
1985 """
1986 """
1986
1987
1987 def __init__(self, manifestlog, node):
1988 def __init__(self, manifestlog, node):
1988 self._manifestlog = manifestlog
1989 self._manifestlog = manifestlog
1989 self._data = None
1990 self._data = None
1990
1991
1991 self._node = node
1992 self._node = node
1992
1993
1993 # TODO: We eventually want p1, p2, and linkrev exposed on this class,
1994 # TODO: We eventually want p1, p2, and linkrev exposed on this class,
1994 # but let's add it later when something needs it and we can load it
1995 # but let's add it later when something needs it and we can load it
1995 # lazily.
1996 # lazily.
1996 # self.p1, self.p2 = store.parents(node)
1997 # self.p1, self.p2 = store.parents(node)
1997 # rev = store.rev(node)
1998 # rev = store.rev(node)
1998 # self.linkrev = store.linkrev(rev)
1999 # self.linkrev = store.linkrev(rev)
1999
2000
2000 def _storage(self):
2001 def _storage(self):
2001 return self._manifestlog.getstorage(b'')
2002 return self._manifestlog.getstorage(b'')
2002
2003
2003 def node(self):
2004 def node(self):
2004 return self._node
2005 return self._node
2005
2006
2006 def copy(self):
2007 def copy(self):
2007 memmf = memmanifestctx(self._manifestlog)
2008 memmf = memmanifestctx(self._manifestlog)
2008 memmf._manifestdict = self.read().copy()
2009 memmf._manifestdict = self.read().copy()
2009 return memmf
2010 return memmf
2010
2011
2011 @propertycache
2012 @propertycache
2012 def parents(self):
2013 def parents(self):
2013 return self._storage().parents(self._node)
2014 return self._storage().parents(self._node)
2014
2015
2015 def read(self):
2016 def read(self):
2016 if self._data is None:
2017 if self._data is None:
2017 if self._node == nullid:
2018 if self._node == nullid:
2018 self._data = manifestdict()
2019 self._data = manifestdict()
2019 else:
2020 else:
2020 store = self._storage()
2021 store = self._storage()
2021 if self._node in store.fulltextcache:
2022 if self._node in store.fulltextcache:
2022 text = pycompat.bytestr(store.fulltextcache[self._node])
2023 text = pycompat.bytestr(store.fulltextcache[self._node])
2023 else:
2024 else:
2024 text = store.revision(self._node)
2025 text = store.revision(self._node)
2025 arraytext = bytearray(text)
2026 arraytext = bytearray(text)
2026 store.fulltextcache[self._node] = arraytext
2027 store.fulltextcache[self._node] = arraytext
2027 self._data = manifestdict(text)
2028 self._data = manifestdict(text)
2028 return self._data
2029 return self._data
2029
2030
2030 def readfast(self, shallow=False):
2031 def readfast(self, shallow=False):
2031 '''Calls either readdelta or read, based on which would be less work.
2032 '''Calls either readdelta or read, based on which would be less work.
2032 readdelta is called if the delta is against the p1, and therefore can be
2033 readdelta is called if the delta is against the p1, and therefore can be
2033 read quickly.
2034 read quickly.
2034
2035
2035 If `shallow` is True, nothing changes since this is a flat manifest.
2036 If `shallow` is True, nothing changes since this is a flat manifest.
2036 '''
2037 '''
2037 store = self._storage()
2038 store = self._storage()
2038 r = store.rev(self._node)
2039 r = store.rev(self._node)
2039 deltaparent = store.deltaparent(r)
2040 deltaparent = store.deltaparent(r)
2040 if deltaparent != nullrev and deltaparent in store.parentrevs(r):
2041 if deltaparent != nullrev and deltaparent in store.parentrevs(r):
2041 return self.readdelta()
2042 return self.readdelta()
2042 return self.read()
2043 return self.read()
2043
2044
2044 def readdelta(self, shallow=False):
2045 def readdelta(self, shallow=False):
2045 '''Returns a manifest containing just the entries that are present
2046 '''Returns a manifest containing just the entries that are present
2046 in this manifest, but not in its p1 manifest. This is efficient to read
2047 in this manifest, but not in its p1 manifest. This is efficient to read
2047 if the revlog delta is already p1.
2048 if the revlog delta is already p1.
2048
2049
2049 Changing the value of `shallow` has no effect on flat manifests.
2050 Changing the value of `shallow` has no effect on flat manifests.
2050 '''
2051 '''
2051 store = self._storage()
2052 store = self._storage()
2052 r = store.rev(self._node)
2053 r = store.rev(self._node)
2053 d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))
2054 d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))
2054 return manifestdict(d)
2055 return manifestdict(d)
2055
2056
2056 def find(self, key):
2057 def find(self, key):
2057 return self.read().find(key)
2058 return self.read().find(key)
2058
2059
2059
2060
2060 @interfaceutil.implementer(repository.imanifestrevisionwritable)
2061 @interfaceutil.implementer(repository.imanifestrevisionwritable)
2061 class memtreemanifestctx(object):
2062 class memtreemanifestctx(object):
2062 def __init__(self, manifestlog, dir=b''):
2063 def __init__(self, manifestlog, dir=b''):
2063 self._manifestlog = manifestlog
2064 self._manifestlog = manifestlog
2064 self._dir = dir
2065 self._dir = dir
2065 self._treemanifest = treemanifest()
2066 self._treemanifest = treemanifest()
2066
2067
2067 def _storage(self):
2068 def _storage(self):
2068 return self._manifestlog.getstorage(b'')
2069 return self._manifestlog.getstorage(b'')
2069
2070
2070 def copy(self):
2071 def copy(self):
2071 memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)
2072 memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)
2072 memmf._treemanifest = self._treemanifest.copy()
2073 memmf._treemanifest = self._treemanifest.copy()
2073 return memmf
2074 return memmf
2074
2075
2075 def read(self):
2076 def read(self):
2076 return self._treemanifest
2077 return self._treemanifest
2077
2078
2078 def write(self, transaction, link, p1, p2, added, removed, match=None):
2079 def write(self, transaction, link, p1, p2, added, removed, match=None):
2079 def readtree(dir, node):
2080 def readtree(dir, node):
2080 return self._manifestlog.get(dir, node).read()
2081 return self._manifestlog.get(dir, node).read()
2081
2082
2082 return self._storage().add(
2083 return self._storage().add(
2083 self._treemanifest,
2084 self._treemanifest,
2084 transaction,
2085 transaction,
2085 link,
2086 link,
2086 p1,
2087 p1,
2087 p2,
2088 p2,
2088 added,
2089 added,
2089 removed,
2090 removed,
2090 readtree=readtree,
2091 readtree=readtree,
2091 match=match,
2092 match=match,
2092 )
2093 )
2093
2094
2094
2095
2095 @interfaceutil.implementer(repository.imanifestrevisionstored)
2096 @interfaceutil.implementer(repository.imanifestrevisionstored)
2096 class treemanifestctx(object):
2097 class treemanifestctx(object):
2097 def __init__(self, manifestlog, dir, node):
2098 def __init__(self, manifestlog, dir, node):
2098 self._manifestlog = manifestlog
2099 self._manifestlog = manifestlog
2099 self._dir = dir
2100 self._dir = dir
2100 self._data = None
2101 self._data = None
2101
2102
2102 self._node = node
2103 self._node = node
2103
2104
2104 # TODO: Load p1/p2/linkrev lazily. They need to be lazily loaded so that
2105 # TODO: Load p1/p2/linkrev lazily. They need to be lazily loaded so that
2105 # we can instantiate treemanifestctx objects for directories we don't
2106 # we can instantiate treemanifestctx objects for directories we don't
2106 # have on disk.
2107 # have on disk.
2107 # self.p1, self.p2 = store.parents(node)
2108 # self.p1, self.p2 = store.parents(node)
2108 # rev = store.rev(node)
2109 # rev = store.rev(node)
2109 # self.linkrev = store.linkrev(rev)
2110 # self.linkrev = store.linkrev(rev)
2110
2111
2111 def _storage(self):
2112 def _storage(self):
2112 narrowmatch = self._manifestlog._narrowmatch
2113 narrowmatch = self._manifestlog._narrowmatch
2113 if not narrowmatch.always():
2114 if not narrowmatch.always():
2114 if not narrowmatch.visitdir(self._dir[:-1]):
2115 if not narrowmatch.visitdir(self._dir[:-1]):
2115 return excludedmanifestrevlog(self._dir)
2116 return excludedmanifestrevlog(self._dir)
2116 return self._manifestlog.getstorage(self._dir)
2117 return self._manifestlog.getstorage(self._dir)
2117
2118
2118 def read(self):
2119 def read(self):
2119 if self._data is None:
2120 if self._data is None:
2120 store = self._storage()
2121 store = self._storage()
2121 if self._node == nullid:
2122 if self._node == nullid:
2122 self._data = treemanifest()
2123 self._data = treemanifest()
2123 # TODO accessing non-public API
2124 # TODO accessing non-public API
2124 elif store._treeondisk:
2125 elif store._treeondisk:
2125 m = treemanifest(dir=self._dir)
2126 m = treemanifest(dir=self._dir)
2126
2127
2127 def gettext():
2128 def gettext():
2128 return store.revision(self._node)
2129 return store.revision(self._node)
2129
2130
2130 def readsubtree(dir, subm):
2131 def readsubtree(dir, subm):
2131 # Set verify to False since we need to be able to create
2132 # Set verify to False since we need to be able to create
2132 # subtrees for trees that don't exist on disk.
2133 # subtrees for trees that don't exist on disk.
2133 return self._manifestlog.get(dir, subm, verify=False).read()
2134 return self._manifestlog.get(dir, subm, verify=False).read()
2134
2135
2135 m.read(gettext, readsubtree)
2136 m.read(gettext, readsubtree)
2136 m.setnode(self._node)
2137 m.setnode(self._node)
2137 self._data = m
2138 self._data = m
2138 else:
2139 else:
2139 if self._node in store.fulltextcache:
2140 if self._node in store.fulltextcache:
2140 text = pycompat.bytestr(store.fulltextcache[self._node])
2141 text = pycompat.bytestr(store.fulltextcache[self._node])
2141 else:
2142 else:
2142 text = store.revision(self._node)
2143 text = store.revision(self._node)
2143 arraytext = bytearray(text)
2144 arraytext = bytearray(text)
2144 store.fulltextcache[self._node] = arraytext
2145 store.fulltextcache[self._node] = arraytext
2145 self._data = treemanifest(dir=self._dir, text=text)
2146 self._data = treemanifest(dir=self._dir, text=text)
2146
2147
2147 return self._data
2148 return self._data
2148
2149
2149 def node(self):
2150 def node(self):
2150 return self._node
2151 return self._node
2151
2152
2152 def copy(self):
2153 def copy(self):
2153 memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)
2154 memmf = memtreemanifestctx(self._manifestlog, dir=self._dir)
2154 memmf._treemanifest = self.read().copy()
2155 memmf._treemanifest = self.read().copy()
2155 return memmf
2156 return memmf
2156
2157
2157 @propertycache
2158 @propertycache
2158 def parents(self):
2159 def parents(self):
2159 return self._storage().parents(self._node)
2160 return self._storage().parents(self._node)
2160
2161
2161 def readdelta(self, shallow=False):
2162 def readdelta(self, shallow=False):
2162 '''Returns a manifest containing just the entries that are present
2163 '''Returns a manifest containing just the entries that are present
2163 in this manifest, but not in its p1 manifest. This is efficient to read
2164 in this manifest, but not in its p1 manifest. This is efficient to read
2164 if the revlog delta is already p1.
2165 if the revlog delta is already p1.
2165
2166
2166 If `shallow` is True, this will read the delta for this directory,
2167 If `shallow` is True, this will read the delta for this directory,
2167 without recursively reading subdirectory manifests. Instead, any
2168 without recursively reading subdirectory manifests. Instead, any
2168 subdirectory entry will be reported as it appears in the manifest, i.e.
2169 subdirectory entry will be reported as it appears in the manifest, i.e.
2169 the subdirectory will be reported among files and distinguished only by
2170 the subdirectory will be reported among files and distinguished only by
2170 its 't' flag.
2171 its 't' flag.
2171 '''
2172 '''
2172 store = self._storage()
2173 store = self._storage()
2173 if shallow:
2174 if shallow:
2174 r = store.rev(self._node)
2175 r = store.rev(self._node)
2175 d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))
2176 d = mdiff.patchtext(store.revdiff(store.deltaparent(r), r))
2176 return manifestdict(d)
2177 return manifestdict(d)
2177 else:
2178 else:
2178 # Need to perform a slow delta
2179 # Need to perform a slow delta
2179 r0 = store.deltaparent(store.rev(self._node))
2180 r0 = store.deltaparent(store.rev(self._node))
2180 m0 = self._manifestlog.get(self._dir, store.node(r0)).read()
2181 m0 = self._manifestlog.get(self._dir, store.node(r0)).read()
2181 m1 = self.read()
2182 m1 = self.read()
2182 md = treemanifest(dir=self._dir)
2183 md = treemanifest(dir=self._dir)
2183 for f, ((n0, fl0), (n1, fl1)) in pycompat.iteritems(m0.diff(m1)):
2184 for f, ((n0, fl0), (n1, fl1)) in pycompat.iteritems(m0.diff(m1)):
2184 if n1:
2185 if n1:
2185 md[f] = n1
2186 md[f] = n1
2186 if fl1:
2187 if fl1:
2187 md.setflag(f, fl1)
2188 md.setflag(f, fl1)
2188 return md
2189 return md
2189
2190
2190 def readfast(self, shallow=False):
2191 def readfast(self, shallow=False):
2191 '''Calls either readdelta or read, based on which would be less work.
2192 '''Calls either readdelta or read, based on which would be less work.
2192 readdelta is called if the delta is against the p1, and therefore can be
2193 readdelta is called if the delta is against the p1, and therefore can be
2193 read quickly.
2194 read quickly.
2194
2195
2195 If `shallow` is True, it only returns the entries from this manifest,
2196 If `shallow` is True, it only returns the entries from this manifest,
2196 and not any submanifests.
2197 and not any submanifests.
2197 '''
2198 '''
2198 store = self._storage()
2199 store = self._storage()
2199 r = store.rev(self._node)
2200 r = store.rev(self._node)
2200 deltaparent = store.deltaparent(r)
2201 deltaparent = store.deltaparent(r)
2201 if deltaparent != nullrev and deltaparent in store.parentrevs(r):
2202 if deltaparent != nullrev and deltaparent in store.parentrevs(r):
2202 return self.readdelta(shallow=shallow)
2203 return self.readdelta(shallow=shallow)
2203
2204
2204 if shallow:
2205 if shallow:
2205 return manifestdict(store.revision(self._node))
2206 return manifestdict(store.revision(self._node))
2206 else:
2207 else:
2207 return self.read()
2208 return self.read()
2208
2209
2209 def find(self, key):
2210 def find(self, key):
2210 return self.read().find(key)
2211 return self.read().find(key)
2211
2212
2212
2213
2213 class excludeddir(treemanifest):
2214 class excludeddir(treemanifest):
2214 """Stand-in for a directory that is excluded from the repository.
2215 """Stand-in for a directory that is excluded from the repository.
2215
2216
2216 With narrowing active on a repository that uses treemanifests,
2217 With narrowing active on a repository that uses treemanifests,
2217 some of the directory revlogs will be excluded from the resulting
2218 some of the directory revlogs will be excluded from the resulting
2218 clone. This is a huge storage win for clients, but means we need
2219 clone. This is a huge storage win for clients, but means we need
2219 some sort of pseudo-manifest to surface to internals so we can
2220 some sort of pseudo-manifest to surface to internals so we can
2220 detect a merge conflict outside the narrowspec. That's what this
2221 detect a merge conflict outside the narrowspec. That's what this
2221 class is: it stands in for a directory whose node is known, but
2222 class is: it stands in for a directory whose node is known, but
2222 whose contents are unknown.
2223 whose contents are unknown.
2223 """
2224 """
2224
2225
2225 def __init__(self, dir, node):
2226 def __init__(self, dir, node):
2226 super(excludeddir, self).__init__(dir)
2227 super(excludeddir, self).__init__(dir)
2227 self._node = node
2228 self._node = node
2228 # Add an empty file, which will be included by iterators and such,
2229 # Add an empty file, which will be included by iterators and such,
2229 # appearing as the directory itself (i.e. something like "dir/")
2230 # appearing as the directory itself (i.e. something like "dir/")
2230 self._files[b''] = node
2231 self._files[b''] = node
2231 self._flags[b''] = b't'
2232 self._flags[b''] = b't'
2232
2233
2233 # Manifests outside the narrowspec should never be modified, so avoid
2234 # Manifests outside the narrowspec should never be modified, so avoid
2234 # copying. This makes a noticeable difference when there are very many
2235 # copying. This makes a noticeable difference when there are very many
2235 # directories outside the narrowspec. Also, it makes sense for the copy to
2236 # directories outside the narrowspec. Also, it makes sense for the copy to
2236 # be of the same type as the original, which would not happen with the
2237 # be of the same type as the original, which would not happen with the
2237 # super type's copy().
2238 # super type's copy().
2238 def copy(self):
2239 def copy(self):
2239 return self
2240 return self
2240
2241
2241
2242
2242 class excludeddirmanifestctx(treemanifestctx):
2243 class excludeddirmanifestctx(treemanifestctx):
2243 """context wrapper for excludeddir - see that docstring for rationale"""
2244 """context wrapper for excludeddir - see that docstring for rationale"""
2244
2245
2245 def __init__(self, dir, node):
2246 def __init__(self, dir, node):
2246 self._dir = dir
2247 self._dir = dir
2247 self._node = node
2248 self._node = node
2248
2249
2249 def read(self):
2250 def read(self):
2250 return excludeddir(self._dir, self._node)
2251 return excludeddir(self._dir, self._node)
2251
2252
2252 def write(self, *args):
2253 def write(self, *args):
2253 raise error.ProgrammingError(
2254 raise error.ProgrammingError(
2254 b'attempt to write manifest from excluded dir %s' % self._dir
2255 b'attempt to write manifest from excluded dir %s' % self._dir
2255 )
2256 )
2256
2257
2257
2258
2258 class excludedmanifestrevlog(manifestrevlog):
2259 class excludedmanifestrevlog(manifestrevlog):
2259 """Stand-in for excluded treemanifest revlogs.
2260 """Stand-in for excluded treemanifest revlogs.
2260
2261
2261 When narrowing is active on a treemanifest repository, we'll have
2262 When narrowing is active on a treemanifest repository, we'll have
2262 references to directories we can't see due to the revlog being
2263 references to directories we can't see due to the revlog being
2263 skipped. This class exists to conform to the manifestrevlog
2264 skipped. This class exists to conform to the manifestrevlog
2264 interface for those directories and proactively prevent writes to
2265 interface for those directories and proactively prevent writes to
2265 outside the narrowspec.
2266 outside the narrowspec.
2266 """
2267 """
2267
2268
2268 def __init__(self, dir):
2269 def __init__(self, dir):
2269 self._dir = dir
2270 self._dir = dir
2270
2271
2271 def __len__(self):
2272 def __len__(self):
2272 raise error.ProgrammingError(
2273 raise error.ProgrammingError(
2273 b'attempt to get length of excluded dir %s' % self._dir
2274 b'attempt to get length of excluded dir %s' % self._dir
2274 )
2275 )
2275
2276
2276 def rev(self, node):
2277 def rev(self, node):
2277 raise error.ProgrammingError(
2278 raise error.ProgrammingError(
2278 b'attempt to get rev from excluded dir %s' % self._dir
2279 b'attempt to get rev from excluded dir %s' % self._dir
2279 )
2280 )
2280
2281
2281 def linkrev(self, node):
2282 def linkrev(self, node):
2282 raise error.ProgrammingError(
2283 raise error.ProgrammingError(
2283 b'attempt to get linkrev from excluded dir %s' % self._dir
2284 b'attempt to get linkrev from excluded dir %s' % self._dir
2284 )
2285 )
2285
2286
2286 def node(self, rev):
2287 def node(self, rev):
2287 raise error.ProgrammingError(
2288 raise error.ProgrammingError(
2288 b'attempt to get node from excluded dir %s' % self._dir
2289 b'attempt to get node from excluded dir %s' % self._dir
2289 )
2290 )
2290
2291
2291 def add(self, *args, **kwargs):
2292 def add(self, *args, **kwargs):
2292 # We should never write entries in dirlogs outside the narrow clone.
2293 # We should never write entries in dirlogs outside the narrow clone.
2293 # However, the method still gets called from writesubtree() in
2294 # However, the method still gets called from writesubtree() in
2294 # _addtree(), so we need to handle it. We should possibly make that
2295 # _addtree(), so we need to handle it. We should possibly make that
2295 # avoid calling add() with a clean manifest (_dirty is always False
2296 # avoid calling add() with a clean manifest (_dirty is always False
2296 # in excludeddir instances).
2297 # in excludeddir instances).
2297 pass
2298 pass
General Comments 0
You need to be logged in to leave comments. Login now