##// END OF EJS Templates
re2: exit `_checkre2` early if calling it is useless...
marmoute -
r51580:82cf392c stable
parent child Browse files
Show More
@@ -1,3316 +1,3319 b''
1 # util.py - Mercurial utility functions and platform specific implementations
1 # util.py - Mercurial utility functions and platform specific implementations
2 #
2 #
3 # Copyright 2005 K. Thananchayan <thananck@yahoo.com>
3 # Copyright 2005 K. Thananchayan <thananck@yahoo.com>
4 # Copyright 2005-2007 Olivia Mackall <olivia@selenic.com>
4 # Copyright 2005-2007 Olivia Mackall <olivia@selenic.com>
5 # Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com>
5 # Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com>
6 #
6 #
7 # This software may be used and distributed according to the terms of the
7 # This software may be used and distributed according to the terms of the
8 # GNU General Public License version 2 or any later version.
8 # GNU General Public License version 2 or any later version.
9
9
10 """Mercurial utility functions and platform specific implementations.
10 """Mercurial utility functions and platform specific implementations.
11
11
12 This contains helper routines that are independent of the SCM core and
12 This contains helper routines that are independent of the SCM core and
13 hide platform-specific details from the core.
13 hide platform-specific details from the core.
14 """
14 """
15
15
16
16
17 import abc
17 import abc
18 import collections
18 import collections
19 import contextlib
19 import contextlib
20 import errno
20 import errno
21 import gc
21 import gc
22 import hashlib
22 import hashlib
23 import io
23 import io
24 import itertools
24 import itertools
25 import locale
25 import locale
26 import mmap
26 import mmap
27 import os
27 import os
28 import pickle # provides util.pickle symbol
28 import pickle # provides util.pickle symbol
29 import re as remod
29 import re as remod
30 import shutil
30 import shutil
31 import stat
31 import stat
32 import sys
32 import sys
33 import time
33 import time
34 import traceback
34 import traceback
35 import warnings
35 import warnings
36
36
37 from .node import hex
37 from .node import hex
38 from .thirdparty import attr
38 from .thirdparty import attr
39 from .pycompat import (
39 from .pycompat import (
40 delattr,
40 delattr,
41 getattr,
41 getattr,
42 open,
42 open,
43 setattr,
43 setattr,
44 )
44 )
45 from hgdemandimport import tracing
45 from hgdemandimport import tracing
46 from . import (
46 from . import (
47 encoding,
47 encoding,
48 error,
48 error,
49 i18n,
49 i18n,
50 policy,
50 policy,
51 pycompat,
51 pycompat,
52 urllibcompat,
52 urllibcompat,
53 )
53 )
54 from .utils import (
54 from .utils import (
55 compression,
55 compression,
56 hashutil,
56 hashutil,
57 procutil,
57 procutil,
58 stringutil,
58 stringutil,
59 )
59 )
60
60
61 if pycompat.TYPE_CHECKING:
61 if pycompat.TYPE_CHECKING:
62 from typing import (
62 from typing import (
63 Iterable,
63 Iterable,
64 Iterator,
64 Iterator,
65 List,
65 List,
66 Optional,
66 Optional,
67 Tuple,
67 Tuple,
68 )
68 )
69
69
70
70
71 base85 = policy.importmod('base85')
71 base85 = policy.importmod('base85')
72 osutil = policy.importmod('osutil')
72 osutil = policy.importmod('osutil')
73
73
74 b85decode = base85.b85decode
74 b85decode = base85.b85decode
75 b85encode = base85.b85encode
75 b85encode = base85.b85encode
76
76
77 cookielib = pycompat.cookielib
77 cookielib = pycompat.cookielib
78 httplib = pycompat.httplib
78 httplib = pycompat.httplib
79 safehasattr = pycompat.safehasattr
79 safehasattr = pycompat.safehasattr
80 socketserver = pycompat.socketserver
80 socketserver = pycompat.socketserver
81 bytesio = io.BytesIO
81 bytesio = io.BytesIO
82 # TODO deprecate stringio name, as it is a lie on Python 3.
82 # TODO deprecate stringio name, as it is a lie on Python 3.
83 stringio = bytesio
83 stringio = bytesio
84 xmlrpclib = pycompat.xmlrpclib
84 xmlrpclib = pycompat.xmlrpclib
85
85
86 httpserver = urllibcompat.httpserver
86 httpserver = urllibcompat.httpserver
87 urlerr = urllibcompat.urlerr
87 urlerr = urllibcompat.urlerr
88 urlreq = urllibcompat.urlreq
88 urlreq = urllibcompat.urlreq
89
89
90 # workaround for win32mbcs
90 # workaround for win32mbcs
91 _filenamebytestr = pycompat.bytestr
91 _filenamebytestr = pycompat.bytestr
92
92
93 if pycompat.iswindows:
93 if pycompat.iswindows:
94 from . import windows as platform
94 from . import windows as platform
95 else:
95 else:
96 from . import posix as platform
96 from . import posix as platform
97
97
98 _ = i18n._
98 _ = i18n._
99
99
100 abspath = platform.abspath
100 abspath = platform.abspath
101 bindunixsocket = platform.bindunixsocket
101 bindunixsocket = platform.bindunixsocket
102 cachestat = platform.cachestat
102 cachestat = platform.cachestat
103 checkexec = platform.checkexec
103 checkexec = platform.checkexec
104 checklink = platform.checklink
104 checklink = platform.checklink
105 copymode = platform.copymode
105 copymode = platform.copymode
106 expandglobs = platform.expandglobs
106 expandglobs = platform.expandglobs
107 getfsmountpoint = platform.getfsmountpoint
107 getfsmountpoint = platform.getfsmountpoint
108 getfstype = platform.getfstype
108 getfstype = platform.getfstype
109 get_password = platform.get_password
109 get_password = platform.get_password
110 groupmembers = platform.groupmembers
110 groupmembers = platform.groupmembers
111 groupname = platform.groupname
111 groupname = platform.groupname
112 isexec = platform.isexec
112 isexec = platform.isexec
113 isowner = platform.isowner
113 isowner = platform.isowner
114 listdir = osutil.listdir
114 listdir = osutil.listdir
115 localpath = platform.localpath
115 localpath = platform.localpath
116 lookupreg = platform.lookupreg
116 lookupreg = platform.lookupreg
117 makedir = platform.makedir
117 makedir = platform.makedir
118 nlinks = platform.nlinks
118 nlinks = platform.nlinks
119 normpath = platform.normpath
119 normpath = platform.normpath
120 normcase = platform.normcase
120 normcase = platform.normcase
121 normcasespec = platform.normcasespec
121 normcasespec = platform.normcasespec
122 normcasefallback = platform.normcasefallback
122 normcasefallback = platform.normcasefallback
123 openhardlinks = platform.openhardlinks
123 openhardlinks = platform.openhardlinks
124 oslink = platform.oslink
124 oslink = platform.oslink
125 parsepatchoutput = platform.parsepatchoutput
125 parsepatchoutput = platform.parsepatchoutput
126 pconvert = platform.pconvert
126 pconvert = platform.pconvert
127 poll = platform.poll
127 poll = platform.poll
128 posixfile = platform.posixfile
128 posixfile = platform.posixfile
129 readlink = platform.readlink
129 readlink = platform.readlink
130 rename = platform.rename
130 rename = platform.rename
131 removedirs = platform.removedirs
131 removedirs = platform.removedirs
132 samedevice = platform.samedevice
132 samedevice = platform.samedevice
133 samefile = platform.samefile
133 samefile = platform.samefile
134 samestat = platform.samestat
134 samestat = platform.samestat
135 setflags = platform.setflags
135 setflags = platform.setflags
136 split = platform.split
136 split = platform.split
137 statfiles = getattr(osutil, 'statfiles', platform.statfiles)
137 statfiles = getattr(osutil, 'statfiles', platform.statfiles)
138 statisexec = platform.statisexec
138 statisexec = platform.statisexec
139 statislink = platform.statislink
139 statislink = platform.statislink
140 umask = platform.umask
140 umask = platform.umask
141 unlink = platform.unlink
141 unlink = platform.unlink
142 username = platform.username
142 username = platform.username
143
143
144
144
145 def setumask(val):
145 def setumask(val):
146 # type: (int) -> None
146 # type: (int) -> None
147 '''updates the umask. used by chg server'''
147 '''updates the umask. used by chg server'''
148 if pycompat.iswindows:
148 if pycompat.iswindows:
149 return
149 return
150 os.umask(val)
150 os.umask(val)
151 global umask
151 global umask
152 platform.umask = umask = val & 0o777
152 platform.umask = umask = val & 0o777
153
153
154
154
155 # small compat layer
155 # small compat layer
156 compengines = compression.compengines
156 compengines = compression.compengines
157 SERVERROLE = compression.SERVERROLE
157 SERVERROLE = compression.SERVERROLE
158 CLIENTROLE = compression.CLIENTROLE
158 CLIENTROLE = compression.CLIENTROLE
159
159
160 # Python compatibility
160 # Python compatibility
161
161
162 _notset = object()
162 _notset = object()
163
163
164
164
165 def bitsfrom(container):
165 def bitsfrom(container):
166 bits = 0
166 bits = 0
167 for bit in container:
167 for bit in container:
168 bits |= bit
168 bits |= bit
169 return bits
169 return bits
170
170
171
171
172 # python 2.6 still have deprecation warning enabled by default. We do not want
172 # python 2.6 still have deprecation warning enabled by default. We do not want
173 # to display anything to standard user so detect if we are running test and
173 # to display anything to standard user so detect if we are running test and
174 # only use python deprecation warning in this case.
174 # only use python deprecation warning in this case.
175 _dowarn = bool(encoding.environ.get(b'HGEMITWARNINGS'))
175 _dowarn = bool(encoding.environ.get(b'HGEMITWARNINGS'))
176 if _dowarn:
176 if _dowarn:
177 # explicitly unfilter our warning for python 2.7
177 # explicitly unfilter our warning for python 2.7
178 #
178 #
179 # The option of setting PYTHONWARNINGS in the test runner was investigated.
179 # The option of setting PYTHONWARNINGS in the test runner was investigated.
180 # However, module name set through PYTHONWARNINGS was exactly matched, so
180 # However, module name set through PYTHONWARNINGS was exactly matched, so
181 # we cannot set 'mercurial' and have it match eg: 'mercurial.scmutil'. This
181 # we cannot set 'mercurial' and have it match eg: 'mercurial.scmutil'. This
182 # makes the whole PYTHONWARNINGS thing useless for our usecase.
182 # makes the whole PYTHONWARNINGS thing useless for our usecase.
183 warnings.filterwarnings('default', '', DeprecationWarning, 'mercurial')
183 warnings.filterwarnings('default', '', DeprecationWarning, 'mercurial')
184 warnings.filterwarnings('default', '', DeprecationWarning, 'hgext')
184 warnings.filterwarnings('default', '', DeprecationWarning, 'hgext')
185 warnings.filterwarnings('default', '', DeprecationWarning, 'hgext3rd')
185 warnings.filterwarnings('default', '', DeprecationWarning, 'hgext3rd')
186 if _dowarn:
186 if _dowarn:
187 # silence warning emitted by passing user string to re.sub()
187 # silence warning emitted by passing user string to re.sub()
188 warnings.filterwarnings(
188 warnings.filterwarnings(
189 'ignore', 'bad escape', DeprecationWarning, 'mercurial'
189 'ignore', 'bad escape', DeprecationWarning, 'mercurial'
190 )
190 )
191 warnings.filterwarnings(
191 warnings.filterwarnings(
192 'ignore', 'invalid escape sequence', DeprecationWarning, 'mercurial'
192 'ignore', 'invalid escape sequence', DeprecationWarning, 'mercurial'
193 )
193 )
194 # TODO: reinvent imp.is_frozen()
194 # TODO: reinvent imp.is_frozen()
195 warnings.filterwarnings(
195 warnings.filterwarnings(
196 'ignore',
196 'ignore',
197 'the imp module is deprecated',
197 'the imp module is deprecated',
198 DeprecationWarning,
198 DeprecationWarning,
199 'mercurial',
199 'mercurial',
200 )
200 )
201
201
202
202
203 def nouideprecwarn(msg, version, stacklevel=1):
203 def nouideprecwarn(msg, version, stacklevel=1):
204 """Issue an python native deprecation warning
204 """Issue an python native deprecation warning
205
205
206 This is a noop outside of tests, use 'ui.deprecwarn' when possible.
206 This is a noop outside of tests, use 'ui.deprecwarn' when possible.
207 """
207 """
208 if _dowarn:
208 if _dowarn:
209 msg += (
209 msg += (
210 b"\n(compatibility will be dropped after Mercurial-%s,"
210 b"\n(compatibility will be dropped after Mercurial-%s,"
211 b" update your code.)"
211 b" update your code.)"
212 ) % version
212 ) % version
213 warnings.warn(pycompat.sysstr(msg), DeprecationWarning, stacklevel + 1)
213 warnings.warn(pycompat.sysstr(msg), DeprecationWarning, stacklevel + 1)
214 # on python 3 with chg, we will need to explicitly flush the output
214 # on python 3 with chg, we will need to explicitly flush the output
215 sys.stderr.flush()
215 sys.stderr.flush()
216
216
217
217
218 DIGESTS = {
218 DIGESTS = {
219 b'md5': hashlib.md5,
219 b'md5': hashlib.md5,
220 b'sha1': hashutil.sha1,
220 b'sha1': hashutil.sha1,
221 b'sha512': hashlib.sha512,
221 b'sha512': hashlib.sha512,
222 }
222 }
223 # List of digest types from strongest to weakest
223 # List of digest types from strongest to weakest
224 DIGESTS_BY_STRENGTH = [b'sha512', b'sha1', b'md5']
224 DIGESTS_BY_STRENGTH = [b'sha512', b'sha1', b'md5']
225
225
226 for k in DIGESTS_BY_STRENGTH:
226 for k in DIGESTS_BY_STRENGTH:
227 assert k in DIGESTS
227 assert k in DIGESTS
228
228
229
229
230 class digester:
230 class digester:
231 """helper to compute digests.
231 """helper to compute digests.
232
232
233 This helper can be used to compute one or more digests given their name.
233 This helper can be used to compute one or more digests given their name.
234
234
235 >>> d = digester([b'md5', b'sha1'])
235 >>> d = digester([b'md5', b'sha1'])
236 >>> d.update(b'foo')
236 >>> d.update(b'foo')
237 >>> [k for k in sorted(d)]
237 >>> [k for k in sorted(d)]
238 ['md5', 'sha1']
238 ['md5', 'sha1']
239 >>> d[b'md5']
239 >>> d[b'md5']
240 'acbd18db4cc2f85cedef654fccc4a4d8'
240 'acbd18db4cc2f85cedef654fccc4a4d8'
241 >>> d[b'sha1']
241 >>> d[b'sha1']
242 '0beec7b5ea3f0fdbc95d0dd47f3c5bc275da8a33'
242 '0beec7b5ea3f0fdbc95d0dd47f3c5bc275da8a33'
243 >>> digester.preferred([b'md5', b'sha1'])
243 >>> digester.preferred([b'md5', b'sha1'])
244 'sha1'
244 'sha1'
245 """
245 """
246
246
247 def __init__(self, digests, s=b''):
247 def __init__(self, digests, s=b''):
248 self._hashes = {}
248 self._hashes = {}
249 for k in digests:
249 for k in digests:
250 if k not in DIGESTS:
250 if k not in DIGESTS:
251 raise error.Abort(_(b'unknown digest type: %s') % k)
251 raise error.Abort(_(b'unknown digest type: %s') % k)
252 self._hashes[k] = DIGESTS[k]()
252 self._hashes[k] = DIGESTS[k]()
253 if s:
253 if s:
254 self.update(s)
254 self.update(s)
255
255
256 def update(self, data):
256 def update(self, data):
257 for h in self._hashes.values():
257 for h in self._hashes.values():
258 h.update(data)
258 h.update(data)
259
259
260 def __getitem__(self, key):
260 def __getitem__(self, key):
261 if key not in DIGESTS:
261 if key not in DIGESTS:
262 raise error.Abort(_(b'unknown digest type: %s') % k)
262 raise error.Abort(_(b'unknown digest type: %s') % k)
263 return hex(self._hashes[key].digest())
263 return hex(self._hashes[key].digest())
264
264
265 def __iter__(self):
265 def __iter__(self):
266 return iter(self._hashes)
266 return iter(self._hashes)
267
267
268 @staticmethod
268 @staticmethod
269 def preferred(supported):
269 def preferred(supported):
270 """returns the strongest digest type in both supported and DIGESTS."""
270 """returns the strongest digest type in both supported and DIGESTS."""
271
271
272 for k in DIGESTS_BY_STRENGTH:
272 for k in DIGESTS_BY_STRENGTH:
273 if k in supported:
273 if k in supported:
274 return k
274 return k
275 return None
275 return None
276
276
277
277
278 class digestchecker:
278 class digestchecker:
279 """file handle wrapper that additionally checks content against a given
279 """file handle wrapper that additionally checks content against a given
280 size and digests.
280 size and digests.
281
281
282 d = digestchecker(fh, size, {'md5': '...'})
282 d = digestchecker(fh, size, {'md5': '...'})
283
283
284 When multiple digests are given, all of them are validated.
284 When multiple digests are given, all of them are validated.
285 """
285 """
286
286
287 def __init__(self, fh, size, digests):
287 def __init__(self, fh, size, digests):
288 self._fh = fh
288 self._fh = fh
289 self._size = size
289 self._size = size
290 self._got = 0
290 self._got = 0
291 self._digests = dict(digests)
291 self._digests = dict(digests)
292 self._digester = digester(self._digests.keys())
292 self._digester = digester(self._digests.keys())
293
293
294 def read(self, length=-1):
294 def read(self, length=-1):
295 content = self._fh.read(length)
295 content = self._fh.read(length)
296 self._digester.update(content)
296 self._digester.update(content)
297 self._got += len(content)
297 self._got += len(content)
298 return content
298 return content
299
299
300 def validate(self):
300 def validate(self):
301 if self._size != self._got:
301 if self._size != self._got:
302 raise error.Abort(
302 raise error.Abort(
303 _(b'size mismatch: expected %d, got %d')
303 _(b'size mismatch: expected %d, got %d')
304 % (self._size, self._got)
304 % (self._size, self._got)
305 )
305 )
306 for k, v in self._digests.items():
306 for k, v in self._digests.items():
307 if v != self._digester[k]:
307 if v != self._digester[k]:
308 # i18n: first parameter is a digest name
308 # i18n: first parameter is a digest name
309 raise error.Abort(
309 raise error.Abort(
310 _(b'%s mismatch: expected %s, got %s')
310 _(b'%s mismatch: expected %s, got %s')
311 % (k, v, self._digester[k])
311 % (k, v, self._digester[k])
312 )
312 )
313
313
314
314
315 try:
315 try:
316 buffer = buffer # pytype: disable=name-error
316 buffer = buffer # pytype: disable=name-error
317 except NameError:
317 except NameError:
318
318
319 def buffer(sliceable, offset=0, length=None):
319 def buffer(sliceable, offset=0, length=None):
320 if length is not None:
320 if length is not None:
321 return memoryview(sliceable)[offset : offset + length]
321 return memoryview(sliceable)[offset : offset + length]
322 return memoryview(sliceable)[offset:]
322 return memoryview(sliceable)[offset:]
323
323
324
324
325 _chunksize = 4096
325 _chunksize = 4096
326
326
327
327
328 class bufferedinputpipe:
328 class bufferedinputpipe:
329 """a manually buffered input pipe
329 """a manually buffered input pipe
330
330
331 Python will not let us use buffered IO and lazy reading with 'polling' at
331 Python will not let us use buffered IO and lazy reading with 'polling' at
332 the same time. We cannot probe the buffer state and select will not detect
332 the same time. We cannot probe the buffer state and select will not detect
333 that data are ready to read if they are already buffered.
333 that data are ready to read if they are already buffered.
334
334
335 This class let us work around that by implementing its own buffering
335 This class let us work around that by implementing its own buffering
336 (allowing efficient readline) while offering a way to know if the buffer is
336 (allowing efficient readline) while offering a way to know if the buffer is
337 empty from the output (allowing collaboration of the buffer with polling).
337 empty from the output (allowing collaboration of the buffer with polling).
338
338
339 This class lives in the 'util' module because it makes use of the 'os'
339 This class lives in the 'util' module because it makes use of the 'os'
340 module from the python stdlib.
340 module from the python stdlib.
341 """
341 """
342
342
343 def __new__(cls, fh):
343 def __new__(cls, fh):
344 # If we receive a fileobjectproxy, we need to use a variation of this
344 # If we receive a fileobjectproxy, we need to use a variation of this
345 # class that notifies observers about activity.
345 # class that notifies observers about activity.
346 if isinstance(fh, fileobjectproxy):
346 if isinstance(fh, fileobjectproxy):
347 cls = observedbufferedinputpipe
347 cls = observedbufferedinputpipe
348
348
349 return super(bufferedinputpipe, cls).__new__(cls)
349 return super(bufferedinputpipe, cls).__new__(cls)
350
350
351 def __init__(self, input):
351 def __init__(self, input):
352 self._input = input
352 self._input = input
353 self._buffer = []
353 self._buffer = []
354 self._eof = False
354 self._eof = False
355 self._lenbuf = 0
355 self._lenbuf = 0
356
356
357 @property
357 @property
358 def hasbuffer(self):
358 def hasbuffer(self):
359 """True is any data is currently buffered
359 """True is any data is currently buffered
360
360
361 This will be used externally a pre-step for polling IO. If there is
361 This will be used externally a pre-step for polling IO. If there is
362 already data then no polling should be set in place."""
362 already data then no polling should be set in place."""
363 return bool(self._buffer)
363 return bool(self._buffer)
364
364
365 @property
365 @property
366 def closed(self):
366 def closed(self):
367 return self._input.closed
367 return self._input.closed
368
368
369 def fileno(self):
369 def fileno(self):
370 return self._input.fileno()
370 return self._input.fileno()
371
371
372 def close(self):
372 def close(self):
373 return self._input.close()
373 return self._input.close()
374
374
375 def read(self, size):
375 def read(self, size):
376 while (not self._eof) and (self._lenbuf < size):
376 while (not self._eof) and (self._lenbuf < size):
377 self._fillbuffer()
377 self._fillbuffer()
378 return self._frombuffer(size)
378 return self._frombuffer(size)
379
379
380 def unbufferedread(self, size):
380 def unbufferedread(self, size):
381 if not self._eof and self._lenbuf == 0:
381 if not self._eof and self._lenbuf == 0:
382 self._fillbuffer(max(size, _chunksize))
382 self._fillbuffer(max(size, _chunksize))
383 return self._frombuffer(min(self._lenbuf, size))
383 return self._frombuffer(min(self._lenbuf, size))
384
384
385 def readline(self, *args, **kwargs):
385 def readline(self, *args, **kwargs):
386 if len(self._buffer) > 1:
386 if len(self._buffer) > 1:
387 # this should not happen because both read and readline end with a
387 # this should not happen because both read and readline end with a
388 # _frombuffer call that collapse it.
388 # _frombuffer call that collapse it.
389 self._buffer = [b''.join(self._buffer)]
389 self._buffer = [b''.join(self._buffer)]
390 self._lenbuf = len(self._buffer[0])
390 self._lenbuf = len(self._buffer[0])
391 lfi = -1
391 lfi = -1
392 if self._buffer:
392 if self._buffer:
393 lfi = self._buffer[-1].find(b'\n')
393 lfi = self._buffer[-1].find(b'\n')
394 while (not self._eof) and lfi < 0:
394 while (not self._eof) and lfi < 0:
395 self._fillbuffer()
395 self._fillbuffer()
396 if self._buffer:
396 if self._buffer:
397 lfi = self._buffer[-1].find(b'\n')
397 lfi = self._buffer[-1].find(b'\n')
398 size = lfi + 1
398 size = lfi + 1
399 if lfi < 0: # end of file
399 if lfi < 0: # end of file
400 size = self._lenbuf
400 size = self._lenbuf
401 elif len(self._buffer) > 1:
401 elif len(self._buffer) > 1:
402 # we need to take previous chunks into account
402 # we need to take previous chunks into account
403 size += self._lenbuf - len(self._buffer[-1])
403 size += self._lenbuf - len(self._buffer[-1])
404 return self._frombuffer(size)
404 return self._frombuffer(size)
405
405
406 def _frombuffer(self, size):
406 def _frombuffer(self, size):
407 """return at most 'size' data from the buffer
407 """return at most 'size' data from the buffer
408
408
409 The data are removed from the buffer."""
409 The data are removed from the buffer."""
410 if size == 0 or not self._buffer:
410 if size == 0 or not self._buffer:
411 return b''
411 return b''
412 buf = self._buffer[0]
412 buf = self._buffer[0]
413 if len(self._buffer) > 1:
413 if len(self._buffer) > 1:
414 buf = b''.join(self._buffer)
414 buf = b''.join(self._buffer)
415
415
416 data = buf[:size]
416 data = buf[:size]
417 buf = buf[len(data) :]
417 buf = buf[len(data) :]
418 if buf:
418 if buf:
419 self._buffer = [buf]
419 self._buffer = [buf]
420 self._lenbuf = len(buf)
420 self._lenbuf = len(buf)
421 else:
421 else:
422 self._buffer = []
422 self._buffer = []
423 self._lenbuf = 0
423 self._lenbuf = 0
424 return data
424 return data
425
425
426 def _fillbuffer(self, size=_chunksize):
426 def _fillbuffer(self, size=_chunksize):
427 """read data to the buffer"""
427 """read data to the buffer"""
428 data = os.read(self._input.fileno(), size)
428 data = os.read(self._input.fileno(), size)
429 if not data:
429 if not data:
430 self._eof = True
430 self._eof = True
431 else:
431 else:
432 self._lenbuf += len(data)
432 self._lenbuf += len(data)
433 self._buffer.append(data)
433 self._buffer.append(data)
434
434
435 return data
435 return data
436
436
437
437
438 def mmapread(fp, size=None):
438 def mmapread(fp, size=None):
439 if size == 0:
439 if size == 0:
440 # size of 0 to mmap.mmap() means "all data"
440 # size of 0 to mmap.mmap() means "all data"
441 # rather than "zero bytes", so special case that.
441 # rather than "zero bytes", so special case that.
442 return b''
442 return b''
443 elif size is None:
443 elif size is None:
444 size = 0
444 size = 0
445 fd = getattr(fp, 'fileno', lambda: fp)()
445 fd = getattr(fp, 'fileno', lambda: fp)()
446 try:
446 try:
447 return mmap.mmap(fd, size, access=mmap.ACCESS_READ)
447 return mmap.mmap(fd, size, access=mmap.ACCESS_READ)
448 except ValueError:
448 except ValueError:
449 # Empty files cannot be mmapped, but mmapread should still work. Check
449 # Empty files cannot be mmapped, but mmapread should still work. Check
450 # if the file is empty, and if so, return an empty buffer.
450 # if the file is empty, and if so, return an empty buffer.
451 if os.fstat(fd).st_size == 0:
451 if os.fstat(fd).st_size == 0:
452 return b''
452 return b''
453 raise
453 raise
454
454
455
455
456 class fileobjectproxy:
456 class fileobjectproxy:
457 """A proxy around file objects that tells a watcher when events occur.
457 """A proxy around file objects that tells a watcher when events occur.
458
458
459 This type is intended to only be used for testing purposes. Think hard
459 This type is intended to only be used for testing purposes. Think hard
460 before using it in important code.
460 before using it in important code.
461 """
461 """
462
462
463 __slots__ = (
463 __slots__ = (
464 '_orig',
464 '_orig',
465 '_observer',
465 '_observer',
466 )
466 )
467
467
468 def __init__(self, fh, observer):
468 def __init__(self, fh, observer):
469 object.__setattr__(self, '_orig', fh)
469 object.__setattr__(self, '_orig', fh)
470 object.__setattr__(self, '_observer', observer)
470 object.__setattr__(self, '_observer', observer)
471
471
472 def __getattribute__(self, name):
472 def __getattribute__(self, name):
473 ours = {
473 ours = {
474 '_observer',
474 '_observer',
475 # IOBase
475 # IOBase
476 'close',
476 'close',
477 # closed if a property
477 # closed if a property
478 'fileno',
478 'fileno',
479 'flush',
479 'flush',
480 'isatty',
480 'isatty',
481 'readable',
481 'readable',
482 'readline',
482 'readline',
483 'readlines',
483 'readlines',
484 'seek',
484 'seek',
485 'seekable',
485 'seekable',
486 'tell',
486 'tell',
487 'truncate',
487 'truncate',
488 'writable',
488 'writable',
489 'writelines',
489 'writelines',
490 # RawIOBase
490 # RawIOBase
491 'read',
491 'read',
492 'readall',
492 'readall',
493 'readinto',
493 'readinto',
494 'write',
494 'write',
495 # BufferedIOBase
495 # BufferedIOBase
496 # raw is a property
496 # raw is a property
497 'detach',
497 'detach',
498 # read defined above
498 # read defined above
499 'read1',
499 'read1',
500 # readinto defined above
500 # readinto defined above
501 # write defined above
501 # write defined above
502 }
502 }
503
503
504 # We only observe some methods.
504 # We only observe some methods.
505 if name in ours:
505 if name in ours:
506 return object.__getattribute__(self, name)
506 return object.__getattribute__(self, name)
507
507
508 return getattr(object.__getattribute__(self, '_orig'), name)
508 return getattr(object.__getattribute__(self, '_orig'), name)
509
509
510 def __nonzero__(self):
510 def __nonzero__(self):
511 return bool(object.__getattribute__(self, '_orig'))
511 return bool(object.__getattribute__(self, '_orig'))
512
512
513 __bool__ = __nonzero__
513 __bool__ = __nonzero__
514
514
515 def __delattr__(self, name):
515 def __delattr__(self, name):
516 return delattr(object.__getattribute__(self, '_orig'), name)
516 return delattr(object.__getattribute__(self, '_orig'), name)
517
517
518 def __setattr__(self, name, value):
518 def __setattr__(self, name, value):
519 return setattr(object.__getattribute__(self, '_orig'), name, value)
519 return setattr(object.__getattribute__(self, '_orig'), name, value)
520
520
521 def __iter__(self):
521 def __iter__(self):
522 return object.__getattribute__(self, '_orig').__iter__()
522 return object.__getattribute__(self, '_orig').__iter__()
523
523
524 def _observedcall(self, name, *args, **kwargs):
524 def _observedcall(self, name, *args, **kwargs):
525 # Call the original object.
525 # Call the original object.
526 orig = object.__getattribute__(self, '_orig')
526 orig = object.__getattribute__(self, '_orig')
527 res = getattr(orig, name)(*args, **kwargs)
527 res = getattr(orig, name)(*args, **kwargs)
528
528
529 # Call a method on the observer of the same name with arguments
529 # Call a method on the observer of the same name with arguments
530 # so it can react, log, etc.
530 # so it can react, log, etc.
531 observer = object.__getattribute__(self, '_observer')
531 observer = object.__getattribute__(self, '_observer')
532 fn = getattr(observer, name, None)
532 fn = getattr(observer, name, None)
533 if fn:
533 if fn:
534 fn(res, *args, **kwargs)
534 fn(res, *args, **kwargs)
535
535
536 return res
536 return res
537
537
538 def close(self, *args, **kwargs):
538 def close(self, *args, **kwargs):
539 return object.__getattribute__(self, '_observedcall')(
539 return object.__getattribute__(self, '_observedcall')(
540 'close', *args, **kwargs
540 'close', *args, **kwargs
541 )
541 )
542
542
543 def fileno(self, *args, **kwargs):
543 def fileno(self, *args, **kwargs):
544 return object.__getattribute__(self, '_observedcall')(
544 return object.__getattribute__(self, '_observedcall')(
545 'fileno', *args, **kwargs
545 'fileno', *args, **kwargs
546 )
546 )
547
547
548 def flush(self, *args, **kwargs):
548 def flush(self, *args, **kwargs):
549 return object.__getattribute__(self, '_observedcall')(
549 return object.__getattribute__(self, '_observedcall')(
550 'flush', *args, **kwargs
550 'flush', *args, **kwargs
551 )
551 )
552
552
553 def isatty(self, *args, **kwargs):
553 def isatty(self, *args, **kwargs):
554 return object.__getattribute__(self, '_observedcall')(
554 return object.__getattribute__(self, '_observedcall')(
555 'isatty', *args, **kwargs
555 'isatty', *args, **kwargs
556 )
556 )
557
557
558 def readable(self, *args, **kwargs):
558 def readable(self, *args, **kwargs):
559 return object.__getattribute__(self, '_observedcall')(
559 return object.__getattribute__(self, '_observedcall')(
560 'readable', *args, **kwargs
560 'readable', *args, **kwargs
561 )
561 )
562
562
563 def readline(self, *args, **kwargs):
563 def readline(self, *args, **kwargs):
564 return object.__getattribute__(self, '_observedcall')(
564 return object.__getattribute__(self, '_observedcall')(
565 'readline', *args, **kwargs
565 'readline', *args, **kwargs
566 )
566 )
567
567
568 def readlines(self, *args, **kwargs):
568 def readlines(self, *args, **kwargs):
569 return object.__getattribute__(self, '_observedcall')(
569 return object.__getattribute__(self, '_observedcall')(
570 'readlines', *args, **kwargs
570 'readlines', *args, **kwargs
571 )
571 )
572
572
573 def seek(self, *args, **kwargs):
573 def seek(self, *args, **kwargs):
574 return object.__getattribute__(self, '_observedcall')(
574 return object.__getattribute__(self, '_observedcall')(
575 'seek', *args, **kwargs
575 'seek', *args, **kwargs
576 )
576 )
577
577
578 def seekable(self, *args, **kwargs):
578 def seekable(self, *args, **kwargs):
579 return object.__getattribute__(self, '_observedcall')(
579 return object.__getattribute__(self, '_observedcall')(
580 'seekable', *args, **kwargs
580 'seekable', *args, **kwargs
581 )
581 )
582
582
583 def tell(self, *args, **kwargs):
583 def tell(self, *args, **kwargs):
584 return object.__getattribute__(self, '_observedcall')(
584 return object.__getattribute__(self, '_observedcall')(
585 'tell', *args, **kwargs
585 'tell', *args, **kwargs
586 )
586 )
587
587
588 def truncate(self, *args, **kwargs):
588 def truncate(self, *args, **kwargs):
589 return object.__getattribute__(self, '_observedcall')(
589 return object.__getattribute__(self, '_observedcall')(
590 'truncate', *args, **kwargs
590 'truncate', *args, **kwargs
591 )
591 )
592
592
593 def writable(self, *args, **kwargs):
593 def writable(self, *args, **kwargs):
594 return object.__getattribute__(self, '_observedcall')(
594 return object.__getattribute__(self, '_observedcall')(
595 'writable', *args, **kwargs
595 'writable', *args, **kwargs
596 )
596 )
597
597
598 def writelines(self, *args, **kwargs):
598 def writelines(self, *args, **kwargs):
599 return object.__getattribute__(self, '_observedcall')(
599 return object.__getattribute__(self, '_observedcall')(
600 'writelines', *args, **kwargs
600 'writelines', *args, **kwargs
601 )
601 )
602
602
603 def read(self, *args, **kwargs):
603 def read(self, *args, **kwargs):
604 return object.__getattribute__(self, '_observedcall')(
604 return object.__getattribute__(self, '_observedcall')(
605 'read', *args, **kwargs
605 'read', *args, **kwargs
606 )
606 )
607
607
608 def readall(self, *args, **kwargs):
608 def readall(self, *args, **kwargs):
609 return object.__getattribute__(self, '_observedcall')(
609 return object.__getattribute__(self, '_observedcall')(
610 'readall', *args, **kwargs
610 'readall', *args, **kwargs
611 )
611 )
612
612
613 def readinto(self, *args, **kwargs):
613 def readinto(self, *args, **kwargs):
614 return object.__getattribute__(self, '_observedcall')(
614 return object.__getattribute__(self, '_observedcall')(
615 'readinto', *args, **kwargs
615 'readinto', *args, **kwargs
616 )
616 )
617
617
618 def write(self, *args, **kwargs):
618 def write(self, *args, **kwargs):
619 return object.__getattribute__(self, '_observedcall')(
619 return object.__getattribute__(self, '_observedcall')(
620 'write', *args, **kwargs
620 'write', *args, **kwargs
621 )
621 )
622
622
623 def detach(self, *args, **kwargs):
623 def detach(self, *args, **kwargs):
624 return object.__getattribute__(self, '_observedcall')(
624 return object.__getattribute__(self, '_observedcall')(
625 'detach', *args, **kwargs
625 'detach', *args, **kwargs
626 )
626 )
627
627
628 def read1(self, *args, **kwargs):
628 def read1(self, *args, **kwargs):
629 return object.__getattribute__(self, '_observedcall')(
629 return object.__getattribute__(self, '_observedcall')(
630 'read1', *args, **kwargs
630 'read1', *args, **kwargs
631 )
631 )
632
632
633
633
634 class observedbufferedinputpipe(bufferedinputpipe):
634 class observedbufferedinputpipe(bufferedinputpipe):
635 """A variation of bufferedinputpipe that is aware of fileobjectproxy.
635 """A variation of bufferedinputpipe that is aware of fileobjectproxy.
636
636
637 ``bufferedinputpipe`` makes low-level calls to ``os.read()`` that
637 ``bufferedinputpipe`` makes low-level calls to ``os.read()`` that
638 bypass ``fileobjectproxy``. Because of this, we need to make
638 bypass ``fileobjectproxy``. Because of this, we need to make
639 ``bufferedinputpipe`` aware of these operations.
639 ``bufferedinputpipe`` aware of these operations.
640
640
641 This variation of ``bufferedinputpipe`` can notify observers about
641 This variation of ``bufferedinputpipe`` can notify observers about
642 ``os.read()`` events. It also re-publishes other events, such as
642 ``os.read()`` events. It also re-publishes other events, such as
643 ``read()`` and ``readline()``.
643 ``read()`` and ``readline()``.
644 """
644 """
645
645
646 def _fillbuffer(self, size=_chunksize):
646 def _fillbuffer(self, size=_chunksize):
647 res = super(observedbufferedinputpipe, self)._fillbuffer(size=size)
647 res = super(observedbufferedinputpipe, self)._fillbuffer(size=size)
648
648
649 fn = getattr(self._input._observer, 'osread', None)
649 fn = getattr(self._input._observer, 'osread', None)
650 if fn:
650 if fn:
651 fn(res, size)
651 fn(res, size)
652
652
653 return res
653 return res
654
654
655 # We use different observer methods because the operation isn't
655 # We use different observer methods because the operation isn't
656 # performed on the actual file object but on us.
656 # performed on the actual file object but on us.
657 def read(self, size):
657 def read(self, size):
658 res = super(observedbufferedinputpipe, self).read(size)
658 res = super(observedbufferedinputpipe, self).read(size)
659
659
660 fn = getattr(self._input._observer, 'bufferedread', None)
660 fn = getattr(self._input._observer, 'bufferedread', None)
661 if fn:
661 if fn:
662 fn(res, size)
662 fn(res, size)
663
663
664 return res
664 return res
665
665
666 def readline(self, *args, **kwargs):
666 def readline(self, *args, **kwargs):
667 res = super(observedbufferedinputpipe, self).readline(*args, **kwargs)
667 res = super(observedbufferedinputpipe, self).readline(*args, **kwargs)
668
668
669 fn = getattr(self._input._observer, 'bufferedreadline', None)
669 fn = getattr(self._input._observer, 'bufferedreadline', None)
670 if fn:
670 if fn:
671 fn(res)
671 fn(res)
672
672
673 return res
673 return res
674
674
675
675
676 PROXIED_SOCKET_METHODS = {
676 PROXIED_SOCKET_METHODS = {
677 'makefile',
677 'makefile',
678 'recv',
678 'recv',
679 'recvfrom',
679 'recvfrom',
680 'recvfrom_into',
680 'recvfrom_into',
681 'recv_into',
681 'recv_into',
682 'send',
682 'send',
683 'sendall',
683 'sendall',
684 'sendto',
684 'sendto',
685 'setblocking',
685 'setblocking',
686 'settimeout',
686 'settimeout',
687 'gettimeout',
687 'gettimeout',
688 'setsockopt',
688 'setsockopt',
689 }
689 }
690
690
691
691
692 class socketproxy:
692 class socketproxy:
693 """A proxy around a socket that tells a watcher when events occur.
693 """A proxy around a socket that tells a watcher when events occur.
694
694
695 This is like ``fileobjectproxy`` except for sockets.
695 This is like ``fileobjectproxy`` except for sockets.
696
696
697 This type is intended to only be used for testing purposes. Think hard
697 This type is intended to only be used for testing purposes. Think hard
698 before using it in important code.
698 before using it in important code.
699 """
699 """
700
700
701 __slots__ = (
701 __slots__ = (
702 '_orig',
702 '_orig',
703 '_observer',
703 '_observer',
704 )
704 )
705
705
706 def __init__(self, sock, observer):
706 def __init__(self, sock, observer):
707 object.__setattr__(self, '_orig', sock)
707 object.__setattr__(self, '_orig', sock)
708 object.__setattr__(self, '_observer', observer)
708 object.__setattr__(self, '_observer', observer)
709
709
710 def __getattribute__(self, name):
710 def __getattribute__(self, name):
711 if name in PROXIED_SOCKET_METHODS:
711 if name in PROXIED_SOCKET_METHODS:
712 return object.__getattribute__(self, name)
712 return object.__getattribute__(self, name)
713
713
714 return getattr(object.__getattribute__(self, '_orig'), name)
714 return getattr(object.__getattribute__(self, '_orig'), name)
715
715
716 def __delattr__(self, name):
716 def __delattr__(self, name):
717 return delattr(object.__getattribute__(self, '_orig'), name)
717 return delattr(object.__getattribute__(self, '_orig'), name)
718
718
719 def __setattr__(self, name, value):
719 def __setattr__(self, name, value):
720 return setattr(object.__getattribute__(self, '_orig'), name, value)
720 return setattr(object.__getattribute__(self, '_orig'), name, value)
721
721
722 def __nonzero__(self):
722 def __nonzero__(self):
723 return bool(object.__getattribute__(self, '_orig'))
723 return bool(object.__getattribute__(self, '_orig'))
724
724
725 __bool__ = __nonzero__
725 __bool__ = __nonzero__
726
726
727 def _observedcall(self, name, *args, **kwargs):
727 def _observedcall(self, name, *args, **kwargs):
728 # Call the original object.
728 # Call the original object.
729 orig = object.__getattribute__(self, '_orig')
729 orig = object.__getattribute__(self, '_orig')
730 res = getattr(orig, name)(*args, **kwargs)
730 res = getattr(orig, name)(*args, **kwargs)
731
731
732 # Call a method on the observer of the same name with arguments
732 # Call a method on the observer of the same name with arguments
733 # so it can react, log, etc.
733 # so it can react, log, etc.
734 observer = object.__getattribute__(self, '_observer')
734 observer = object.__getattribute__(self, '_observer')
735 fn = getattr(observer, name, None)
735 fn = getattr(observer, name, None)
736 if fn:
736 if fn:
737 fn(res, *args, **kwargs)
737 fn(res, *args, **kwargs)
738
738
739 return res
739 return res
740
740
741 def makefile(self, *args, **kwargs):
741 def makefile(self, *args, **kwargs):
742 res = object.__getattribute__(self, '_observedcall')(
742 res = object.__getattribute__(self, '_observedcall')(
743 'makefile', *args, **kwargs
743 'makefile', *args, **kwargs
744 )
744 )
745
745
746 # The file object may be used for I/O. So we turn it into a
746 # The file object may be used for I/O. So we turn it into a
747 # proxy using our observer.
747 # proxy using our observer.
748 observer = object.__getattribute__(self, '_observer')
748 observer = object.__getattribute__(self, '_observer')
749 return makeloggingfileobject(
749 return makeloggingfileobject(
750 observer.fh,
750 observer.fh,
751 res,
751 res,
752 observer.name,
752 observer.name,
753 reads=observer.reads,
753 reads=observer.reads,
754 writes=observer.writes,
754 writes=observer.writes,
755 logdata=observer.logdata,
755 logdata=observer.logdata,
756 logdataapis=observer.logdataapis,
756 logdataapis=observer.logdataapis,
757 )
757 )
758
758
759 def recv(self, *args, **kwargs):
759 def recv(self, *args, **kwargs):
760 return object.__getattribute__(self, '_observedcall')(
760 return object.__getattribute__(self, '_observedcall')(
761 'recv', *args, **kwargs
761 'recv', *args, **kwargs
762 )
762 )
763
763
764 def recvfrom(self, *args, **kwargs):
764 def recvfrom(self, *args, **kwargs):
765 return object.__getattribute__(self, '_observedcall')(
765 return object.__getattribute__(self, '_observedcall')(
766 'recvfrom', *args, **kwargs
766 'recvfrom', *args, **kwargs
767 )
767 )
768
768
769 def recvfrom_into(self, *args, **kwargs):
769 def recvfrom_into(self, *args, **kwargs):
770 return object.__getattribute__(self, '_observedcall')(
770 return object.__getattribute__(self, '_observedcall')(
771 'recvfrom_into', *args, **kwargs
771 'recvfrom_into', *args, **kwargs
772 )
772 )
773
773
774 def recv_into(self, *args, **kwargs):
774 def recv_into(self, *args, **kwargs):
775 return object.__getattribute__(self, '_observedcall')(
775 return object.__getattribute__(self, '_observedcall')(
776 'recv_info', *args, **kwargs
776 'recv_info', *args, **kwargs
777 )
777 )
778
778
779 def send(self, *args, **kwargs):
779 def send(self, *args, **kwargs):
780 return object.__getattribute__(self, '_observedcall')(
780 return object.__getattribute__(self, '_observedcall')(
781 'send', *args, **kwargs
781 'send', *args, **kwargs
782 )
782 )
783
783
784 def sendall(self, *args, **kwargs):
784 def sendall(self, *args, **kwargs):
785 return object.__getattribute__(self, '_observedcall')(
785 return object.__getattribute__(self, '_observedcall')(
786 'sendall', *args, **kwargs
786 'sendall', *args, **kwargs
787 )
787 )
788
788
789 def sendto(self, *args, **kwargs):
789 def sendto(self, *args, **kwargs):
790 return object.__getattribute__(self, '_observedcall')(
790 return object.__getattribute__(self, '_observedcall')(
791 'sendto', *args, **kwargs
791 'sendto', *args, **kwargs
792 )
792 )
793
793
794 def setblocking(self, *args, **kwargs):
794 def setblocking(self, *args, **kwargs):
795 return object.__getattribute__(self, '_observedcall')(
795 return object.__getattribute__(self, '_observedcall')(
796 'setblocking', *args, **kwargs
796 'setblocking', *args, **kwargs
797 )
797 )
798
798
799 def settimeout(self, *args, **kwargs):
799 def settimeout(self, *args, **kwargs):
800 return object.__getattribute__(self, '_observedcall')(
800 return object.__getattribute__(self, '_observedcall')(
801 'settimeout', *args, **kwargs
801 'settimeout', *args, **kwargs
802 )
802 )
803
803
804 def gettimeout(self, *args, **kwargs):
804 def gettimeout(self, *args, **kwargs):
805 return object.__getattribute__(self, '_observedcall')(
805 return object.__getattribute__(self, '_observedcall')(
806 'gettimeout', *args, **kwargs
806 'gettimeout', *args, **kwargs
807 )
807 )
808
808
809 def setsockopt(self, *args, **kwargs):
809 def setsockopt(self, *args, **kwargs):
810 return object.__getattribute__(self, '_observedcall')(
810 return object.__getattribute__(self, '_observedcall')(
811 'setsockopt', *args, **kwargs
811 'setsockopt', *args, **kwargs
812 )
812 )
813
813
814
814
815 class baseproxyobserver:
815 class baseproxyobserver:
816 def __init__(self, fh, name, logdata, logdataapis):
816 def __init__(self, fh, name, logdata, logdataapis):
817 self.fh = fh
817 self.fh = fh
818 self.name = name
818 self.name = name
819 self.logdata = logdata
819 self.logdata = logdata
820 self.logdataapis = logdataapis
820 self.logdataapis = logdataapis
821
821
822 def _writedata(self, data):
822 def _writedata(self, data):
823 if not self.logdata:
823 if not self.logdata:
824 if self.logdataapis:
824 if self.logdataapis:
825 self.fh.write(b'\n')
825 self.fh.write(b'\n')
826 self.fh.flush()
826 self.fh.flush()
827 return
827 return
828
828
829 # Simple case writes all data on a single line.
829 # Simple case writes all data on a single line.
830 if b'\n' not in data:
830 if b'\n' not in data:
831 if self.logdataapis:
831 if self.logdataapis:
832 self.fh.write(b': %s\n' % stringutil.escapestr(data))
832 self.fh.write(b': %s\n' % stringutil.escapestr(data))
833 else:
833 else:
834 self.fh.write(
834 self.fh.write(
835 b'%s> %s\n' % (self.name, stringutil.escapestr(data))
835 b'%s> %s\n' % (self.name, stringutil.escapestr(data))
836 )
836 )
837 self.fh.flush()
837 self.fh.flush()
838 return
838 return
839
839
840 # Data with newlines is written to multiple lines.
840 # Data with newlines is written to multiple lines.
841 if self.logdataapis:
841 if self.logdataapis:
842 self.fh.write(b':\n')
842 self.fh.write(b':\n')
843
843
844 lines = data.splitlines(True)
844 lines = data.splitlines(True)
845 for line in lines:
845 for line in lines:
846 self.fh.write(
846 self.fh.write(
847 b'%s> %s\n' % (self.name, stringutil.escapestr(line))
847 b'%s> %s\n' % (self.name, stringutil.escapestr(line))
848 )
848 )
849 self.fh.flush()
849 self.fh.flush()
850
850
851
851
852 class fileobjectobserver(baseproxyobserver):
852 class fileobjectobserver(baseproxyobserver):
853 """Logs file object activity."""
853 """Logs file object activity."""
854
854
855 def __init__(
855 def __init__(
856 self, fh, name, reads=True, writes=True, logdata=False, logdataapis=True
856 self, fh, name, reads=True, writes=True, logdata=False, logdataapis=True
857 ):
857 ):
858 super(fileobjectobserver, self).__init__(fh, name, logdata, logdataapis)
858 super(fileobjectobserver, self).__init__(fh, name, logdata, logdataapis)
859 self.reads = reads
859 self.reads = reads
860 self.writes = writes
860 self.writes = writes
861
861
862 def read(self, res, size=-1):
862 def read(self, res, size=-1):
863 if not self.reads:
863 if not self.reads:
864 return
864 return
865 # Python 3 can return None from reads at EOF instead of empty strings.
865 # Python 3 can return None from reads at EOF instead of empty strings.
866 if res is None:
866 if res is None:
867 res = b''
867 res = b''
868
868
869 if size == -1 and res == b'':
869 if size == -1 and res == b'':
870 # Suppress pointless read(-1) calls that return
870 # Suppress pointless read(-1) calls that return
871 # nothing. These happen _a lot_ on Python 3, and there
871 # nothing. These happen _a lot_ on Python 3, and there
872 # doesn't seem to be a better workaround to have matching
872 # doesn't seem to be a better workaround to have matching
873 # Python 2 and 3 behavior. :(
873 # Python 2 and 3 behavior. :(
874 return
874 return
875
875
876 if self.logdataapis:
876 if self.logdataapis:
877 self.fh.write(b'%s> read(%d) -> %d' % (self.name, size, len(res)))
877 self.fh.write(b'%s> read(%d) -> %d' % (self.name, size, len(res)))
878
878
879 self._writedata(res)
879 self._writedata(res)
880
880
881 def readline(self, res, limit=-1):
881 def readline(self, res, limit=-1):
882 if not self.reads:
882 if not self.reads:
883 return
883 return
884
884
885 if self.logdataapis:
885 if self.logdataapis:
886 self.fh.write(b'%s> readline() -> %d' % (self.name, len(res)))
886 self.fh.write(b'%s> readline() -> %d' % (self.name, len(res)))
887
887
888 self._writedata(res)
888 self._writedata(res)
889
889
890 def readinto(self, res, dest):
890 def readinto(self, res, dest):
891 if not self.reads:
891 if not self.reads:
892 return
892 return
893
893
894 if self.logdataapis:
894 if self.logdataapis:
895 self.fh.write(
895 self.fh.write(
896 b'%s> readinto(%d) -> %r' % (self.name, len(dest), res)
896 b'%s> readinto(%d) -> %r' % (self.name, len(dest), res)
897 )
897 )
898
898
899 data = dest[0:res] if res is not None else b''
899 data = dest[0:res] if res is not None else b''
900
900
901 # _writedata() uses "in" operator and is confused by memoryview because
901 # _writedata() uses "in" operator and is confused by memoryview because
902 # characters are ints on Python 3.
902 # characters are ints on Python 3.
903 if isinstance(data, memoryview):
903 if isinstance(data, memoryview):
904 data = data.tobytes()
904 data = data.tobytes()
905
905
906 self._writedata(data)
906 self._writedata(data)
907
907
908 def write(self, res, data):
908 def write(self, res, data):
909 if not self.writes:
909 if not self.writes:
910 return
910 return
911
911
912 # Python 2 returns None from some write() calls. Python 3 (reasonably)
912 # Python 2 returns None from some write() calls. Python 3 (reasonably)
913 # returns the integer bytes written.
913 # returns the integer bytes written.
914 if res is None and data:
914 if res is None and data:
915 res = len(data)
915 res = len(data)
916
916
917 if self.logdataapis:
917 if self.logdataapis:
918 self.fh.write(b'%s> write(%d) -> %r' % (self.name, len(data), res))
918 self.fh.write(b'%s> write(%d) -> %r' % (self.name, len(data), res))
919
919
920 self._writedata(data)
920 self._writedata(data)
921
921
922 def flush(self, res):
922 def flush(self, res):
923 if not self.writes:
923 if not self.writes:
924 return
924 return
925
925
926 self.fh.write(b'%s> flush() -> %r\n' % (self.name, res))
926 self.fh.write(b'%s> flush() -> %r\n' % (self.name, res))
927
927
928 # For observedbufferedinputpipe.
928 # For observedbufferedinputpipe.
929 def bufferedread(self, res, size):
929 def bufferedread(self, res, size):
930 if not self.reads:
930 if not self.reads:
931 return
931 return
932
932
933 if self.logdataapis:
933 if self.logdataapis:
934 self.fh.write(
934 self.fh.write(
935 b'%s> bufferedread(%d) -> %d' % (self.name, size, len(res))
935 b'%s> bufferedread(%d) -> %d' % (self.name, size, len(res))
936 )
936 )
937
937
938 self._writedata(res)
938 self._writedata(res)
939
939
940 def bufferedreadline(self, res):
940 def bufferedreadline(self, res):
941 if not self.reads:
941 if not self.reads:
942 return
942 return
943
943
944 if self.logdataapis:
944 if self.logdataapis:
945 self.fh.write(
945 self.fh.write(
946 b'%s> bufferedreadline() -> %d' % (self.name, len(res))
946 b'%s> bufferedreadline() -> %d' % (self.name, len(res))
947 )
947 )
948
948
949 self._writedata(res)
949 self._writedata(res)
950
950
951
951
952 def makeloggingfileobject(
952 def makeloggingfileobject(
953 logh, fh, name, reads=True, writes=True, logdata=False, logdataapis=True
953 logh, fh, name, reads=True, writes=True, logdata=False, logdataapis=True
954 ):
954 ):
955 """Turn a file object into a logging file object."""
955 """Turn a file object into a logging file object."""
956
956
957 observer = fileobjectobserver(
957 observer = fileobjectobserver(
958 logh,
958 logh,
959 name,
959 name,
960 reads=reads,
960 reads=reads,
961 writes=writes,
961 writes=writes,
962 logdata=logdata,
962 logdata=logdata,
963 logdataapis=logdataapis,
963 logdataapis=logdataapis,
964 )
964 )
965 return fileobjectproxy(fh, observer)
965 return fileobjectproxy(fh, observer)
966
966
967
967
968 class socketobserver(baseproxyobserver):
968 class socketobserver(baseproxyobserver):
969 """Logs socket activity."""
969 """Logs socket activity."""
970
970
971 def __init__(
971 def __init__(
972 self,
972 self,
973 fh,
973 fh,
974 name,
974 name,
975 reads=True,
975 reads=True,
976 writes=True,
976 writes=True,
977 states=True,
977 states=True,
978 logdata=False,
978 logdata=False,
979 logdataapis=True,
979 logdataapis=True,
980 ):
980 ):
981 super(socketobserver, self).__init__(fh, name, logdata, logdataapis)
981 super(socketobserver, self).__init__(fh, name, logdata, logdataapis)
982 self.reads = reads
982 self.reads = reads
983 self.writes = writes
983 self.writes = writes
984 self.states = states
984 self.states = states
985
985
986 def makefile(self, res, mode=None, bufsize=None):
986 def makefile(self, res, mode=None, bufsize=None):
987 if not self.states:
987 if not self.states:
988 return
988 return
989
989
990 self.fh.write(b'%s> makefile(%r, %r)\n' % (self.name, mode, bufsize))
990 self.fh.write(b'%s> makefile(%r, %r)\n' % (self.name, mode, bufsize))
991
991
992 def recv(self, res, size, flags=0):
992 def recv(self, res, size, flags=0):
993 if not self.reads:
993 if not self.reads:
994 return
994 return
995
995
996 if self.logdataapis:
996 if self.logdataapis:
997 self.fh.write(
997 self.fh.write(
998 b'%s> recv(%d, %d) -> %d' % (self.name, size, flags, len(res))
998 b'%s> recv(%d, %d) -> %d' % (self.name, size, flags, len(res))
999 )
999 )
1000 self._writedata(res)
1000 self._writedata(res)
1001
1001
1002 def recvfrom(self, res, size, flags=0):
1002 def recvfrom(self, res, size, flags=0):
1003 if not self.reads:
1003 if not self.reads:
1004 return
1004 return
1005
1005
1006 if self.logdataapis:
1006 if self.logdataapis:
1007 self.fh.write(
1007 self.fh.write(
1008 b'%s> recvfrom(%d, %d) -> %d'
1008 b'%s> recvfrom(%d, %d) -> %d'
1009 % (self.name, size, flags, len(res[0]))
1009 % (self.name, size, flags, len(res[0]))
1010 )
1010 )
1011
1011
1012 self._writedata(res[0])
1012 self._writedata(res[0])
1013
1013
1014 def recvfrom_into(self, res, buf, size, flags=0):
1014 def recvfrom_into(self, res, buf, size, flags=0):
1015 if not self.reads:
1015 if not self.reads:
1016 return
1016 return
1017
1017
1018 if self.logdataapis:
1018 if self.logdataapis:
1019 self.fh.write(
1019 self.fh.write(
1020 b'%s> recvfrom_into(%d, %d) -> %d'
1020 b'%s> recvfrom_into(%d, %d) -> %d'
1021 % (self.name, size, flags, res[0])
1021 % (self.name, size, flags, res[0])
1022 )
1022 )
1023
1023
1024 self._writedata(buf[0 : res[0]])
1024 self._writedata(buf[0 : res[0]])
1025
1025
1026 def recv_into(self, res, buf, size=0, flags=0):
1026 def recv_into(self, res, buf, size=0, flags=0):
1027 if not self.reads:
1027 if not self.reads:
1028 return
1028 return
1029
1029
1030 if self.logdataapis:
1030 if self.logdataapis:
1031 self.fh.write(
1031 self.fh.write(
1032 b'%s> recv_into(%d, %d) -> %d' % (self.name, size, flags, res)
1032 b'%s> recv_into(%d, %d) -> %d' % (self.name, size, flags, res)
1033 )
1033 )
1034
1034
1035 self._writedata(buf[0:res])
1035 self._writedata(buf[0:res])
1036
1036
1037 def send(self, res, data, flags=0):
1037 def send(self, res, data, flags=0):
1038 if not self.writes:
1038 if not self.writes:
1039 return
1039 return
1040
1040
1041 self.fh.write(
1041 self.fh.write(
1042 b'%s> send(%d, %d) -> %d' % (self.name, len(data), flags, len(res))
1042 b'%s> send(%d, %d) -> %d' % (self.name, len(data), flags, len(res))
1043 )
1043 )
1044 self._writedata(data)
1044 self._writedata(data)
1045
1045
1046 def sendall(self, res, data, flags=0):
1046 def sendall(self, res, data, flags=0):
1047 if not self.writes:
1047 if not self.writes:
1048 return
1048 return
1049
1049
1050 if self.logdataapis:
1050 if self.logdataapis:
1051 # Returns None on success. So don't bother reporting return value.
1051 # Returns None on success. So don't bother reporting return value.
1052 self.fh.write(
1052 self.fh.write(
1053 b'%s> sendall(%d, %d)' % (self.name, len(data), flags)
1053 b'%s> sendall(%d, %d)' % (self.name, len(data), flags)
1054 )
1054 )
1055
1055
1056 self._writedata(data)
1056 self._writedata(data)
1057
1057
1058 def sendto(self, res, data, flagsoraddress, address=None):
1058 def sendto(self, res, data, flagsoraddress, address=None):
1059 if not self.writes:
1059 if not self.writes:
1060 return
1060 return
1061
1061
1062 if address:
1062 if address:
1063 flags = flagsoraddress
1063 flags = flagsoraddress
1064 else:
1064 else:
1065 flags = 0
1065 flags = 0
1066
1066
1067 if self.logdataapis:
1067 if self.logdataapis:
1068 self.fh.write(
1068 self.fh.write(
1069 b'%s> sendto(%d, %d, %r) -> %d'
1069 b'%s> sendto(%d, %d, %r) -> %d'
1070 % (self.name, len(data), flags, address, res)
1070 % (self.name, len(data), flags, address, res)
1071 )
1071 )
1072
1072
1073 self._writedata(data)
1073 self._writedata(data)
1074
1074
1075 def setblocking(self, res, flag):
1075 def setblocking(self, res, flag):
1076 if not self.states:
1076 if not self.states:
1077 return
1077 return
1078
1078
1079 self.fh.write(b'%s> setblocking(%r)\n' % (self.name, flag))
1079 self.fh.write(b'%s> setblocking(%r)\n' % (self.name, flag))
1080
1080
1081 def settimeout(self, res, value):
1081 def settimeout(self, res, value):
1082 if not self.states:
1082 if not self.states:
1083 return
1083 return
1084
1084
1085 self.fh.write(b'%s> settimeout(%r)\n' % (self.name, value))
1085 self.fh.write(b'%s> settimeout(%r)\n' % (self.name, value))
1086
1086
1087 def gettimeout(self, res):
1087 def gettimeout(self, res):
1088 if not self.states:
1088 if not self.states:
1089 return
1089 return
1090
1090
1091 self.fh.write(b'%s> gettimeout() -> %f\n' % (self.name, res))
1091 self.fh.write(b'%s> gettimeout() -> %f\n' % (self.name, res))
1092
1092
1093 def setsockopt(self, res, level, optname, value):
1093 def setsockopt(self, res, level, optname, value):
1094 if not self.states:
1094 if not self.states:
1095 return
1095 return
1096
1096
1097 self.fh.write(
1097 self.fh.write(
1098 b'%s> setsockopt(%r, %r, %r) -> %r\n'
1098 b'%s> setsockopt(%r, %r, %r) -> %r\n'
1099 % (self.name, level, optname, value, res)
1099 % (self.name, level, optname, value, res)
1100 )
1100 )
1101
1101
1102
1102
1103 def makeloggingsocket(
1103 def makeloggingsocket(
1104 logh,
1104 logh,
1105 fh,
1105 fh,
1106 name,
1106 name,
1107 reads=True,
1107 reads=True,
1108 writes=True,
1108 writes=True,
1109 states=True,
1109 states=True,
1110 logdata=False,
1110 logdata=False,
1111 logdataapis=True,
1111 logdataapis=True,
1112 ):
1112 ):
1113 """Turn a socket into a logging socket."""
1113 """Turn a socket into a logging socket."""
1114
1114
1115 observer = socketobserver(
1115 observer = socketobserver(
1116 logh,
1116 logh,
1117 name,
1117 name,
1118 reads=reads,
1118 reads=reads,
1119 writes=writes,
1119 writes=writes,
1120 states=states,
1120 states=states,
1121 logdata=logdata,
1121 logdata=logdata,
1122 logdataapis=logdataapis,
1122 logdataapis=logdataapis,
1123 )
1123 )
1124 return socketproxy(fh, observer)
1124 return socketproxy(fh, observer)
1125
1125
1126
1126
1127 def version():
1127 def version():
1128 """Return version information if available."""
1128 """Return version information if available."""
1129 try:
1129 try:
1130 from . import __version__
1130 from . import __version__
1131
1131
1132 return __version__.version
1132 return __version__.version
1133 except ImportError:
1133 except ImportError:
1134 return b'unknown'
1134 return b'unknown'
1135
1135
1136
1136
1137 def versiontuple(v=None, n=4):
1137 def versiontuple(v=None, n=4):
1138 """Parses a Mercurial version string into an N-tuple.
1138 """Parses a Mercurial version string into an N-tuple.
1139
1139
1140 The version string to be parsed is specified with the ``v`` argument.
1140 The version string to be parsed is specified with the ``v`` argument.
1141 If it isn't defined, the current Mercurial version string will be parsed.
1141 If it isn't defined, the current Mercurial version string will be parsed.
1142
1142
1143 ``n`` can be 2, 3, or 4. Here is how some version strings map to
1143 ``n`` can be 2, 3, or 4. Here is how some version strings map to
1144 returned values:
1144 returned values:
1145
1145
1146 >>> v = b'3.6.1+190-df9b73d2d444'
1146 >>> v = b'3.6.1+190-df9b73d2d444'
1147 >>> versiontuple(v, 2)
1147 >>> versiontuple(v, 2)
1148 (3, 6)
1148 (3, 6)
1149 >>> versiontuple(v, 3)
1149 >>> versiontuple(v, 3)
1150 (3, 6, 1)
1150 (3, 6, 1)
1151 >>> versiontuple(v, 4)
1151 >>> versiontuple(v, 4)
1152 (3, 6, 1, '190-df9b73d2d444')
1152 (3, 6, 1, '190-df9b73d2d444')
1153
1153
1154 >>> versiontuple(b'3.6.1+190-df9b73d2d444+20151118')
1154 >>> versiontuple(b'3.6.1+190-df9b73d2d444+20151118')
1155 (3, 6, 1, '190-df9b73d2d444+20151118')
1155 (3, 6, 1, '190-df9b73d2d444+20151118')
1156
1156
1157 >>> v = b'3.6'
1157 >>> v = b'3.6'
1158 >>> versiontuple(v, 2)
1158 >>> versiontuple(v, 2)
1159 (3, 6)
1159 (3, 6)
1160 >>> versiontuple(v, 3)
1160 >>> versiontuple(v, 3)
1161 (3, 6, None)
1161 (3, 6, None)
1162 >>> versiontuple(v, 4)
1162 >>> versiontuple(v, 4)
1163 (3, 6, None, None)
1163 (3, 6, None, None)
1164
1164
1165 >>> v = b'3.9-rc'
1165 >>> v = b'3.9-rc'
1166 >>> versiontuple(v, 2)
1166 >>> versiontuple(v, 2)
1167 (3, 9)
1167 (3, 9)
1168 >>> versiontuple(v, 3)
1168 >>> versiontuple(v, 3)
1169 (3, 9, None)
1169 (3, 9, None)
1170 >>> versiontuple(v, 4)
1170 >>> versiontuple(v, 4)
1171 (3, 9, None, 'rc')
1171 (3, 9, None, 'rc')
1172
1172
1173 >>> v = b'3.9-rc+2-02a8fea4289b'
1173 >>> v = b'3.9-rc+2-02a8fea4289b'
1174 >>> versiontuple(v, 2)
1174 >>> versiontuple(v, 2)
1175 (3, 9)
1175 (3, 9)
1176 >>> versiontuple(v, 3)
1176 >>> versiontuple(v, 3)
1177 (3, 9, None)
1177 (3, 9, None)
1178 >>> versiontuple(v, 4)
1178 >>> versiontuple(v, 4)
1179 (3, 9, None, 'rc+2-02a8fea4289b')
1179 (3, 9, None, 'rc+2-02a8fea4289b')
1180
1180
1181 >>> versiontuple(b'4.6rc0')
1181 >>> versiontuple(b'4.6rc0')
1182 (4, 6, None, 'rc0')
1182 (4, 6, None, 'rc0')
1183 >>> versiontuple(b'4.6rc0+12-425d55e54f98')
1183 >>> versiontuple(b'4.6rc0+12-425d55e54f98')
1184 (4, 6, None, 'rc0+12-425d55e54f98')
1184 (4, 6, None, 'rc0+12-425d55e54f98')
1185 >>> versiontuple(b'.1.2.3')
1185 >>> versiontuple(b'.1.2.3')
1186 (None, None, None, '.1.2.3')
1186 (None, None, None, '.1.2.3')
1187 >>> versiontuple(b'12.34..5')
1187 >>> versiontuple(b'12.34..5')
1188 (12, 34, None, '..5')
1188 (12, 34, None, '..5')
1189 >>> versiontuple(b'1.2.3.4.5.6')
1189 >>> versiontuple(b'1.2.3.4.5.6')
1190 (1, 2, 3, '.4.5.6')
1190 (1, 2, 3, '.4.5.6')
1191 """
1191 """
1192 if not v:
1192 if not v:
1193 v = version()
1193 v = version()
1194 m = remod.match(br'(\d+(?:\.\d+){,2})[+-]?(.*)', v)
1194 m = remod.match(br'(\d+(?:\.\d+){,2})[+-]?(.*)', v)
1195 if not m:
1195 if not m:
1196 vparts, extra = b'', v
1196 vparts, extra = b'', v
1197 elif m.group(2):
1197 elif m.group(2):
1198 vparts, extra = m.groups()
1198 vparts, extra = m.groups()
1199 else:
1199 else:
1200 vparts, extra = m.group(1), None
1200 vparts, extra = m.group(1), None
1201
1201
1202 assert vparts is not None # help pytype
1202 assert vparts is not None # help pytype
1203
1203
1204 vints = []
1204 vints = []
1205 for i in vparts.split(b'.'):
1205 for i in vparts.split(b'.'):
1206 try:
1206 try:
1207 vints.append(int(i))
1207 vints.append(int(i))
1208 except ValueError:
1208 except ValueError:
1209 break
1209 break
1210 # (3, 6) -> (3, 6, None)
1210 # (3, 6) -> (3, 6, None)
1211 while len(vints) < 3:
1211 while len(vints) < 3:
1212 vints.append(None)
1212 vints.append(None)
1213
1213
1214 if n == 2:
1214 if n == 2:
1215 return (vints[0], vints[1])
1215 return (vints[0], vints[1])
1216 if n == 3:
1216 if n == 3:
1217 return (vints[0], vints[1], vints[2])
1217 return (vints[0], vints[1], vints[2])
1218 if n == 4:
1218 if n == 4:
1219 return (vints[0], vints[1], vints[2], extra)
1219 return (vints[0], vints[1], vints[2], extra)
1220
1220
1221 raise error.ProgrammingError(b"invalid version part request: %d" % n)
1221 raise error.ProgrammingError(b"invalid version part request: %d" % n)
1222
1222
1223
1223
1224 def cachefunc(func):
1224 def cachefunc(func):
1225 '''cache the result of function calls'''
1225 '''cache the result of function calls'''
1226 # XXX doesn't handle keywords args
1226 # XXX doesn't handle keywords args
1227 if func.__code__.co_argcount == 0:
1227 if func.__code__.co_argcount == 0:
1228 listcache = []
1228 listcache = []
1229
1229
1230 def f():
1230 def f():
1231 if len(listcache) == 0:
1231 if len(listcache) == 0:
1232 listcache.append(func())
1232 listcache.append(func())
1233 return listcache[0]
1233 return listcache[0]
1234
1234
1235 return f
1235 return f
1236 cache = {}
1236 cache = {}
1237 if func.__code__.co_argcount == 1:
1237 if func.__code__.co_argcount == 1:
1238 # we gain a small amount of time because
1238 # we gain a small amount of time because
1239 # we don't need to pack/unpack the list
1239 # we don't need to pack/unpack the list
1240 def f(arg):
1240 def f(arg):
1241 if arg not in cache:
1241 if arg not in cache:
1242 cache[arg] = func(arg)
1242 cache[arg] = func(arg)
1243 return cache[arg]
1243 return cache[arg]
1244
1244
1245 else:
1245 else:
1246
1246
1247 def f(*args):
1247 def f(*args):
1248 if args not in cache:
1248 if args not in cache:
1249 cache[args] = func(*args)
1249 cache[args] = func(*args)
1250 return cache[args]
1250 return cache[args]
1251
1251
1252 return f
1252 return f
1253
1253
1254
1254
1255 class cow:
1255 class cow:
1256 """helper class to make copy-on-write easier
1256 """helper class to make copy-on-write easier
1257
1257
1258 Call preparewrite before doing any writes.
1258 Call preparewrite before doing any writes.
1259 """
1259 """
1260
1260
1261 def preparewrite(self):
1261 def preparewrite(self):
1262 """call this before writes, return self or a copied new object"""
1262 """call this before writes, return self or a copied new object"""
1263 if getattr(self, '_copied', 0):
1263 if getattr(self, '_copied', 0):
1264 self._copied -= 1
1264 self._copied -= 1
1265 # Function cow.__init__ expects 1 arg(s), got 2 [wrong-arg-count]
1265 # Function cow.__init__ expects 1 arg(s), got 2 [wrong-arg-count]
1266 return self.__class__(self) # pytype: disable=wrong-arg-count
1266 return self.__class__(self) # pytype: disable=wrong-arg-count
1267 return self
1267 return self
1268
1268
1269 def copy(self):
1269 def copy(self):
1270 """always do a cheap copy"""
1270 """always do a cheap copy"""
1271 self._copied = getattr(self, '_copied', 0) + 1
1271 self._copied = getattr(self, '_copied', 0) + 1
1272 return self
1272 return self
1273
1273
1274
1274
1275 class sortdict(collections.OrderedDict):
1275 class sortdict(collections.OrderedDict):
1276 """a simple sorted dictionary
1276 """a simple sorted dictionary
1277
1277
1278 >>> d1 = sortdict([(b'a', 0), (b'b', 1)])
1278 >>> d1 = sortdict([(b'a', 0), (b'b', 1)])
1279 >>> d2 = d1.copy()
1279 >>> d2 = d1.copy()
1280 >>> d2
1280 >>> d2
1281 sortdict([('a', 0), ('b', 1)])
1281 sortdict([('a', 0), ('b', 1)])
1282 >>> d2.update([(b'a', 2)])
1282 >>> d2.update([(b'a', 2)])
1283 >>> list(d2.keys()) # should still be in last-set order
1283 >>> list(d2.keys()) # should still be in last-set order
1284 ['b', 'a']
1284 ['b', 'a']
1285 >>> d1.insert(1, b'a.5', 0.5)
1285 >>> d1.insert(1, b'a.5', 0.5)
1286 >>> d1
1286 >>> d1
1287 sortdict([('a', 0), ('a.5', 0.5), ('b', 1)])
1287 sortdict([('a', 0), ('a.5', 0.5), ('b', 1)])
1288 """
1288 """
1289
1289
1290 def __setitem__(self, key, value):
1290 def __setitem__(self, key, value):
1291 if key in self:
1291 if key in self:
1292 del self[key]
1292 del self[key]
1293 super(sortdict, self).__setitem__(key, value)
1293 super(sortdict, self).__setitem__(key, value)
1294
1294
1295 if pycompat.ispypy:
1295 if pycompat.ispypy:
1296 # __setitem__() isn't called as of PyPy 5.8.0
1296 # __setitem__() isn't called as of PyPy 5.8.0
1297 def update(self, src, **f):
1297 def update(self, src, **f):
1298 if isinstance(src, dict):
1298 if isinstance(src, dict):
1299 src = src.items()
1299 src = src.items()
1300 for k, v in src:
1300 for k, v in src:
1301 self[k] = v
1301 self[k] = v
1302 for k in f:
1302 for k in f:
1303 self[k] = f[k]
1303 self[k] = f[k]
1304
1304
1305 def insert(self, position, key, value):
1305 def insert(self, position, key, value):
1306 for (i, (k, v)) in enumerate(list(self.items())):
1306 for (i, (k, v)) in enumerate(list(self.items())):
1307 if i == position:
1307 if i == position:
1308 self[key] = value
1308 self[key] = value
1309 if i >= position:
1309 if i >= position:
1310 del self[k]
1310 del self[k]
1311 self[k] = v
1311 self[k] = v
1312
1312
1313
1313
1314 class cowdict(cow, dict):
1314 class cowdict(cow, dict):
1315 """copy-on-write dict
1315 """copy-on-write dict
1316
1316
1317 Be sure to call d = d.preparewrite() before writing to d.
1317 Be sure to call d = d.preparewrite() before writing to d.
1318
1318
1319 >>> a = cowdict()
1319 >>> a = cowdict()
1320 >>> a is a.preparewrite()
1320 >>> a is a.preparewrite()
1321 True
1321 True
1322 >>> b = a.copy()
1322 >>> b = a.copy()
1323 >>> b is a
1323 >>> b is a
1324 True
1324 True
1325 >>> c = b.copy()
1325 >>> c = b.copy()
1326 >>> c is a
1326 >>> c is a
1327 True
1327 True
1328 >>> a = a.preparewrite()
1328 >>> a = a.preparewrite()
1329 >>> b is a
1329 >>> b is a
1330 False
1330 False
1331 >>> a is a.preparewrite()
1331 >>> a is a.preparewrite()
1332 True
1332 True
1333 >>> c = c.preparewrite()
1333 >>> c = c.preparewrite()
1334 >>> b is c
1334 >>> b is c
1335 False
1335 False
1336 >>> b is b.preparewrite()
1336 >>> b is b.preparewrite()
1337 True
1337 True
1338 """
1338 """
1339
1339
1340
1340
1341 class cowsortdict(cow, sortdict):
1341 class cowsortdict(cow, sortdict):
1342 """copy-on-write sortdict
1342 """copy-on-write sortdict
1343
1343
1344 Be sure to call d = d.preparewrite() before writing to d.
1344 Be sure to call d = d.preparewrite() before writing to d.
1345 """
1345 """
1346
1346
1347
1347
1348 class transactional: # pytype: disable=ignored-metaclass
1348 class transactional: # pytype: disable=ignored-metaclass
1349 """Base class for making a transactional type into a context manager."""
1349 """Base class for making a transactional type into a context manager."""
1350
1350
1351 __metaclass__ = abc.ABCMeta
1351 __metaclass__ = abc.ABCMeta
1352
1352
1353 @abc.abstractmethod
1353 @abc.abstractmethod
1354 def close(self):
1354 def close(self):
1355 """Successfully closes the transaction."""
1355 """Successfully closes the transaction."""
1356
1356
1357 @abc.abstractmethod
1357 @abc.abstractmethod
1358 def release(self):
1358 def release(self):
1359 """Marks the end of the transaction.
1359 """Marks the end of the transaction.
1360
1360
1361 If the transaction has not been closed, it will be aborted.
1361 If the transaction has not been closed, it will be aborted.
1362 """
1362 """
1363
1363
1364 def __enter__(self):
1364 def __enter__(self):
1365 return self
1365 return self
1366
1366
1367 def __exit__(self, exc_type, exc_val, exc_tb):
1367 def __exit__(self, exc_type, exc_val, exc_tb):
1368 try:
1368 try:
1369 if exc_type is None:
1369 if exc_type is None:
1370 self.close()
1370 self.close()
1371 finally:
1371 finally:
1372 self.release()
1372 self.release()
1373
1373
1374
1374
1375 @contextlib.contextmanager
1375 @contextlib.contextmanager
1376 def acceptintervention(tr=None):
1376 def acceptintervention(tr=None):
1377 """A context manager that closes the transaction on InterventionRequired
1377 """A context manager that closes the transaction on InterventionRequired
1378
1378
1379 If no transaction was provided, this simply runs the body and returns
1379 If no transaction was provided, this simply runs the body and returns
1380 """
1380 """
1381 if not tr:
1381 if not tr:
1382 yield
1382 yield
1383 return
1383 return
1384 try:
1384 try:
1385 yield
1385 yield
1386 tr.close()
1386 tr.close()
1387 except error.InterventionRequired:
1387 except error.InterventionRequired:
1388 tr.close()
1388 tr.close()
1389 raise
1389 raise
1390 finally:
1390 finally:
1391 tr.release()
1391 tr.release()
1392
1392
1393
1393
1394 @contextlib.contextmanager
1394 @contextlib.contextmanager
1395 def nullcontextmanager(enter_result=None):
1395 def nullcontextmanager(enter_result=None):
1396 yield enter_result
1396 yield enter_result
1397
1397
1398
1398
1399 class _lrucachenode:
1399 class _lrucachenode:
1400 """A node in a doubly linked list.
1400 """A node in a doubly linked list.
1401
1401
1402 Holds a reference to nodes on either side as well as a key-value
1402 Holds a reference to nodes on either side as well as a key-value
1403 pair for the dictionary entry.
1403 pair for the dictionary entry.
1404 """
1404 """
1405
1405
1406 __slots__ = ('next', 'prev', 'key', 'value', 'cost')
1406 __slots__ = ('next', 'prev', 'key', 'value', 'cost')
1407
1407
1408 def __init__(self):
1408 def __init__(self):
1409 self.next = self
1409 self.next = self
1410 self.prev = self
1410 self.prev = self
1411
1411
1412 self.key = _notset
1412 self.key = _notset
1413 self.value = None
1413 self.value = None
1414 self.cost = 0
1414 self.cost = 0
1415
1415
1416 def markempty(self):
1416 def markempty(self):
1417 """Mark the node as emptied."""
1417 """Mark the node as emptied."""
1418 self.key = _notset
1418 self.key = _notset
1419 self.value = None
1419 self.value = None
1420 self.cost = 0
1420 self.cost = 0
1421
1421
1422
1422
1423 class lrucachedict:
1423 class lrucachedict:
1424 """Dict that caches most recent accesses and sets.
1424 """Dict that caches most recent accesses and sets.
1425
1425
1426 The dict consists of an actual backing dict - indexed by original
1426 The dict consists of an actual backing dict - indexed by original
1427 key - and a doubly linked circular list defining the order of entries in
1427 key - and a doubly linked circular list defining the order of entries in
1428 the cache.
1428 the cache.
1429
1429
1430 The head node is the newest entry in the cache. If the cache is full,
1430 The head node is the newest entry in the cache. If the cache is full,
1431 we recycle head.prev and make it the new head. Cache accesses result in
1431 we recycle head.prev and make it the new head. Cache accesses result in
1432 the node being moved to before the existing head and being marked as the
1432 the node being moved to before the existing head and being marked as the
1433 new head node.
1433 new head node.
1434
1434
1435 Items in the cache can be inserted with an optional "cost" value. This is
1435 Items in the cache can be inserted with an optional "cost" value. This is
1436 simply an integer that is specified by the caller. The cache can be queried
1436 simply an integer that is specified by the caller. The cache can be queried
1437 for the total cost of all items presently in the cache.
1437 for the total cost of all items presently in the cache.
1438
1438
1439 The cache can also define a maximum cost. If a cache insertion would
1439 The cache can also define a maximum cost. If a cache insertion would
1440 cause the total cost of the cache to go beyond the maximum cost limit,
1440 cause the total cost of the cache to go beyond the maximum cost limit,
1441 nodes will be evicted to make room for the new code. This can be used
1441 nodes will be evicted to make room for the new code. This can be used
1442 to e.g. set a max memory limit and associate an estimated bytes size
1442 to e.g. set a max memory limit and associate an estimated bytes size
1443 cost to each item in the cache. By default, no maximum cost is enforced.
1443 cost to each item in the cache. By default, no maximum cost is enforced.
1444 """
1444 """
1445
1445
1446 def __init__(self, max, maxcost=0):
1446 def __init__(self, max, maxcost=0):
1447 self._cache = {}
1447 self._cache = {}
1448
1448
1449 self._head = _lrucachenode()
1449 self._head = _lrucachenode()
1450 self._size = 1
1450 self._size = 1
1451 self.capacity = max
1451 self.capacity = max
1452 self.totalcost = 0
1452 self.totalcost = 0
1453 self.maxcost = maxcost
1453 self.maxcost = maxcost
1454
1454
1455 def __len__(self):
1455 def __len__(self):
1456 return len(self._cache)
1456 return len(self._cache)
1457
1457
1458 def __contains__(self, k):
1458 def __contains__(self, k):
1459 return k in self._cache
1459 return k in self._cache
1460
1460
1461 def __iter__(self):
1461 def __iter__(self):
1462 # We don't have to iterate in cache order, but why not.
1462 # We don't have to iterate in cache order, but why not.
1463 n = self._head
1463 n = self._head
1464 for i in range(len(self._cache)):
1464 for i in range(len(self._cache)):
1465 yield n.key
1465 yield n.key
1466 n = n.next
1466 n = n.next
1467
1467
1468 def __getitem__(self, k):
1468 def __getitem__(self, k):
1469 node = self._cache[k]
1469 node = self._cache[k]
1470 self._movetohead(node)
1470 self._movetohead(node)
1471 return node.value
1471 return node.value
1472
1472
1473 def insert(self, k, v, cost=0):
1473 def insert(self, k, v, cost=0):
1474 """Insert a new item in the cache with optional cost value."""
1474 """Insert a new item in the cache with optional cost value."""
1475 node = self._cache.get(k)
1475 node = self._cache.get(k)
1476 # Replace existing value and mark as newest.
1476 # Replace existing value and mark as newest.
1477 if node is not None:
1477 if node is not None:
1478 self.totalcost -= node.cost
1478 self.totalcost -= node.cost
1479 node.value = v
1479 node.value = v
1480 node.cost = cost
1480 node.cost = cost
1481 self.totalcost += cost
1481 self.totalcost += cost
1482 self._movetohead(node)
1482 self._movetohead(node)
1483
1483
1484 if self.maxcost:
1484 if self.maxcost:
1485 self._enforcecostlimit()
1485 self._enforcecostlimit()
1486
1486
1487 return
1487 return
1488
1488
1489 if self._size < self.capacity:
1489 if self._size < self.capacity:
1490 node = self._addcapacity()
1490 node = self._addcapacity()
1491 else:
1491 else:
1492 # Grab the last/oldest item.
1492 # Grab the last/oldest item.
1493 node = self._head.prev
1493 node = self._head.prev
1494
1494
1495 # At capacity. Kill the old entry.
1495 # At capacity. Kill the old entry.
1496 if node.key is not _notset:
1496 if node.key is not _notset:
1497 self.totalcost -= node.cost
1497 self.totalcost -= node.cost
1498 del self._cache[node.key]
1498 del self._cache[node.key]
1499
1499
1500 node.key = k
1500 node.key = k
1501 node.value = v
1501 node.value = v
1502 node.cost = cost
1502 node.cost = cost
1503 self.totalcost += cost
1503 self.totalcost += cost
1504 self._cache[k] = node
1504 self._cache[k] = node
1505 # And mark it as newest entry. No need to adjust order since it
1505 # And mark it as newest entry. No need to adjust order since it
1506 # is already self._head.prev.
1506 # is already self._head.prev.
1507 self._head = node
1507 self._head = node
1508
1508
1509 if self.maxcost:
1509 if self.maxcost:
1510 self._enforcecostlimit()
1510 self._enforcecostlimit()
1511
1511
1512 def __setitem__(self, k, v):
1512 def __setitem__(self, k, v):
1513 self.insert(k, v)
1513 self.insert(k, v)
1514
1514
1515 def __delitem__(self, k):
1515 def __delitem__(self, k):
1516 self.pop(k)
1516 self.pop(k)
1517
1517
1518 def pop(self, k, default=_notset):
1518 def pop(self, k, default=_notset):
1519 try:
1519 try:
1520 node = self._cache.pop(k)
1520 node = self._cache.pop(k)
1521 except KeyError:
1521 except KeyError:
1522 if default is _notset:
1522 if default is _notset:
1523 raise
1523 raise
1524 return default
1524 return default
1525
1525
1526 assert node is not None # help pytype
1526 assert node is not None # help pytype
1527 value = node.value
1527 value = node.value
1528 self.totalcost -= node.cost
1528 self.totalcost -= node.cost
1529 node.markempty()
1529 node.markempty()
1530
1530
1531 # Temporarily mark as newest item before re-adjusting head to make
1531 # Temporarily mark as newest item before re-adjusting head to make
1532 # this node the oldest item.
1532 # this node the oldest item.
1533 self._movetohead(node)
1533 self._movetohead(node)
1534 self._head = node.next
1534 self._head = node.next
1535
1535
1536 return value
1536 return value
1537
1537
1538 # Additional dict methods.
1538 # Additional dict methods.
1539
1539
1540 def get(self, k, default=None):
1540 def get(self, k, default=None):
1541 try:
1541 try:
1542 return self.__getitem__(k)
1542 return self.__getitem__(k)
1543 except KeyError:
1543 except KeyError:
1544 return default
1544 return default
1545
1545
1546 def peek(self, k, default=_notset):
1546 def peek(self, k, default=_notset):
1547 """Get the specified item without moving it to the head
1547 """Get the specified item without moving it to the head
1548
1548
1549 Unlike get(), this doesn't mutate the internal state. But be aware
1549 Unlike get(), this doesn't mutate the internal state. But be aware
1550 that it doesn't mean peek() is thread safe.
1550 that it doesn't mean peek() is thread safe.
1551 """
1551 """
1552 try:
1552 try:
1553 node = self._cache[k]
1553 node = self._cache[k]
1554 assert node is not None # help pytype
1554 assert node is not None # help pytype
1555 return node.value
1555 return node.value
1556 except KeyError:
1556 except KeyError:
1557 if default is _notset:
1557 if default is _notset:
1558 raise
1558 raise
1559 return default
1559 return default
1560
1560
1561 def clear(self):
1561 def clear(self):
1562 n = self._head
1562 n = self._head
1563 while n.key is not _notset:
1563 while n.key is not _notset:
1564 self.totalcost -= n.cost
1564 self.totalcost -= n.cost
1565 n.markempty()
1565 n.markempty()
1566 n = n.next
1566 n = n.next
1567
1567
1568 self._cache.clear()
1568 self._cache.clear()
1569
1569
1570 def copy(self, capacity=None, maxcost=0):
1570 def copy(self, capacity=None, maxcost=0):
1571 """Create a new cache as a copy of the current one.
1571 """Create a new cache as a copy of the current one.
1572
1572
1573 By default, the new cache has the same capacity as the existing one.
1573 By default, the new cache has the same capacity as the existing one.
1574 But, the cache capacity can be changed as part of performing the
1574 But, the cache capacity can be changed as part of performing the
1575 copy.
1575 copy.
1576
1576
1577 Items in the copy have an insertion/access order matching this
1577 Items in the copy have an insertion/access order matching this
1578 instance.
1578 instance.
1579 """
1579 """
1580
1580
1581 capacity = capacity or self.capacity
1581 capacity = capacity or self.capacity
1582 maxcost = maxcost or self.maxcost
1582 maxcost = maxcost or self.maxcost
1583 result = lrucachedict(capacity, maxcost=maxcost)
1583 result = lrucachedict(capacity, maxcost=maxcost)
1584
1584
1585 # We copy entries by iterating in oldest-to-newest order so the copy
1585 # We copy entries by iterating in oldest-to-newest order so the copy
1586 # has the correct ordering.
1586 # has the correct ordering.
1587
1587
1588 # Find the first non-empty entry.
1588 # Find the first non-empty entry.
1589 n = self._head.prev
1589 n = self._head.prev
1590 while n.key is _notset and n is not self._head:
1590 while n.key is _notset and n is not self._head:
1591 n = n.prev
1591 n = n.prev
1592
1592
1593 # We could potentially skip the first N items when decreasing capacity.
1593 # We could potentially skip the first N items when decreasing capacity.
1594 # But let's keep it simple unless it is a performance problem.
1594 # But let's keep it simple unless it is a performance problem.
1595 for i in range(len(self._cache)):
1595 for i in range(len(self._cache)):
1596 result.insert(n.key, n.value, cost=n.cost)
1596 result.insert(n.key, n.value, cost=n.cost)
1597 n = n.prev
1597 n = n.prev
1598
1598
1599 return result
1599 return result
1600
1600
1601 def popoldest(self):
1601 def popoldest(self):
1602 """Remove the oldest item from the cache.
1602 """Remove the oldest item from the cache.
1603
1603
1604 Returns the (key, value) describing the removed cache entry.
1604 Returns the (key, value) describing the removed cache entry.
1605 """
1605 """
1606 if not self._cache:
1606 if not self._cache:
1607 return
1607 return
1608
1608
1609 # Walk the linked list backwards starting at tail node until we hit
1609 # Walk the linked list backwards starting at tail node until we hit
1610 # a non-empty node.
1610 # a non-empty node.
1611 n = self._head.prev
1611 n = self._head.prev
1612
1612
1613 assert n is not None # help pytype
1613 assert n is not None # help pytype
1614
1614
1615 while n.key is _notset:
1615 while n.key is _notset:
1616 n = n.prev
1616 n = n.prev
1617
1617
1618 assert n is not None # help pytype
1618 assert n is not None # help pytype
1619
1619
1620 key, value = n.key, n.value
1620 key, value = n.key, n.value
1621
1621
1622 # And remove it from the cache and mark it as empty.
1622 # And remove it from the cache and mark it as empty.
1623 del self._cache[n.key]
1623 del self._cache[n.key]
1624 self.totalcost -= n.cost
1624 self.totalcost -= n.cost
1625 n.markempty()
1625 n.markempty()
1626
1626
1627 return key, value
1627 return key, value
1628
1628
1629 def _movetohead(self, node):
1629 def _movetohead(self, node):
1630 """Mark a node as the newest, making it the new head.
1630 """Mark a node as the newest, making it the new head.
1631
1631
1632 When a node is accessed, it becomes the freshest entry in the LRU
1632 When a node is accessed, it becomes the freshest entry in the LRU
1633 list, which is denoted by self._head.
1633 list, which is denoted by self._head.
1634
1634
1635 Visually, let's make ``N`` the new head node (* denotes head):
1635 Visually, let's make ``N`` the new head node (* denotes head):
1636
1636
1637 previous/oldest <-> head <-> next/next newest
1637 previous/oldest <-> head <-> next/next newest
1638
1638
1639 ----<->--- A* ---<->-----
1639 ----<->--- A* ---<->-----
1640 | |
1640 | |
1641 E <-> D <-> N <-> C <-> B
1641 E <-> D <-> N <-> C <-> B
1642
1642
1643 To:
1643 To:
1644
1644
1645 ----<->--- N* ---<->-----
1645 ----<->--- N* ---<->-----
1646 | |
1646 | |
1647 E <-> D <-> C <-> B <-> A
1647 E <-> D <-> C <-> B <-> A
1648
1648
1649 This requires the following moves:
1649 This requires the following moves:
1650
1650
1651 C.next = D (node.prev.next = node.next)
1651 C.next = D (node.prev.next = node.next)
1652 D.prev = C (node.next.prev = node.prev)
1652 D.prev = C (node.next.prev = node.prev)
1653 E.next = N (head.prev.next = node)
1653 E.next = N (head.prev.next = node)
1654 N.prev = E (node.prev = head.prev)
1654 N.prev = E (node.prev = head.prev)
1655 N.next = A (node.next = head)
1655 N.next = A (node.next = head)
1656 A.prev = N (head.prev = node)
1656 A.prev = N (head.prev = node)
1657 """
1657 """
1658 head = self._head
1658 head = self._head
1659 # C.next = D
1659 # C.next = D
1660 node.prev.next = node.next
1660 node.prev.next = node.next
1661 # D.prev = C
1661 # D.prev = C
1662 node.next.prev = node.prev
1662 node.next.prev = node.prev
1663 # N.prev = E
1663 # N.prev = E
1664 node.prev = head.prev
1664 node.prev = head.prev
1665 # N.next = A
1665 # N.next = A
1666 # It is tempting to do just "head" here, however if node is
1666 # It is tempting to do just "head" here, however if node is
1667 # adjacent to head, this will do bad things.
1667 # adjacent to head, this will do bad things.
1668 node.next = head.prev.next
1668 node.next = head.prev.next
1669 # E.next = N
1669 # E.next = N
1670 node.next.prev = node
1670 node.next.prev = node
1671 # A.prev = N
1671 # A.prev = N
1672 node.prev.next = node
1672 node.prev.next = node
1673
1673
1674 self._head = node
1674 self._head = node
1675
1675
1676 def _addcapacity(self):
1676 def _addcapacity(self):
1677 """Add a node to the circular linked list.
1677 """Add a node to the circular linked list.
1678
1678
1679 The new node is inserted before the head node.
1679 The new node is inserted before the head node.
1680 """
1680 """
1681 head = self._head
1681 head = self._head
1682 node = _lrucachenode()
1682 node = _lrucachenode()
1683 head.prev.next = node
1683 head.prev.next = node
1684 node.prev = head.prev
1684 node.prev = head.prev
1685 node.next = head
1685 node.next = head
1686 head.prev = node
1686 head.prev = node
1687 self._size += 1
1687 self._size += 1
1688 return node
1688 return node
1689
1689
1690 def _enforcecostlimit(self):
1690 def _enforcecostlimit(self):
1691 # This should run after an insertion. It should only be called if total
1691 # This should run after an insertion. It should only be called if total
1692 # cost limits are being enforced.
1692 # cost limits are being enforced.
1693 # The most recently inserted node is never evicted.
1693 # The most recently inserted node is never evicted.
1694 if len(self) <= 1 or self.totalcost <= self.maxcost:
1694 if len(self) <= 1 or self.totalcost <= self.maxcost:
1695 return
1695 return
1696
1696
1697 # This is logically equivalent to calling popoldest() until we
1697 # This is logically equivalent to calling popoldest() until we
1698 # free up enough cost. We don't do that since popoldest() needs
1698 # free up enough cost. We don't do that since popoldest() needs
1699 # to walk the linked list and doing this in a loop would be
1699 # to walk the linked list and doing this in a loop would be
1700 # quadratic. So we find the first non-empty node and then
1700 # quadratic. So we find the first non-empty node and then
1701 # walk nodes until we free up enough capacity.
1701 # walk nodes until we free up enough capacity.
1702 #
1702 #
1703 # If we only removed the minimum number of nodes to free enough
1703 # If we only removed the minimum number of nodes to free enough
1704 # cost at insert time, chances are high that the next insert would
1704 # cost at insert time, chances are high that the next insert would
1705 # also require pruning. This would effectively constitute quadratic
1705 # also require pruning. This would effectively constitute quadratic
1706 # behavior for insert-heavy workloads. To mitigate this, we set a
1706 # behavior for insert-heavy workloads. To mitigate this, we set a
1707 # target cost that is a percentage of the max cost. This will tend
1707 # target cost that is a percentage of the max cost. This will tend
1708 # to free more nodes when the high water mark is reached, which
1708 # to free more nodes when the high water mark is reached, which
1709 # lowers the chances of needing to prune on the subsequent insert.
1709 # lowers the chances of needing to prune on the subsequent insert.
1710 targetcost = int(self.maxcost * 0.75)
1710 targetcost = int(self.maxcost * 0.75)
1711
1711
1712 n = self._head.prev
1712 n = self._head.prev
1713 while n.key is _notset:
1713 while n.key is _notset:
1714 n = n.prev
1714 n = n.prev
1715
1715
1716 while len(self) > 1 and self.totalcost > targetcost:
1716 while len(self) > 1 and self.totalcost > targetcost:
1717 del self._cache[n.key]
1717 del self._cache[n.key]
1718 self.totalcost -= n.cost
1718 self.totalcost -= n.cost
1719 n.markempty()
1719 n.markempty()
1720 n = n.prev
1720 n = n.prev
1721
1721
1722
1722
1723 def lrucachefunc(func):
1723 def lrucachefunc(func):
1724 '''cache most recent results of function calls'''
1724 '''cache most recent results of function calls'''
1725 cache = {}
1725 cache = {}
1726 order = collections.deque()
1726 order = collections.deque()
1727 if func.__code__.co_argcount == 1:
1727 if func.__code__.co_argcount == 1:
1728
1728
1729 def f(arg):
1729 def f(arg):
1730 if arg not in cache:
1730 if arg not in cache:
1731 if len(cache) > 20:
1731 if len(cache) > 20:
1732 del cache[order.popleft()]
1732 del cache[order.popleft()]
1733 cache[arg] = func(arg)
1733 cache[arg] = func(arg)
1734 else:
1734 else:
1735 order.remove(arg)
1735 order.remove(arg)
1736 order.append(arg)
1736 order.append(arg)
1737 return cache[arg]
1737 return cache[arg]
1738
1738
1739 else:
1739 else:
1740
1740
1741 def f(*args):
1741 def f(*args):
1742 if args not in cache:
1742 if args not in cache:
1743 if len(cache) > 20:
1743 if len(cache) > 20:
1744 del cache[order.popleft()]
1744 del cache[order.popleft()]
1745 cache[args] = func(*args)
1745 cache[args] = func(*args)
1746 else:
1746 else:
1747 order.remove(args)
1747 order.remove(args)
1748 order.append(args)
1748 order.append(args)
1749 return cache[args]
1749 return cache[args]
1750
1750
1751 return f
1751 return f
1752
1752
1753
1753
1754 class propertycache:
1754 class propertycache:
1755 def __init__(self, func):
1755 def __init__(self, func):
1756 self.func = func
1756 self.func = func
1757 self.name = func.__name__
1757 self.name = func.__name__
1758
1758
1759 def __get__(self, obj, type=None):
1759 def __get__(self, obj, type=None):
1760 result = self.func(obj)
1760 result = self.func(obj)
1761 self.cachevalue(obj, result)
1761 self.cachevalue(obj, result)
1762 return result
1762 return result
1763
1763
1764 def cachevalue(self, obj, value):
1764 def cachevalue(self, obj, value):
1765 # __dict__ assignment required to bypass __setattr__ (eg: repoview)
1765 # __dict__ assignment required to bypass __setattr__ (eg: repoview)
1766 obj.__dict__[self.name] = value
1766 obj.__dict__[self.name] = value
1767
1767
1768
1768
1769 def clearcachedproperty(obj, prop):
1769 def clearcachedproperty(obj, prop):
1770 '''clear a cached property value, if one has been set'''
1770 '''clear a cached property value, if one has been set'''
1771 prop = pycompat.sysstr(prop)
1771 prop = pycompat.sysstr(prop)
1772 if prop in obj.__dict__:
1772 if prop in obj.__dict__:
1773 del obj.__dict__[prop]
1773 del obj.__dict__[prop]
1774
1774
1775
1775
1776 def increasingchunks(source, min=1024, max=65536):
1776 def increasingchunks(source, min=1024, max=65536):
1777 """return no less than min bytes per chunk while data remains,
1777 """return no less than min bytes per chunk while data remains,
1778 doubling min after each chunk until it reaches max"""
1778 doubling min after each chunk until it reaches max"""
1779
1779
1780 def log2(x):
1780 def log2(x):
1781 if not x:
1781 if not x:
1782 return 0
1782 return 0
1783 i = 0
1783 i = 0
1784 while x:
1784 while x:
1785 x >>= 1
1785 x >>= 1
1786 i += 1
1786 i += 1
1787 return i - 1
1787 return i - 1
1788
1788
1789 buf = []
1789 buf = []
1790 blen = 0
1790 blen = 0
1791 for chunk in source:
1791 for chunk in source:
1792 buf.append(chunk)
1792 buf.append(chunk)
1793 blen += len(chunk)
1793 blen += len(chunk)
1794 if blen >= min:
1794 if blen >= min:
1795 if min < max:
1795 if min < max:
1796 min = min << 1
1796 min = min << 1
1797 nmin = 1 << log2(blen)
1797 nmin = 1 << log2(blen)
1798 if nmin > min:
1798 if nmin > min:
1799 min = nmin
1799 min = nmin
1800 if min > max:
1800 if min > max:
1801 min = max
1801 min = max
1802 yield b''.join(buf)
1802 yield b''.join(buf)
1803 blen = 0
1803 blen = 0
1804 buf = []
1804 buf = []
1805 if buf:
1805 if buf:
1806 yield b''.join(buf)
1806 yield b''.join(buf)
1807
1807
1808
1808
1809 def always(fn):
1809 def always(fn):
1810 return True
1810 return True
1811
1811
1812
1812
1813 def never(fn):
1813 def never(fn):
1814 return False
1814 return False
1815
1815
1816
1816
1817 def nogc(func):
1817 def nogc(func):
1818 """disable garbage collector
1818 """disable garbage collector
1819
1819
1820 Python's garbage collector triggers a GC each time a certain number of
1820 Python's garbage collector triggers a GC each time a certain number of
1821 container objects (the number being defined by gc.get_threshold()) are
1821 container objects (the number being defined by gc.get_threshold()) are
1822 allocated even when marked not to be tracked by the collector. Tracking has
1822 allocated even when marked not to be tracked by the collector. Tracking has
1823 no effect on when GCs are triggered, only on what objects the GC looks
1823 no effect on when GCs are triggered, only on what objects the GC looks
1824 into. As a workaround, disable GC while building complex (huge)
1824 into. As a workaround, disable GC while building complex (huge)
1825 containers.
1825 containers.
1826
1826
1827 This garbage collector issue have been fixed in 2.7. But it still affect
1827 This garbage collector issue have been fixed in 2.7. But it still affect
1828 CPython's performance.
1828 CPython's performance.
1829 """
1829 """
1830
1830
1831 def wrapper(*args, **kwargs):
1831 def wrapper(*args, **kwargs):
1832 gcenabled = gc.isenabled()
1832 gcenabled = gc.isenabled()
1833 gc.disable()
1833 gc.disable()
1834 try:
1834 try:
1835 return func(*args, **kwargs)
1835 return func(*args, **kwargs)
1836 finally:
1836 finally:
1837 if gcenabled:
1837 if gcenabled:
1838 gc.enable()
1838 gc.enable()
1839
1839
1840 return wrapper
1840 return wrapper
1841
1841
1842
1842
1843 if pycompat.ispypy:
1843 if pycompat.ispypy:
1844 # PyPy runs slower with gc disabled
1844 # PyPy runs slower with gc disabled
1845 nogc = lambda x: x
1845 nogc = lambda x: x
1846
1846
1847
1847
1848 def pathto(root, n1, n2):
1848 def pathto(root, n1, n2):
1849 # type: (bytes, bytes, bytes) -> bytes
1849 # type: (bytes, bytes, bytes) -> bytes
1850 """return the relative path from one place to another.
1850 """return the relative path from one place to another.
1851 root should use os.sep to separate directories
1851 root should use os.sep to separate directories
1852 n1 should use os.sep to separate directories
1852 n1 should use os.sep to separate directories
1853 n2 should use "/" to separate directories
1853 n2 should use "/" to separate directories
1854 returns an os.sep-separated path.
1854 returns an os.sep-separated path.
1855
1855
1856 If n1 is a relative path, it's assumed it's
1856 If n1 is a relative path, it's assumed it's
1857 relative to root.
1857 relative to root.
1858 n2 should always be relative to root.
1858 n2 should always be relative to root.
1859 """
1859 """
1860 if not n1:
1860 if not n1:
1861 return localpath(n2)
1861 return localpath(n2)
1862 if os.path.isabs(n1):
1862 if os.path.isabs(n1):
1863 if os.path.splitdrive(root)[0] != os.path.splitdrive(n1)[0]:
1863 if os.path.splitdrive(root)[0] != os.path.splitdrive(n1)[0]:
1864 return os.path.join(root, localpath(n2))
1864 return os.path.join(root, localpath(n2))
1865 n2 = b'/'.join((pconvert(root), n2))
1865 n2 = b'/'.join((pconvert(root), n2))
1866 a, b = splitpath(n1), n2.split(b'/')
1866 a, b = splitpath(n1), n2.split(b'/')
1867 a.reverse()
1867 a.reverse()
1868 b.reverse()
1868 b.reverse()
1869 while a and b and a[-1] == b[-1]:
1869 while a and b and a[-1] == b[-1]:
1870 a.pop()
1870 a.pop()
1871 b.pop()
1871 b.pop()
1872 b.reverse()
1872 b.reverse()
1873 return pycompat.ossep.join(([b'..'] * len(a)) + b) or b'.'
1873 return pycompat.ossep.join(([b'..'] * len(a)) + b) or b'.'
1874
1874
1875
1875
1876 def checksignature(func, depth=1):
1876 def checksignature(func, depth=1):
1877 '''wrap a function with code to check for calling errors'''
1877 '''wrap a function with code to check for calling errors'''
1878
1878
1879 def check(*args, **kwargs):
1879 def check(*args, **kwargs):
1880 try:
1880 try:
1881 return func(*args, **kwargs)
1881 return func(*args, **kwargs)
1882 except TypeError:
1882 except TypeError:
1883 if len(traceback.extract_tb(sys.exc_info()[2])) == depth:
1883 if len(traceback.extract_tb(sys.exc_info()[2])) == depth:
1884 raise error.SignatureError
1884 raise error.SignatureError
1885 raise
1885 raise
1886
1886
1887 return check
1887 return check
1888
1888
1889
1889
1890 # a whilelist of known filesystems where hardlink works reliably
1890 # a whilelist of known filesystems where hardlink works reliably
1891 _hardlinkfswhitelist = {
1891 _hardlinkfswhitelist = {
1892 b'apfs',
1892 b'apfs',
1893 b'btrfs',
1893 b'btrfs',
1894 b'ext2',
1894 b'ext2',
1895 b'ext3',
1895 b'ext3',
1896 b'ext4',
1896 b'ext4',
1897 b'hfs',
1897 b'hfs',
1898 b'jfs',
1898 b'jfs',
1899 b'NTFS',
1899 b'NTFS',
1900 b'reiserfs',
1900 b'reiserfs',
1901 b'tmpfs',
1901 b'tmpfs',
1902 b'ufs',
1902 b'ufs',
1903 b'xfs',
1903 b'xfs',
1904 b'zfs',
1904 b'zfs',
1905 }
1905 }
1906
1906
1907
1907
1908 def copyfile(
1908 def copyfile(
1909 src,
1909 src,
1910 dest,
1910 dest,
1911 hardlink=False,
1911 hardlink=False,
1912 copystat=False,
1912 copystat=False,
1913 checkambig=False,
1913 checkambig=False,
1914 nb_bytes=None,
1914 nb_bytes=None,
1915 no_hardlink_cb=None,
1915 no_hardlink_cb=None,
1916 check_fs_hardlink=True,
1916 check_fs_hardlink=True,
1917 ):
1917 ):
1918 """copy a file, preserving mode and optionally other stat info like
1918 """copy a file, preserving mode and optionally other stat info like
1919 atime/mtime
1919 atime/mtime
1920
1920
1921 checkambig argument is used with filestat, and is useful only if
1921 checkambig argument is used with filestat, and is useful only if
1922 destination file is guarded by any lock (e.g. repo.lock or
1922 destination file is guarded by any lock (e.g. repo.lock or
1923 repo.wlock).
1923 repo.wlock).
1924
1924
1925 copystat and checkambig should be exclusive.
1925 copystat and checkambig should be exclusive.
1926
1926
1927 nb_bytes: if set only copy the first `nb_bytes` of the source file.
1927 nb_bytes: if set only copy the first `nb_bytes` of the source file.
1928 """
1928 """
1929 assert not (copystat and checkambig)
1929 assert not (copystat and checkambig)
1930 oldstat = None
1930 oldstat = None
1931 if os.path.lexists(dest):
1931 if os.path.lexists(dest):
1932 if checkambig:
1932 if checkambig:
1933 oldstat = checkambig and filestat.frompath(dest)
1933 oldstat = checkambig and filestat.frompath(dest)
1934 unlink(dest)
1934 unlink(dest)
1935 if hardlink and check_fs_hardlink:
1935 if hardlink and check_fs_hardlink:
1936 # Hardlinks are problematic on CIFS (issue4546), do not allow hardlinks
1936 # Hardlinks are problematic on CIFS (issue4546), do not allow hardlinks
1937 # unless we are confident that dest is on a whitelisted filesystem.
1937 # unless we are confident that dest is on a whitelisted filesystem.
1938 try:
1938 try:
1939 fstype = getfstype(os.path.dirname(dest))
1939 fstype = getfstype(os.path.dirname(dest))
1940 except OSError:
1940 except OSError:
1941 fstype = None
1941 fstype = None
1942 if fstype not in _hardlinkfswhitelist:
1942 if fstype not in _hardlinkfswhitelist:
1943 if no_hardlink_cb is not None:
1943 if no_hardlink_cb is not None:
1944 no_hardlink_cb()
1944 no_hardlink_cb()
1945 hardlink = False
1945 hardlink = False
1946 if hardlink:
1946 if hardlink:
1947 try:
1947 try:
1948 oslink(src, dest)
1948 oslink(src, dest)
1949 if nb_bytes is not None:
1949 if nb_bytes is not None:
1950 m = "the `nb_bytes` argument is incompatible with `hardlink`"
1950 m = "the `nb_bytes` argument is incompatible with `hardlink`"
1951 raise error.ProgrammingError(m)
1951 raise error.ProgrammingError(m)
1952 return
1952 return
1953 except (IOError, OSError) as exc:
1953 except (IOError, OSError) as exc:
1954 if exc.errno != errno.EEXIST and no_hardlink_cb is not None:
1954 if exc.errno != errno.EEXIST and no_hardlink_cb is not None:
1955 no_hardlink_cb()
1955 no_hardlink_cb()
1956 # fall back to normal copy
1956 # fall back to normal copy
1957 if os.path.islink(src):
1957 if os.path.islink(src):
1958 os.symlink(os.readlink(src), dest)
1958 os.symlink(os.readlink(src), dest)
1959 # copytime is ignored for symlinks, but in general copytime isn't needed
1959 # copytime is ignored for symlinks, but in general copytime isn't needed
1960 # for them anyway
1960 # for them anyway
1961 if nb_bytes is not None:
1961 if nb_bytes is not None:
1962 m = "cannot use `nb_bytes` on a symlink"
1962 m = "cannot use `nb_bytes` on a symlink"
1963 raise error.ProgrammingError(m)
1963 raise error.ProgrammingError(m)
1964 else:
1964 else:
1965 try:
1965 try:
1966 shutil.copyfile(src, dest)
1966 shutil.copyfile(src, dest)
1967 if copystat:
1967 if copystat:
1968 # copystat also copies mode
1968 # copystat also copies mode
1969 shutil.copystat(src, dest)
1969 shutil.copystat(src, dest)
1970 else:
1970 else:
1971 shutil.copymode(src, dest)
1971 shutil.copymode(src, dest)
1972 if oldstat and oldstat.stat:
1972 if oldstat and oldstat.stat:
1973 newstat = filestat.frompath(dest)
1973 newstat = filestat.frompath(dest)
1974 if newstat.isambig(oldstat):
1974 if newstat.isambig(oldstat):
1975 # stat of copied file is ambiguous to original one
1975 # stat of copied file is ambiguous to original one
1976 advanced = (
1976 advanced = (
1977 oldstat.stat[stat.ST_MTIME] + 1
1977 oldstat.stat[stat.ST_MTIME] + 1
1978 ) & 0x7FFFFFFF
1978 ) & 0x7FFFFFFF
1979 os.utime(dest, (advanced, advanced))
1979 os.utime(dest, (advanced, advanced))
1980 # We could do something smarter using `copy_file_range` call or similar
1980 # We could do something smarter using `copy_file_range` call or similar
1981 if nb_bytes is not None:
1981 if nb_bytes is not None:
1982 with open(dest, mode='r+') as f:
1982 with open(dest, mode='r+') as f:
1983 f.truncate(nb_bytes)
1983 f.truncate(nb_bytes)
1984 except shutil.Error as inst:
1984 except shutil.Error as inst:
1985 raise error.Abort(stringutil.forcebytestr(inst))
1985 raise error.Abort(stringutil.forcebytestr(inst))
1986
1986
1987
1987
1988 def copyfiles(src, dst, hardlink=None, progress=None):
1988 def copyfiles(src, dst, hardlink=None, progress=None):
1989 """Copy a directory tree using hardlinks if possible."""
1989 """Copy a directory tree using hardlinks if possible."""
1990 num = 0
1990 num = 0
1991
1991
1992 def settopic():
1992 def settopic():
1993 if progress:
1993 if progress:
1994 progress.topic = _(b'linking') if hardlink else _(b'copying')
1994 progress.topic = _(b'linking') if hardlink else _(b'copying')
1995
1995
1996 if os.path.isdir(src):
1996 if os.path.isdir(src):
1997 if hardlink is None:
1997 if hardlink is None:
1998 hardlink = (
1998 hardlink = (
1999 os.stat(src).st_dev == os.stat(os.path.dirname(dst)).st_dev
1999 os.stat(src).st_dev == os.stat(os.path.dirname(dst)).st_dev
2000 )
2000 )
2001 settopic()
2001 settopic()
2002 os.mkdir(dst)
2002 os.mkdir(dst)
2003 for name, kind in listdir(src):
2003 for name, kind in listdir(src):
2004 srcname = os.path.join(src, name)
2004 srcname = os.path.join(src, name)
2005 dstname = os.path.join(dst, name)
2005 dstname = os.path.join(dst, name)
2006 hardlink, n = copyfiles(srcname, dstname, hardlink, progress)
2006 hardlink, n = copyfiles(srcname, dstname, hardlink, progress)
2007 num += n
2007 num += n
2008 else:
2008 else:
2009 if hardlink is None:
2009 if hardlink is None:
2010 hardlink = (
2010 hardlink = (
2011 os.stat(os.path.dirname(src)).st_dev
2011 os.stat(os.path.dirname(src)).st_dev
2012 == os.stat(os.path.dirname(dst)).st_dev
2012 == os.stat(os.path.dirname(dst)).st_dev
2013 )
2013 )
2014 settopic()
2014 settopic()
2015
2015
2016 if hardlink:
2016 if hardlink:
2017 try:
2017 try:
2018 oslink(src, dst)
2018 oslink(src, dst)
2019 except (IOError, OSError) as exc:
2019 except (IOError, OSError) as exc:
2020 if exc.errno != errno.EEXIST:
2020 if exc.errno != errno.EEXIST:
2021 hardlink = False
2021 hardlink = False
2022 # XXX maybe try to relink if the file exist ?
2022 # XXX maybe try to relink if the file exist ?
2023 shutil.copy(src, dst)
2023 shutil.copy(src, dst)
2024 else:
2024 else:
2025 shutil.copy(src, dst)
2025 shutil.copy(src, dst)
2026 num += 1
2026 num += 1
2027 if progress:
2027 if progress:
2028 progress.increment()
2028 progress.increment()
2029
2029
2030 return hardlink, num
2030 return hardlink, num
2031
2031
2032
2032
2033 _winreservednames = {
2033 _winreservednames = {
2034 b'con',
2034 b'con',
2035 b'prn',
2035 b'prn',
2036 b'aux',
2036 b'aux',
2037 b'nul',
2037 b'nul',
2038 b'com1',
2038 b'com1',
2039 b'com2',
2039 b'com2',
2040 b'com3',
2040 b'com3',
2041 b'com4',
2041 b'com4',
2042 b'com5',
2042 b'com5',
2043 b'com6',
2043 b'com6',
2044 b'com7',
2044 b'com7',
2045 b'com8',
2045 b'com8',
2046 b'com9',
2046 b'com9',
2047 b'lpt1',
2047 b'lpt1',
2048 b'lpt2',
2048 b'lpt2',
2049 b'lpt3',
2049 b'lpt3',
2050 b'lpt4',
2050 b'lpt4',
2051 b'lpt5',
2051 b'lpt5',
2052 b'lpt6',
2052 b'lpt6',
2053 b'lpt7',
2053 b'lpt7',
2054 b'lpt8',
2054 b'lpt8',
2055 b'lpt9',
2055 b'lpt9',
2056 }
2056 }
2057 _winreservedchars = b':*?"<>|'
2057 _winreservedchars = b':*?"<>|'
2058
2058
2059
2059
2060 def checkwinfilename(path):
2060 def checkwinfilename(path):
2061 # type: (bytes) -> Optional[bytes]
2061 # type: (bytes) -> Optional[bytes]
2062 r"""Check that the base-relative path is a valid filename on Windows.
2062 r"""Check that the base-relative path is a valid filename on Windows.
2063 Returns None if the path is ok, or a UI string describing the problem.
2063 Returns None if the path is ok, or a UI string describing the problem.
2064
2064
2065 >>> checkwinfilename(b"just/a/normal/path")
2065 >>> checkwinfilename(b"just/a/normal/path")
2066 >>> checkwinfilename(b"foo/bar/con.xml")
2066 >>> checkwinfilename(b"foo/bar/con.xml")
2067 "filename contains 'con', which is reserved on Windows"
2067 "filename contains 'con', which is reserved on Windows"
2068 >>> checkwinfilename(b"foo/con.xml/bar")
2068 >>> checkwinfilename(b"foo/con.xml/bar")
2069 "filename contains 'con', which is reserved on Windows"
2069 "filename contains 'con', which is reserved on Windows"
2070 >>> checkwinfilename(b"foo/bar/xml.con")
2070 >>> checkwinfilename(b"foo/bar/xml.con")
2071 >>> checkwinfilename(b"foo/bar/AUX/bla.txt")
2071 >>> checkwinfilename(b"foo/bar/AUX/bla.txt")
2072 "filename contains 'AUX', which is reserved on Windows"
2072 "filename contains 'AUX', which is reserved on Windows"
2073 >>> checkwinfilename(b"foo/bar/bla:.txt")
2073 >>> checkwinfilename(b"foo/bar/bla:.txt")
2074 "filename contains ':', which is reserved on Windows"
2074 "filename contains ':', which is reserved on Windows"
2075 >>> checkwinfilename(b"foo/bar/b\07la.txt")
2075 >>> checkwinfilename(b"foo/bar/b\07la.txt")
2076 "filename contains '\\x07', which is invalid on Windows"
2076 "filename contains '\\x07', which is invalid on Windows"
2077 >>> checkwinfilename(b"foo/bar/bla ")
2077 >>> checkwinfilename(b"foo/bar/bla ")
2078 "filename ends with ' ', which is not allowed on Windows"
2078 "filename ends with ' ', which is not allowed on Windows"
2079 >>> checkwinfilename(b"../bar")
2079 >>> checkwinfilename(b"../bar")
2080 >>> checkwinfilename(b"foo\\")
2080 >>> checkwinfilename(b"foo\\")
2081 "filename ends with '\\', which is invalid on Windows"
2081 "filename ends with '\\', which is invalid on Windows"
2082 >>> checkwinfilename(b"foo\\/bar")
2082 >>> checkwinfilename(b"foo\\/bar")
2083 "directory name ends with '\\', which is invalid on Windows"
2083 "directory name ends with '\\', which is invalid on Windows"
2084 """
2084 """
2085 if path.endswith(b'\\'):
2085 if path.endswith(b'\\'):
2086 return _(b"filename ends with '\\', which is invalid on Windows")
2086 return _(b"filename ends with '\\', which is invalid on Windows")
2087 if b'\\/' in path:
2087 if b'\\/' in path:
2088 return _(b"directory name ends with '\\', which is invalid on Windows")
2088 return _(b"directory name ends with '\\', which is invalid on Windows")
2089 for n in path.replace(b'\\', b'/').split(b'/'):
2089 for n in path.replace(b'\\', b'/').split(b'/'):
2090 if not n:
2090 if not n:
2091 continue
2091 continue
2092 for c in _filenamebytestr(n):
2092 for c in _filenamebytestr(n):
2093 if c in _winreservedchars:
2093 if c in _winreservedchars:
2094 return (
2094 return (
2095 _(
2095 _(
2096 b"filename contains '%s', which is reserved "
2096 b"filename contains '%s', which is reserved "
2097 b"on Windows"
2097 b"on Windows"
2098 )
2098 )
2099 % c
2099 % c
2100 )
2100 )
2101 if ord(c) <= 31:
2101 if ord(c) <= 31:
2102 return _(
2102 return _(
2103 b"filename contains '%s', which is invalid on Windows"
2103 b"filename contains '%s', which is invalid on Windows"
2104 ) % stringutil.escapestr(c)
2104 ) % stringutil.escapestr(c)
2105 base = n.split(b'.')[0]
2105 base = n.split(b'.')[0]
2106 if base and base.lower() in _winreservednames:
2106 if base and base.lower() in _winreservednames:
2107 return (
2107 return (
2108 _(b"filename contains '%s', which is reserved on Windows")
2108 _(b"filename contains '%s', which is reserved on Windows")
2109 % base
2109 % base
2110 )
2110 )
2111 t = n[-1:]
2111 t = n[-1:]
2112 if t in b'. ' and n not in b'..':
2112 if t in b'. ' and n not in b'..':
2113 return (
2113 return (
2114 _(
2114 _(
2115 b"filename ends with '%s', which is not allowed "
2115 b"filename ends with '%s', which is not allowed "
2116 b"on Windows"
2116 b"on Windows"
2117 )
2117 )
2118 % t
2118 % t
2119 )
2119 )
2120
2120
2121
2121
2122 timer = getattr(time, "perf_counter", None)
2122 timer = getattr(time, "perf_counter", None)
2123
2123
2124 if pycompat.iswindows:
2124 if pycompat.iswindows:
2125 checkosfilename = checkwinfilename
2125 checkosfilename = checkwinfilename
2126 if not timer:
2126 if not timer:
2127 timer = time.clock
2127 timer = time.clock
2128 else:
2128 else:
2129 # mercurial.windows doesn't have platform.checkosfilename
2129 # mercurial.windows doesn't have platform.checkosfilename
2130 checkosfilename = platform.checkosfilename # pytype: disable=module-attr
2130 checkosfilename = platform.checkosfilename # pytype: disable=module-attr
2131 if not timer:
2131 if not timer:
2132 timer = time.time
2132 timer = time.time
2133
2133
2134
2134
2135 def makelock(info, pathname):
2135 def makelock(info, pathname):
2136 """Create a lock file atomically if possible
2136 """Create a lock file atomically if possible
2137
2137
2138 This may leave a stale lock file if symlink isn't supported and signal
2138 This may leave a stale lock file if symlink isn't supported and signal
2139 interrupt is enabled.
2139 interrupt is enabled.
2140 """
2140 """
2141 try:
2141 try:
2142 return os.symlink(info, pathname)
2142 return os.symlink(info, pathname)
2143 except OSError as why:
2143 except OSError as why:
2144 if why.errno == errno.EEXIST:
2144 if why.errno == errno.EEXIST:
2145 raise
2145 raise
2146 except AttributeError: # no symlink in os
2146 except AttributeError: # no symlink in os
2147 pass
2147 pass
2148
2148
2149 flags = os.O_CREAT | os.O_WRONLY | os.O_EXCL | getattr(os, 'O_BINARY', 0)
2149 flags = os.O_CREAT | os.O_WRONLY | os.O_EXCL | getattr(os, 'O_BINARY', 0)
2150 ld = os.open(pathname, flags)
2150 ld = os.open(pathname, flags)
2151 os.write(ld, info)
2151 os.write(ld, info)
2152 os.close(ld)
2152 os.close(ld)
2153
2153
2154
2154
2155 def readlock(pathname):
2155 def readlock(pathname):
2156 # type: (bytes) -> bytes
2156 # type: (bytes) -> bytes
2157 try:
2157 try:
2158 return readlink(pathname)
2158 return readlink(pathname)
2159 except OSError as why:
2159 except OSError as why:
2160 if why.errno not in (errno.EINVAL, errno.ENOSYS):
2160 if why.errno not in (errno.EINVAL, errno.ENOSYS):
2161 raise
2161 raise
2162 except AttributeError: # no symlink in os
2162 except AttributeError: # no symlink in os
2163 pass
2163 pass
2164 with posixfile(pathname, b'rb') as fp:
2164 with posixfile(pathname, b'rb') as fp:
2165 return fp.read()
2165 return fp.read()
2166
2166
2167
2167
2168 def fstat(fp):
2168 def fstat(fp):
2169 '''stat file object that may not have fileno method.'''
2169 '''stat file object that may not have fileno method.'''
2170 try:
2170 try:
2171 return os.fstat(fp.fileno())
2171 return os.fstat(fp.fileno())
2172 except AttributeError:
2172 except AttributeError:
2173 return os.stat(fp.name)
2173 return os.stat(fp.name)
2174
2174
2175
2175
2176 # File system features
2176 # File system features
2177
2177
2178
2178
2179 def fscasesensitive(path):
2179 def fscasesensitive(path):
2180 # type: (bytes) -> bool
2180 # type: (bytes) -> bool
2181 """
2181 """
2182 Return true if the given path is on a case-sensitive filesystem
2182 Return true if the given path is on a case-sensitive filesystem
2183
2183
2184 Requires a path (like /foo/.hg) ending with a foldable final
2184 Requires a path (like /foo/.hg) ending with a foldable final
2185 directory component.
2185 directory component.
2186 """
2186 """
2187 s1 = os.lstat(path)
2187 s1 = os.lstat(path)
2188 d, b = os.path.split(path)
2188 d, b = os.path.split(path)
2189 b2 = b.upper()
2189 b2 = b.upper()
2190 if b == b2:
2190 if b == b2:
2191 b2 = b.lower()
2191 b2 = b.lower()
2192 if b == b2:
2192 if b == b2:
2193 return True # no evidence against case sensitivity
2193 return True # no evidence against case sensitivity
2194 p2 = os.path.join(d, b2)
2194 p2 = os.path.join(d, b2)
2195 try:
2195 try:
2196 s2 = os.lstat(p2)
2196 s2 = os.lstat(p2)
2197 if s2 == s1:
2197 if s2 == s1:
2198 return False
2198 return False
2199 return True
2199 return True
2200 except OSError:
2200 except OSError:
2201 return True
2201 return True
2202
2202
2203
2203
2204 _re2_input = lambda x: x
2204 _re2_input = lambda x: x
2205 try:
2205 try:
2206 import re2 # pytype: disable=import-error
2206 import re2 # pytype: disable=import-error
2207
2207
2208 _re2 = None
2208 _re2 = None
2209 except ImportError:
2209 except ImportError:
2210 _re2 = False
2210 _re2 = False
2211
2211
2212
2212
2213 class _re:
2213 class _re:
2214 def _checkre2(self):
2214 def _checkre2(self):
2215 global _re2
2215 global _re2
2216 global _re2_input
2216 global _re2_input
2217 if _re2 is not None:
2218 # we already have the answer
2219 return
2217
2220
2218 check_pattern = br'\[([^\[]+)\]'
2221 check_pattern = br'\[([^\[]+)\]'
2219 check_input = b'[ui]'
2222 check_input = b'[ui]'
2220 try:
2223 try:
2221 # check if match works, see issue3964
2224 # check if match works, see issue3964
2222 _re2 = bool(re2.match(check_pattern, check_input))
2225 _re2 = bool(re2.match(check_pattern, check_input))
2223 except ImportError:
2226 except ImportError:
2224 _re2 = False
2227 _re2 = False
2225 except TypeError:
2228 except TypeError:
2226 # the `pyre-2` project provides a re2 module that accept bytes
2229 # the `pyre-2` project provides a re2 module that accept bytes
2227 # the `fb-re2` project provides a re2 module that acccept sysstr
2230 # the `fb-re2` project provides a re2 module that acccept sysstr
2228 check_pattern = pycompat.sysstr(check_pattern)
2231 check_pattern = pycompat.sysstr(check_pattern)
2229 check_input = pycompat.sysstr(check_input)
2232 check_input = pycompat.sysstr(check_input)
2230 _re2 = bool(re2.match(check_pattern, check_input))
2233 _re2 = bool(re2.match(check_pattern, check_input))
2231 _re2_input = pycompat.sysstr
2234 _re2_input = pycompat.sysstr
2232
2235
2233 def compile(self, pat, flags=0):
2236 def compile(self, pat, flags=0):
2234 """Compile a regular expression, using re2 if possible
2237 """Compile a regular expression, using re2 if possible
2235
2238
2236 For best performance, use only re2-compatible regexp features. The
2239 For best performance, use only re2-compatible regexp features. The
2237 only flags from the re module that are re2-compatible are
2240 only flags from the re module that are re2-compatible are
2238 IGNORECASE and MULTILINE."""
2241 IGNORECASE and MULTILINE."""
2239 if _re2 is None:
2242 if _re2 is None:
2240 self._checkre2()
2243 self._checkre2()
2241 if _re2 and (flags & ~(remod.IGNORECASE | remod.MULTILINE)) == 0:
2244 if _re2 and (flags & ~(remod.IGNORECASE | remod.MULTILINE)) == 0:
2242 if flags & remod.IGNORECASE:
2245 if flags & remod.IGNORECASE:
2243 pat = b'(?i)' + pat
2246 pat = b'(?i)' + pat
2244 if flags & remod.MULTILINE:
2247 if flags & remod.MULTILINE:
2245 pat = b'(?m)' + pat
2248 pat = b'(?m)' + pat
2246 try:
2249 try:
2247 return re2.compile(_re2_input(pat))
2250 return re2.compile(_re2_input(pat))
2248 except re2.error:
2251 except re2.error:
2249 pass
2252 pass
2250 return remod.compile(pat, flags)
2253 return remod.compile(pat, flags)
2251
2254
2252 @propertycache
2255 @propertycache
2253 def escape(self):
2256 def escape(self):
2254 """Return the version of escape corresponding to self.compile.
2257 """Return the version of escape corresponding to self.compile.
2255
2258
2256 This is imperfect because whether re2 or re is used for a particular
2259 This is imperfect because whether re2 or re is used for a particular
2257 function depends on the flags, etc, but it's the best we can do.
2260 function depends on the flags, etc, but it's the best we can do.
2258 """
2261 """
2259 global _re2
2262 global _re2
2260 if _re2 is None:
2263 if _re2 is None:
2261 self._checkre2()
2264 self._checkre2()
2262 if _re2:
2265 if _re2:
2263 return re2.escape
2266 return re2.escape
2264 else:
2267 else:
2265 return remod.escape
2268 return remod.escape
2266
2269
2267
2270
2268 re = _re()
2271 re = _re()
2269
2272
2270 _fspathcache = {}
2273 _fspathcache = {}
2271
2274
2272
2275
2273 def fspath(name, root):
2276 def fspath(name, root):
2274 # type: (bytes, bytes) -> bytes
2277 # type: (bytes, bytes) -> bytes
2275 """Get name in the case stored in the filesystem
2278 """Get name in the case stored in the filesystem
2276
2279
2277 The name should be relative to root, and be normcase-ed for efficiency.
2280 The name should be relative to root, and be normcase-ed for efficiency.
2278
2281
2279 Note that this function is unnecessary, and should not be
2282 Note that this function is unnecessary, and should not be
2280 called, for case-sensitive filesystems (simply because it's expensive).
2283 called, for case-sensitive filesystems (simply because it's expensive).
2281
2284
2282 The root should be normcase-ed, too.
2285 The root should be normcase-ed, too.
2283 """
2286 """
2284
2287
2285 def _makefspathcacheentry(dir):
2288 def _makefspathcacheentry(dir):
2286 return {normcase(n): n for n in os.listdir(dir)}
2289 return {normcase(n): n for n in os.listdir(dir)}
2287
2290
2288 seps = pycompat.ossep
2291 seps = pycompat.ossep
2289 if pycompat.osaltsep:
2292 if pycompat.osaltsep:
2290 seps = seps + pycompat.osaltsep
2293 seps = seps + pycompat.osaltsep
2291 # Protect backslashes. This gets silly very quickly.
2294 # Protect backslashes. This gets silly very quickly.
2292 seps.replace(b'\\', b'\\\\')
2295 seps.replace(b'\\', b'\\\\')
2293 pattern = remod.compile(br'([^%s]+)|([%s]+)' % (seps, seps))
2296 pattern = remod.compile(br'([^%s]+)|([%s]+)' % (seps, seps))
2294 dir = os.path.normpath(root)
2297 dir = os.path.normpath(root)
2295 result = []
2298 result = []
2296 for part, sep in pattern.findall(name):
2299 for part, sep in pattern.findall(name):
2297 if sep:
2300 if sep:
2298 result.append(sep)
2301 result.append(sep)
2299 continue
2302 continue
2300
2303
2301 if dir not in _fspathcache:
2304 if dir not in _fspathcache:
2302 _fspathcache[dir] = _makefspathcacheentry(dir)
2305 _fspathcache[dir] = _makefspathcacheentry(dir)
2303 contents = _fspathcache[dir]
2306 contents = _fspathcache[dir]
2304
2307
2305 found = contents.get(part)
2308 found = contents.get(part)
2306 if not found:
2309 if not found:
2307 # retry "once per directory" per "dirstate.walk" which
2310 # retry "once per directory" per "dirstate.walk" which
2308 # may take place for each patches of "hg qpush", for example
2311 # may take place for each patches of "hg qpush", for example
2309 _fspathcache[dir] = contents = _makefspathcacheentry(dir)
2312 _fspathcache[dir] = contents = _makefspathcacheentry(dir)
2310 found = contents.get(part)
2313 found = contents.get(part)
2311
2314
2312 result.append(found or part)
2315 result.append(found or part)
2313 dir = os.path.join(dir, part)
2316 dir = os.path.join(dir, part)
2314
2317
2315 return b''.join(result)
2318 return b''.join(result)
2316
2319
2317
2320
2318 def checknlink(testfile):
2321 def checknlink(testfile):
2319 # type: (bytes) -> bool
2322 # type: (bytes) -> bool
2320 '''check whether hardlink count reporting works properly'''
2323 '''check whether hardlink count reporting works properly'''
2321
2324
2322 # testfile may be open, so we need a separate file for checking to
2325 # testfile may be open, so we need a separate file for checking to
2323 # work around issue2543 (or testfile may get lost on Samba shares)
2326 # work around issue2543 (or testfile may get lost on Samba shares)
2324 f1, f2, fp = None, None, None
2327 f1, f2, fp = None, None, None
2325 try:
2328 try:
2326 fd, f1 = pycompat.mkstemp(
2329 fd, f1 = pycompat.mkstemp(
2327 prefix=b'.%s-' % os.path.basename(testfile),
2330 prefix=b'.%s-' % os.path.basename(testfile),
2328 suffix=b'1~',
2331 suffix=b'1~',
2329 dir=os.path.dirname(testfile),
2332 dir=os.path.dirname(testfile),
2330 )
2333 )
2331 os.close(fd)
2334 os.close(fd)
2332 f2 = b'%s2~' % f1[:-2]
2335 f2 = b'%s2~' % f1[:-2]
2333
2336
2334 oslink(f1, f2)
2337 oslink(f1, f2)
2335 # nlinks() may behave differently for files on Windows shares if
2338 # nlinks() may behave differently for files on Windows shares if
2336 # the file is open.
2339 # the file is open.
2337 fp = posixfile(f2)
2340 fp = posixfile(f2)
2338 return nlinks(f2) > 1
2341 return nlinks(f2) > 1
2339 except OSError:
2342 except OSError:
2340 return False
2343 return False
2341 finally:
2344 finally:
2342 if fp is not None:
2345 if fp is not None:
2343 fp.close()
2346 fp.close()
2344 for f in (f1, f2):
2347 for f in (f1, f2):
2345 try:
2348 try:
2346 if f is not None:
2349 if f is not None:
2347 os.unlink(f)
2350 os.unlink(f)
2348 except OSError:
2351 except OSError:
2349 pass
2352 pass
2350
2353
2351
2354
2352 def endswithsep(path):
2355 def endswithsep(path):
2353 # type: (bytes) -> bool
2356 # type: (bytes) -> bool
2354 '''Check path ends with os.sep or os.altsep.'''
2357 '''Check path ends with os.sep or os.altsep.'''
2355 return bool( # help pytype
2358 return bool( # help pytype
2356 path.endswith(pycompat.ossep)
2359 path.endswith(pycompat.ossep)
2357 or pycompat.osaltsep
2360 or pycompat.osaltsep
2358 and path.endswith(pycompat.osaltsep)
2361 and path.endswith(pycompat.osaltsep)
2359 )
2362 )
2360
2363
2361
2364
2362 def splitpath(path):
2365 def splitpath(path):
2363 # type: (bytes) -> List[bytes]
2366 # type: (bytes) -> List[bytes]
2364 """Split path by os.sep.
2367 """Split path by os.sep.
2365 Note that this function does not use os.altsep because this is
2368 Note that this function does not use os.altsep because this is
2366 an alternative of simple "xxx.split(os.sep)".
2369 an alternative of simple "xxx.split(os.sep)".
2367 It is recommended to use os.path.normpath() before using this
2370 It is recommended to use os.path.normpath() before using this
2368 function if need."""
2371 function if need."""
2369 return path.split(pycompat.ossep)
2372 return path.split(pycompat.ossep)
2370
2373
2371
2374
2372 def mktempcopy(name, emptyok=False, createmode=None, enforcewritable=False):
2375 def mktempcopy(name, emptyok=False, createmode=None, enforcewritable=False):
2373 """Create a temporary file with the same contents from name
2376 """Create a temporary file with the same contents from name
2374
2377
2375 The permission bits are copied from the original file.
2378 The permission bits are copied from the original file.
2376
2379
2377 If the temporary file is going to be truncated immediately, you
2380 If the temporary file is going to be truncated immediately, you
2378 can use emptyok=True as an optimization.
2381 can use emptyok=True as an optimization.
2379
2382
2380 Returns the name of the temporary file.
2383 Returns the name of the temporary file.
2381 """
2384 """
2382 d, fn = os.path.split(name)
2385 d, fn = os.path.split(name)
2383 fd, temp = pycompat.mkstemp(prefix=b'.%s-' % fn, suffix=b'~', dir=d)
2386 fd, temp = pycompat.mkstemp(prefix=b'.%s-' % fn, suffix=b'~', dir=d)
2384 os.close(fd)
2387 os.close(fd)
2385 # Temporary files are created with mode 0600, which is usually not
2388 # Temporary files are created with mode 0600, which is usually not
2386 # what we want. If the original file already exists, just copy
2389 # what we want. If the original file already exists, just copy
2387 # its mode. Otherwise, manually obey umask.
2390 # its mode. Otherwise, manually obey umask.
2388 copymode(name, temp, createmode, enforcewritable)
2391 copymode(name, temp, createmode, enforcewritable)
2389
2392
2390 if emptyok:
2393 if emptyok:
2391 return temp
2394 return temp
2392 try:
2395 try:
2393 try:
2396 try:
2394 ifp = posixfile(name, b"rb")
2397 ifp = posixfile(name, b"rb")
2395 except IOError as inst:
2398 except IOError as inst:
2396 if inst.errno == errno.ENOENT:
2399 if inst.errno == errno.ENOENT:
2397 return temp
2400 return temp
2398 if not getattr(inst, 'filename', None):
2401 if not getattr(inst, 'filename', None):
2399 inst.filename = name
2402 inst.filename = name
2400 raise
2403 raise
2401 ofp = posixfile(temp, b"wb")
2404 ofp = posixfile(temp, b"wb")
2402 for chunk in filechunkiter(ifp):
2405 for chunk in filechunkiter(ifp):
2403 ofp.write(chunk)
2406 ofp.write(chunk)
2404 ifp.close()
2407 ifp.close()
2405 ofp.close()
2408 ofp.close()
2406 except: # re-raises
2409 except: # re-raises
2407 try:
2410 try:
2408 os.unlink(temp)
2411 os.unlink(temp)
2409 except OSError:
2412 except OSError:
2410 pass
2413 pass
2411 raise
2414 raise
2412 return temp
2415 return temp
2413
2416
2414
2417
2415 class filestat:
2418 class filestat:
2416 """help to exactly detect change of a file
2419 """help to exactly detect change of a file
2417
2420
2418 'stat' attribute is result of 'os.stat()' if specified 'path'
2421 'stat' attribute is result of 'os.stat()' if specified 'path'
2419 exists. Otherwise, it is None. This can avoid preparative
2422 exists. Otherwise, it is None. This can avoid preparative
2420 'exists()' examination on client side of this class.
2423 'exists()' examination on client side of this class.
2421 """
2424 """
2422
2425
2423 def __init__(self, stat):
2426 def __init__(self, stat):
2424 self.stat = stat
2427 self.stat = stat
2425
2428
2426 @classmethod
2429 @classmethod
2427 def frompath(cls, path):
2430 def frompath(cls, path):
2428 try:
2431 try:
2429 stat = os.stat(path)
2432 stat = os.stat(path)
2430 except FileNotFoundError:
2433 except FileNotFoundError:
2431 stat = None
2434 stat = None
2432 return cls(stat)
2435 return cls(stat)
2433
2436
2434 @classmethod
2437 @classmethod
2435 def fromfp(cls, fp):
2438 def fromfp(cls, fp):
2436 stat = os.fstat(fp.fileno())
2439 stat = os.fstat(fp.fileno())
2437 return cls(stat)
2440 return cls(stat)
2438
2441
2439 __hash__ = object.__hash__
2442 __hash__ = object.__hash__
2440
2443
2441 def __eq__(self, old):
2444 def __eq__(self, old):
2442 try:
2445 try:
2443 # if ambiguity between stat of new and old file is
2446 # if ambiguity between stat of new and old file is
2444 # avoided, comparison of size, ctime and mtime is enough
2447 # avoided, comparison of size, ctime and mtime is enough
2445 # to exactly detect change of a file regardless of platform
2448 # to exactly detect change of a file regardless of platform
2446 return (
2449 return (
2447 self.stat.st_size == old.stat.st_size
2450 self.stat.st_size == old.stat.st_size
2448 and self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME]
2451 and self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME]
2449 and self.stat[stat.ST_MTIME] == old.stat[stat.ST_MTIME]
2452 and self.stat[stat.ST_MTIME] == old.stat[stat.ST_MTIME]
2450 )
2453 )
2451 except AttributeError:
2454 except AttributeError:
2452 pass
2455 pass
2453 try:
2456 try:
2454 return self.stat is None and old.stat is None
2457 return self.stat is None and old.stat is None
2455 except AttributeError:
2458 except AttributeError:
2456 return False
2459 return False
2457
2460
2458 def isambig(self, old):
2461 def isambig(self, old):
2459 """Examine whether new (= self) stat is ambiguous against old one
2462 """Examine whether new (= self) stat is ambiguous against old one
2460
2463
2461 "S[N]" below means stat of a file at N-th change:
2464 "S[N]" below means stat of a file at N-th change:
2462
2465
2463 - S[n-1].ctime < S[n].ctime: can detect change of a file
2466 - S[n-1].ctime < S[n].ctime: can detect change of a file
2464 - S[n-1].ctime == S[n].ctime
2467 - S[n-1].ctime == S[n].ctime
2465 - S[n-1].ctime < S[n].mtime: means natural advancing (*1)
2468 - S[n-1].ctime < S[n].mtime: means natural advancing (*1)
2466 - S[n-1].ctime == S[n].mtime: is ambiguous (*2)
2469 - S[n-1].ctime == S[n].mtime: is ambiguous (*2)
2467 - S[n-1].ctime > S[n].mtime: never occurs naturally (don't care)
2470 - S[n-1].ctime > S[n].mtime: never occurs naturally (don't care)
2468 - S[n-1].ctime > S[n].ctime: never occurs naturally (don't care)
2471 - S[n-1].ctime > S[n].ctime: never occurs naturally (don't care)
2469
2472
2470 Case (*2) above means that a file was changed twice or more at
2473 Case (*2) above means that a file was changed twice or more at
2471 same time in sec (= S[n-1].ctime), and comparison of timestamp
2474 same time in sec (= S[n-1].ctime), and comparison of timestamp
2472 is ambiguous.
2475 is ambiguous.
2473
2476
2474 Base idea to avoid such ambiguity is "advance mtime 1 sec, if
2477 Base idea to avoid such ambiguity is "advance mtime 1 sec, if
2475 timestamp is ambiguous".
2478 timestamp is ambiguous".
2476
2479
2477 But advancing mtime only in case (*2) doesn't work as
2480 But advancing mtime only in case (*2) doesn't work as
2478 expected, because naturally advanced S[n].mtime in case (*1)
2481 expected, because naturally advanced S[n].mtime in case (*1)
2479 might be equal to manually advanced S[n-1 or earlier].mtime.
2482 might be equal to manually advanced S[n-1 or earlier].mtime.
2480
2483
2481 Therefore, all "S[n-1].ctime == S[n].ctime" cases should be
2484 Therefore, all "S[n-1].ctime == S[n].ctime" cases should be
2482 treated as ambiguous regardless of mtime, to avoid overlooking
2485 treated as ambiguous regardless of mtime, to avoid overlooking
2483 by confliction between such mtime.
2486 by confliction between such mtime.
2484
2487
2485 Advancing mtime "if isambig(oldstat)" ensures "S[n-1].mtime !=
2488 Advancing mtime "if isambig(oldstat)" ensures "S[n-1].mtime !=
2486 S[n].mtime", even if size of a file isn't changed.
2489 S[n].mtime", even if size of a file isn't changed.
2487 """
2490 """
2488 try:
2491 try:
2489 return self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME]
2492 return self.stat[stat.ST_CTIME] == old.stat[stat.ST_CTIME]
2490 except AttributeError:
2493 except AttributeError:
2491 return False
2494 return False
2492
2495
2493 def avoidambig(self, path, old):
2496 def avoidambig(self, path, old):
2494 """Change file stat of specified path to avoid ambiguity
2497 """Change file stat of specified path to avoid ambiguity
2495
2498
2496 'old' should be previous filestat of 'path'.
2499 'old' should be previous filestat of 'path'.
2497
2500
2498 This skips avoiding ambiguity, if a process doesn't have
2501 This skips avoiding ambiguity, if a process doesn't have
2499 appropriate privileges for 'path'. This returns False in this
2502 appropriate privileges for 'path'. This returns False in this
2500 case.
2503 case.
2501
2504
2502 Otherwise, this returns True, as "ambiguity is avoided".
2505 Otherwise, this returns True, as "ambiguity is avoided".
2503 """
2506 """
2504 advanced = (old.stat[stat.ST_MTIME] + 1) & 0x7FFFFFFF
2507 advanced = (old.stat[stat.ST_MTIME] + 1) & 0x7FFFFFFF
2505 try:
2508 try:
2506 os.utime(path, (advanced, advanced))
2509 os.utime(path, (advanced, advanced))
2507 except PermissionError:
2510 except PermissionError:
2508 # utime() on the file created by another user causes EPERM,
2511 # utime() on the file created by another user causes EPERM,
2509 # if a process doesn't have appropriate privileges
2512 # if a process doesn't have appropriate privileges
2510 return False
2513 return False
2511 return True
2514 return True
2512
2515
2513 def __ne__(self, other):
2516 def __ne__(self, other):
2514 return not self == other
2517 return not self == other
2515
2518
2516
2519
2517 class atomictempfile:
2520 class atomictempfile:
2518 """writable file object that atomically updates a file
2521 """writable file object that atomically updates a file
2519
2522
2520 All writes will go to a temporary copy of the original file. Call
2523 All writes will go to a temporary copy of the original file. Call
2521 close() when you are done writing, and atomictempfile will rename
2524 close() when you are done writing, and atomictempfile will rename
2522 the temporary copy to the original name, making the changes
2525 the temporary copy to the original name, making the changes
2523 visible. If the object is destroyed without being closed, all your
2526 visible. If the object is destroyed without being closed, all your
2524 writes are discarded.
2527 writes are discarded.
2525
2528
2526 checkambig argument of constructor is used with filestat, and is
2529 checkambig argument of constructor is used with filestat, and is
2527 useful only if target file is guarded by any lock (e.g. repo.lock
2530 useful only if target file is guarded by any lock (e.g. repo.lock
2528 or repo.wlock).
2531 or repo.wlock).
2529 """
2532 """
2530
2533
2531 def __init__(self, name, mode=b'w+b', createmode=None, checkambig=False):
2534 def __init__(self, name, mode=b'w+b', createmode=None, checkambig=False):
2532 self.__name = name # permanent name
2535 self.__name = name # permanent name
2533 self._tempname = mktempcopy(
2536 self._tempname = mktempcopy(
2534 name,
2537 name,
2535 emptyok=(b'w' in mode),
2538 emptyok=(b'w' in mode),
2536 createmode=createmode,
2539 createmode=createmode,
2537 enforcewritable=(b'w' in mode),
2540 enforcewritable=(b'w' in mode),
2538 )
2541 )
2539
2542
2540 self._fp = posixfile(self._tempname, mode)
2543 self._fp = posixfile(self._tempname, mode)
2541 self._checkambig = checkambig
2544 self._checkambig = checkambig
2542
2545
2543 # delegated methods
2546 # delegated methods
2544 self.read = self._fp.read
2547 self.read = self._fp.read
2545 self.write = self._fp.write
2548 self.write = self._fp.write
2546 self.writelines = self._fp.writelines
2549 self.writelines = self._fp.writelines
2547 self.seek = self._fp.seek
2550 self.seek = self._fp.seek
2548 self.tell = self._fp.tell
2551 self.tell = self._fp.tell
2549 self.fileno = self._fp.fileno
2552 self.fileno = self._fp.fileno
2550
2553
2551 def close(self):
2554 def close(self):
2552 if not self._fp.closed:
2555 if not self._fp.closed:
2553 self._fp.close()
2556 self._fp.close()
2554 filename = localpath(self.__name)
2557 filename = localpath(self.__name)
2555 oldstat = self._checkambig and filestat.frompath(filename)
2558 oldstat = self._checkambig and filestat.frompath(filename)
2556 if oldstat and oldstat.stat:
2559 if oldstat and oldstat.stat:
2557 rename(self._tempname, filename)
2560 rename(self._tempname, filename)
2558 newstat = filestat.frompath(filename)
2561 newstat = filestat.frompath(filename)
2559 if newstat.isambig(oldstat):
2562 if newstat.isambig(oldstat):
2560 # stat of changed file is ambiguous to original one
2563 # stat of changed file is ambiguous to original one
2561 advanced = (oldstat.stat[stat.ST_MTIME] + 1) & 0x7FFFFFFF
2564 advanced = (oldstat.stat[stat.ST_MTIME] + 1) & 0x7FFFFFFF
2562 os.utime(filename, (advanced, advanced))
2565 os.utime(filename, (advanced, advanced))
2563 else:
2566 else:
2564 rename(self._tempname, filename)
2567 rename(self._tempname, filename)
2565
2568
2566 def discard(self):
2569 def discard(self):
2567 if not self._fp.closed:
2570 if not self._fp.closed:
2568 try:
2571 try:
2569 os.unlink(self._tempname)
2572 os.unlink(self._tempname)
2570 except OSError:
2573 except OSError:
2571 pass
2574 pass
2572 self._fp.close()
2575 self._fp.close()
2573
2576
2574 def __del__(self):
2577 def __del__(self):
2575 if safehasattr(self, '_fp'): # constructor actually did something
2578 if safehasattr(self, '_fp'): # constructor actually did something
2576 self.discard()
2579 self.discard()
2577
2580
2578 def __enter__(self):
2581 def __enter__(self):
2579 return self
2582 return self
2580
2583
2581 def __exit__(self, exctype, excvalue, traceback):
2584 def __exit__(self, exctype, excvalue, traceback):
2582 if exctype is not None:
2585 if exctype is not None:
2583 self.discard()
2586 self.discard()
2584 else:
2587 else:
2585 self.close()
2588 self.close()
2586
2589
2587
2590
2588 def tryrmdir(f):
2591 def tryrmdir(f):
2589 try:
2592 try:
2590 removedirs(f)
2593 removedirs(f)
2591 except OSError as e:
2594 except OSError as e:
2592 if e.errno != errno.ENOENT and e.errno != errno.ENOTEMPTY:
2595 if e.errno != errno.ENOENT and e.errno != errno.ENOTEMPTY:
2593 raise
2596 raise
2594
2597
2595
2598
2596 def unlinkpath(f, ignoremissing=False, rmdir=True):
2599 def unlinkpath(f, ignoremissing=False, rmdir=True):
2597 # type: (bytes, bool, bool) -> None
2600 # type: (bytes, bool, bool) -> None
2598 """unlink and remove the directory if it is empty"""
2601 """unlink and remove the directory if it is empty"""
2599 if ignoremissing:
2602 if ignoremissing:
2600 tryunlink(f)
2603 tryunlink(f)
2601 else:
2604 else:
2602 unlink(f)
2605 unlink(f)
2603 if rmdir:
2606 if rmdir:
2604 # try removing directories that might now be empty
2607 # try removing directories that might now be empty
2605 try:
2608 try:
2606 removedirs(os.path.dirname(f))
2609 removedirs(os.path.dirname(f))
2607 except OSError:
2610 except OSError:
2608 pass
2611 pass
2609
2612
2610
2613
2611 def tryunlink(f):
2614 def tryunlink(f):
2612 # type: (bytes) -> None
2615 # type: (bytes) -> None
2613 """Attempt to remove a file, ignoring FileNotFoundError."""
2616 """Attempt to remove a file, ignoring FileNotFoundError."""
2614 try:
2617 try:
2615 unlink(f)
2618 unlink(f)
2616 except FileNotFoundError:
2619 except FileNotFoundError:
2617 pass
2620 pass
2618
2621
2619
2622
2620 def makedirs(name, mode=None, notindexed=False):
2623 def makedirs(name, mode=None, notindexed=False):
2621 # type: (bytes, Optional[int], bool) -> None
2624 # type: (bytes, Optional[int], bool) -> None
2622 """recursive directory creation with parent mode inheritance
2625 """recursive directory creation with parent mode inheritance
2623
2626
2624 Newly created directories are marked as "not to be indexed by
2627 Newly created directories are marked as "not to be indexed by
2625 the content indexing service", if ``notindexed`` is specified
2628 the content indexing service", if ``notindexed`` is specified
2626 for "write" mode access.
2629 for "write" mode access.
2627 """
2630 """
2628 try:
2631 try:
2629 makedir(name, notindexed)
2632 makedir(name, notindexed)
2630 except OSError as err:
2633 except OSError as err:
2631 if err.errno == errno.EEXIST:
2634 if err.errno == errno.EEXIST:
2632 return
2635 return
2633 if err.errno != errno.ENOENT or not name:
2636 if err.errno != errno.ENOENT or not name:
2634 raise
2637 raise
2635 parent = os.path.dirname(abspath(name))
2638 parent = os.path.dirname(abspath(name))
2636 if parent == name:
2639 if parent == name:
2637 raise
2640 raise
2638 makedirs(parent, mode, notindexed)
2641 makedirs(parent, mode, notindexed)
2639 try:
2642 try:
2640 makedir(name, notindexed)
2643 makedir(name, notindexed)
2641 except OSError as err:
2644 except OSError as err:
2642 # Catch EEXIST to handle races
2645 # Catch EEXIST to handle races
2643 if err.errno == errno.EEXIST:
2646 if err.errno == errno.EEXIST:
2644 return
2647 return
2645 raise
2648 raise
2646 if mode is not None:
2649 if mode is not None:
2647 os.chmod(name, mode)
2650 os.chmod(name, mode)
2648
2651
2649
2652
2650 def readfile(path):
2653 def readfile(path):
2651 # type: (bytes) -> bytes
2654 # type: (bytes) -> bytes
2652 with open(path, b'rb') as fp:
2655 with open(path, b'rb') as fp:
2653 return fp.read()
2656 return fp.read()
2654
2657
2655
2658
2656 def writefile(path, text):
2659 def writefile(path, text):
2657 # type: (bytes, bytes) -> None
2660 # type: (bytes, bytes) -> None
2658 with open(path, b'wb') as fp:
2661 with open(path, b'wb') as fp:
2659 fp.write(text)
2662 fp.write(text)
2660
2663
2661
2664
2662 def appendfile(path, text):
2665 def appendfile(path, text):
2663 # type: (bytes, bytes) -> None
2666 # type: (bytes, bytes) -> None
2664 with open(path, b'ab') as fp:
2667 with open(path, b'ab') as fp:
2665 fp.write(text)
2668 fp.write(text)
2666
2669
2667
2670
2668 class chunkbuffer:
2671 class chunkbuffer:
2669 """Allow arbitrary sized chunks of data to be efficiently read from an
2672 """Allow arbitrary sized chunks of data to be efficiently read from an
2670 iterator over chunks of arbitrary size."""
2673 iterator over chunks of arbitrary size."""
2671
2674
2672 def __init__(self, in_iter):
2675 def __init__(self, in_iter):
2673 """in_iter is the iterator that's iterating over the input chunks."""
2676 """in_iter is the iterator that's iterating over the input chunks."""
2674
2677
2675 def splitbig(chunks):
2678 def splitbig(chunks):
2676 for chunk in chunks:
2679 for chunk in chunks:
2677 if len(chunk) > 2 ** 20:
2680 if len(chunk) > 2 ** 20:
2678 pos = 0
2681 pos = 0
2679 while pos < len(chunk):
2682 while pos < len(chunk):
2680 end = pos + 2 ** 18
2683 end = pos + 2 ** 18
2681 yield chunk[pos:end]
2684 yield chunk[pos:end]
2682 pos = end
2685 pos = end
2683 else:
2686 else:
2684 yield chunk
2687 yield chunk
2685
2688
2686 self.iter = splitbig(in_iter)
2689 self.iter = splitbig(in_iter)
2687 self._queue = collections.deque()
2690 self._queue = collections.deque()
2688 self._chunkoffset = 0
2691 self._chunkoffset = 0
2689
2692
2690 def read(self, l=None):
2693 def read(self, l=None):
2691 """Read L bytes of data from the iterator of chunks of data.
2694 """Read L bytes of data from the iterator of chunks of data.
2692 Returns less than L bytes if the iterator runs dry.
2695 Returns less than L bytes if the iterator runs dry.
2693
2696
2694 If size parameter is omitted, read everything"""
2697 If size parameter is omitted, read everything"""
2695 if l is None:
2698 if l is None:
2696 return b''.join(self.iter)
2699 return b''.join(self.iter)
2697
2700
2698 left = l
2701 left = l
2699 buf = []
2702 buf = []
2700 queue = self._queue
2703 queue = self._queue
2701 while left > 0:
2704 while left > 0:
2702 # refill the queue
2705 # refill the queue
2703 if not queue:
2706 if not queue:
2704 target = 2 ** 18
2707 target = 2 ** 18
2705 for chunk in self.iter:
2708 for chunk in self.iter:
2706 queue.append(chunk)
2709 queue.append(chunk)
2707 target -= len(chunk)
2710 target -= len(chunk)
2708 if target <= 0:
2711 if target <= 0:
2709 break
2712 break
2710 if not queue:
2713 if not queue:
2711 break
2714 break
2712
2715
2713 # The easy way to do this would be to queue.popleft(), modify the
2716 # The easy way to do this would be to queue.popleft(), modify the
2714 # chunk (if necessary), then queue.appendleft(). However, for cases
2717 # chunk (if necessary), then queue.appendleft(). However, for cases
2715 # where we read partial chunk content, this incurs 2 dequeue
2718 # where we read partial chunk content, this incurs 2 dequeue
2716 # mutations and creates a new str for the remaining chunk in the
2719 # mutations and creates a new str for the remaining chunk in the
2717 # queue. Our code below avoids this overhead.
2720 # queue. Our code below avoids this overhead.
2718
2721
2719 chunk = queue[0]
2722 chunk = queue[0]
2720 chunkl = len(chunk)
2723 chunkl = len(chunk)
2721 offset = self._chunkoffset
2724 offset = self._chunkoffset
2722
2725
2723 # Use full chunk.
2726 # Use full chunk.
2724 if offset == 0 and left >= chunkl:
2727 if offset == 0 and left >= chunkl:
2725 left -= chunkl
2728 left -= chunkl
2726 queue.popleft()
2729 queue.popleft()
2727 buf.append(chunk)
2730 buf.append(chunk)
2728 # self._chunkoffset remains at 0.
2731 # self._chunkoffset remains at 0.
2729 continue
2732 continue
2730
2733
2731 chunkremaining = chunkl - offset
2734 chunkremaining = chunkl - offset
2732
2735
2733 # Use all of unconsumed part of chunk.
2736 # Use all of unconsumed part of chunk.
2734 if left >= chunkremaining:
2737 if left >= chunkremaining:
2735 left -= chunkremaining
2738 left -= chunkremaining
2736 queue.popleft()
2739 queue.popleft()
2737 # offset == 0 is enabled by block above, so this won't merely
2740 # offset == 0 is enabled by block above, so this won't merely
2738 # copy via ``chunk[0:]``.
2741 # copy via ``chunk[0:]``.
2739 buf.append(chunk[offset:])
2742 buf.append(chunk[offset:])
2740 self._chunkoffset = 0
2743 self._chunkoffset = 0
2741
2744
2742 # Partial chunk needed.
2745 # Partial chunk needed.
2743 else:
2746 else:
2744 buf.append(chunk[offset : offset + left])
2747 buf.append(chunk[offset : offset + left])
2745 self._chunkoffset += left
2748 self._chunkoffset += left
2746 left -= chunkremaining
2749 left -= chunkremaining
2747
2750
2748 return b''.join(buf)
2751 return b''.join(buf)
2749
2752
2750
2753
2751 def filechunkiter(f, size=131072, limit=None):
2754 def filechunkiter(f, size=131072, limit=None):
2752 """Create a generator that produces the data in the file size
2755 """Create a generator that produces the data in the file size
2753 (default 131072) bytes at a time, up to optional limit (default is
2756 (default 131072) bytes at a time, up to optional limit (default is
2754 to read all data). Chunks may be less than size bytes if the
2757 to read all data). Chunks may be less than size bytes if the
2755 chunk is the last chunk in the file, or the file is a socket or
2758 chunk is the last chunk in the file, or the file is a socket or
2756 some other type of file that sometimes reads less data than is
2759 some other type of file that sometimes reads less data than is
2757 requested."""
2760 requested."""
2758 assert size >= 0
2761 assert size >= 0
2759 assert limit is None or limit >= 0
2762 assert limit is None or limit >= 0
2760 while True:
2763 while True:
2761 if limit is None:
2764 if limit is None:
2762 nbytes = size
2765 nbytes = size
2763 else:
2766 else:
2764 nbytes = min(limit, size)
2767 nbytes = min(limit, size)
2765 s = nbytes and f.read(nbytes)
2768 s = nbytes and f.read(nbytes)
2766 if not s:
2769 if not s:
2767 break
2770 break
2768 if limit:
2771 if limit:
2769 limit -= len(s)
2772 limit -= len(s)
2770 yield s
2773 yield s
2771
2774
2772
2775
2773 class cappedreader:
2776 class cappedreader:
2774 """A file object proxy that allows reading up to N bytes.
2777 """A file object proxy that allows reading up to N bytes.
2775
2778
2776 Given a source file object, instances of this type allow reading up to
2779 Given a source file object, instances of this type allow reading up to
2777 N bytes from that source file object. Attempts to read past the allowed
2780 N bytes from that source file object. Attempts to read past the allowed
2778 limit are treated as EOF.
2781 limit are treated as EOF.
2779
2782
2780 It is assumed that I/O is not performed on the original file object
2783 It is assumed that I/O is not performed on the original file object
2781 in addition to I/O that is performed by this instance. If there is,
2784 in addition to I/O that is performed by this instance. If there is,
2782 state tracking will get out of sync and unexpected results will ensue.
2785 state tracking will get out of sync and unexpected results will ensue.
2783 """
2786 """
2784
2787
2785 def __init__(self, fh, limit):
2788 def __init__(self, fh, limit):
2786 """Allow reading up to <limit> bytes from <fh>."""
2789 """Allow reading up to <limit> bytes from <fh>."""
2787 self._fh = fh
2790 self._fh = fh
2788 self._left = limit
2791 self._left = limit
2789
2792
2790 def read(self, n=-1):
2793 def read(self, n=-1):
2791 if not self._left:
2794 if not self._left:
2792 return b''
2795 return b''
2793
2796
2794 if n < 0:
2797 if n < 0:
2795 n = self._left
2798 n = self._left
2796
2799
2797 data = self._fh.read(min(n, self._left))
2800 data = self._fh.read(min(n, self._left))
2798 self._left -= len(data)
2801 self._left -= len(data)
2799 assert self._left >= 0
2802 assert self._left >= 0
2800
2803
2801 return data
2804 return data
2802
2805
2803 def readinto(self, b):
2806 def readinto(self, b):
2804 res = self.read(len(b))
2807 res = self.read(len(b))
2805 if res is None:
2808 if res is None:
2806 return None
2809 return None
2807
2810
2808 b[0 : len(res)] = res
2811 b[0 : len(res)] = res
2809 return len(res)
2812 return len(res)
2810
2813
2811
2814
2812 def unitcountfn(*unittable):
2815 def unitcountfn(*unittable):
2813 '''return a function that renders a readable count of some quantity'''
2816 '''return a function that renders a readable count of some quantity'''
2814
2817
2815 def go(count):
2818 def go(count):
2816 for multiplier, divisor, format in unittable:
2819 for multiplier, divisor, format in unittable:
2817 if abs(count) >= divisor * multiplier:
2820 if abs(count) >= divisor * multiplier:
2818 return format % (count / float(divisor))
2821 return format % (count / float(divisor))
2819 return unittable[-1][2] % count
2822 return unittable[-1][2] % count
2820
2823
2821 return go
2824 return go
2822
2825
2823
2826
2824 def processlinerange(fromline, toline):
2827 def processlinerange(fromline, toline):
2825 # type: (int, int) -> Tuple[int, int]
2828 # type: (int, int) -> Tuple[int, int]
2826 """Check that linerange <fromline>:<toline> makes sense and return a
2829 """Check that linerange <fromline>:<toline> makes sense and return a
2827 0-based range.
2830 0-based range.
2828
2831
2829 >>> processlinerange(10, 20)
2832 >>> processlinerange(10, 20)
2830 (9, 20)
2833 (9, 20)
2831 >>> processlinerange(2, 1)
2834 >>> processlinerange(2, 1)
2832 Traceback (most recent call last):
2835 Traceback (most recent call last):
2833 ...
2836 ...
2834 ParseError: line range must be positive
2837 ParseError: line range must be positive
2835 >>> processlinerange(0, 5)
2838 >>> processlinerange(0, 5)
2836 Traceback (most recent call last):
2839 Traceback (most recent call last):
2837 ...
2840 ...
2838 ParseError: fromline must be strictly positive
2841 ParseError: fromline must be strictly positive
2839 """
2842 """
2840 if toline - fromline < 0:
2843 if toline - fromline < 0:
2841 raise error.ParseError(_(b"line range must be positive"))
2844 raise error.ParseError(_(b"line range must be positive"))
2842 if fromline < 1:
2845 if fromline < 1:
2843 raise error.ParseError(_(b"fromline must be strictly positive"))
2846 raise error.ParseError(_(b"fromline must be strictly positive"))
2844 return fromline - 1, toline
2847 return fromline - 1, toline
2845
2848
2846
2849
2847 bytecount = unitcountfn(
2850 bytecount = unitcountfn(
2848 (100, 1 << 30, _(b'%.0f GB')),
2851 (100, 1 << 30, _(b'%.0f GB')),
2849 (10, 1 << 30, _(b'%.1f GB')),
2852 (10, 1 << 30, _(b'%.1f GB')),
2850 (1, 1 << 30, _(b'%.2f GB')),
2853 (1, 1 << 30, _(b'%.2f GB')),
2851 (100, 1 << 20, _(b'%.0f MB')),
2854 (100, 1 << 20, _(b'%.0f MB')),
2852 (10, 1 << 20, _(b'%.1f MB')),
2855 (10, 1 << 20, _(b'%.1f MB')),
2853 (1, 1 << 20, _(b'%.2f MB')),
2856 (1, 1 << 20, _(b'%.2f MB')),
2854 (100, 1 << 10, _(b'%.0f KB')),
2857 (100, 1 << 10, _(b'%.0f KB')),
2855 (10, 1 << 10, _(b'%.1f KB')),
2858 (10, 1 << 10, _(b'%.1f KB')),
2856 (1, 1 << 10, _(b'%.2f KB')),
2859 (1, 1 << 10, _(b'%.2f KB')),
2857 (1, 1, _(b'%.0f bytes')),
2860 (1, 1, _(b'%.0f bytes')),
2858 )
2861 )
2859
2862
2860
2863
2861 class transformingwriter:
2864 class transformingwriter:
2862 """Writable file wrapper to transform data by function"""
2865 """Writable file wrapper to transform data by function"""
2863
2866
2864 def __init__(self, fp, encode):
2867 def __init__(self, fp, encode):
2865 self._fp = fp
2868 self._fp = fp
2866 self._encode = encode
2869 self._encode = encode
2867
2870
2868 def close(self):
2871 def close(self):
2869 self._fp.close()
2872 self._fp.close()
2870
2873
2871 def flush(self):
2874 def flush(self):
2872 self._fp.flush()
2875 self._fp.flush()
2873
2876
2874 def write(self, data):
2877 def write(self, data):
2875 return self._fp.write(self._encode(data))
2878 return self._fp.write(self._encode(data))
2876
2879
2877
2880
2878 # Matches a single EOL which can either be a CRLF where repeated CR
2881 # Matches a single EOL which can either be a CRLF where repeated CR
2879 # are removed or a LF. We do not care about old Macintosh files, so a
2882 # are removed or a LF. We do not care about old Macintosh files, so a
2880 # stray CR is an error.
2883 # stray CR is an error.
2881 _eolre = remod.compile(br'\r*\n')
2884 _eolre = remod.compile(br'\r*\n')
2882
2885
2883
2886
2884 def tolf(s):
2887 def tolf(s):
2885 # type: (bytes) -> bytes
2888 # type: (bytes) -> bytes
2886 return _eolre.sub(b'\n', s)
2889 return _eolre.sub(b'\n', s)
2887
2890
2888
2891
2889 def tocrlf(s):
2892 def tocrlf(s):
2890 # type: (bytes) -> bytes
2893 # type: (bytes) -> bytes
2891 return _eolre.sub(b'\r\n', s)
2894 return _eolre.sub(b'\r\n', s)
2892
2895
2893
2896
2894 def _crlfwriter(fp):
2897 def _crlfwriter(fp):
2895 return transformingwriter(fp, tocrlf)
2898 return transformingwriter(fp, tocrlf)
2896
2899
2897
2900
2898 if pycompat.oslinesep == b'\r\n':
2901 if pycompat.oslinesep == b'\r\n':
2899 tonativeeol = tocrlf
2902 tonativeeol = tocrlf
2900 fromnativeeol = tolf
2903 fromnativeeol = tolf
2901 nativeeolwriter = _crlfwriter
2904 nativeeolwriter = _crlfwriter
2902 else:
2905 else:
2903 tonativeeol = pycompat.identity
2906 tonativeeol = pycompat.identity
2904 fromnativeeol = pycompat.identity
2907 fromnativeeol = pycompat.identity
2905 nativeeolwriter = pycompat.identity
2908 nativeeolwriter = pycompat.identity
2906
2909
2907
2910
2908 # TODO delete since workaround variant for Python 2 no longer needed.
2911 # TODO delete since workaround variant for Python 2 no longer needed.
2909 def iterfile(fp):
2912 def iterfile(fp):
2910 return fp
2913 return fp
2911
2914
2912
2915
2913 def iterlines(iterator):
2916 def iterlines(iterator):
2914 # type: (Iterable[bytes]) -> Iterator[bytes]
2917 # type: (Iterable[bytes]) -> Iterator[bytes]
2915 for chunk in iterator:
2918 for chunk in iterator:
2916 for line in chunk.splitlines():
2919 for line in chunk.splitlines():
2917 yield line
2920 yield line
2918
2921
2919
2922
2920 def expandpath(path):
2923 def expandpath(path):
2921 # type: (bytes) -> bytes
2924 # type: (bytes) -> bytes
2922 return os.path.expanduser(os.path.expandvars(path))
2925 return os.path.expanduser(os.path.expandvars(path))
2923
2926
2924
2927
2925 def interpolate(prefix, mapping, s, fn=None, escape_prefix=False):
2928 def interpolate(prefix, mapping, s, fn=None, escape_prefix=False):
2926 """Return the result of interpolating items in the mapping into string s.
2929 """Return the result of interpolating items in the mapping into string s.
2927
2930
2928 prefix is a single character string, or a two character string with
2931 prefix is a single character string, or a two character string with
2929 a backslash as the first character if the prefix needs to be escaped in
2932 a backslash as the first character if the prefix needs to be escaped in
2930 a regular expression.
2933 a regular expression.
2931
2934
2932 fn is an optional function that will be applied to the replacement text
2935 fn is an optional function that will be applied to the replacement text
2933 just before replacement.
2936 just before replacement.
2934
2937
2935 escape_prefix is an optional flag that allows using doubled prefix for
2938 escape_prefix is an optional flag that allows using doubled prefix for
2936 its escaping.
2939 its escaping.
2937 """
2940 """
2938 fn = fn or (lambda s: s)
2941 fn = fn or (lambda s: s)
2939 patterns = b'|'.join(mapping.keys())
2942 patterns = b'|'.join(mapping.keys())
2940 if escape_prefix:
2943 if escape_prefix:
2941 patterns += b'|' + prefix
2944 patterns += b'|' + prefix
2942 if len(prefix) > 1:
2945 if len(prefix) > 1:
2943 prefix_char = prefix[1:]
2946 prefix_char = prefix[1:]
2944 else:
2947 else:
2945 prefix_char = prefix
2948 prefix_char = prefix
2946 mapping[prefix_char] = prefix_char
2949 mapping[prefix_char] = prefix_char
2947 r = remod.compile(br'%s(%s)' % (prefix, patterns))
2950 r = remod.compile(br'%s(%s)' % (prefix, patterns))
2948 return r.sub(lambda x: fn(mapping[x.group()[1:]]), s)
2951 return r.sub(lambda x: fn(mapping[x.group()[1:]]), s)
2949
2952
2950
2953
2951 timecount = unitcountfn(
2954 timecount = unitcountfn(
2952 (1, 1e3, _(b'%.0f s')),
2955 (1, 1e3, _(b'%.0f s')),
2953 (100, 1, _(b'%.1f s')),
2956 (100, 1, _(b'%.1f s')),
2954 (10, 1, _(b'%.2f s')),
2957 (10, 1, _(b'%.2f s')),
2955 (1, 1, _(b'%.3f s')),
2958 (1, 1, _(b'%.3f s')),
2956 (100, 0.001, _(b'%.1f ms')),
2959 (100, 0.001, _(b'%.1f ms')),
2957 (10, 0.001, _(b'%.2f ms')),
2960 (10, 0.001, _(b'%.2f ms')),
2958 (1, 0.001, _(b'%.3f ms')),
2961 (1, 0.001, _(b'%.3f ms')),
2959 (100, 0.000001, _(b'%.1f us')),
2962 (100, 0.000001, _(b'%.1f us')),
2960 (10, 0.000001, _(b'%.2f us')),
2963 (10, 0.000001, _(b'%.2f us')),
2961 (1, 0.000001, _(b'%.3f us')),
2964 (1, 0.000001, _(b'%.3f us')),
2962 (100, 0.000000001, _(b'%.1f ns')),
2965 (100, 0.000000001, _(b'%.1f ns')),
2963 (10, 0.000000001, _(b'%.2f ns')),
2966 (10, 0.000000001, _(b'%.2f ns')),
2964 (1, 0.000000001, _(b'%.3f ns')),
2967 (1, 0.000000001, _(b'%.3f ns')),
2965 )
2968 )
2966
2969
2967
2970
2968 @attr.s
2971 @attr.s
2969 class timedcmstats:
2972 class timedcmstats:
2970 """Stats information produced by the timedcm context manager on entering."""
2973 """Stats information produced by the timedcm context manager on entering."""
2971
2974
2972 # the starting value of the timer as a float (meaning and resulution is
2975 # the starting value of the timer as a float (meaning and resulution is
2973 # platform dependent, see util.timer)
2976 # platform dependent, see util.timer)
2974 start = attr.ib(default=attr.Factory(lambda: timer()))
2977 start = attr.ib(default=attr.Factory(lambda: timer()))
2975 # the number of seconds as a floating point value; starts at 0, updated when
2978 # the number of seconds as a floating point value; starts at 0, updated when
2976 # the context is exited.
2979 # the context is exited.
2977 elapsed = attr.ib(default=0)
2980 elapsed = attr.ib(default=0)
2978 # the number of nested timedcm context managers.
2981 # the number of nested timedcm context managers.
2979 level = attr.ib(default=1)
2982 level = attr.ib(default=1)
2980
2983
2981 def __bytes__(self):
2984 def __bytes__(self):
2982 return timecount(self.elapsed) if self.elapsed else b'<unknown>'
2985 return timecount(self.elapsed) if self.elapsed else b'<unknown>'
2983
2986
2984 __str__ = encoding.strmethod(__bytes__)
2987 __str__ = encoding.strmethod(__bytes__)
2985
2988
2986
2989
2987 @contextlib.contextmanager
2990 @contextlib.contextmanager
2988 def timedcm(whencefmt, *whenceargs):
2991 def timedcm(whencefmt, *whenceargs):
2989 """A context manager that produces timing information for a given context.
2992 """A context manager that produces timing information for a given context.
2990
2993
2991 On entering a timedcmstats instance is produced.
2994 On entering a timedcmstats instance is produced.
2992
2995
2993 This context manager is reentrant.
2996 This context manager is reentrant.
2994
2997
2995 """
2998 """
2996 # track nested context managers
2999 # track nested context managers
2997 timedcm._nested += 1
3000 timedcm._nested += 1
2998 timing_stats = timedcmstats(level=timedcm._nested)
3001 timing_stats = timedcmstats(level=timedcm._nested)
2999 try:
3002 try:
3000 with tracing.log(whencefmt, *whenceargs):
3003 with tracing.log(whencefmt, *whenceargs):
3001 yield timing_stats
3004 yield timing_stats
3002 finally:
3005 finally:
3003 timing_stats.elapsed = timer() - timing_stats.start
3006 timing_stats.elapsed = timer() - timing_stats.start
3004 timedcm._nested -= 1
3007 timedcm._nested -= 1
3005
3008
3006
3009
3007 timedcm._nested = 0
3010 timedcm._nested = 0
3008
3011
3009
3012
3010 def timed(func):
3013 def timed(func):
3011 """Report the execution time of a function call to stderr.
3014 """Report the execution time of a function call to stderr.
3012
3015
3013 During development, use as a decorator when you need to measure
3016 During development, use as a decorator when you need to measure
3014 the cost of a function, e.g. as follows:
3017 the cost of a function, e.g. as follows:
3015
3018
3016 @util.timed
3019 @util.timed
3017 def foo(a, b, c):
3020 def foo(a, b, c):
3018 pass
3021 pass
3019 """
3022 """
3020
3023
3021 def wrapper(*args, **kwargs):
3024 def wrapper(*args, **kwargs):
3022 with timedcm(pycompat.bytestr(func.__name__)) as time_stats:
3025 with timedcm(pycompat.bytestr(func.__name__)) as time_stats:
3023 result = func(*args, **kwargs)
3026 result = func(*args, **kwargs)
3024 stderr = procutil.stderr
3027 stderr = procutil.stderr
3025 stderr.write(
3028 stderr.write(
3026 b'%s%s: %s\n'
3029 b'%s%s: %s\n'
3027 % (
3030 % (
3028 b' ' * time_stats.level * 2,
3031 b' ' * time_stats.level * 2,
3029 pycompat.bytestr(func.__name__),
3032 pycompat.bytestr(func.__name__),
3030 time_stats,
3033 time_stats,
3031 )
3034 )
3032 )
3035 )
3033 return result
3036 return result
3034
3037
3035 return wrapper
3038 return wrapper
3036
3039
3037
3040
3038 _sizeunits = (
3041 _sizeunits = (
3039 (b'm', 2 ** 20),
3042 (b'm', 2 ** 20),
3040 (b'k', 2 ** 10),
3043 (b'k', 2 ** 10),
3041 (b'g', 2 ** 30),
3044 (b'g', 2 ** 30),
3042 (b'kb', 2 ** 10),
3045 (b'kb', 2 ** 10),
3043 (b'mb', 2 ** 20),
3046 (b'mb', 2 ** 20),
3044 (b'gb', 2 ** 30),
3047 (b'gb', 2 ** 30),
3045 (b'b', 1),
3048 (b'b', 1),
3046 )
3049 )
3047
3050
3048
3051
3049 def sizetoint(s):
3052 def sizetoint(s):
3050 # type: (bytes) -> int
3053 # type: (bytes) -> int
3051 """Convert a space specifier to a byte count.
3054 """Convert a space specifier to a byte count.
3052
3055
3053 >>> sizetoint(b'30')
3056 >>> sizetoint(b'30')
3054 30
3057 30
3055 >>> sizetoint(b'2.2kb')
3058 >>> sizetoint(b'2.2kb')
3056 2252
3059 2252
3057 >>> sizetoint(b'6M')
3060 >>> sizetoint(b'6M')
3058 6291456
3061 6291456
3059 """
3062 """
3060 t = s.strip().lower()
3063 t = s.strip().lower()
3061 try:
3064 try:
3062 for k, u in _sizeunits:
3065 for k, u in _sizeunits:
3063 if t.endswith(k):
3066 if t.endswith(k):
3064 return int(float(t[: -len(k)]) * u)
3067 return int(float(t[: -len(k)]) * u)
3065 return int(t)
3068 return int(t)
3066 except ValueError:
3069 except ValueError:
3067 raise error.ParseError(_(b"couldn't parse size: %s") % s)
3070 raise error.ParseError(_(b"couldn't parse size: %s") % s)
3068
3071
3069
3072
3070 class hooks:
3073 class hooks:
3071 """A collection of hook functions that can be used to extend a
3074 """A collection of hook functions that can be used to extend a
3072 function's behavior. Hooks are called in lexicographic order,
3075 function's behavior. Hooks are called in lexicographic order,
3073 based on the names of their sources."""
3076 based on the names of their sources."""
3074
3077
3075 def __init__(self):
3078 def __init__(self):
3076 self._hooks = []
3079 self._hooks = []
3077
3080
3078 def add(self, source, hook):
3081 def add(self, source, hook):
3079 self._hooks.append((source, hook))
3082 self._hooks.append((source, hook))
3080
3083
3081 def __call__(self, *args):
3084 def __call__(self, *args):
3082 self._hooks.sort(key=lambda x: x[0])
3085 self._hooks.sort(key=lambda x: x[0])
3083 results = []
3086 results = []
3084 for source, hook in self._hooks:
3087 for source, hook in self._hooks:
3085 results.append(hook(*args))
3088 results.append(hook(*args))
3086 return results
3089 return results
3087
3090
3088
3091
3089 def getstackframes(skip=0, line=b' %-*s in %s\n', fileline=b'%s:%d', depth=0):
3092 def getstackframes(skip=0, line=b' %-*s in %s\n', fileline=b'%s:%d', depth=0):
3090 """Yields lines for a nicely formatted stacktrace.
3093 """Yields lines for a nicely formatted stacktrace.
3091 Skips the 'skip' last entries, then return the last 'depth' entries.
3094 Skips the 'skip' last entries, then return the last 'depth' entries.
3092 Each file+linenumber is formatted according to fileline.
3095 Each file+linenumber is formatted according to fileline.
3093 Each line is formatted according to line.
3096 Each line is formatted according to line.
3094 If line is None, it yields:
3097 If line is None, it yields:
3095 length of longest filepath+line number,
3098 length of longest filepath+line number,
3096 filepath+linenumber,
3099 filepath+linenumber,
3097 function
3100 function
3098
3101
3099 Not be used in production code but very convenient while developing.
3102 Not be used in production code but very convenient while developing.
3100 """
3103 """
3101 entries = [
3104 entries = [
3102 (fileline % (pycompat.sysbytes(fn), ln), pycompat.sysbytes(func))
3105 (fileline % (pycompat.sysbytes(fn), ln), pycompat.sysbytes(func))
3103 for fn, ln, func, _text in traceback.extract_stack()[: -skip - 1]
3106 for fn, ln, func, _text in traceback.extract_stack()[: -skip - 1]
3104 ][-depth:]
3107 ][-depth:]
3105 if entries:
3108 if entries:
3106 fnmax = max(len(entry[0]) for entry in entries)
3109 fnmax = max(len(entry[0]) for entry in entries)
3107 for fnln, func in entries:
3110 for fnln, func in entries:
3108 if line is None:
3111 if line is None:
3109 yield (fnmax, fnln, func)
3112 yield (fnmax, fnln, func)
3110 else:
3113 else:
3111 yield line % (fnmax, fnln, func)
3114 yield line % (fnmax, fnln, func)
3112
3115
3113
3116
3114 def debugstacktrace(
3117 def debugstacktrace(
3115 msg=b'stacktrace',
3118 msg=b'stacktrace',
3116 skip=0,
3119 skip=0,
3117 f=procutil.stderr,
3120 f=procutil.stderr,
3118 otherf=procutil.stdout,
3121 otherf=procutil.stdout,
3119 depth=0,
3122 depth=0,
3120 prefix=b'',
3123 prefix=b'',
3121 ):
3124 ):
3122 """Writes a message to f (stderr) with a nicely formatted stacktrace.
3125 """Writes a message to f (stderr) with a nicely formatted stacktrace.
3123 Skips the 'skip' entries closest to the call, then show 'depth' entries.
3126 Skips the 'skip' entries closest to the call, then show 'depth' entries.
3124 By default it will flush stdout first.
3127 By default it will flush stdout first.
3125 It can be used everywhere and intentionally does not require an ui object.
3128 It can be used everywhere and intentionally does not require an ui object.
3126 Not be used in production code but very convenient while developing.
3129 Not be used in production code but very convenient while developing.
3127 """
3130 """
3128 if otherf:
3131 if otherf:
3129 otherf.flush()
3132 otherf.flush()
3130 f.write(b'%s%s at:\n' % (prefix, msg.rstrip()))
3133 f.write(b'%s%s at:\n' % (prefix, msg.rstrip()))
3131 for line in getstackframes(skip + 1, depth=depth):
3134 for line in getstackframes(skip + 1, depth=depth):
3132 f.write(prefix + line)
3135 f.write(prefix + line)
3133 f.flush()
3136 f.flush()
3134
3137
3135
3138
3136 # convenient shortcut
3139 # convenient shortcut
3137 dst = debugstacktrace
3140 dst = debugstacktrace
3138
3141
3139
3142
3140 def safename(f, tag, ctx, others=None):
3143 def safename(f, tag, ctx, others=None):
3141 """
3144 """
3142 Generate a name that it is safe to rename f to in the given context.
3145 Generate a name that it is safe to rename f to in the given context.
3143
3146
3144 f: filename to rename
3147 f: filename to rename
3145 tag: a string tag that will be included in the new name
3148 tag: a string tag that will be included in the new name
3146 ctx: a context, in which the new name must not exist
3149 ctx: a context, in which the new name must not exist
3147 others: a set of other filenames that the new name must not be in
3150 others: a set of other filenames that the new name must not be in
3148
3151
3149 Returns a file name of the form oldname~tag[~number] which does not exist
3152 Returns a file name of the form oldname~tag[~number] which does not exist
3150 in the provided context and is not in the set of other names.
3153 in the provided context and is not in the set of other names.
3151 """
3154 """
3152 if others is None:
3155 if others is None:
3153 others = set()
3156 others = set()
3154
3157
3155 fn = b'%s~%s' % (f, tag)
3158 fn = b'%s~%s' % (f, tag)
3156 if fn not in ctx and fn not in others:
3159 if fn not in ctx and fn not in others:
3157 return fn
3160 return fn
3158 for n in itertools.count(1):
3161 for n in itertools.count(1):
3159 fn = b'%s~%s~%s' % (f, tag, n)
3162 fn = b'%s~%s~%s' % (f, tag, n)
3160 if fn not in ctx and fn not in others:
3163 if fn not in ctx and fn not in others:
3161 return fn
3164 return fn
3162
3165
3163
3166
3164 def readexactly(stream, n):
3167 def readexactly(stream, n):
3165 '''read n bytes from stream.read and abort if less was available'''
3168 '''read n bytes from stream.read and abort if less was available'''
3166 s = stream.read(n)
3169 s = stream.read(n)
3167 if len(s) < n:
3170 if len(s) < n:
3168 raise error.Abort(
3171 raise error.Abort(
3169 _(b"stream ended unexpectedly (got %d bytes, expected %d)")
3172 _(b"stream ended unexpectedly (got %d bytes, expected %d)")
3170 % (len(s), n)
3173 % (len(s), n)
3171 )
3174 )
3172 return s
3175 return s
3173
3176
3174
3177
3175 def uvarintencode(value):
3178 def uvarintencode(value):
3176 """Encode an unsigned integer value to a varint.
3179 """Encode an unsigned integer value to a varint.
3177
3180
3178 A varint is a variable length integer of 1 or more bytes. Each byte
3181 A varint is a variable length integer of 1 or more bytes. Each byte
3179 except the last has the most significant bit set. The lower 7 bits of
3182 except the last has the most significant bit set. The lower 7 bits of
3180 each byte store the 2's complement representation, least significant group
3183 each byte store the 2's complement representation, least significant group
3181 first.
3184 first.
3182
3185
3183 >>> uvarintencode(0)
3186 >>> uvarintencode(0)
3184 '\\x00'
3187 '\\x00'
3185 >>> uvarintencode(1)
3188 >>> uvarintencode(1)
3186 '\\x01'
3189 '\\x01'
3187 >>> uvarintencode(127)
3190 >>> uvarintencode(127)
3188 '\\x7f'
3191 '\\x7f'
3189 >>> uvarintencode(1337)
3192 >>> uvarintencode(1337)
3190 '\\xb9\\n'
3193 '\\xb9\\n'
3191 >>> uvarintencode(65536)
3194 >>> uvarintencode(65536)
3192 '\\x80\\x80\\x04'
3195 '\\x80\\x80\\x04'
3193 >>> uvarintencode(-1)
3196 >>> uvarintencode(-1)
3194 Traceback (most recent call last):
3197 Traceback (most recent call last):
3195 ...
3198 ...
3196 ProgrammingError: negative value for uvarint: -1
3199 ProgrammingError: negative value for uvarint: -1
3197 """
3200 """
3198 if value < 0:
3201 if value < 0:
3199 raise error.ProgrammingError(b'negative value for uvarint: %d' % value)
3202 raise error.ProgrammingError(b'negative value for uvarint: %d' % value)
3200 bits = value & 0x7F
3203 bits = value & 0x7F
3201 value >>= 7
3204 value >>= 7
3202 bytes = []
3205 bytes = []
3203 while value:
3206 while value:
3204 bytes.append(pycompat.bytechr(0x80 | bits))
3207 bytes.append(pycompat.bytechr(0x80 | bits))
3205 bits = value & 0x7F
3208 bits = value & 0x7F
3206 value >>= 7
3209 value >>= 7
3207 bytes.append(pycompat.bytechr(bits))
3210 bytes.append(pycompat.bytechr(bits))
3208
3211
3209 return b''.join(bytes)
3212 return b''.join(bytes)
3210
3213
3211
3214
3212 def uvarintdecodestream(fh):
3215 def uvarintdecodestream(fh):
3213 """Decode an unsigned variable length integer from a stream.
3216 """Decode an unsigned variable length integer from a stream.
3214
3217
3215 The passed argument is anything that has a ``.read(N)`` method.
3218 The passed argument is anything that has a ``.read(N)`` method.
3216
3219
3217 >>> from io import BytesIO
3220 >>> from io import BytesIO
3218 >>> uvarintdecodestream(BytesIO(b'\\x00'))
3221 >>> uvarintdecodestream(BytesIO(b'\\x00'))
3219 0
3222 0
3220 >>> uvarintdecodestream(BytesIO(b'\\x01'))
3223 >>> uvarintdecodestream(BytesIO(b'\\x01'))
3221 1
3224 1
3222 >>> uvarintdecodestream(BytesIO(b'\\x7f'))
3225 >>> uvarintdecodestream(BytesIO(b'\\x7f'))
3223 127
3226 127
3224 >>> uvarintdecodestream(BytesIO(b'\\xb9\\n'))
3227 >>> uvarintdecodestream(BytesIO(b'\\xb9\\n'))
3225 1337
3228 1337
3226 >>> uvarintdecodestream(BytesIO(b'\\x80\\x80\\x04'))
3229 >>> uvarintdecodestream(BytesIO(b'\\x80\\x80\\x04'))
3227 65536
3230 65536
3228 >>> uvarintdecodestream(BytesIO(b'\\x80'))
3231 >>> uvarintdecodestream(BytesIO(b'\\x80'))
3229 Traceback (most recent call last):
3232 Traceback (most recent call last):
3230 ...
3233 ...
3231 Abort: stream ended unexpectedly (got 0 bytes, expected 1)
3234 Abort: stream ended unexpectedly (got 0 bytes, expected 1)
3232 """
3235 """
3233 result = 0
3236 result = 0
3234 shift = 0
3237 shift = 0
3235 while True:
3238 while True:
3236 byte = ord(readexactly(fh, 1))
3239 byte = ord(readexactly(fh, 1))
3237 result |= (byte & 0x7F) << shift
3240 result |= (byte & 0x7F) << shift
3238 if not (byte & 0x80):
3241 if not (byte & 0x80):
3239 return result
3242 return result
3240 shift += 7
3243 shift += 7
3241
3244
3242
3245
3243 # Passing the '' locale means that the locale should be set according to the
3246 # Passing the '' locale means that the locale should be set according to the
3244 # user settings (environment variables).
3247 # user settings (environment variables).
3245 # Python sometimes avoids setting the global locale settings. When interfacing
3248 # Python sometimes avoids setting the global locale settings. When interfacing
3246 # with C code (e.g. the curses module or the Subversion bindings), the global
3249 # with C code (e.g. the curses module or the Subversion bindings), the global
3247 # locale settings must be initialized correctly. Python 2 does not initialize
3250 # locale settings must be initialized correctly. Python 2 does not initialize
3248 # the global locale settings on interpreter startup. Python 3 sometimes
3251 # the global locale settings on interpreter startup. Python 3 sometimes
3249 # initializes LC_CTYPE, but not consistently at least on Windows. Therefore we
3252 # initializes LC_CTYPE, but not consistently at least on Windows. Therefore we
3250 # explicitly initialize it to get consistent behavior if it's not already
3253 # explicitly initialize it to get consistent behavior if it's not already
3251 # initialized. Since CPython commit 177d921c8c03d30daa32994362023f777624b10d,
3254 # initialized. Since CPython commit 177d921c8c03d30daa32994362023f777624b10d,
3252 # LC_CTYPE is always initialized. If we require Python 3.8+, we should re-check
3255 # LC_CTYPE is always initialized. If we require Python 3.8+, we should re-check
3253 # if we can remove this code.
3256 # if we can remove this code.
3254 @contextlib.contextmanager
3257 @contextlib.contextmanager
3255 def with_lc_ctype():
3258 def with_lc_ctype():
3256 oldloc = locale.setlocale(locale.LC_CTYPE, None)
3259 oldloc = locale.setlocale(locale.LC_CTYPE, None)
3257 if oldloc == 'C':
3260 if oldloc == 'C':
3258 try:
3261 try:
3259 try:
3262 try:
3260 locale.setlocale(locale.LC_CTYPE, '')
3263 locale.setlocale(locale.LC_CTYPE, '')
3261 except locale.Error:
3264 except locale.Error:
3262 # The likely case is that the locale from the environment
3265 # The likely case is that the locale from the environment
3263 # variables is unknown.
3266 # variables is unknown.
3264 pass
3267 pass
3265 yield
3268 yield
3266 finally:
3269 finally:
3267 locale.setlocale(locale.LC_CTYPE, oldloc)
3270 locale.setlocale(locale.LC_CTYPE, oldloc)
3268 else:
3271 else:
3269 yield
3272 yield
3270
3273
3271
3274
3272 def _estimatememory():
3275 def _estimatememory():
3273 # type: () -> Optional[int]
3276 # type: () -> Optional[int]
3274 """Provide an estimate for the available system memory in Bytes.
3277 """Provide an estimate for the available system memory in Bytes.
3275
3278
3276 If no estimate can be provided on the platform, returns None.
3279 If no estimate can be provided on the platform, returns None.
3277 """
3280 """
3278 if pycompat.sysplatform.startswith(b'win'):
3281 if pycompat.sysplatform.startswith(b'win'):
3279 # On Windows, use the GlobalMemoryStatusEx kernel function directly.
3282 # On Windows, use the GlobalMemoryStatusEx kernel function directly.
3280 from ctypes import c_long as DWORD, c_ulonglong as DWORDLONG
3283 from ctypes import c_long as DWORD, c_ulonglong as DWORDLONG
3281 from ctypes.wintypes import ( # pytype: disable=import-error
3284 from ctypes.wintypes import ( # pytype: disable=import-error
3282 Structure,
3285 Structure,
3283 byref,
3286 byref,
3284 sizeof,
3287 sizeof,
3285 windll,
3288 windll,
3286 )
3289 )
3287
3290
3288 class MEMORYSTATUSEX(Structure):
3291 class MEMORYSTATUSEX(Structure):
3289 _fields_ = [
3292 _fields_ = [
3290 ('dwLength', DWORD),
3293 ('dwLength', DWORD),
3291 ('dwMemoryLoad', DWORD),
3294 ('dwMemoryLoad', DWORD),
3292 ('ullTotalPhys', DWORDLONG),
3295 ('ullTotalPhys', DWORDLONG),
3293 ('ullAvailPhys', DWORDLONG),
3296 ('ullAvailPhys', DWORDLONG),
3294 ('ullTotalPageFile', DWORDLONG),
3297 ('ullTotalPageFile', DWORDLONG),
3295 ('ullAvailPageFile', DWORDLONG),
3298 ('ullAvailPageFile', DWORDLONG),
3296 ('ullTotalVirtual', DWORDLONG),
3299 ('ullTotalVirtual', DWORDLONG),
3297 ('ullAvailVirtual', DWORDLONG),
3300 ('ullAvailVirtual', DWORDLONG),
3298 ('ullExtendedVirtual', DWORDLONG),
3301 ('ullExtendedVirtual', DWORDLONG),
3299 ]
3302 ]
3300
3303
3301 x = MEMORYSTATUSEX()
3304 x = MEMORYSTATUSEX()
3302 x.dwLength = sizeof(x)
3305 x.dwLength = sizeof(x)
3303 windll.kernel32.GlobalMemoryStatusEx(byref(x))
3306 windll.kernel32.GlobalMemoryStatusEx(byref(x))
3304 return x.ullAvailPhys
3307 return x.ullAvailPhys
3305
3308
3306 # On newer Unix-like systems and Mac OSX, the sysconf interface
3309 # On newer Unix-like systems and Mac OSX, the sysconf interface
3307 # can be used. _SC_PAGE_SIZE is part of POSIX; _SC_PHYS_PAGES
3310 # can be used. _SC_PAGE_SIZE is part of POSIX; _SC_PHYS_PAGES
3308 # seems to be implemented on most systems.
3311 # seems to be implemented on most systems.
3309 try:
3312 try:
3310 pagesize = os.sysconf(os.sysconf_names['SC_PAGE_SIZE'])
3313 pagesize = os.sysconf(os.sysconf_names['SC_PAGE_SIZE'])
3311 pages = os.sysconf(os.sysconf_names['SC_PHYS_PAGES'])
3314 pages = os.sysconf(os.sysconf_names['SC_PHYS_PAGES'])
3312 return pagesize * pages
3315 return pagesize * pages
3313 except OSError: # sysconf can fail
3316 except OSError: # sysconf can fail
3314 pass
3317 pass
3315 except KeyError: # unknown parameter
3318 except KeyError: # unknown parameter
3316 pass
3319 pass
General Comments 0
You need to be logged in to leave comments. Login now