Show More
util.py
1805 lines
| 56.2 KiB
| text/x-python
|
PythonLexer
/ mercurial / util.py
timeless@mozdev.org
|
r17515 | # util.py - Mercurial utility functions and platform specific implementations | ||
Martin Geisler
|
r8226 | # | ||
# Copyright 2005 K. Thananchayan <thananck@yahoo.com> | ||||
# Copyright 2005-2007 Matt Mackall <mpm@selenic.com> | ||||
# Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com> | ||||
# | ||||
# This software may be used and distributed according to the terms of the | ||||
Matt Mackall
|
r10263 | # GNU General Public License version 2 or any later version. | ||
mpm@selenic.com
|
r1082 | |||
timeless@mozdev.org
|
r17515 | """Mercurial utility functions and platform specific implementations. | ||
mpm@selenic.com
|
r1082 | |||
Martin Geisler
|
r8227 | This contains helper routines that are independent of the SCM core and | ||
hide platform-specific details from the core. | ||||
mpm@selenic.com
|
r1082 | """ | ||
mpm@selenic.com
|
r419 | |||
Matt Mackall
|
r3891 | from i18n import _ | ||
Bryan O'Sullivan
|
r16803 | import error, osutil, encoding, collections | ||
Matt Mackall
|
r11758 | import errno, re, shutil, sys, tempfile, traceback | ||
Dmitry Panov
|
r15505 | import os, time, datetime, calendar, textwrap, signal | ||
Brodie Rao
|
r14076 | import imp, socket, urllib | ||
Matt Mackall
|
r3769 | |||
Adrian Buehlmann
|
r14912 | if os.name == 'nt': | ||
Adrian Buehlmann
|
r14926 | import windows as platform | ||
Adrian Buehlmann
|
r14912 | else: | ||
Adrian Buehlmann
|
r14926 | import posix as platform | ||
Idan Kamara
|
r14927 | cachestat = platform.cachestat | ||
Adrian Buehlmann
|
r14926 | checkexec = platform.checkexec | ||
checklink = platform.checklink | ||||
Adrian Buehlmann
|
r15011 | copymode = platform.copymode | ||
Adrian Buehlmann
|
r14926 | executablepath = platform.executablepath | ||
expandglobs = platform.expandglobs | ||||
explainexit = platform.explainexit | ||||
findexe = platform.findexe | ||||
gethgcmd = platform.gethgcmd | ||||
getuser = platform.getuser | ||||
groupmembers = platform.groupmembers | ||||
groupname = platform.groupname | ||||
hidewindow = platform.hidewindow | ||||
isexec = platform.isexec | ||||
isowner = platform.isowner | ||||
localpath = platform.localpath | ||||
lookupreg = platform.lookupreg | ||||
makedir = platform.makedir | ||||
nlinks = platform.nlinks | ||||
normpath = platform.normpath | ||||
Matt Mackall
|
r15488 | normcase = platform.normcase | ||
Adrian Buehlmann
|
r14926 | openhardlinks = platform.openhardlinks | ||
oslink = platform.oslink | ||||
parsepatchoutput = platform.parsepatchoutput | ||||
pconvert = platform.pconvert | ||||
popen = platform.popen | ||||
posixfile = platform.posixfile | ||||
quotecommand = platform.quotecommand | ||||
realpath = platform.realpath | ||||
rename = platform.rename | ||||
samedevice = platform.samedevice | ||||
samefile = platform.samefile | ||||
samestat = platform.samestat | ||||
setbinary = platform.setbinary | ||||
setflags = platform.setflags | ||||
setsignalhandler = platform.setsignalhandler | ||||
shellquote = platform.shellquote | ||||
spawndetached = platform.spawndetached | ||||
Bryan O'Sullivan
|
r17560 | split = platform.split | ||
Adrian Buehlmann
|
r14926 | sshargs = platform.sshargs | ||
statfiles = platform.statfiles | ||||
termwidth = platform.termwidth | ||||
testpid = platform.testpid | ||||
umask = platform.umask | ||||
unlink = platform.unlink | ||||
unlinkpath = platform.unlinkpath | ||||
username = platform.username | ||||
Adrian Buehlmann
|
r14912 | |||
Dirkjan Ochtman
|
r6470 | # Python compatibility | ||
Matt Mackall
|
r3769 | |||
Matt Mackall
|
r15656 | _notset = object() | ||
def safehasattr(thing, attr): | ||||
return getattr(thing, attr, _notset) is not _notset | ||||
Matt Mackall
|
r15390 | def sha1(s=''): | ||
Matt Mackall
|
r15392 | ''' | ||
Low-overhead wrapper around Python's SHA support | ||||
>>> f = _fastsha1 | ||||
>>> a = sha1() | ||||
>>> a = f() | ||||
>>> a.hexdigest() | ||||
'da39a3ee5e6b4b0d3255bfef95601890afd80709' | ||||
''' | ||||
Martin Geisler
|
r8297 | return _fastsha1(s) | ||
Matt Mackall
|
r15390 | def _fastsha1(s=''): | ||
Martin Geisler
|
r8297 | # This function will import sha1 from hashlib or sha (whichever is | ||
# available) and overwrite itself with it on the first call. | ||||
# Subsequent calls will go directly to the imported function. | ||||
Sol Jerome
|
r12051 | if sys.version_info >= (2, 5): | ||
Martin Geisler
|
r8297 | from hashlib import sha1 as _sha1 | ||
Sol Jerome
|
r12051 | else: | ||
Sune Foldager
|
r8295 | from sha import sha as _sha1 | ||
Simon Heimberg
|
r8309 | global _fastsha1, sha1 | ||
_fastsha1 = sha1 = _sha1 | ||||
Dirkjan Ochtman
|
r6470 | return _sha1(s) | ||
Renato Cunha
|
r11565 | try: | ||
Matt Mackall
|
r15657 | buffer = buffer | ||
Renato Cunha
|
r11565 | except NameError: | ||
Matt Mackall
|
r15657 | if sys.version_info[0] < 3: | ||
def buffer(sliceable, offset=0): | ||||
return sliceable[offset:] | ||||
else: | ||||
def buffer(sliceable, offset=0): | ||||
return memoryview(sliceable)[offset:] | ||||
Ronny Pfannschmidt
|
r10756 | |||
Martin Geisler
|
r8280 | import subprocess | ||
closefds = os.name == 'posix' | ||||
Patrick Mezard
|
r10197 | |||
Patrick Mezard
|
r10199 | def popen2(cmd, env=None, newlines=False): | ||
Martin Geisler
|
r9089 | # Setting bufsize to -1 lets the system decide the buffer size. | ||
# The default for bufsize is 0, meaning unbuffered. This leads to | ||||
# poor performance on Mac OS X: http://bugs.python.org/issue4194 | ||||
p = subprocess.Popen(cmd, shell=True, bufsize=-1, | ||||
Bryan O'Sullivan
|
r9083 | close_fds=closefds, | ||
Patrick Mezard
|
r10197 | stdin=subprocess.PIPE, stdout=subprocess.PIPE, | ||
Patrick Mezard
|
r10199 | universal_newlines=newlines, | ||
env=env) | ||||
Martin Geisler
|
r8280 | return p.stdin, p.stdout | ||
Patrick Mezard
|
r10197 | |||
Patrick Mezard
|
r10199 | def popen3(cmd, env=None, newlines=False): | ||
Martin Geisler
|
r9089 | p = subprocess.Popen(cmd, shell=True, bufsize=-1, | ||
Bryan O'Sullivan
|
r9083 | close_fds=closefds, | ||
Martin Geisler
|
r8280 | stdin=subprocess.PIPE, stdout=subprocess.PIPE, | ||
Patrick Mezard
|
r10197 | stderr=subprocess.PIPE, | ||
Patrick Mezard
|
r10199 | universal_newlines=newlines, | ||
env=env) | ||||
Martin Geisler
|
r8280 | return p.stdin, p.stdout, p.stderr | ||
Dirkjan Ochtman
|
r7106 | |||
Matt Mackall
|
r7632 | def version(): | ||
"""Return version information if available.""" | ||||
try: | ||||
import __version__ | ||||
return __version__.version | ||||
except ImportError: | ||||
return 'unknown' | ||||
Chris Mason
|
r2609 | # used by parsedate | ||
Matt Mackall
|
r3808 | defaultdateformats = ( | ||
'%Y-%m-%d %H:%M:%S', | ||||
'%Y-%m-%d %I:%M:%S%p', | ||||
'%Y-%m-%d %H:%M', | ||||
'%Y-%m-%d %I:%M%p', | ||||
'%Y-%m-%d', | ||||
'%m-%d', | ||||
'%m/%d', | ||||
'%m/%d/%y', | ||||
'%m/%d/%Y', | ||||
'%a %b %d %H:%M:%S %Y', | ||||
'%a %b %d %I:%M:%S%p %Y', | ||||
Markus F.X.J. Oberhumer
|
r4708 | '%a, %d %b %Y %H:%M:%S', # GNU coreutils "/bin/date --rfc-2822" | ||
Matt Mackall
|
r3808 | '%b %d %H:%M:%S %Y', | ||
Matt Mackall
|
r3812 | '%b %d %I:%M:%S%p %Y', | ||
'%b %d %H:%M:%S', | ||||
Matt Mackall
|
r3808 | '%b %d %I:%M:%S%p', | ||
'%b %d %H:%M', | ||||
'%b %d %I:%M%p', | ||||
'%b %d %Y', | ||||
'%b %d', | ||||
'%H:%M:%S', | ||||
Carey Evans
|
r9383 | '%I:%M:%S%p', | ||
Matt Mackall
|
r3808 | '%H:%M', | ||
'%I:%M%p', | ||||
) | ||||
Chris Mason
|
r2609 | |||
Matt Mackall
|
r3812 | extendeddateformats = defaultdateformats + ( | ||
"%Y", | ||||
"%Y-%m", | ||||
"%b", | ||||
"%b %Y", | ||||
) | ||||
Chris Mason
|
r2609 | |||
Brendan Cully
|
r3145 | def cachefunc(func): | ||
'''cache the result of function calls''' | ||||
Benoit Boissinot
|
r3147 | # XXX doesn't handle keywords args | ||
Brendan Cully
|
r3145 | cache = {} | ||
if func.func_code.co_argcount == 1: | ||||
Benoit Boissinot
|
r3147 | # we gain a small amount of time because | ||
# we don't need to pack/unpack the list | ||||
Brendan Cully
|
r3145 | def f(arg): | ||
if arg not in cache: | ||||
cache[arg] = func(arg) | ||||
return cache[arg] | ||||
else: | ||||
def f(*args): | ||||
if args not in cache: | ||||
cache[args] = func(*args) | ||||
return cache[args] | ||||
return f | ||||
Bryan O'Sullivan
|
r16834 | try: | ||
collections.deque.remove | ||||
deque = collections.deque | ||||
except AttributeError: | ||||
# python 2.4 lacks deque.remove | ||||
class deque(collections.deque): | ||||
def remove(self, val): | ||||
for i, v in enumerate(self): | ||||
if v == val: | ||||
del self[i] | ||||
break | ||||
Matt Mackall
|
r9097 | def lrucachefunc(func): | ||
'''cache most recent results of function calls''' | ||||
cache = {} | ||||
Bryan O'Sullivan
|
r16834 | order = deque() | ||
Matt Mackall
|
r9097 | if func.func_code.co_argcount == 1: | ||
def f(arg): | ||||
if arg not in cache: | ||||
if len(cache) > 20: | ||||
Bryan O'Sullivan
|
r16803 | del cache[order.popleft()] | ||
Matt Mackall
|
r9097 | cache[arg] = func(arg) | ||
else: | ||||
order.remove(arg) | ||||
order.append(arg) | ||||
return cache[arg] | ||||
else: | ||||
def f(*args): | ||||
if args not in cache: | ||||
if len(cache) > 20: | ||||
Bryan O'Sullivan
|
r16803 | del cache[order.popleft()] | ||
Matt Mackall
|
r9097 | cache[args] = func(*args) | ||
else: | ||||
order.remove(args) | ||||
order.append(args) | ||||
return cache[args] | ||||
return f | ||||
Matt Mackall
|
r8207 | class propertycache(object): | ||
def __init__(self, func): | ||||
self.func = func | ||||
self.name = func.__name__ | ||||
def __get__(self, obj, type=None): | ||||
result = self.func(obj) | ||||
setattr(obj, self.name, result) | ||||
return result | ||||
Bryan O'Sullivan
|
r1293 | def pipefilter(s, cmd): | ||
'''filter string S through command CMD, returning its output''' | ||||
Martin Geisler
|
r8302 | p = subprocess.Popen(cmd, shell=True, close_fds=closefds, | ||
stdin=subprocess.PIPE, stdout=subprocess.PIPE) | ||||
pout, perr = p.communicate(s) | ||||
return pout | ||||
mpm@selenic.com
|
r419 | |||
Bryan O'Sullivan
|
r1293 | def tempfilter(s, cmd): | ||
'''filter string S through a pair of temporary files with CMD. | ||||
CMD is used as a template to create the real command to be run, | ||||
with the strings INFILE and OUTFILE replaced by the real names of | ||||
the temporary files generated.''' | ||||
inname, outname = None, None | ||||
try: | ||||
Thomas Arendsen Hein
|
r2165 | infd, inname = tempfile.mkstemp(prefix='hg-filter-in-') | ||
Bryan O'Sullivan
|
r1293 | fp = os.fdopen(infd, 'wb') | ||
fp.write(s) | ||||
fp.close() | ||||
Thomas Arendsen Hein
|
r2165 | outfd, outname = tempfile.mkstemp(prefix='hg-filter-out-') | ||
Bryan O'Sullivan
|
r1293 | os.close(outfd) | ||
cmd = cmd.replace('INFILE', inname) | ||||
cmd = cmd.replace('OUTFILE', outname) | ||||
code = os.system(cmd) | ||||
Jean-Francois PIERONNE
|
r4720 | if sys.platform == 'OpenVMS' and code & 1: | ||
code = 0 | ||||
Matt Mackall
|
r10282 | if code: | ||
raise Abort(_("command '%s' failed: %s") % | ||||
Adrian Buehlmann
|
r14234 | (cmd, explainexit(code))) | ||
Dan Villiom Podlaski Christiansen
|
r13400 | fp = open(outname, 'rb') | ||
r = fp.read() | ||||
fp.close() | ||||
return r | ||||
Bryan O'Sullivan
|
r1293 | finally: | ||
try: | ||||
Matt Mackall
|
r10282 | if inname: | ||
os.unlink(inname) | ||||
Idan Kamara
|
r14004 | except OSError: | ||
Matt Mackall
|
r10282 | pass | ||
Bryan O'Sullivan
|
r1293 | try: | ||
Matt Mackall
|
r10282 | if outname: | ||
os.unlink(outname) | ||||
Idan Kamara
|
r14004 | except OSError: | ||
Matt Mackall
|
r10282 | pass | ||
Bryan O'Sullivan
|
r1293 | |||
filtertable = { | ||||
'tempfile:': tempfilter, | ||||
'pipe:': pipefilter, | ||||
} | ||||
def filter(s, cmd): | ||||
"filter a string through a command that transforms its input to its output" | ||||
for name, fn in filtertable.iteritems(): | ||||
if cmd.startswith(name): | ||||
return fn(s, cmd[len(name):].lstrip()) | ||||
return pipefilter(s, cmd) | ||||
mpm@selenic.com
|
r1015 | def binary(s): | ||
Christian Ebert
|
r6507 | """return true if a string is binary data""" | ||
Martin Geisler
|
r8118 | return bool(s and '\0' in s) | ||
Matt Mackall
|
r6762 | |||
Brendan Cully
|
r7396 | def increasingchunks(source, min=1024, max=65536): | ||
'''return no less than min bytes per chunk while data remains, | ||||
doubling min after each chunk until it reaches max''' | ||||
def log2(x): | ||||
if not x: | ||||
return 0 | ||||
i = 0 | ||||
while x: | ||||
x >>= 1 | ||||
i += 1 | ||||
return i - 1 | ||||
buf = [] | ||||
blen = 0 | ||||
for chunk in source: | ||||
buf.append(chunk) | ||||
blen += len(chunk) | ||||
if blen >= min: | ||||
if min < max: | ||||
min = min << 1 | ||||
nmin = 1 << log2(blen) | ||||
if nmin > min: | ||||
min = nmin | ||||
if min > max: | ||||
min = max | ||||
yield ''.join(buf) | ||||
blen = 0 | ||||
buf = [] | ||||
if buf: | ||||
yield ''.join(buf) | ||||
Matt Mackall
|
r7947 | Abort = error.Abort | ||
mpm@selenic.com
|
r508 | |||
Matt Mackall
|
r10282 | def always(fn): | ||
return True | ||||
def never(fn): | ||||
return False | ||||
Bryan O'Sullivan
|
r724 | |||
Alexis S. L. Carvalho
|
r4229 | def pathto(root, n1, n2): | ||
Bryan O'Sullivan
|
r886 | '''return the relative path from one place to another. | ||
Alexis S. L. Carvalho
|
r4229 | root should use os.sep to separate directories | ||
Alexis S. L. Carvalho
|
r3669 | n1 should use os.sep to separate directories | ||
n2 should use "/" to separate directories | ||||
returns an os.sep-separated path. | ||||
Alexis S. L. Carvalho
|
r4229 | |||
If n1 is a relative path, it's assumed it's | ||||
relative to root. | ||||
n2 should always be relative to root. | ||||
Alexis S. L. Carvalho
|
r3669 | ''' | ||
Matt Mackall
|
r10282 | if not n1: | ||
return localpath(n2) | ||||
Alexis S. L. Carvalho
|
r4230 | if os.path.isabs(n1): | ||
if os.path.splitdrive(root)[0] != os.path.splitdrive(n1)[0]: | ||||
return os.path.join(root, localpath(n2)) | ||||
n2 = '/'.join((pconvert(root), n2)) | ||||
Shun-ichi GOTO
|
r5844 | a, b = splitpath(n1), n2.split('/') | ||
twaldmann@thinkmo.de
|
r1541 | a.reverse() | ||
b.reverse() | ||||
Bryan O'Sullivan
|
r884 | while a and b and a[-1] == b[-1]: | ||
twaldmann@thinkmo.de
|
r1541 | a.pop() | ||
b.pop() | ||||
Bryan O'Sullivan
|
r884 | b.reverse() | ||
Alexis S. L. Carvalho
|
r6111 | return os.sep.join((['..'] * len(a)) + b) or '.' | ||
Bryan O'Sullivan
|
r884 | |||
Thomas Arendsen Hein
|
r5062 | _hgexecutable = None | ||
Adrian Buehlmann
|
r14228 | def mainfrozen(): | ||
"Paul Moore "
|
r6499 | """return True if we are a frozen executable. | ||
The code supports py2exe (most common, Windows only) and tools/freeze | ||||
(portable, not much used). | ||||
""" | ||||
Augie Fackler
|
r14968 | return (safehasattr(sys, "frozen") or # new py2exe | ||
safehasattr(sys, "importers") or # old py2exe | ||||
"Paul Moore "
|
r6499 | imp.is_frozen("__main__")) # tools/freeze | ||
Thomas Arendsen Hein
|
r5062 | def hgexecutable(): | ||
"""return location of the 'hg' executable. | ||||
Defaults to $HG or 'hg' in the search path. | ||||
""" | ||||
if _hgexecutable is None: | ||||
Bryan O'Sullivan
|
r6500 | hg = os.environ.get('HG') | ||
Simon Heimberg
|
r15106 | mainmod = sys.modules['__main__'] | ||
Bryan O'Sullivan
|
r6500 | if hg: | ||
Adrian Buehlmann
|
r14229 | _sethgexecutable(hg) | ||
Adrian Buehlmann
|
r14228 | elif mainfrozen(): | ||
Adrian Buehlmann
|
r14229 | _sethgexecutable(sys.executable) | ||
Simon Heimberg
|
r15106 | elif os.path.basename(getattr(mainmod, '__file__', '')) == 'hg': | ||
_sethgexecutable(mainmod.__file__) | ||||
"Paul Moore "
|
r6499 | else: | ||
Adrian Buehlmann
|
r14271 | exe = findexe('hg') or os.path.basename(sys.argv[0]) | ||
Adrian Buehlmann
|
r14229 | _sethgexecutable(exe) | ||
Thomas Arendsen Hein
|
r5062 | return _hgexecutable | ||
Thomas Arendsen Hein
|
r4686 | |||
Adrian Buehlmann
|
r14229 | def _sethgexecutable(path): | ||
Thomas Arendsen Hein
|
r5062 | """set location of the 'hg' executable""" | ||
Thomas Arendsen Hein
|
r4686 | global _hgexecutable | ||
Thomas Arendsen Hein
|
r5062 | _hgexecutable = path | ||
Thomas Arendsen Hein
|
r4686 | |||
Maxim Khitrov
|
r11469 | def system(cmd, environ={}, cwd=None, onerr=None, errprefix=None, out=None): | ||
Vadim Gelfer
|
r1882 | '''enhanced shell command execution. | ||
run with environment maybe modified, maybe in different dir. | ||||
mpm@selenic.com
|
r508 | |||
Vadim Gelfer
|
r1882 | if command fails and onerr is None, return status. if ui object, | ||
print error message and return status, else raise onerr object as | ||||
Maxim Khitrov
|
r11469 | exception. | ||
if out is specified, it is assumed to be a file-like object that has a | ||||
write() method. stdout and stderr will be redirected to out.''' | ||||
Mads Kiilerich
|
r13439 | try: | ||
sys.stdout.flush() | ||||
except Exception: | ||||
pass | ||||
Vadim Gelfer
|
r2601 | def py2shell(val): | ||
'convert python object into string that is useful to shell' | ||||
Martin Geisler
|
r8534 | if val is None or val is False: | ||
Vadim Gelfer
|
r2601 | return '0' | ||
Martin Geisler
|
r8534 | if val is True: | ||
Vadim Gelfer
|
r2601 | return '1' | ||
return str(val) | ||||
Alexis S. L. Carvalho
|
r3905 | origcmd = cmd | ||
Steve Borho
|
r13188 | cmd = quotecommand(cmd) | ||
Steven Stallion
|
r16383 | if sys.platform == 'plan9': | ||
# subprocess kludge to work around issues in half-baked Python | ||||
# ports, notably bichued/python: | ||||
if not cwd is None: | ||||
os.chdir(cwd) | ||||
rc = os.system(cmd) | ||||
Maxim Khitrov
|
r11469 | else: | ||
Steven Stallion
|
r16383 | env = dict(os.environ) | ||
env.update((k, py2shell(v)) for k, v in environ.iteritems()) | ||||
env['HG'] = hgexecutable() | ||||
if out is None or out == sys.__stdout__: | ||||
rc = subprocess.call(cmd, shell=True, close_fds=closefds, | ||||
env=env, cwd=cwd) | ||||
else: | ||||
proc = subprocess.Popen(cmd, shell=True, close_fds=closefds, | ||||
env=env, cwd=cwd, stdout=subprocess.PIPE, | ||||
stderr=subprocess.STDOUT) | ||||
for line in proc.stdout: | ||||
out.write(line) | ||||
proc.wait() | ||||
rc = proc.returncode | ||||
if sys.platform == 'OpenVMS' and rc & 1: | ||||
rc = 0 | ||||
Mads Kiilerich
|
r9517 | if rc and onerr: | ||
errmsg = '%s %s' % (os.path.basename(origcmd.split(None, 1)[0]), | ||||
Adrian Buehlmann
|
r14234 | explainexit(rc)[0]) | ||
Mads Kiilerich
|
r9517 | if errprefix: | ||
errmsg = '%s: %s' % (errprefix, errmsg) | ||||
try: | ||||
onerr.warn(errmsg + '\n') | ||||
except AttributeError: | ||||
raise onerr(errmsg) | ||||
return rc | ||||
Vadim Gelfer
|
r1880 | |||
Matt Mackall
|
r7388 | def checksignature(func): | ||
'''wrap a function with code to check for calling errors''' | ||||
def check(*args, **kwargs): | ||||
try: | ||||
return func(*args, **kwargs) | ||||
except TypeError: | ||||
if len(traceback.extract_tb(sys.exc_info()[2])) == 1: | ||||
Matt Mackall
|
r7646 | raise error.SignatureError | ||
Matt Mackall
|
r7388 | raise | ||
return check | ||||
Matt Mackall
|
r3629 | def copyfile(src, dest): | ||
Will Maier
|
r7767 | "copy a file, preserving mode and atime/mtime" | ||
Eric St-Jean
|
r4271 | if os.path.islink(src): | ||
try: | ||||
os.unlink(dest) | ||||
Idan Kamara
|
r14004 | except OSError: | ||
Eric St-Jean
|
r4271 | pass | ||
os.symlink(os.readlink(src), dest) | ||||
else: | ||||
try: | ||||
shutil.copyfile(src, dest) | ||||
Brodie Rao
|
r13099 | shutil.copymode(src, dest) | ||
Eric St-Jean
|
r4271 | except shutil.Error, inst: | ||
raise Abort(str(inst)) | ||||
Matt Mackall
|
r3629 | |||
Stephen Darnell
|
r1241 | def copyfiles(src, dst, hardlink=None): | ||
"""Copy a directory tree using hardlinks if possible""" | ||||
if hardlink is None: | ||||
hardlink = (os.stat(src).st_dev == | ||||
os.stat(os.path.dirname(dst)).st_dev) | ||||
Thomas Arendsen Hein
|
r698 | |||
Adrian Buehlmann
|
r11251 | num = 0 | ||
mpm@selenic.com
|
r1207 | if os.path.isdir(src): | ||
os.mkdir(dst) | ||||
Bryan O'Sullivan
|
r5396 | for name, kind in osutil.listdir(src): | ||
mpm@selenic.com
|
r1207 | srcname = os.path.join(src, name) | ||
dstname = os.path.join(dst, name) | ||||
Adrian Buehlmann
|
r11251 | hardlink, n = copyfiles(srcname, dstname, hardlink) | ||
num += n | ||||
mpm@selenic.com
|
r1207 | else: | ||
Stephen Darnell
|
r1241 | if hardlink: | ||
try: | ||||
Adrian Buehlmann
|
r14235 | oslink(src, dst) | ||
Vadim Gelfer
|
r2050 | except (IOError, OSError): | ||
Stephen Darnell
|
r1241 | hardlink = False | ||
Benoit Boissinot
|
r1591 | shutil.copy(src, dst) | ||
Stephen Darnell
|
r1241 | else: | ||
Benoit Boissinot
|
r1591 | shutil.copy(src, dst) | ||
Adrian Buehlmann
|
r11251 | num += 1 | ||
Thomas Arendsen Hein
|
r698 | |||
Adrian Buehlmann
|
r11251 | return hardlink, num | ||
Adrian Buehlmann
|
r11254 | |||
Adrian Buehlmann
|
r14262 | _winreservednames = '''con prn aux nul | ||
Adrian Buehlmann
|
r13916 | com1 com2 com3 com4 com5 com6 com7 com8 com9 | ||
lpt1 lpt2 lpt3 lpt4 lpt5 lpt6 lpt7 lpt8 lpt9'''.split() | ||||
Adrian Buehlmann
|
r14262 | _winreservedchars = ':*?"<>|' | ||
Adrian Buehlmann
|
r13916 | def checkwinfilename(path): | ||
'''Check that the base-relative path is a valid filename on Windows. | ||||
Returns None if the path is ok, or a UI string describing the problem. | ||||
>>> checkwinfilename("just/a/normal/path") | ||||
>>> checkwinfilename("foo/bar/con.xml") | ||||
"filename contains 'con', which is reserved on Windows" | ||||
>>> checkwinfilename("foo/con.xml/bar") | ||||
"filename contains 'con', which is reserved on Windows" | ||||
>>> checkwinfilename("foo/bar/xml.con") | ||||
>>> checkwinfilename("foo/bar/AUX/bla.txt") | ||||
"filename contains 'AUX', which is reserved on Windows" | ||||
>>> checkwinfilename("foo/bar/bla:.txt") | ||||
"filename contains ':', which is reserved on Windows" | ||||
>>> checkwinfilename("foo/bar/b\07la.txt") | ||||
Adrian Buehlmann
|
r13947 | "filename contains '\\\\x07', which is invalid on Windows" | ||
Adrian Buehlmann
|
r13916 | >>> checkwinfilename("foo/bar/bla ") | ||
"filename ends with ' ', which is not allowed on Windows" | ||||
Matt Mackall
|
r15358 | >>> checkwinfilename("../bar") | ||
Adrian Buehlmann
|
r13916 | ''' | ||
for n in path.replace('\\', '/').split('/'): | ||||
if not n: | ||||
continue | ||||
for c in n: | ||||
Adrian Buehlmann
|
r14262 | if c in _winreservedchars: | ||
Adrian Buehlmann
|
r13916 | return _("filename contains '%s', which is reserved " | ||
"on Windows") % c | ||||
if ord(c) <= 31: | ||||
Adrian Buehlmann
|
r13947 | return _("filename contains %r, which is invalid " | ||
Adrian Buehlmann
|
r13916 | "on Windows") % c | ||
base = n.split('.')[0] | ||||
Adrian Buehlmann
|
r14262 | if base and base.lower() in _winreservednames: | ||
Adrian Buehlmann
|
r13916 | return _("filename contains '%s', which is reserved " | ||
"on Windows") % base | ||||
t = n[-1] | ||||
Matt Mackall
|
r15358 | if t in '. ' and n not in '..': | ||
Adrian Buehlmann
|
r13916 | return _("filename ends with '%s', which is not allowed " | ||
"on Windows") % t | ||||
Matt Mackall
|
r7890 | if os.name == 'nt': | ||
Adrian Buehlmann
|
r13916 | checkosfilename = checkwinfilename | ||
Matt Mackall
|
r7890 | else: | ||
Adrian Buehlmann
|
r14926 | checkosfilename = platform.checkosfilename | ||
Matt Mackall
|
r7890 | |||
def makelock(info, pathname): | ||||
try: | ||||
return os.symlink(info, pathname) | ||||
except OSError, why: | ||||
if why.errno == errno.EEXIST: | ||||
raise | ||||
except AttributeError: # no symlink in os | ||||
pass | ||||
Thomas Arendsen Hein
|
r704 | ld = os.open(pathname, os.O_CREAT | os.O_WRONLY | os.O_EXCL) | ||
os.write(ld, info) | ||||
os.close(ld) | ||||
Matt Mackall
|
r7890 | def readlock(pathname): | ||
try: | ||||
return os.readlink(pathname) | ||||
except OSError, why: | ||||
if why.errno not in (errno.EINVAL, errno.ENOSYS): | ||||
raise | ||||
except AttributeError: # no symlink in os | ||||
pass | ||||
Dan Villiom Podlaski Christiansen
|
r13400 | fp = posixfile(pathname) | ||
r = fp.read() | ||||
fp.close() | ||||
return r | ||||
Thomas Arendsen Hein
|
r704 | |||
Vadim Gelfer
|
r2176 | def fstat(fp): | ||
'''stat file object that may not have fileno method.''' | ||||
try: | ||||
return os.fstat(fp.fileno()) | ||||
except AttributeError: | ||||
return os.stat(fp.name) | ||||
Matt Mackall
|
r3784 | # File system features | ||
Matt Mackall
|
r6746 | def checkcase(path): | ||
Matt Mackall
|
r3784 | """ | ||
Check whether the given path is on a case-sensitive filesystem | ||||
Requires a path (like /foo/.hg) ending with a foldable final | ||||
directory component. | ||||
""" | ||||
s1 = os.stat(path) | ||||
d, b = os.path.split(path) | ||||
FUJIWARA Katsunori
|
r15667 | b2 = b.upper() | ||
if b == b2: | ||||
b2 = b.lower() | ||||
if b == b2: | ||||
return True # no evidence against case sensitivity | ||||
p2 = os.path.join(d, b2) | ||||
Matt Mackall
|
r3784 | try: | ||
s2 = os.stat(p2) | ||||
if s2 == s1: | ||||
return False | ||||
return True | ||||
Idan Kamara
|
r14004 | except OSError: | ||
Matt Mackall
|
r3784 | return True | ||
Bryan O'Sullivan
|
r16943 | try: | ||
import re2 | ||||
_re2 = None | ||||
except ImportError: | ||||
_re2 = False | ||||
def compilere(pat): | ||||
'''Compile a regular expression, using re2 if possible | ||||
For best performance, use only re2-compatible regexp features.''' | ||||
global _re2 | ||||
if _re2 is None: | ||||
try: | ||||
re2.compile | ||||
_re2 = True | ||||
except ImportError: | ||||
_re2 = False | ||||
if _re2: | ||||
try: | ||||
return re2.compile(pat) | ||||
except re2.error: | ||||
pass | ||||
return re.compile(pat) | ||||
Paul Moore
|
r6676 | _fspathcache = {} | ||
def fspath(name, root): | ||||
'''Get name in the case stored in the filesystem | ||||
FUJIWARA Katsunori
|
r15710 | The name should be relative to root, and be normcase-ed for efficiency. | ||
Note that this function is unnecessary, and should not be | ||||
Paul Moore
|
r6676 | called, for case-sensitive filesystems (simply because it's expensive). | ||
FUJIWARA Katsunori
|
r15670 | |||
FUJIWARA Katsunori
|
r15710 | The root should be normcase-ed, too. | ||
Paul Moore
|
r6676 | ''' | ||
FUJIWARA Katsunori
|
r15709 | def find(p, contents): | ||
for n in contents: | ||||
FUJIWARA Katsunori
|
r15718 | if normcase(n) == p: | ||
FUJIWARA Katsunori
|
r15709 | return n | ||
return None | ||||
Paul Moore
|
r6676 | seps = os.sep | ||
if os.altsep: | ||||
seps = seps + os.altsep | ||||
# Protect backslashes. This gets silly very quickly. | ||||
seps.replace('\\','\\\\') | ||||
pattern = re.compile(r'([^%s]+)|([%s]+)' % (seps, seps)) | ||||
FUJIWARA Katsunori
|
r15669 | dir = os.path.normpath(root) | ||
Paul Moore
|
r6676 | result = [] | ||
for part, sep in pattern.findall(name): | ||||
if sep: | ||||
result.append(sep) | ||||
continue | ||||
FUJIWARA Katsunori
|
r15719 | if dir not in _fspathcache: | ||
_fspathcache[dir] = os.listdir(dir) | ||||
contents = _fspathcache[dir] | ||||
Paul Moore
|
r6676 | |||
FUJIWARA Katsunori
|
r15709 | found = find(part, contents) | ||
if not found: | ||||
FUJIWARA Katsunori
|
r15720 | # retry "once per directory" per "dirstate.walk" which | ||
# may take place for each patches of "hg qpush", for example | ||||
FUJIWARA Katsunori
|
r15709 | contents = os.listdir(dir) | ||
_fspathcache[dir] = contents | ||||
found = find(part, contents) | ||||
result.append(found or part) | ||||
FUJIWARA Katsunori
|
r15669 | dir = os.path.join(dir, part) | ||
Paul Moore
|
r6676 | |||
return ''.join(result) | ||||
Adrian Buehlmann
|
r12938 | def checknlink(testfile): | ||
'''check whether hardlink count reporting works properly''' | ||||
Adrian Buehlmann
|
r13204 | # testfile may be open, so we need a separate file for checking to | ||
# work around issue2543 (or testfile may get lost on Samba shares) | ||||
f1 = testfile + ".hgtmp1" | ||||
if os.path.lexists(f1): | ||||
return False | ||||
Adrian Buehlmann
|
r12938 | try: | ||
Adrian Buehlmann
|
r13204 | posixfile(f1, 'w').close() | ||
except IOError: | ||||
Adrian Buehlmann
|
r12938 | return False | ||
Adrian Buehlmann
|
r13204 | f2 = testfile + ".hgtmp2" | ||
fd = None | ||||
Adrian Buehlmann
|
r12938 | try: | ||
Adrian Buehlmann
|
r13204 | try: | ||
Adrian Buehlmann
|
r14235 | oslink(f1, f2) | ||
Adrian Buehlmann
|
r13204 | except OSError: | ||
return False | ||||
Adrian Buehlmann
|
r12938 | # nlinks() may behave differently for files on Windows shares if | ||
# the file is open. | ||||
Adrian Buehlmann
|
r13342 | fd = posixfile(f2) | ||
Adrian Buehlmann
|
r13204 | return nlinks(f2) > 1 | ||
Adrian Buehlmann
|
r12938 | finally: | ||
Adrian Buehlmann
|
r13204 | if fd is not None: | ||
fd.close() | ||||
for f in (f1, f2): | ||||
try: | ||||
os.unlink(f) | ||||
except OSError: | ||||
pass | ||||
Adrian Buehlmann
|
r12938 | |||
return False | ||||
Shun-ichi GOTO
|
r5843 | def endswithsep(path): | ||
'''Check path ends with os.sep or os.altsep.''' | ||||
return path.endswith(os.sep) or os.altsep and path.endswith(os.altsep) | ||||
Shun-ichi GOTO
|
r5844 | def splitpath(path): | ||
'''Split path by os.sep. | ||||
Note that this function does not use os.altsep because this is | ||||
an alternative of simple "xxx.split(os.sep)". | ||||
It is recommended to use os.path.normpath() before using this | ||||
function if need.''' | ||||
return path.split(os.sep) | ||||
Matt Mackall
|
r6007 | def gui(): | ||
'''Are we running in a GUI?''' | ||||
Dan Villiom Podlaski Christiansen
|
r13734 | if sys.platform == 'darwin': | ||
if 'SSH_CONNECTION' in os.environ: | ||||
# handle SSH access to a box where the user is logged in | ||||
return False | ||||
elif getattr(osutil, 'isgui', None): | ||||
# check if a CoreGraphics session is available | ||||
return osutil.isgui() | ||||
else: | ||||
# pure build; use a safe default | ||||
return True | ||||
else: | ||||
return os.name == "nt" or os.environ.get("DISPLAY") | ||||
Matt Mackall
|
r6007 | |||
Alexis S. L. Carvalho
|
r6062 | def mktempcopy(name, emptyok=False, createmode=None): | ||
Alexis S. L. Carvalho
|
r4827 | """Create a temporary file with the same contents from name | ||
The permission bits are copied from the original file. | ||||
If the temporary file is going to be truncated immediately, you | ||||
can use emptyok=True as an optimization. | ||||
Returns the name of the temporary file. | ||||
Vadim Gelfer
|
r2176 | """ | ||
Alexis S. L. Carvalho
|
r4827 | d, fn = os.path.split(name) | ||
fd, temp = tempfile.mkstemp(prefix='.%s-' % fn, dir=d) | ||||
os.close(fd) | ||||
# Temporary files are created with mode 0600, which is usually not | ||||
# what we want. If the original file already exists, just copy | ||||
# its mode. Otherwise, manually obey umask. | ||||
Adrian Buehlmann
|
r15010 | copymode(name, temp, createmode) | ||
Alexis S. L. Carvalho
|
r4827 | if emptyok: | ||
return temp | ||||
try: | ||||
try: | ||||
ifp = posixfile(name, "rb") | ||||
except IOError, inst: | ||||
if inst.errno == errno.ENOENT: | ||||
return temp | ||||
if not getattr(inst, 'filename', None): | ||||
inst.filename = name | ||||
raise | ||||
ofp = posixfile(temp, "wb") | ||||
for chunk in filechunkiter(ifp): | ||||
ofp.write(chunk) | ||||
ifp.close() | ||||
ofp.close() | ||||
Brodie Rao
|
r16705 | except: # re-raises | ||
Alexis S. L. Carvalho
|
r4827 | try: os.unlink(temp) | ||
Brodie Rao
|
r16703 | except OSError: pass | ||
Alexis S. L. Carvalho
|
r4827 | raise | ||
return temp | ||||
Vadim Gelfer
|
r2176 | |||
Benoit Boissinot
|
r8778 | class atomictempfile(object): | ||
Mads Kiilerich
|
r17424 | '''writable file object that atomically updates a file | ||
Alexis S. L. Carvalho
|
r4827 | |||
Greg Ward
|
r14008 | All writes will go to a temporary copy of the original file. Call | ||
Greg Ward
|
r15057 | close() when you are done writing, and atomictempfile will rename | ||
the temporary copy to the original name, making the changes | ||||
visible. If the object is destroyed without being closed, all your | ||||
writes are discarded. | ||||
Greg Ward
|
r14008 | ''' | ||
Yuya Nishihara
|
r11212 | def __init__(self, name, mode='w+b', createmode=None): | ||
Greg Ward
|
r14007 | self.__name = name # permanent name | ||
self._tempname = mktempcopy(name, emptyok=('w' in mode), | ||||
createmode=createmode) | ||||
self._fp = posixfile(self._tempname, mode) | ||||
Bryan O'Sullivan
|
r8327 | |||
Greg Ward
|
r14007 | # delegated methods | ||
self.write = self._fp.write | ||||
Bryan O'Sullivan
|
r17237 | self.seek = self._fp.seek | ||
self.tell = self._fp.tell | ||||
Greg Ward
|
r14007 | self.fileno = self._fp.fileno | ||
Alexis S. L. Carvalho
|
r4827 | |||
Greg Ward
|
r15057 | def close(self): | ||
Benoit Boissinot
|
r8785 | if not self._fp.closed: | ||
Bryan O'Sullivan
|
r8327 | self._fp.close() | ||
Greg Ward
|
r14007 | rename(self._tempname, localpath(self.__name)) | ||
Alexis S. L. Carvalho
|
r4827 | |||
Greg Ward
|
r15057 | def discard(self): | ||
Benoit Boissinot
|
r8785 | if not self._fp.closed: | ||
Alexis S. L. Carvalho
|
r4827 | try: | ||
Greg Ward
|
r14007 | os.unlink(self._tempname) | ||
except OSError: | ||||
pass | ||||
Bryan O'Sullivan
|
r8327 | self._fp.close() | ||
Alexis S. L. Carvalho
|
r4827 | |||
Dan Villiom Podlaski Christiansen
|
r13098 | def __del__(self): | ||
Augie Fackler
|
r14968 | if safehasattr(self, '_fp'): # constructor actually did something | ||
Greg Ward
|
r15057 | self.discard() | ||
Dan Villiom Podlaski Christiansen
|
r13098 | |||
Alexis S. L. Carvalho
|
r6062 | def makedirs(name, mode=None): | ||
"""recursive directory creation with parent mode inheritance""" | ||||
try: | ||||
os.mkdir(name) | ||||
except OSError, err: | ||||
if err.errno == errno.EEXIST: | ||||
return | ||||
Adrian Buehlmann
|
r15058 | if err.errno != errno.ENOENT or not name: | ||
raise | ||||
parent = os.path.dirname(os.path.abspath(name)) | ||||
if parent == name: | ||||
Alexis S. L. Carvalho
|
r6062 | raise | ||
Mads Kiilerich
|
r15049 | makedirs(parent, mode) | ||
Mads Kiilerich
|
r15050 | os.mkdir(name) | ||
Mads Kiilerich
|
r15049 | if mode is not None: | ||
os.chmod(name, mode) | ||||
Alexis S. L. Carvalho
|
r6062 | |||
Dan Villiom Podlaski Christiansen
|
r14099 | def readfile(path): | ||
Patrick Mezard
|
r14250 | fp = open(path, 'rb') | ||
Dan Villiom Podlaski Christiansen
|
r14099 | try: | ||
Matt Mackall
|
r14100 | return fp.read() | ||
Dan Villiom Podlaski Christiansen
|
r14099 | finally: | ||
fp.close() | ||||
Dan Villiom Podlaski Christiansen
|
r14167 | def writefile(path, text): | ||
fp = open(path, 'wb') | ||||
try: | ||||
fp.write(text) | ||||
finally: | ||||
fp.close() | ||||
def appendfile(path, text): | ||||
fp = open(path, 'ab') | ||||
Dan Villiom Podlaski Christiansen
|
r14099 | try: | ||
fp.write(text) | ||||
finally: | ||||
fp.close() | ||||
Eric Hopper
|
r1199 | class chunkbuffer(object): | ||
"""Allow arbitrary sized chunks of data to be efficiently read from an | ||||
iterator over chunks of arbitrary size.""" | ||||
Bryan O'Sullivan
|
r1200 | |||
Matt Mackall
|
r5446 | def __init__(self, in_iter): | ||
Eric Hopper
|
r1199 | """in_iter is the iterator that's iterating over the input chunks. | ||
targetsize is how big a buffer to try to maintain.""" | ||||
Benoit Boissinot
|
r11670 | def splitbig(chunks): | ||
for chunk in chunks: | ||||
if len(chunk) > 2**20: | ||||
pos = 0 | ||||
while pos < len(chunk): | ||||
end = pos + 2 ** 18 | ||||
yield chunk[pos:end] | ||||
pos = end | ||||
else: | ||||
yield chunk | ||||
self.iter = splitbig(in_iter) | ||||
Bryan O'Sullivan
|
r16873 | self._queue = deque() | ||
Bryan O'Sullivan
|
r1200 | |||
Eric Hopper
|
r1199 | def read(self, l): | ||
Bryan O'Sullivan
|
r1200 | """Read L bytes of data from the iterator of chunks of data. | ||
Thomas Arendsen Hein
|
r1308 | Returns less than L bytes if the iterator runs dry.""" | ||
Matt Mackall
|
r11758 | left = l | ||
buf = '' | ||||
Bryan O'Sullivan
|
r16873 | queue = self._queue | ||
Matt Mackall
|
r11758 | while left > 0: | ||
# refill the queue | ||||
if not queue: | ||||
target = 2**18 | ||||
for chunk in self.iter: | ||||
queue.append(chunk) | ||||
target -= len(chunk) | ||||
if target <= 0: | ||||
break | ||||
if not queue: | ||||
Eric Hopper
|
r1199 | break | ||
Matt Mackall
|
r11758 | |||
Bryan O'Sullivan
|
r16803 | chunk = queue.popleft() | ||
Matt Mackall
|
r11758 | left -= len(chunk) | ||
if left < 0: | ||||
Bryan O'Sullivan
|
r16803 | queue.appendleft(chunk[left:]) | ||
Matt Mackall
|
r11758 | buf += chunk[:left] | ||
else: | ||||
buf += chunk | ||||
return buf | ||||
Vadim Gelfer
|
r2462 | def filechunkiter(f, size=65536, limit=None): | ||
"""Create a generator that produces the data in the file size | ||||
(default 65536) bytes at a time, up to optional limit (default is | ||||
to read all data). Chunks may be less than size bytes if the | ||||
chunk is the last chunk in the file, or the file is a socket or | ||||
some other type of file that sometimes reads less data than is | ||||
requested.""" | ||||
assert size >= 0 | ||||
assert limit is None or limit >= 0 | ||||
while True: | ||||
Matt Mackall
|
r10282 | if limit is None: | ||
nbytes = size | ||||
else: | ||||
nbytes = min(limit, size) | ||||
Vadim Gelfer
|
r2462 | s = nbytes and f.read(nbytes) | ||
Matt Mackall
|
r10282 | if not s: | ||
break | ||||
if limit: | ||||
limit -= len(s) | ||||
Eric Hopper
|
r1199 | yield s | ||
Bryan O'Sullivan
|
r1320 | |||
Bryan O'Sullivan
|
r1321 | def makedate(): | ||
Dmitry Panov
|
r15505 | ct = time.time() | ||
if ct < 0: | ||||
Adrian Buehlmann
|
r13063 | hint = _("check your clock") | ||
Dmitry Panov
|
r15505 | raise Abort(_("negative timestamp: %d") % ct, hint=hint) | ||
delta = (datetime.datetime.utcfromtimestamp(ct) - | ||||
datetime.datetime.fromtimestamp(ct)) | ||||
tz = delta.days * 86400 + delta.seconds | ||||
return ct, tz | ||||
Bryan O'Sullivan
|
r1329 | |||
Matt Mackall
|
r6229 | def datestr(date=None, format='%a %b %d %H:%M:%S %Y %1%2'): | ||
Bryan O'Sullivan
|
r1321 | """represent a (unixtime, offset) tuple as a localized time. | ||
unixtime is seconds since the epoch, and offset is the time zone's | ||||
Vadim Gelfer
|
r1987 | number of seconds away from UTC. if timezone is false, do not | ||
append time zone to string.""" | ||||
Bryan O'Sullivan
|
r1321 | t, tz = date or makedate() | ||
Adrian Buehlmann
|
r13039 | if t < 0: | ||
t = 0 # time.gmtime(lt) fails on Windows for lt < -43200 | ||||
tz = 0 | ||||
Matt Mackall
|
r6229 | if "%1" in format or "%2" in format: | ||
sign = (tz > 0) and "-" or "+" | ||||
Alejandro Santos
|
r9029 | minutes = abs(tz) // 60 | ||
format = format.replace("%1", "%c%02d" % (sign, minutes // 60)) | ||||
Matt Mackall
|
r6229 | format = format.replace("%2", "%02d" % (minutes % 60)) | ||
Kevin Gessner
|
r15157 | try: | ||
t = time.gmtime(float(t) - tz) | ||||
except ValueError: | ||||
# time was out of range | ||||
t = time.gmtime(sys.maxint) | ||||
s = time.strftime(format, t) | ||||
Vadim Gelfer
|
r1987 | return s | ||
Vadim Gelfer
|
r1829 | |||
Thomas Arendsen Hein
|
r6134 | def shortdate(date=None): | ||
"""turn (timestamp, tzoff) tuple into iso 8631 date.""" | ||||
Matt Mackall
|
r6229 | return datestr(date, format='%Y-%m-%d') | ||
Thomas Arendsen Hein
|
r6134 | |||
Bryan O'Sullivan
|
r5357 | def strdate(string, format, defaults=[]): | ||
Jose M. Prieto
|
r2522 | """parse a localized time string and return a (unixtime, offset) tuple. | ||
if the string cannot be parsed, ValueError is raised.""" | ||||
Matt Mackall
|
r3809 | def timezone(string): | ||
tz = string.split()[-1] | ||||
if tz[0] in "+-" and len(tz) == 5 and tz[1:].isdigit(): | ||||
Matt Mackall
|
r6229 | sign = (tz[0] == "+") and 1 or -1 | ||
hours = int(tz[1:3]) | ||||
minutes = int(tz[3:5]) | ||||
return -sign * (hours * 60 + minutes) * 60 | ||||
Matt Mackall
|
r12401 | if tz == "GMT" or tz == "UTC": | ||
Matt Mackall
|
r3809 | return 0 | ||
return None | ||||
Jose M. Prieto
|
r2522 | |||
Jose M. Prieto
|
r3255 | # NOTE: unixtime = localunixtime + offset | ||
Matt Mackall
|
r3809 | offset, date = timezone(string), string | ||
Martin Geisler
|
r13031 | if offset is not None: | ||
Matt Mackall
|
r3809 | date = " ".join(string.split()[:-1]) | ||
Matt Mackall
|
r3808 | |||
Matt Mackall
|
r3812 | # add missing elements from defaults | ||
Matt Mackall
|
r13212 | usenow = False # default to using biased defaults | ||
for part in ("S", "M", "HI", "d", "mb", "yY"): # decreasing specificity | ||||
Matt Mackall
|
r3812 | found = [True for p in part if ("%"+p) in format] | ||
if not found: | ||||
Matt Mackall
|
r13212 | date += "@" + defaults[part][usenow] | ||
Matt Mackall
|
r3812 | format += "@%" + part[0] | ||
Matt Mackall
|
r13212 | else: | ||
# We've found a specific time element, less specific time | ||||
# elements are relative to today | ||||
usenow = True | ||||
Matt Mackall
|
r3808 | |||
Jose M. Prieto
|
r3256 | timetuple = time.strptime(date, format) | ||
localunixtime = int(calendar.timegm(timetuple)) | ||||
if offset is None: | ||||
# local timezone | ||||
unixtime = int(time.mktime(timetuple)) | ||||
offset = unixtime - localunixtime | ||||
else: | ||||
unixtime = localunixtime + offset | ||||
Jose M. Prieto
|
r3255 | return unixtime, offset | ||
Jose M. Prieto
|
r2522 | |||
Matt Mackall
|
r13212 | def parsedate(date, formats=None, bias={}): | ||
"""parse a localized date/time and return a (unixtime, offset) tuple. | ||||
Thomas Arendsen Hein
|
r6139 | |||
Jose M. Prieto
|
r2522 | The date may be a "unixtime offset" string or in one of the specified | ||
Thomas Arendsen Hein
|
r6139 | formats. If the date already is a (unixtime, offset) tuple, it is returned. | ||
""" | ||||
if not date: | ||||
Matt Mackall
|
r3807 | return 0, 0 | ||
Matt Mackall
|
r6230 | if isinstance(date, tuple) and len(date) == 2: | ||
Thomas Arendsen Hein
|
r6139 | return date | ||
Chris Mason
|
r2609 | if not formats: | ||
formats = defaultdateformats | ||||
Thomas Arendsen Hein
|
r6139 | date = date.strip() | ||
Jose M. Prieto
|
r2522 | try: | ||
Thomas Arendsen Hein
|
r6139 | when, offset = map(int, date.split(' ')) | ||
Benoit Boissinot
|
r2523 | except ValueError: | ||
Matt Mackall
|
r3812 | # fill out defaults | ||
now = makedate() | ||||
Matt Mackall
|
r13212 | defaults = {} | ||
David Soria Parra
|
r13200 | for part in ("d", "mb", "yY", "HI", "M", "S"): | ||
Matt Mackall
|
r13212 | # this piece is for rounding the specific end of unknowns | ||
b = bias.get(part) | ||||
if b is None: | ||||
Matt Mackall
|
r3812 | if part[0] in "HMS": | ||
Matt Mackall
|
r13212 | b = "00" | ||
Matt Mackall
|
r3812 | else: | ||
Matt Mackall
|
r13212 | b = "0" | ||
# this piece is for matching the generic end to today's date | ||||
n = datestr(now, "%" + part[0]) | ||||
defaults[part] = (b, n) | ||||
Matt Mackall
|
r3812 | |||
Benoit Boissinot
|
r2523 | for format in formats: | ||
try: | ||||
Thomas Arendsen Hein
|
r6139 | when, offset = strdate(date, format, defaults) | ||
Dirkjan Ochtman
|
r6087 | except (ValueError, OverflowError): | ||
Benoit Boissinot
|
r2523 | pass | ||
else: | ||||
break | ||||
else: | ||||
Nicolas Dumazet
|
r12105 | raise Abort(_('invalid date: %r') % date) | ||
Benoit Boissinot
|
r2523 | # validate explicit (probably user-specified) date and | ||
# time zone offset. values must fit in signed 32 bits for | ||||
# current 32-bit linux runtimes. timezones go from UTC-12 | ||||
# to UTC+14 | ||||
if abs(when) > 0x7fffffff: | ||||
Matt Mackall
|
r3806 | raise Abort(_('date exceeds 32 bits: %d') % when) | ||
Adrian Buehlmann
|
r13062 | if when < 0: | ||
raise Abort(_('negative date value: %d') % when) | ||||
Benoit Boissinot
|
r2523 | if offset < -50400 or offset > 43200: | ||
Matt Mackall
|
r3806 | raise Abort(_('impossible time zone offset: %d') % offset) | ||
Benoit Boissinot
|
r2523 | return when, offset | ||
Jose M. Prieto
|
r2522 | |||
Matt Mackall
|
r3812 | def matchdate(date): | ||
"""Return a function that matches a given date match specifier | ||||
Formats include: | ||||
'{date}' match a given date to the accuracy provided | ||||
'<{date}' on or before a given date | ||||
'>{date}' on or after a given date | ||||
Matt Mackall
|
r13212 | >>> p1 = parsedate("10:29:59") | ||
>>> p2 = parsedate("10:30:00") | ||||
>>> p3 = parsedate("10:30:59") | ||||
>>> p4 = parsedate("10:31:00") | ||||
>>> p5 = parsedate("Sep 15 10:30:00 1999") | ||||
>>> f = matchdate("10:30") | ||||
>>> f(p1[0]) | ||||
False | ||||
>>> f(p2[0]) | ||||
True | ||||
>>> f(p3[0]) | ||||
True | ||||
>>> f(p4[0]) | ||||
False | ||||
>>> f(p5[0]) | ||||
False | ||||
Matt Mackall
|
r3812 | """ | ||
def lower(date): | ||||
Matt Mackall
|
r6230 | d = dict(mb="1", d="1") | ||
return parsedate(date, extendeddateformats, d)[0] | ||||
Matt Mackall
|
r3812 | |||
def upper(date): | ||||
d = dict(mb="12", HI="23", M="59", S="59") | ||||
David Soria Parra
|
r13200 | for days in ("31", "30", "29"): | ||
Matt Mackall
|
r3812 | try: | ||
d["d"] = days | ||||
return parsedate(date, extendeddateformats, d)[0] | ||||
Brodie Rao
|
r16688 | except Abort: | ||
Matt Mackall
|
r3812 | pass | ||
d["d"] = "28" | ||||
return parsedate(date, extendeddateformats, d)[0] | ||||
Justin Peng
|
r7953 | date = date.strip() | ||
Idan Kamara
|
r13780 | |||
if not date: | ||||
raise Abort(_("dates cannot consist entirely of whitespace")) | ||||
elif date[0] == "<": | ||||
Matt Mackall
|
r13869 | if not date[1:]: | ||
Martin Geisler
|
r13886 | raise Abort(_("invalid day spec, use '<DATE'")) | ||
Matt Mackall
|
r3812 | when = upper(date[1:]) | ||
return lambda x: x <= when | ||||
elif date[0] == ">": | ||||
Matt Mackall
|
r13869 | if not date[1:]: | ||
Martin Geisler
|
r13886 | raise Abort(_("invalid day spec, use '>DATE'")) | ||
Matt Mackall
|
r3812 | when = lower(date[1:]) | ||
return lambda x: x >= when | ||||
elif date[0] == "-": | ||||
try: | ||||
days = int(date[1:]) | ||||
except ValueError: | ||||
raise Abort(_("invalid day spec: %s") % date[1:]) | ||||
Yun Lee
|
r13889 | if days < 0: | ||
raise Abort(_("%s must be nonnegative (see 'hg help dates')") | ||||
% date[1:]) | ||||
Matt Mackall
|
r3812 | when = makedate()[0] - days * 3600 * 24 | ||
Matt Mackall
|
r3813 | return lambda x: x >= when | ||
Matt Mackall
|
r3812 | elif " to " in date: | ||
a, b = date.split(" to ") | ||||
start, stop = lower(a), upper(b) | ||||
return lambda x: x >= start and x <= stop | ||||
else: | ||||
start, stop = lower(date), upper(date) | ||||
return lambda x: x >= start and x <= stop | ||||
Vadim Gelfer
|
r1903 | def shortuser(user): | ||
"""Return a short representation of a user name or email address.""" | ||||
f = user.find('@') | ||||
if f >= 0: | ||||
user = user[:f] | ||||
f = user.find('<') | ||||
if f >= 0: | ||||
Matt Mackall
|
r10282 | user = user[f + 1:] | ||
Thomas Arendsen Hein
|
r3176 | f = user.find(' ') | ||
if f >= 0: | ||||
user = user[:f] | ||||
Matt Mackall
|
r3533 | f = user.find('.') | ||
if f >= 0: | ||||
user = user[:f] | ||||
Vadim Gelfer
|
r1903 | return user | ||
Vadim Gelfer
|
r1920 | |||
Matteo Capobianco
|
r16360 | def emailuser(user): | ||
"""Return the user portion of an email address.""" | ||||
f = user.find('@') | ||||
if f >= 0: | ||||
user = user[:f] | ||||
f = user.find('<') | ||||
if f >= 0: | ||||
user = user[f + 1:] | ||||
return user | ||||
Matt Mackall
|
r5975 | def email(author): | ||
'''get email of author.''' | ||||
r = author.find('>') | ||||
Matt Mackall
|
r10282 | if r == -1: | ||
r = None | ||||
return author[author.find('<') + 1:r] | ||||
Matt Mackall
|
r5975 | |||
Yuya Nishihara
|
r13225 | def _ellipsis(text, maxlength): | ||
if len(text) <= maxlength: | ||||
return text, False | ||||
else: | ||||
return "%s..." % (text[:maxlength - 3]), True | ||||
Thomas Arendsen Hein
|
r3767 | def ellipsis(text, maxlength=400): | ||
"""Trim string to at most maxlength (default: 400) characters.""" | ||||
Yuya Nishihara
|
r13225 | try: | ||
# use unicode not to split at intermediate multi-byte sequence | ||||
utext, truncated = _ellipsis(text.decode(encoding.encoding), | ||||
maxlength) | ||||
if not truncated: | ||||
return text | ||||
return utext.encode(encoding.encoding) | ||||
except (UnicodeDecodeError, UnicodeEncodeError): | ||||
return _ellipsis(text, maxlength)[0] | ||||
Thomas Arendsen Hein
|
r3767 | |||
Matt Mackall
|
r16397 | _byteunits = ( | ||
(100, 1 << 30, _('%.0f GB')), | ||||
(10, 1 << 30, _('%.1f GB')), | ||||
(1, 1 << 30, _('%.2f GB')), | ||||
(100, 1 << 20, _('%.0f MB')), | ||||
(10, 1 << 20, _('%.1f MB')), | ||||
(1, 1 << 20, _('%.2f MB')), | ||||
(100, 1 << 10, _('%.0f KB')), | ||||
(10, 1 << 10, _('%.1f KB')), | ||||
(1, 1 << 10, _('%.2f KB')), | ||||
(1, 1, _('%.0f bytes')), | ||||
) | ||||
Vadim Gelfer
|
r2612 | def bytecount(nbytes): | ||
'''return byte count formatted as readable string, with units''' | ||||
Matt Mackall
|
r16397 | for multiplier, divisor, format in _byteunits: | ||
Vadim Gelfer
|
r2612 | if nbytes >= divisor * multiplier: | ||
return format % (nbytes / float(divisor)) | ||||
Augie Fackler
|
r16768 | return _byteunits[-1][2] % nbytes | ||
Vadim Gelfer
|
r2740 | |||
Patrick Mezard
|
r5291 | def uirepr(s): | ||
# Avoid double backslash in Windows path repr() | ||||
return repr(s).replace('\\\\', '\\') | ||||
Alexander Solovyov
|
r7547 | |||
Matt Mackall
|
r13316 | # delay import of textwrap | ||
def MBTextWrapper(**kwargs): | ||||
class tw(textwrap.TextWrapper): | ||||
""" | ||||
FUJIWARA Katsunori
|
r15066 | Extend TextWrapper for width-awareness. | ||
Neither number of 'bytes' in any encoding nor 'characters' is | ||||
appropriate to calculate terminal columns for specified string. | ||||
Nicolas Dumazet
|
r12957 | |||
FUJIWARA Katsunori
|
r15066 | Original TextWrapper implementation uses built-in 'len()' directly, | ||
so overriding is needed to use width information of each characters. | ||||
Nicolas Dumazet
|
r12957 | |||
FUJIWARA Katsunori
|
r15066 | In addition, characters classified into 'ambiguous' width are | ||
Mads Kiilerich
|
r17424 | treated as wide in East Asian area, but as narrow in other. | ||
FUJIWARA Katsunori
|
r15066 | |||
This requires use decision to determine width of such characters. | ||||
Matt Mackall
|
r13316 | """ | ||
def __init__(self, **kwargs): | ||||
textwrap.TextWrapper.__init__(self, **kwargs) | ||||
FUJIWARA Katsunori
|
r11297 | |||
FUJIWARA Katsunori
|
r15066 | # for compatibility between 2.4 and 2.6 | ||
if getattr(self, 'drop_whitespace', None) is None: | ||||
self.drop_whitespace = kwargs.get('drop_whitespace', True) | ||||
Mads Kiilerich
|
r15065 | def _cutdown(self, ucstr, space_left): | ||
Matt Mackall
|
r13316 | l = 0 | ||
FUJIWARA Katsunori
|
r15066 | colwidth = encoding.ucolwidth | ||
Matt Mackall
|
r13316 | for i in xrange(len(ucstr)): | ||
FUJIWARA Katsunori
|
r15066 | l += colwidth(ucstr[i]) | ||
Matt Mackall
|
r13316 | if space_left < l: | ||
Mads Kiilerich
|
r15065 | return (ucstr[:i], ucstr[i:]) | ||
return ucstr, '' | ||||
FUJIWARA Katsunori
|
r11297 | |||
Matt Mackall
|
r13316 | # overriding of base class | ||
def _handle_long_word(self, reversed_chunks, cur_line, cur_len, width): | ||||
space_left = max(width - cur_len, 1) | ||||
FUJIWARA Katsunori
|
r11297 | |||
Matt Mackall
|
r13316 | if self.break_long_words: | ||
cut, res = self._cutdown(reversed_chunks[-1], space_left) | ||||
cur_line.append(cut) | ||||
reversed_chunks[-1] = res | ||||
elif not cur_line: | ||||
cur_line.append(reversed_chunks.pop()) | ||||
FUJIWARA Katsunori
|
r11297 | |||
FUJIWARA Katsunori
|
r15066 | # this overriding code is imported from TextWrapper of python 2.6 | ||
# to calculate columns of string by 'encoding.ucolwidth()' | ||||
def _wrap_chunks(self, chunks): | ||||
colwidth = encoding.ucolwidth | ||||
lines = [] | ||||
if self.width <= 0: | ||||
raise ValueError("invalid width %r (must be > 0)" % self.width) | ||||
# Arrange in reverse order so items can be efficiently popped | ||||
# from a stack of chucks. | ||||
chunks.reverse() | ||||
while chunks: | ||||
# Start the list of chunks that will make up the current line. | ||||
# cur_len is just the length of all the chunks in cur_line. | ||||
cur_line = [] | ||||
cur_len = 0 | ||||
# Figure out which static string will prefix this line. | ||||
if lines: | ||||
indent = self.subsequent_indent | ||||
else: | ||||
indent = self.initial_indent | ||||
# Maximum width for this line. | ||||
width = self.width - len(indent) | ||||
# First chunk on line is whitespace -- drop it, unless this | ||||
Mads Kiilerich
|
r17424 | # is the very beginning of the text (i.e. no lines started yet). | ||
FUJIWARA Katsunori
|
r15066 | if self.drop_whitespace and chunks[-1].strip() == '' and lines: | ||
del chunks[-1] | ||||
while chunks: | ||||
l = colwidth(chunks[-1]) | ||||
# Can at least squeeze this chunk onto the current line. | ||||
if cur_len + l <= width: | ||||
cur_line.append(chunks.pop()) | ||||
cur_len += l | ||||
# Nope, this line is full. | ||||
else: | ||||
break | ||||
# The current line is full, and the next chunk is too big to | ||||
# fit on *any* line (not just this one). | ||||
if chunks and colwidth(chunks[-1]) > width: | ||||
self._handle_long_word(chunks, cur_line, cur_len, width) | ||||
# If the last chunk on this line is all whitespace, drop it. | ||||
if (self.drop_whitespace and | ||||
cur_line and cur_line[-1].strip() == ''): | ||||
del cur_line[-1] | ||||
# Convert current line back to a string and store it in list | ||||
# of all lines (return value). | ||||
if cur_line: | ||||
lines.append(indent + ''.join(cur_line)) | ||||
return lines | ||||
Matt Mackall
|
r13316 | global MBTextWrapper | ||
MBTextWrapper = tw | ||||
return tw(**kwargs) | ||||
FUJIWARA Katsunori
|
r11297 | |||
Matt Mackall
|
r12698 | def wrap(line, width, initindent='', hangindent=''): | ||
FUJIWARA Katsunori
|
r11297 | maxindent = max(len(hangindent), len(initindent)) | ||
if width <= maxindent: | ||||
Martin Geisler
|
r9417 | # adjust for weird terminal size | ||
FUJIWARA Katsunori
|
r11297 | width = max(78, maxindent + 1) | ||
Mads Kiilerich
|
r15065 | line = line.decode(encoding.encoding, encoding.encodingmode) | ||
initindent = initindent.decode(encoding.encoding, encoding.encodingmode) | ||||
hangindent = hangindent.decode(encoding.encoding, encoding.encodingmode) | ||||
FUJIWARA Katsunori
|
r11297 | wrapper = MBTextWrapper(width=width, | ||
initial_indent=initindent, | ||||
subsequent_indent=hangindent) | ||||
Mads Kiilerich
|
r15065 | return wrapper.fill(line).encode(encoding.encoding) | ||
Martin Geisler
|
r8938 | |||
Alexander Solovyov <piranha at piranha.org.ua>
|
r7879 | def iterlines(iterator): | ||
for chunk in iterator: | ||||
for line in chunk.splitlines(): | ||||
yield line | ||||
Alexander Solovyov
|
r9610 | |||
def expandpath(path): | ||||
return os.path.expanduser(os.path.expandvars(path)) | ||||
Patrick Mezard
|
r10239 | |||
def hgcmd(): | ||||
"""Return the command used to execute current hg | ||||
This is different from hgexecutable() because on Windows we want | ||||
to avoid things opening new shell windows like batch files, so we | ||||
get either the python call or current executable. | ||||
""" | ||||
Adrian Buehlmann
|
r14228 | if mainfrozen(): | ||
Patrick Mezard
|
r10239 | return [sys.executable] | ||
return gethgcmd() | ||||
Patrick Mezard
|
r10344 | |||
def rundetached(args, condfn): | ||||
"""Execute the argument list in a detached process. | ||||
Augie Fackler
|
r10422 | |||
Patrick Mezard
|
r10344 | condfn is a callable which is called repeatedly and should return | ||
True once the child process is known to have started successfully. | ||||
At this point, the child process PID is returned. If the child | ||||
process fails to start or finishes before condfn() evaluates to | ||||
True, return -1. | ||||
""" | ||||
# Windows case is easier because the child process is either | ||||
# successfully starting and validating the condition or exiting | ||||
# on failure. We just poll on its PID. On Unix, if the child | ||||
# process fails to start, it will be left in a zombie state until | ||||
# the parent wait on it, which we cannot do since we expect a long | ||||
# running process on success. Instead we listen for SIGCHLD telling | ||||
# us our child process terminated. | ||||
terminated = set() | ||||
def handler(signum, frame): | ||||
terminated.add(os.wait()) | ||||
prevhandler = None | ||||
Augie Fackler
|
r14968 | SIGCHLD = getattr(signal, 'SIGCHLD', None) | ||
if SIGCHLD is not None: | ||||
prevhandler = signal.signal(SIGCHLD, handler) | ||||
Patrick Mezard
|
r10344 | try: | ||
pid = spawndetached(args) | ||||
while not condfn(): | ||||
if ((pid in terminated or not testpid(pid)) | ||||
and not condfn()): | ||||
return -1 | ||||
time.sleep(0.1) | ||||
return pid | ||||
finally: | ||||
if prevhandler is not None: | ||||
signal.signal(signal.SIGCHLD, prevhandler) | ||||
Steve Losh
|
r10438 | |||
Steve Losh
|
r10487 | try: | ||
any, all = any, all | ||||
except NameError: | ||||
def any(iterable): | ||||
for i in iterable: | ||||
if i: | ||||
return True | ||||
return False | ||||
Steve Losh
|
r10438 | |||
Steve Losh
|
r10487 | def all(iterable): | ||
for i in iterable: | ||||
if not i: | ||||
return False | ||||
return True | ||||
Patrick Mezard
|
r11010 | |||
Roman Sokolov
|
r13392 | def interpolate(prefix, mapping, s, fn=None, escape_prefix=False): | ||
Steve Losh
|
r11988 | """Return the result of interpolating items in the mapping into string s. | ||
prefix is a single character string, or a two character string with | ||||
a backslash as the first character if the prefix needs to be escaped in | ||||
a regular expression. | ||||
fn is an optional function that will be applied to the replacement text | ||||
just before replacement. | ||||
Roman Sokolov
|
r13392 | |||
escape_prefix is an optional flag that allows using doubled prefix for | ||||
its escaping. | ||||
Steve Losh
|
r11988 | """ | ||
fn = fn or (lambda s: s) | ||||
Roman Sokolov
|
r13392 | patterns = '|'.join(mapping.keys()) | ||
if escape_prefix: | ||||
patterns += '|' + prefix | ||||
if len(prefix) > 1: | ||||
prefix_char = prefix[1:] | ||||
else: | ||||
prefix_char = prefix | ||||
mapping[prefix_char] = prefix_char | ||||
r = re.compile(r'%s(%s)' % (prefix, patterns)) | ||||
Steve Losh
|
r11988 | return r.sub(lambda x: fn(mapping[x.group()[1:]]), s) | ||
Brodie Rao
|
r12076 | def getport(port): | ||
"""Return the port for a given network service. | ||||
If port is an integer, it's returned as is. If it's a string, it's | ||||
looked up using socket.getservbyname(). If there's no matching | ||||
service, util.Abort is raised. | ||||
""" | ||||
try: | ||||
return int(port) | ||||
except ValueError: | ||||
pass | ||||
try: | ||||
return socket.getservbyname(port) | ||||
except socket.error: | ||||
raise Abort(_("no port number associated with service '%s'") % port) | ||||
Augie Fackler
|
r12087 | |||
Augie Fackler
|
r12088 | _booleans = {'1': True, 'yes': True, 'true': True, 'on': True, 'always': True, | ||
'0': False, 'no': False, 'false': False, 'off': False, | ||||
'never': False} | ||||
Augie Fackler
|
r12087 | |||
def parsebool(s): | ||||
"""Parse s into a boolean. | ||||
If s is not a valid boolean, returns None. | ||||
""" | ||||
return _booleans.get(s.lower(), None) | ||||
Brodie Rao
|
r14076 | |||
Brodie Rao
|
r14077 | _hexdig = '0123456789ABCDEFabcdef' | ||
_hextochr = dict((a + b, chr(int(a + b, 16))) | ||||
for a in _hexdig for b in _hexdig) | ||||
def _urlunquote(s): | ||||
Mads Kiilerich
|
r17425 | """Decode HTTP/HTML % encoding. | ||
>>> _urlunquote('abc%20def') | ||||
'abc def' | ||||
""" | ||||
Brodie Rao
|
r14077 | res = s.split('%') | ||
# fastpath | ||||
if len(res) == 1: | ||||
return s | ||||
s = res[0] | ||||
for item in res[1:]: | ||||
try: | ||||
s += _hextochr[item[:2]] + item[2:] | ||||
except KeyError: | ||||
s += '%' + item | ||||
except UnicodeDecodeError: | ||||
s += unichr(int(item[:2], 16)) + item[2:] | ||||
return s | ||||
Brodie Rao
|
r14076 | class url(object): | ||
Mads Kiilerich
|
r14146 | r"""Reliable URL parser. | ||
Brodie Rao
|
r14076 | |||
This parses URLs and provides attributes for the following | ||||
components: | ||||
<scheme>://<user>:<passwd>@<host>:<port>/<path>?<query>#<fragment> | ||||
Missing components are set to None. The only exception is | ||||
fragment, which is set to '' if present but empty. | ||||
If parsefragment is False, fragment is included in query. If | ||||
parsequery is False, query is included in path. If both are | ||||
False, both fragment and query are included in path. | ||||
See http://www.ietf.org/rfc/rfc2396.txt for more information. | ||||
Note that for backward compatibility reasons, bundle URLs do not | ||||
take host names. That means 'bundle://../' has a path of '../'. | ||||
Examples: | ||||
>>> url('http://www.ietf.org/rfc/rfc2396.txt') | ||||
<url scheme: 'http', host: 'www.ietf.org', path: 'rfc/rfc2396.txt'> | ||||
>>> url('ssh://[::1]:2200//home/joe/repo') | ||||
<url scheme: 'ssh', host: '[::1]', port: '2200', path: '/home/joe/repo'> | ||||
>>> url('file:///home/joe/repo') | ||||
<url scheme: 'file', path: '/home/joe/repo'> | ||||
Matt Mackall
|
r14915 | >>> url('file:///c:/temp/foo/') | ||
<url scheme: 'file', path: 'c:/temp/foo/'> | ||||
Brodie Rao
|
r14076 | >>> url('bundle:foo') | ||
<url scheme: 'bundle', path: 'foo'> | ||||
>>> url('bundle://../foo') | ||||
<url scheme: 'bundle', path: '../foo'> | ||||
Mads Kiilerich
|
r14146 | >>> url(r'c:\foo\bar') | ||
<url path: 'c:\\foo\\bar'> | ||||
Matt Mackall
|
r14699 | >>> url(r'\\blah\blah\blah') | ||
<url path: '\\\\blah\\blah\\blah'> | ||||
Matt Mackall
|
r15074 | >>> url(r'\\blah\blah\blah#baz') | ||
<url path: '\\\\blah\\blah\\blah', fragment: 'baz'> | ||||
Brodie Rao
|
r14076 | |||
Authentication credentials: | ||||
>>> url('ssh://joe:xyz@x/repo') | ||||
<url scheme: 'ssh', user: 'joe', passwd: 'xyz', host: 'x', path: 'repo'> | ||||
>>> url('ssh://joe@x/repo') | ||||
<url scheme: 'ssh', user: 'joe', host: 'x', path: 'repo'> | ||||
Query strings and fragments: | ||||
>>> url('http://host/a?b#c') | ||||
<url scheme: 'http', host: 'host', path: 'a', query: 'b', fragment: 'c'> | ||||
>>> url('http://host/a?b#c', parsequery=False, parsefragment=False) | ||||
<url scheme: 'http', host: 'host', path: 'a?b#c'> | ||||
""" | ||||
_safechars = "!~*'()+" | ||||
Mads Kiilerich
|
r15452 | _safepchars = "/!~*'()+:" | ||
Brodie Rao
|
r14076 | _matchscheme = re.compile(r'^[a-zA-Z0-9+.\-]+:').match | ||
def __init__(self, path, parsequery=True, parsefragment=True): | ||||
# We slowly chomp away at path until we have only the path left | ||||
self.scheme = self.user = self.passwd = self.host = None | ||||
self.port = self.path = self.query = self.fragment = None | ||||
self._localpath = True | ||||
self._hostport = '' | ||||
self._origpath = path | ||||
Matt Mackall
|
r15074 | if parsefragment and '#' in path: | ||
path, self.fragment = path.split('#', 1) | ||||
if not path: | ||||
path = None | ||||
Matt Mackall
|
r14699 | # special case for Windows drive letters and UNC paths | ||
if hasdriveletter(path) or path.startswith(r'\\'): | ||||
Brodie Rao
|
r14076 | self.path = path | ||
return | ||||
# For compatibility reasons, we can't handle bundle paths as | ||||
# normal URLS | ||||
if path.startswith('bundle:'): | ||||
self.scheme = 'bundle' | ||||
path = path[7:] | ||||
if path.startswith('//'): | ||||
path = path[2:] | ||||
self.path = path | ||||
return | ||||
if self._matchscheme(path): | ||||
parts = path.split(':', 1) | ||||
if parts[0]: | ||||
self.scheme, path = parts | ||||
self._localpath = False | ||||
if not path: | ||||
path = None | ||||
if self._localpath: | ||||
self.path = '' | ||||
return | ||||
else: | ||||
if self._localpath: | ||||
self.path = path | ||||
return | ||||
if parsequery and '?' in path: | ||||
path, self.query = path.split('?', 1) | ||||
if not path: | ||||
path = None | ||||
if not self.query: | ||||
self.query = None | ||||
# // is required to specify a host/authority | ||||
if path and path.startswith('//'): | ||||
parts = path[2:].split('/', 1) | ||||
if len(parts) > 1: | ||||
self.host, path = parts | ||||
path = path | ||||
else: | ||||
self.host = parts[0] | ||||
path = None | ||||
if not self.host: | ||||
self.host = None | ||||
Mads Kiilerich
|
r15018 | # path of file:///d is /d | ||
# path of file:///d:/ is d:/, not /d:/ | ||||
Matt Mackall
|
r14915 | if path and not hasdriveletter(path): | ||
Brodie Rao
|
r14076 | path = '/' + path | ||
if self.host and '@' in self.host: | ||||
self.user, self.host = self.host.rsplit('@', 1) | ||||
if ':' in self.user: | ||||
self.user, self.passwd = self.user.split(':', 1) | ||||
if not self.host: | ||||
self.host = None | ||||
# Don't split on colons in IPv6 addresses without ports | ||||
if (self.host and ':' in self.host and | ||||
not (self.host.startswith('[') and self.host.endswith(']'))): | ||||
self._hostport = self.host | ||||
self.host, self.port = self.host.rsplit(':', 1) | ||||
if not self.host: | ||||
self.host = None | ||||
if (self.host and self.scheme == 'file' and | ||||
self.host not in ('localhost', '127.0.0.1', '[::1]')): | ||||
raise Abort(_('file:// URLs can only refer to localhost')) | ||||
self.path = path | ||||
Benoit Boissinot
|
r14988 | # leave the query string escaped | ||
Brodie Rao
|
r14076 | for a in ('user', 'passwd', 'host', 'port', | ||
Benoit Boissinot
|
r14988 | 'path', 'fragment'): | ||
Brodie Rao
|
r14076 | v = getattr(self, a) | ||
if v is not None: | ||||
Brodie Rao
|
r14077 | setattr(self, a, _urlunquote(v)) | ||
Brodie Rao
|
r14076 | |||
def __repr__(self): | ||||
attrs = [] | ||||
for a in ('scheme', 'user', 'passwd', 'host', 'port', 'path', | ||||
'query', 'fragment'): | ||||
v = getattr(self, a) | ||||
if v is not None: | ||||
attrs.append('%s: %r' % (a, v)) | ||||
return '<url %s>' % ', '.join(attrs) | ||||
def __str__(self): | ||||
Mads Kiilerich
|
r14147 | r"""Join the URL's components back into a URL string. | ||
Brodie Rao
|
r14076 | |||
Examples: | ||||
Mads Kiilerich
|
r15452 | >>> str(url('http://user:pw@host:80/c:/bob?fo:oo#ba:ar')) | ||
'http://user:pw@host:80/c:/bob?fo:oo#ba:ar' | ||||
Benoit Boissinot
|
r14988 | >>> str(url('http://user:pw@host:80/?foo=bar&baz=42')) | ||
'http://user:pw@host:80/?foo=bar&baz=42' | ||||
>>> str(url('http://user:pw@host:80/?foo=bar%3dbaz')) | ||||
'http://user:pw@host:80/?foo=bar%3dbaz' | ||||
Brodie Rao
|
r14076 | >>> str(url('ssh://user:pw@[::1]:2200//home/joe#')) | ||
'ssh://user:pw@[::1]:2200//home/joe#' | ||||
>>> str(url('http://localhost:80//')) | ||||
'http://localhost:80//' | ||||
>>> str(url('http://localhost:80/')) | ||||
'http://localhost:80/' | ||||
>>> str(url('http://localhost:80')) | ||||
'http://localhost:80/' | ||||
>>> str(url('bundle:foo')) | ||||
'bundle:foo' | ||||
>>> str(url('bundle://../foo')) | ||||
'bundle:../foo' | ||||
>>> str(url('path')) | ||||
'path' | ||||
Peter Arrenbrecht
|
r14313 | >>> str(url('file:///tmp/foo/bar')) | ||
'file:///tmp/foo/bar' | ||||
Patrick Mezard
|
r15609 | >>> str(url('file:///c:/tmp/foo/bar')) | ||
Matt Mackall
|
r15611 | 'file:///c:/tmp/foo/bar' | ||
Mads Kiilerich
|
r14147 | >>> print url(r'bundle:foo\bar') | ||
bundle:foo\bar | ||||
Brodie Rao
|
r14076 | """ | ||
if self._localpath: | ||||
s = self.path | ||||
if self.scheme == 'bundle': | ||||
s = 'bundle:' + s | ||||
if self.fragment: | ||||
s += '#' + self.fragment | ||||
return s | ||||
s = self.scheme + ':' | ||||
Peter Arrenbrecht
|
r14313 | if self.user or self.passwd or self.host: | ||
s += '//' | ||||
Patrick Mezard
|
r15609 | elif self.scheme and (not self.path or self.path.startswith('/') | ||
or hasdriveletter(self.path)): | ||||
Brodie Rao
|
r14076 | s += '//' | ||
Patrick Mezard
|
r15609 | if hasdriveletter(self.path): | ||
s += '/' | ||||
Brodie Rao
|
r14076 | if self.user: | ||
s += urllib.quote(self.user, safe=self._safechars) | ||||
if self.passwd: | ||||
s += ':' + urllib.quote(self.passwd, safe=self._safechars) | ||||
if self.user or self.passwd: | ||||
s += '@' | ||||
if self.host: | ||||
if not (self.host.startswith('[') and self.host.endswith(']')): | ||||
s += urllib.quote(self.host) | ||||
else: | ||||
s += self.host | ||||
if self.port: | ||||
s += ':' + urllib.quote(self.port) | ||||
if self.host: | ||||
s += '/' | ||||
if self.path: | ||||
Benoit Boissinot
|
r14988 | # TODO: similar to the query string, we should not unescape the | ||
# path when we store it, the path might contain '%2f' = '/', | ||||
# which we should *not* escape. | ||||
Brodie Rao
|
r14076 | s += urllib.quote(self.path, safe=self._safepchars) | ||
if self.query: | ||||
Benoit Boissinot
|
r14988 | # we store the query in escaped form. | ||
s += '?' + self.query | ||||
Brodie Rao
|
r14076 | if self.fragment is not None: | ||
s += '#' + urllib.quote(self.fragment, safe=self._safepchars) | ||||
return s | ||||
def authinfo(self): | ||||
user, passwd = self.user, self.passwd | ||||
try: | ||||
self.user, self.passwd = None, None | ||||
s = str(self) | ||||
finally: | ||||
self.user, self.passwd = user, passwd | ||||
if not self.user: | ||||
return (s, None) | ||||
Patrick Mezard
|
r15028 | # authinfo[1] is passed to urllib2 password manager, and its | ||
# URIs must not contain credentials. The host is passed in the | ||||
# URIs list because Python < 2.4.3 uses only that to search for | ||||
# a password. | ||||
Patrick Mezard
|
r15024 | return (s, (None, (s, self.host), | ||
Brodie Rao
|
r14076 | self.user, self.passwd or '')) | ||
Matt Mackall
|
r14766 | def isabs(self): | ||
if self.scheme and self.scheme != 'file': | ||||
return True # remote URL | ||||
if hasdriveletter(self.path): | ||||
return True # absolute for our purposes - can't be joined() | ||||
if self.path.startswith(r'\\'): | ||||
return True # Windows UNC path | ||||
if self.path.startswith('/'): | ||||
return True # POSIX-style | ||||
return False | ||||
Brodie Rao
|
r14076 | def localpath(self): | ||
if self.scheme == 'file' or self.scheme == 'bundle': | ||||
path = self.path or '/' | ||||
# For Windows, we need to promote hosts containing drive | ||||
# letters to paths with drive letters. | ||||
if hasdriveletter(self._hostport): | ||||
path = self._hostport + '/' + self.path | ||||
Mads Kiilerich
|
r15496 | elif (self.host is not None and self.path | ||
and not hasdriveletter(path)): | ||||
Brodie Rao
|
r14076 | path = '/' + path | ||
return path | ||||
return self._origpath | ||||
def hasscheme(path): | ||||
return bool(url(path).scheme) | ||||
def hasdriveletter(path): | ||||
Patrick Mezard
|
r15609 | return path and path[1:2] == ':' and path[0:1].isalpha() | ||
Brodie Rao
|
r14076 | |||
Mads Kiilerich
|
r14825 | def urllocalpath(path): | ||
Brodie Rao
|
r14076 | return url(path, parsequery=False, parsefragment=False).localpath() | ||
def hidepassword(u): | ||||
'''hide user credential in a url string''' | ||||
u = url(u) | ||||
if u.passwd: | ||||
u.passwd = '***' | ||||
return str(u) | ||||
def removeauth(u): | ||||
'''remove all authentication information from a url string''' | ||||
u = url(u) | ||||
u.user = u.passwd = None | ||||
return str(u) | ||||
Idan Kamara
|
r14515 | |||
def isatty(fd): | ||||
try: | ||||
return fd.isatty() | ||||
except AttributeError: | ||||
return False | ||||