##// END OF EJS Templates
util._matcher: fix handling of relglob: patterns
util._matcher: fix handling of relglob: patterns

File last commit:

r4188:ce3ecf99 default
r4188:ce3ecf99 default
Show More
util.py
1377 lines | 42.4 KiB | text/x-python | PythonLexer
mpm@selenic.com
Update util.py docstrings, fix walk test
r1082 """
util.py - Mercurial utility functions and platform specfic implementations
Copyright 2005 K. Thananchayan <thananck@yahoo.com>
Vadim Gelfer
update copyrights.
r2859 Copyright 2005, 2006 Matt Mackall <mpm@selenic.com>
Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com>
mpm@selenic.com
Update util.py docstrings, fix walk test
r1082
This software may be used and distributed according to the terms
of the GNU General Public License, incorporated herein by reference.
This contains helper routines that are independent of the SCM core and hide
platform-specific details from the core.
"""
mpm@selenic.com
[PATCH] file seperator handling for the other 'OS'...
r419
Benoit Boissinot
i18n first part: make '_' available for files who need it
r1400 from i18n import gettext as _
Bryan O'Sullivan
Get add and locate to use new repo and dirstate walk code....
r724 from demandload import *
Vadim Gelfer
fix windows username problem.
r2652 demandload(globals(), "cStringIO errno getpass popen2 re shutil sys tempfile")
Alexis S. L. Carvalho
Explicitly expand globs on Windows
r4054 demandload(globals(), "os threading time calendar ConfigParser locale glob")
Matt Mackall
Add encoding detection
r3769
Alexis S. L. Carvalho
Fallback to ascii if getpreferredencoding raises an exception...
r4057 try:
_encoding = os.environ.get("HGENCODING") or locale.getpreferredencoding() \
or "ascii"
except locale.Error:
_encoding = 'ascii'
Matt Mackall
Add functions for transcoding and manipulating multibyte strings
r3770 _encodingmode = os.environ.get("HGENCODINGMODE", "strict")
Alexis S. L. Carvalho
Allow the user to specify the fallback encoding for the changelog...
r3835 _fallbackencoding = 'ISO-8859-1'
Matt Mackall
Add functions for transcoding and manipulating multibyte strings
r3770
def tolocal(s):
"""
Convert a string from internal UTF-8 to local encoding
All internal strings should be UTF-8 but some repos before the
implementation of locale support may contain latin1 or possibly
other character sets. We attempt to decode everything strictly
using UTF-8, then Latin-1, and failing that, we use UTF-8 and
replace unknown characters.
"""
Alexis S. L. Carvalho
Allow the user to specify the fallback encoding for the changelog...
r3835 for e in ('UTF-8', _fallbackencoding):
Matt Mackall
Add functions for transcoding and manipulating multibyte strings
r3770 try:
u = s.decode(e) # attempt strict decoding
return u.encode(_encoding, "replace")
Matt Mackall
make transcoding more robust...
r3843 except LookupError, k:
raise Abort(_("%s, please check your locale settings") % k)
Matt Mackall
Add functions for transcoding and manipulating multibyte strings
r3770 except UnicodeDecodeError:
pass
u = s.decode("utf-8", "replace") # last ditch
return u.encode(_encoding, "replace")
def fromlocal(s):
"""
Convert a string from the local character encoding to UTF-8
We attempt to decode strings using the encoding mode set by
HG_ENCODINGMODE, which defaults to 'strict'. In this mode, unknown
characters will cause an error message. Other modes include
'replace', which replaces unknown characters with a special
Unicode character, and 'ignore', which drops the character.
"""
try:
return s.decode(_encoding, _encodingmode).encode("utf-8")
except UnicodeDecodeError, inst:
sub = s[max(0, inst.start-10):inst.start+10]
Matt Mackall
make transcoding more robust...
r3843 raise Abort("decoding near '%s': %s!" % (sub, inst))
except LookupError, k:
raise Abort(_("%s, please check your locale settings") % k)
Matt Mackall
Add functions for transcoding and manipulating multibyte strings
r3770
def locallen(s):
"""Find the length in characters of a local string"""
return len(s.decode(_encoding, "replace"))
def localsub(s, a, b=None):
try:
u = s.decode(_encoding, _encodingmode)
if b is not None:
u = u[a:b]
else:
u = u[:a]
return u.encode(_encoding, _encodingmode)
except UnicodeDecodeError, inst:
sub = s[max(0, inst.start-10), inst.start+10]
Matt Mackall
make transcoding more robust...
r3843 raise Abort(_("decoding near '%s': %s!\n") % (sub, inst))
mpm@selenic.com
Add file encoding/decoding support
r1258
Chris Mason
util.parsedate should understand dates from hg export
r2609 # used by parsedate
Matt Mackall
improve date parsing for numerous new date formats...
r3808 defaultdateformats = (
'%Y-%m-%d %H:%M:%S',
'%Y-%m-%d %I:%M:%S%p',
'%Y-%m-%d %H:%M',
'%Y-%m-%d %I:%M%p',
'%Y-%m-%d',
'%m-%d',
'%m/%d',
'%m/%d/%y',
'%m/%d/%Y',
'%a %b %d %H:%M:%S %Y',
'%a %b %d %I:%M:%S%p %Y',
'%b %d %H:%M:%S %Y',
Matt Mackall
Add date matching support...
r3812 '%b %d %I:%M:%S%p %Y',
'%b %d %H:%M:%S',
Matt Mackall
improve date parsing for numerous new date formats...
r3808 '%b %d %I:%M:%S%p',
'%b %d %H:%M',
'%b %d %I:%M%p',
'%b %d %Y',
'%b %d',
'%H:%M:%S',
'%I:%M:%SP',
'%H:%M',
'%I:%M%p',
)
Chris Mason
util.parsedate should understand dates from hg export
r2609
Matt Mackall
Add date matching support...
r3812 extendeddateformats = defaultdateformats + (
"%Y",
"%Y-%m",
"%b",
"%b %Y",
)
Chris Mason
util.parsedate should understand dates from hg export
r2609
Vadim Gelfer
move SignalInterrupt class into util module.
r2153 class SignalInterrupt(Exception):
"""Exception raised on SIGTERM and SIGHUP."""
Alexis S. L. Carvalho
Use a case-sensitive version of SafeConfigParser everywhere...
r3425 # like SafeConfigParser but with case-sensitive keys
class configparser(ConfigParser.SafeConfigParser):
def optionxform(self, optionstr):
return optionstr
Brendan Cully
Add cachefunc to abstract function call cache
r3145 def cachefunc(func):
'''cache the result of function calls'''
Benoit Boissinot
add comments in cachefunc
r3147 # XXX doesn't handle keywords args
Brendan Cully
Add cachefunc to abstract function call cache
r3145 cache = {}
if func.func_code.co_argcount == 1:
Benoit Boissinot
add comments in cachefunc
r3147 # we gain a small amount of time because
# we don't need to pack/unpack the list
Brendan Cully
Add cachefunc to abstract function call cache
r3145 def f(arg):
if arg not in cache:
cache[arg] = func(arg)
return cache[arg]
else:
def f(*args):
if args not in cache:
cache[args] = func(*args)
return cache[args]
return f
Bryan O'Sullivan
Enhance the file filtering capabilities....
r1293 def pipefilter(s, cmd):
'''filter string S through command CMD, returning its output'''
mpm@selenic.com
Add file encoding/decoding support
r1258 (pout, pin) = popen2.popen2(cmd, -1, 'b')
def writer():
Alexis S. L. Carvalho
Ignore EPIPE in pipefilter...
r2096 try:
pin.write(s)
pin.close()
except IOError, inst:
if inst.errno != errno.EPIPE:
raise
mpm@selenic.com
Add file encoding/decoding support
r1258
# we should use select instead on UNIX, but this will work on most
# systems, including Windows
w = threading.Thread(target=writer)
w.start()
f = pout.read()
pout.close()
w.join()
return f
mpm@selenic.com
[PATCH] file seperator handling for the other 'OS'...
r419
Bryan O'Sullivan
Enhance the file filtering capabilities....
r1293 def tempfilter(s, cmd):
'''filter string S through a pair of temporary files with CMD.
CMD is used as a template to create the real command to be run,
with the strings INFILE and OUTFILE replaced by the real names of
the temporary files generated.'''
inname, outname = None, None
try:
Thomas Arendsen Hein
Use better names (hg-{usage}-{random}.{suffix}) for temporary files.
r2165 infd, inname = tempfile.mkstemp(prefix='hg-filter-in-')
Bryan O'Sullivan
Enhance the file filtering capabilities....
r1293 fp = os.fdopen(infd, 'wb')
fp.write(s)
fp.close()
Thomas Arendsen Hein
Use better names (hg-{usage}-{random}.{suffix}) for temporary files.
r2165 outfd, outname = tempfile.mkstemp(prefix='hg-filter-out-')
Bryan O'Sullivan
Enhance the file filtering capabilities....
r1293 os.close(outfd)
cmd = cmd.replace('INFILE', inname)
cmd = cmd.replace('OUTFILE', outname)
code = os.system(cmd)
Benoit Boissinot
i18n part2: use '_' for all strings who are part of the user interface
r1402 if code: raise Abort(_("command '%s' failed: %s") %
Bryan O'Sullivan
Enhance the file filtering capabilities....
r1293 (cmd, explain_exit(code)))
return open(outname, 'rb').read()
finally:
try:
if inname: os.unlink(inname)
except: pass
try:
if outname: os.unlink(outname)
except: pass
filtertable = {
'tempfile:': tempfilter,
'pipe:': pipefilter,
}
def filter(s, cmd):
"filter a string through a command that transforms its input to its output"
for name, fn in filtertable.iteritems():
if cmd.startswith(name):
return fn(s, cmd[len(name):].lstrip())
return pipefilter(s, cmd)
Vadim Gelfer
import: use gpatch if present on system. patch is broken on solaris....
r2071 def find_in_path(name, path, default=None):
'''find name in search path. path can be string (will be split
with os.pathsep), or iterable thing that returns strings. if name
found, return path to name. else return default.'''
if isinstance(path, str):
path = path.split(os.pathsep)
for p in path:
p_name = os.path.join(p, name)
if os.path.exists(p_name):
return p_name
return default
mpm@selenic.com
Add automatic binary file detection to diff and export...
r1015 def binary(s):
mpm@selenic.com
Update util.py docstrings, fix walk test
r1082 """return true if a string is binary data using diff's heuristic"""
mpm@selenic.com
Add automatic binary file detection to diff and export...
r1015 if s and '\0' in s[:4096]:
return True
return False
mpm@selenic.com
Move dirstate.uniq to util.unique...
r556 def unique(g):
mpm@selenic.com
Update util.py docstrings, fix walk test
r1082 """return the uniq elements of iterable g"""
mpm@selenic.com
Move dirstate.uniq to util.unique...
r556 seen = {}
Matt Mackall
Make util.unique return a list
r3535 l = []
mpm@selenic.com
Move dirstate.uniq to util.unique...
r556 for f in g:
if f not in seen:
seen[f] = 1
Matt Mackall
Make util.unique return a list
r3535 l.append(f)
return l
mpm@selenic.com
Move dirstate.uniq to util.unique...
r556
Bryan O'Sullivan
Teach walk code about absolute paths....
r870 class Abort(Exception):
"""Raised if a command needs to print an error and exit."""
mpm@selenic.com
[PATCH] Harden os.system...
r508
Thomas Arendsen Hein
New UnexpectedOutput exception to catch server errors in localrepo.stream_in...
r3564 class UnexpectedOutput(Abort):
"""Raised to print an error with part of output and exit."""
Bryan O'Sullivan
Get add and locate to use new repo and dirstate walk code....
r724 def always(fn): return True
def never(fn): return False
Alexis S. L. Carvalho
Explicitly expand globs on Windows
r4054 def expand_glob(pats):
'''On Windows, expand the implicit globs in a list of patterns'''
if os.name != 'nt':
return list(pats)
ret = []
for p in pats:
kind, name = patkind(p, None)
if kind is None:
globbed = glob.glob(name)
if globbed:
ret.extend(globbed)
continue
# if we couldn't expand the glob, just keep it around
ret.append(p)
return ret
Robin Farine
export patkind() from util
r1563 def patkind(name, dflt_pat='glob'):
"""Split a string into an optional pattern kind prefix and the
actual pattern."""
for prefix in 're', 'glob', 'path', 'relglob', 'relpath', 'relre':
if name.startswith(prefix + ':'): return name.split(':', 1)
return dflt_pat, name
benoit.boissinot@ens-lyon.fr
pep-0008 cleanup...
r1062 def globre(pat, head='^', tail='$'):
Bryan O'Sullivan
Get add and locate to use new repo and dirstate walk code....
r724 "convert a glob pattern into a regexp"
i, n = 0, len(pat)
res = ''
group = False
def peek(): return i < n and pat[i]
while i < n:
c = pat[i]
i = i+1
if c == '*':
if peek() == '*':
i += 1
res += '.*'
else:
res += '[^/]*'
elif c == '?':
res += '.'
elif c == '[':
j = i
if j < n and pat[j] in '!]':
j += 1
while j < n and pat[j] != ']':
j += 1
if j >= n:
res += '\\['
else:
stuff = pat[i:j].replace('\\','\\\\')
i = j + 1
if stuff[0] == '!':
stuff = '^' + stuff[1:]
elif stuff[0] == '^':
stuff = '\\' + stuff
res = '%s[%s]' % (res, stuff)
elif c == '{':
group = True
res += '(?:'
elif c == '}' and group:
res += ')'
group = False
elif c == ',' and group:
res += '|'
Benoit Boissinot
make it possible to escape characters in a glob expression
r1990 elif c == '\\':
p = peek()
if p:
i += 1
res += re.escape(p)
else:
res += re.escape(c)
Bryan O'Sullivan
Get add and locate to use new repo and dirstate walk code....
r724 else:
res += re.escape(c)
return head + res + tail
Bryan O'Sullivan
Reduce the amount of stat traffic generated by a walk....
r812 _globchars = {'[': 1, '{': 1, '*': 1, '?': 1}
Bryan O'Sullivan
Fix walk code for files that do not exist anywhere, and unhandled types....
r884 def pathto(n1, n2):
Bryan O'Sullivan
Fix walk path handling on Windows
r886 '''return the relative path from one place to another.
Alexis S. L. Carvalho
fix util.pathto...
r3669 n1 should use os.sep to separate directories
n2 should use "/" to separate directories
returns an os.sep-separated path.
'''
Bryan O'Sullivan
Fix walk path handling on Windows
r886 if not n1: return localpath(n2)
Alexis S. L. Carvalho
fix util.pathto...
r3669 a, b = n1.split(os.sep), n2.split('/')
twaldmann@thinkmo.de
fixed some stuff pychecker shows, marked unclear/wrong stuff with XXX
r1541 a.reverse()
b.reverse()
Bryan O'Sullivan
Fix walk code for files that do not exist anywhere, and unhandled types....
r884 while a and b and a[-1] == b[-1]:
twaldmann@thinkmo.de
fixed some stuff pychecker shows, marked unclear/wrong stuff with XXX
r1541 a.pop()
b.pop()
Bryan O'Sullivan
Fix walk code for files that do not exist anywhere, and unhandled types....
r884 b.reverse()
return os.sep.join((['..'] * len(a)) + b)
mpm@selenic.com
Change canonpath to not know about repo objects...
r1081 def canonpath(root, cwd, myname):
mpm@selenic.com
Update util.py docstrings, fix walk test
r1082 """return the canonical path of myname, given cwd and root"""
Arun Sharma
Handle hg under /
r1566 if root == os.sep:
rootsep = os.sep
Manpreet Singh
Make it possible to use the root directory as the root of a repository.
r2271 elif root.endswith(os.sep):
rootsep = root
Arun Sharma
Handle hg under /
r1566 else:
Thomas Arendsen Hein
Whitespace, tab and formatting cleanups, mainly in mq.py
r1810 rootsep = root + os.sep
Bryan O'Sullivan
Teach walk code about absolute paths....
r870 name = myname
Vadim Gelfer
fix util.canonpath on windows....
r2090 if not os.path.isabs(name):
mpm@selenic.com
Change canonpath to not know about repo objects...
r1081 name = os.path.join(root, cwd, name)
Bryan O'Sullivan
Teach walk code about absolute paths....
r870 name = os.path.normpath(name)
Manpreet Singh
Make hg status work for repositories in root directory on windows (issue 228)
r2278 if name != rootsep and name.startswith(rootsep):
Thomas Arendsen Hein
Enable path validation for copy, rename, debugwalk and other canonpath users....
r1976 name = name[len(rootsep):]
audit_path(name)
return pconvert(name)
mpm@selenic.com
Change canonpath to not know about repo objects...
r1081 elif name == root:
Bryan O'Sullivan
Teach walk code about absolute paths....
r870 return ''
else:
Jim Meyering
Fix issue 165: `hg status' with abs path containing a symlink-to-dir fails
r2115 # Determine whether `name' is in the hierarchy at or beneath `root',
# by iterating name=dirname(name) until that causes no change (can't
# check name == '/', because that doesn't work on windows). For each
# `name', compare dev/inode numbers. If they match, the list `rel'
# holds the reversed list of components making up the relative file
# name we want.
root_st = os.stat(root)
rel = []
while True:
try:
name_st = os.stat(name)
except OSError:
break
Vadim Gelfer
add util.samestat function for windows....
r2193 if samestat(name_st, root_st):
Jun Inoue
Fix accessing the repo through a symlink.
r4086 if not rel:
# name was actually the same as root (maybe a symlink)
return ''
Jim Meyering
Fix issue 165: `hg status' with abs path containing a symlink-to-dir fails
r2115 rel.reverse()
name = os.path.join(*rel)
audit_path(name)
return pconvert(name)
dirname, basename = os.path.split(name)
rel.append(basename)
if dirname == name:
break
name = dirname
mpm@selenic.com
Change canonpath to not know about repo objects...
r1081 raise Abort('%s not under root' % myname)
mpm@selenic.com
Fix bug with empty inc and exc...
r897
Vadim Gelfer
if hgignore contains errors, print message that is not confusing.
r1610 def matcher(canonroot, cwd='', names=['.'], inc=[], exc=[], head='', src=None):
return _matcher(canonroot, cwd, names, inc, exc, head, 'glob', src)
Benoit Boissinot
Do not use 'glob' expansion by default on OS != 'nt'
r1413
Alexis S. L. Carvalho
docopy: deal with globs on windows in a better way
r4055 def cmdmatcher(canonroot, cwd='', names=['.'], inc=[], exc=[], head='',
src=None, globbed=False):
if not globbed:
names = expand_glob(names)
Alexis S. L. Carvalho
Explicitly expand globs on Windows
r4054 return _matcher(canonroot, cwd, names, inc, exc, head, 'relpath', src)
Benoit Boissinot
Do not use 'glob' expansion by default on OS != 'nt'
r1413
Vadim Gelfer
if hgignore contains errors, print message that is not confusing.
r1610 def _matcher(canonroot, cwd, names, inc, exc, head, dflt_pat, src):
mpm@selenic.com
Update util.py docstrings, fix walk test
r1082 """build a function to match a set of file patterns
arguments:
canonroot - the canonical root of the tree you're matching against
cwd - the current working directory, if relevant
names - patterns to find
inc - patterns to include
exc - patterns to exclude
head - a regex to prepend to patterns to control whether a match is rooted
Alexis S. L. Carvalho
util._matcher: update comments...
r4185 dflt_pat - if a pattern in names has no explicit type, assume this one
src - where these patterns came from (e.g. .hgignore)
mpm@selenic.com
Update util.py docstrings, fix walk test
r1082
a pattern is one of:
Alexis S. L. Carvalho
util._matcher: update comments...
r4185 'glob:<glob>' - a glob relative to cwd
're:<regexp>' - a regular expression
'path:<path>' - a path relative to canonroot
'relglob:<glob>' - an unrooted glob (*.c matches C files in all dirs)
'relpath:<path>' - a path relative to cwd
'relre:<regexp>' - a regexp that doesn't have to match the start of a name
'<something>' - one of the cases above, selected by the dflt_pat argument
mpm@selenic.com
Update util.py docstrings, fix walk test
r1082
returns:
a 3-tuple containing
Alexis S. L. Carvalho
util._matcher: update comments...
r4185 - list of roots (places where one should start a recursive walk of the fs);
this often matches the explicit non-pattern names passed in, but also
includes the initial part of glob: patterns that has no glob characters
mpm@selenic.com
Update util.py docstrings, fix walk test
r1082 - a bool match(filename) function
- a bool indicating if any patterns were passed in
todo:
make head regex a rooted bool
"""
Benoit Boissinot
Do not use 'glob' expansion by default on OS != 'nt'
r1413 def contains_glob(name):
Bryan O'Sullivan
Reduce the amount of stat traffic generated by a walk....
r812 for c in name:
Benoit Boissinot
Do not use 'glob' expansion by default on OS != 'nt'
r1413 if c in _globchars: return True
return False
Bryan O'Sullivan
Clean up walk and changes code to use normalised names properly....
r820
Bryan O'Sullivan
Fix up handling of regexp paths.
r888 def regex(kind, name, tail):
mpm@selenic.com
Refactor matchpats and walk...
r742 '''convert a pattern into a regular expression'''
Bryan O'Sullivan
Clean up walk and changes code to use normalised names properly....
r820 if kind == 're':
return name
elif kind == 'path':
Bryan O'Sullivan
Fix up handling of regexp paths.
r888 return '^' + re.escape(name) + '(?:/|$)'
Bryan O'Sullivan
Switch to new syntax for .hgignore files....
r1270 elif kind == 'relglob':
Alexis S. L. Carvalho
util._matcher: fix handling of relglob: patterns
r4188 return head + globre(name, '(?:|.*/)', '(?:/|$)')
Bryan O'Sullivan
Fix up handling of regexp paths.
r888 elif kind == 'relpath':
return head + re.escape(name) + tail
Bryan O'Sullivan
Switch to new syntax for .hgignore files....
r1270 elif kind == 'relre':
if name.startswith('^'):
return name
return '.*' + name
mpm@selenic.com
Refactor matchpats and walk...
r742 return head + globre(name, '', tail)
def matchfn(pats, tail):
"""build a matching function from a set of patterns"""
Benoit Boissinot
further fix traceback on invalid .hgignore patterns...
r1454 if not pats:
return
Benoit Boissinot
abort on invalid pattern in matcher
r1446 matches = []
for k, p in pats:
try:
pat = '(?:%s)' % regex(k, p, tail)
matches.append(re.compile(pat).match)
twaldmann@thinkmo.de
fixed some stuff pychecker shows, marked unclear/wrong stuff with XXX
r1541 except re.error:
Vadim Gelfer
make invalid pattern message not confusing.
r1611 if src: raise Abort("%s: invalid pattern (%s): %s" % (src, k, p))
else: raise Abort("invalid pattern (%s): %s" % (k, p))
Benoit Boissinot
abort on invalid pattern in matcher
r1446
def buildfn(text):
for m in matches:
r = m(text)
if r:
return r
return buildfn
mpm@selenic.com
Refactor matchpats and walk...
r742
Bryan O'Sullivan
Clean up walk and changes code to use normalised names properly....
r820 def globprefix(pat):
'''return the non-glob prefix of a path, e.g. foo/* -> foo'''
root = []
Alexis S. L. Carvalho
small globprefix fix
r4183 for p in pat.split('/'):
Benoit Boissinot
Do not use 'glob' expansion by default on OS != 'nt'
r1413 if contains_glob(p): break
Bryan O'Sullivan
Clean up walk and changes code to use normalised names properly....
r820 root.append(p)
Alexis S. L. Carvalho
A 'glob:foo?bar' pattern determines a root - the tree root
r4187 return '/'.join(root) or '.'
Bryan O'Sullivan
Clean up walk and changes code to use normalised names properly....
r820
Bryan O'Sullivan
Teach walk code about absolute paths....
r870 pats = []
files = []
roots = []
Benoit Boissinot
Do not use 'glob' expansion by default on OS != 'nt'
r1413 for kind, name in [patkind(p, dflt_pat) for p in names]:
Bryan O'Sullivan
Teach walk code about absolute paths....
r870 if kind in ('glob', 'relpath'):
mpm@selenic.com
Change canonpath to not know about repo objects...
r1081 name = canonpath(canonroot, cwd, name)
Bryan O'Sullivan
Teach walk code about absolute paths....
r870 if name == '':
kind, name = 'glob', '**'
Alexis S. L. Carvalho
util._matcher: fix handling of relglob: patterns
r4188 elif kind == 'relglob':
name = normpath(name)
if kind in ('glob', 'path', 're', 'relglob'):
Bryan O'Sullivan
Fix up handling of regexp paths.
r888 pats.append((kind, name))
Bryan O'Sullivan
Teach walk code about absolute paths....
r870 if kind == 'glob':
root = globprefix(name)
Alexis S. L. Carvalho
A 'glob:foo?bar' pattern determines a root - the tree root
r4187 roots.append(root)
Bryan O'Sullivan
Teach walk code about absolute paths....
r870 elif kind == 'relpath':
Bryan O'Sullivan
Fix up handling of regexp paths.
r888 files.append((kind, name))
Bryan O'Sullivan
Teach walk code about absolute paths....
r870 roots.append(name)
Alexis S. L. Carvalho
util._matcher: fix handling of relglob: patterns
r4188 elif kind == 'relglob':
roots.append('.')
mpm@selenic.com
Fix bug with empty inc and exc...
r897
Bryan O'Sullivan
Clean up walk and changes code to use normalised names properly....
r820 patmatch = matchfn(pats, '$') or always
filematch = matchfn(files, '(?:/|$)') or always
mpm@selenic.com
Fix bug with empty inc and exc...
r897 incmatch = always
if inc:
Vadim Gelfer
fix -I/-X when relative paths used or in subdir
r2480 inckinds = [patkind(canonpath(canonroot, cwd, i)) for i in inc]
incmatch = matchfn(inckinds, '(?:/|$)')
mpm@selenic.com
Fix bug with empty inc and exc...
r897 excmatch = lambda fn: False
if exc:
Vadim Gelfer
fix -I/-X when relative paths used or in subdir
r2480 exckinds = [patkind(canonpath(canonroot, cwd, x)) for x in exc]
excmatch = matchfn(exckinds, '(?:/|$)')
mpm@selenic.com
Refactor matchpats and walk...
r742
Bryan O'Sullivan
Rewrite log command. New version is faster and more featureful....
r1031 return (roots,
lambda fn: (incmatch(fn) and not excmatch(fn) and
(fn.endswith('/') or
(not pats and not files) or
(pats and patmatch(fn)) or
(files and filematch(fn)))),
(inc or exc or (pats and pats != [('glob', '**')])) and True)
mpm@selenic.com
Refactor matchpats and walk...
r742
Vadim Gelfer
merge util.esystem and util.system.
r1882 def system(cmd, environ={}, cwd=None, onerr=None, errprefix=None):
'''enhanced shell command execution.
run with environment maybe modified, maybe in different dir.
mpm@selenic.com
[PATCH] Harden os.system...
r508
Vadim Gelfer
merge util.esystem and util.system.
r1882 if command fails and onerr is None, return status. if ui object,
print error message and return status, else raise onerr object as
exception.'''
Vadim Gelfer
move most of tag code to localrepository class.
r2601 def py2shell(val):
'convert python object into string that is useful to shell'
if val in (None, False):
return '0'
if val == True:
return '1'
return str(val)
Vadim Gelfer
fix broken environment save/restore when a hook runs....
r1880 oldenv = {}
for k in environ:
oldenv[k] = os.environ.get(k)
if cwd is not None:
oldcwd = os.getcwd()
Alexis S. L. Carvalho
util.system: fix quoting on windows
r3905 origcmd = cmd
if os.name == 'nt':
cmd = '"%s"' % cmd
Vadim Gelfer
fix broken environment save/restore when a hook runs....
r1880 try:
for k, v in environ.iteritems():
Vadim Gelfer
move most of tag code to localrepository class.
r2601 os.environ[k] = py2shell(v)
Vadim Gelfer
fix broken environment save/restore when a hook runs....
r1880 if cwd is not None and oldcwd != cwd:
os.chdir(cwd)
Vadim Gelfer
merge util.esystem and util.system.
r1882 rc = os.system(cmd)
if rc and onerr:
Alexis S. L. Carvalho
util.system: fix quoting on windows
r3905 errmsg = '%s %s' % (os.path.basename(origcmd.split(None, 1)[0]),
Vadim Gelfer
merge util.esystem and util.system.
r1882 explain_exit(rc)[0])
if errprefix:
errmsg = '%s: %s' % (errprefix, errmsg)
try:
onerr.warn(errmsg + '\n')
except AttributeError:
raise onerr(errmsg)
return rc
Vadim Gelfer
fix broken environment save/restore when a hook runs....
r1880 finally:
for k, v in oldenv.iteritems():
if v is None:
del os.environ[k]
else:
os.environ[k] = v
if cwd is not None and oldcwd != cwd:
os.chdir(oldcwd)
mpm@selenic.com
[PATCH] rename under the other OS...
r421 def rename(src, dst):
mpm@selenic.com
Update util.py docstrings, fix walk test
r1082 """forcibly rename a file"""
mpm@selenic.com
[PATCH] rename under the other OS...
r421 try:
os.rename(src, dst)
Vadim Gelfer
fix file handling bugs on windows....
r2176 except OSError, err:
# on windows, rename to existing file is not allowed, so we
# must delete destination first. but if file is open, unlink
# schedules it for delete but does not delete it. rename
# happens immediately even for open files, so we create
# temporary file, delete it, rename destination to that name,
# then delete that. then rename is safe to do.
fd, temp = tempfile.mkstemp(dir=os.path.dirname(dst) or '.')
os.close(fd)
os.unlink(temp)
os.rename(dst, temp)
os.unlink(temp)
mpm@selenic.com
[PATCH] rename under the other OS...
r421 os.rename(src, dst)
Benoit Boissinot
refactor some unlink/remove code and make sure we prune empty dir
r1415 def unlink(f):
"""unlink and remove the directory if it is empty"""
os.unlink(f)
# try removing directories that might now be empty
Vadim Gelfer
util.unlink should only catch OSError.
r2064 try:
os.removedirs(os.path.dirname(f))
except OSError:
pass
Benoit Boissinot
refactor some unlink/remove code and make sure we prune empty dir
r1415
Matt Mackall
util: add copyfile function
r3629 def copyfile(src, dest):
"copy a file, preserving mode"
try:
shutil.copyfile(src, dest)
shutil.copymode(src, dest)
except shutil.Error, inst:
Andrei Vermel
Fix wrong module reference in copyfile exception
r4067 raise Abort(str(inst))
Matt Mackall
util: add copyfile function
r3629
Stephen Darnell
Add support for cloning with hardlinks on windows....
r1241 def copyfiles(src, dst, hardlink=None):
"""Copy a directory tree using hardlinks if possible"""
if hardlink is None:
hardlink = (os.stat(src).st_dev ==
os.stat(os.path.dirname(dst)).st_dev)
Thomas Arendsen Hein
Use python function instead of external 'cp' command when cloning repos....
r698
mpm@selenic.com
Rewrite copytree as copyfiles...
r1207 if os.path.isdir(src):
os.mkdir(dst)
for name in os.listdir(src):
srcname = os.path.join(src, name)
dstname = os.path.join(dst, name)
Stephen Darnell
Add support for cloning with hardlinks on windows....
r1241 copyfiles(srcname, dstname, hardlink)
mpm@selenic.com
Rewrite copytree as copyfiles...
r1207 else:
Stephen Darnell
Add support for cloning with hardlinks on windows....
r1241 if hardlink:
try:
os_link(src, dst)
Vadim Gelfer
util.copyfiles: only switch to copy if hardlink raises IOError or OSError....
r2050 except (IOError, OSError):
Stephen Darnell
Add support for cloning with hardlinks on windows....
r1241 hardlink = False
Benoit Boissinot
do not copy atime and mtime in util.copyfiles...
r1591 shutil.copy(src, dst)
Stephen Darnell
Add support for cloning with hardlinks on windows....
r1241 else:
Benoit Boissinot
do not copy atime and mtime in util.copyfiles...
r1591 shutil.copy(src, dst)
Thomas Arendsen Hein
Use python function instead of external 'cp' command when cloning repos....
r698
Thomas Arendsen Hein
Validate paths before reading or writing files in repository or working dir....
r1835 def audit_path(path):
"""Abort if path contains dangerous components"""
parts = os.path.normcase(path).split(os.sep)
if (os.path.splitdrive(path)[0] or parts[0] in ('.hg', '')
or os.pardir in parts):
raise Abort(_("path contains illegal component: %s\n") % path)
Thomas Arendsen Hein
Make makelock and readlock work on filesystems without symlink support....
r704 def _makelock_file(info, pathname):
ld = os.open(pathname, os.O_CREAT | os.O_WRONLY | os.O_EXCL)
os.write(ld, info)
os.close(ld)
def _readlock_file(pathname):
Vadim Gelfer
fix file handling bugs on windows....
r2176 return posixfile(pathname).read()
Thomas Arendsen Hein
Make makelock and readlock work on filesystems without symlink support....
r704
Stephen Darnell
Add support for cloning with hardlinks on windows....
r1241 def nlinks(pathname):
"""Return number of hardlinks for the given file."""
Vadim Gelfer
replace os.stat with os.lstat in some where.
r2448 return os.lstat(pathname).st_nlink
Stephen Darnell
Add support for cloning with hardlinks on windows....
r1241
if hasattr(os, 'link'):
os_link = os.link
else:
def os_link(src, dst):
Benoit Boissinot
i18n part2: use '_' for all strings who are part of the user interface
r1402 raise OSError(0, _("Hardlinks not supported"))
Stephen Darnell
Add support for cloning with hardlinks on windows....
r1241
Vadim Gelfer
fix file handling bugs on windows....
r2176 def fstat(fp):
'''stat file object that may not have fileno method.'''
try:
return os.fstat(fp.fileno())
except AttributeError:
return os.stat(fp.name)
posixfile = file
Vadim Gelfer
windows: revlog.lazyparser not always safe to use....
r2250 def is_win_9x():
'''return true if run on windows 95, 98 or me.'''
try:
return sys.getwindowsversion()[3] == 1
except AttributeError:
return os.name == 'nt' and 'command' in os.environ.get('comspec', '')
Benoit Boissinot
only print a warning when no username is specified...
r3721 getuser_fallback = None
def getuser():
'''return name of current user'''
try:
return getpass.getuser()
except ImportError:
# import of pwd will fail on windows - try fallback
if getuser_fallback:
return getuser_fallback()
# raised if win32api not available
raise Abort(_('user name not available - set USERNAME '
'environment variable'))
Alexis S. L. Carvalho
Only read .hg/hgrc files from trusted users/groups...
r3551 def username(uid=None):
"""Return the name of the user with the given uid.
If uid is None, return the name of the current user."""
try:
import pwd
if uid is None:
uid = os.getuid()
try:
return pwd.getpwuid(uid)[0]
except KeyError:
return str(uid)
except ImportError:
return None
def groupname(gid=None):
"""Return the name of the group with the given gid.
If gid is None, return the name of the current group."""
try:
import grp
if gid is None:
gid = os.getgid()
try:
return grp.getgrgid(gid)[0]
except KeyError:
return str(gid)
except ImportError:
return None
Matt Mackall
imported patch folding
r3784 # File system features
def checkfolding(path):
"""
Check whether the given path is on a case-sensitive filesystem
Requires a path (like /foo/.hg) ending with a foldable final
directory component.
"""
s1 = os.stat(path)
d, b = os.path.split(path)
p2 = os.path.join(d, b.upper())
if path == p2:
p2 = os.path.join(d, b.lower())
try:
s2 = os.stat(p2)
if s2 == s1:
return False
return True
except:
return True
mpm@selenic.com
Update util.py docstrings, fix walk test
r1082 # Platform specific variants
mpm@selenic.com
[PATCH] file seperator handling for the other 'OS'...
r419 if os.name == 'nt':
olivier.maquelin@intel.com
Avoid insertion/deletion of CRs on stdio during hg serve
r1420 demandload(globals(), "msvcrt")
mpm@selenic.com
[PATCH] /dev/null for other OS...
r461 nulldev = 'NUL:'
Vadim Gelfer
eliminate backtrace when piping output on windows....
r1609
class winstdout:
'''stdout on windows misbehaves if sent through a pipe'''
def __init__(self, fp):
self.fp = fp
def __getattr__(self, key):
return getattr(self.fp, key)
def close(self):
try:
self.fp.close()
except: pass
def write(self, s):
try:
return self.fp.write(s)
except IOError, inst:
if inst.errno != 0: raise
self.close()
raise IOError(errno.EPIPE, 'Broken pipe')
Patrick Mezard
stdout raises EINVAL when flush() is called on a closed pipe under win32....
r4129
def flush(self):
try:
return self.fp.flush()
except IOError, inst:
if inst.errno != errno.EINVAL: raise
self.close()
raise IOError(errno.EPIPE, 'Broken pipe')
Vadim Gelfer
eliminate backtrace when piping output on windows....
r1609
sys.stdout = winstdout(sys.stdout)
Vadim Gelfer
fix exception handling on windows....
r2054 def system_rcpath():
Vadim Gelfer
fix issue 217....
r2117 try:
return system_rcpath_win32()
except:
return [r'c:\mercurial\mercurial.ini']
Vadim Gelfer
fix exception handling on windows....
r2054
Vadim Gelfer
add HGRCPATH env var, list of places to look for hgrc files....
r1951 def os_rcpath():
'''return default os-specific hgrc search path'''
Thomas Arendsen Hein
On Windows look for mercurial.ini in $USERPROFILE, too, if available...
r2280 path = system_rcpath()
Volker Kleinfeld
On win98 os.path.expanuser('~') does not result in a useable directory....
r2284 path.append(user_rcpath())
Thomas Arendsen Hein
On Windows look for mercurial.ini in $USERPROFILE, too, if available...
r2280 userprofile = os.environ.get('USERPROFILE')
if userprofile:
path.append(os.path.join(userprofile, 'mercurial.ini'))
return path
Bryan O'Sullivan
Use platform-appropriate rc file names.
r1292
Volker Kleinfeld
On win98 os.path.expanuser('~') does not result in a useable directory....
r2284 def user_rcpath():
Thomas Arendsen Hein
white space and line break cleanups
r3673 '''return os-specific hgrc search path to the user dir'''
return os.path.join(os.path.expanduser('~'), 'mercurial.ini')
Volker Kleinfeld
On win98 os.path.expanuser('~') does not result in a useable directory....
r2284
Volker Kleinfeld
Make 'hg import' platform independent....
r1285 def parse_patch_output(output_line):
"""parses the output produced by patch and returns the file name"""
pf = output_line[14:]
if pf[0] == '`':
pf = pf[1:-1] # Remove the quotes
return pf
Vadim Gelfer
fix exception handling on windows....
r2054 def testpid(pid):
'''return False if pid dead, True if running or not known'''
return True
Stephen Darnell
Add support for cloning with hardlinks on windows....
r1241
mpm@selenic.com
Permission handling for the other OS...
r441 def is_exec(f, last):
return last
def set_exec(f, mode):
pass
mpm@selenic.com
Whitespace cleanups...
r515
olivier.maquelin@intel.com
Avoid insertion/deletion of CRs on stdio during hg serve
r1420 def set_binary(fd):
msvcrt.setmode(fd.fileno(), os.O_BINARY)
mpm@selenic.com
[PATCH] file seperator handling for the other 'OS'...
r419 def pconvert(path):
return path.replace("\\", "/")
mpm@selenic.com
[PATCH] Enables lock work under the other 'OS'...
r422
Bryan O'Sullivan
Fix walk path handling on Windows
r886 def localpath(path):
return path.replace('/', '\\')
def normpath(path):
return pconvert(os.path.normpath(path))
Thomas Arendsen Hein
Make makelock and readlock work on filesystems without symlink support....
r704 makelock = _makelock_file
readlock = _readlock_file
mpm@selenic.com
[PATCH] /dev/null for other OS...
r461
Vadim Gelfer
add util.samestat function for windows....
r2193 def samestat(s1, s2):
return False
Alexis S. L. Carvalho
Fix util.shellquote on windows.
r4087 # A sequence of backslashes is special iff it precedes a double quote:
# - if there's an even number of backslashes, the double quote is not
# quoted (i.e. it ends the quoted region)
# - if there's an odd number of backslashes, the double quote is quoted
# - in both cases, every pair of backslashes is unquoted into a single
# backslash
# (See http://msdn2.microsoft.com/en-us/library/a1y7w461.aspx )
# So, to quote a string, we must surround it in double quotes, double
# the number of backslashes that preceed double quotes and add another
# backslash before every double quote (being careful with the double
# quote we've appended to the end)
_quotere = None
Brendan Cully
Add portable shell-quoting function; teach mq to use it.
r2791 def shellquote(s):
Alexis S. L. Carvalho
Fix util.shellquote on windows.
r4087 global _quotere
if _quotere is None:
_quotere = re.compile(r'(\\*)("|\\$)')
return '"%s"' % _quotere.sub(r'\1\1\\\2', s)
Brendan Cully
Add portable shell-quoting function; teach mq to use it.
r2791
thananck@yahoo.com
Provided platform dependent implementations for explain_exit...
r782 def explain_exit(code):
Benoit Boissinot
i18n part2: use '_' for all strings who are part of the user interface
r1402 return _("exited with status %d") % code, code
thananck@yahoo.com
Provided platform dependent implementations for explain_exit...
r782
Alexis S. L. Carvalho
Avoid looking up usernames if the current user owns the .hgrc file...
r3677 # if you change this stub into a real check, please try to implement the
# username and groupname functions above, too.
def isowner(fp, st=None):
return True
Vadim Gelfer
fix exception handling on windows....
r2054 try:
# override functions with win32 versions if possible
from util_win32 import *
Vadim Gelfer
windows: revlog.lazyparser not always safe to use....
r2250 if not is_win_9x():
posixfile = posixfile_nt
Vadim Gelfer
fix exception handling on windows....
r2054 except ImportError:
pass
mpm@selenic.com
[PATCH] file seperator handling for the other 'OS'...
r419 else:
mpm@selenic.com
[PATCH] /dev/null for other OS...
r461 nulldev = '/dev/null'
Vadim Gelfer
make mercurial look in more places for config files....
r1583 def rcfiles(path):
rcs = [os.path.join(path, 'hgrc')]
rcdir = os.path.join(path, 'hgrc.d')
try:
rcs.extend([os.path.join(rcdir, f) for f in os.listdir(rcdir)
if f.endswith(".rc")])
Benoit Boissinot
fix warnings spotted by pychecker
r3131 except OSError:
pass
Vadim Gelfer
make mercurial look in more places for config files....
r1583 return rcs
Vadim Gelfer
add HGRCPATH env var, list of places to look for hgrc files....
r1951
def os_rcpath():
'''return default os-specific hgrc search path'''
path = []
Vadim Gelfer
make reason for sys.argv change obvious in code.
r2263 # old mod_python does not set sys.argv
Shun-ichi GOTO
Check existance of sys.argv for the use from mod_python.
r2261 if len(getattr(sys, 'argv', [])) > 0:
Vadim Gelfer
add HGRCPATH env var, list of places to look for hgrc files....
r1951 path.extend(rcfiles(os.path.dirname(sys.argv[0]) +
'/../etc/mercurial'))
path.extend(rcfiles('/etc/mercurial'))
path.append(os.path.expanduser('~/.hgrc'))
path = [os.path.normpath(f) for f in path]
return path
Bryan O'Sullivan
Use platform-appropriate rc file names.
r1292
Volker Kleinfeld
Make 'hg import' platform independent....
r1285 def parse_patch_output(output_line):
"""parses the output produced by patch and returns the file name"""
Benoit Boissinot
if a filename contains spaces, patch adds quote around it
r1593 pf = output_line[14:]
Benoit Boissinot
use __contains__, index or split instead of str.find...
r2579 if pf.startswith("'") and pf.endswith("'") and " " in pf:
Benoit Boissinot
if a filename contains spaces, patch adds quote around it
r1593 pf = pf[1:-1] # Remove the quotes
return pf
Volker Kleinfeld
Make 'hg import' platform independent....
r1285
mpm@selenic.com
Permission handling for the other OS...
r441 def is_exec(f, last):
mpm@selenic.com
Update util.py docstrings, fix walk test
r1082 """check whether a file is executable"""
Vadim Gelfer
replace os.stat with os.lstat in some where.
r2448 return (os.lstat(f).st_mode & 0100 != 0)
mpm@selenic.com
Permission handling for the other OS...
r441
def set_exec(f, mode):
Vadim Gelfer
replace os.stat with os.lstat in some where.
r2448 s = os.lstat(f).st_mode
mpm@selenic.com
Permission handling for the other OS...
r441 if (s & 0100 != 0) == mode:
return
if mode:
# Turn on +x for every +r bit when making a file executable
# and obey umask.
umask = os.umask(0)
os.umask(umask)
os.chmod(f, s | (s & 0444) >> 2 & ~umask)
else:
os.chmod(f, s & 0666)
olivier.maquelin@intel.com
Avoid insertion/deletion of CRs on stdio during hg serve
r1420 def set_binary(fd):
pass
mpm@selenic.com
[PATCH] file seperator handling for the other 'OS'...
r419 def pconvert(path):
return path
Bryan O'Sullivan
Fix walk path handling on Windows
r886 def localpath(path):
return path
normpath = os.path.normpath
Vadim Gelfer
add util.samestat function for windows....
r2193 samestat = os.path.samestat
Bryan O'Sullivan
Fix walk path handling on Windows
r886
mpm@selenic.com
[PATCH] Enables lock work under the other 'OS'...
r422 def makelock(info, pathname):
Thomas Arendsen Hein
Make makelock and readlock work on filesystems without symlink support....
r704 try:
os.symlink(info, pathname)
except OSError, why:
if why.errno == errno.EEXIST:
raise
else:
_makelock_file(info, pathname)
mpm@selenic.com
[PATCH] Enables lock work under the other 'OS'...
r422
def readlock(pathname):
Thomas Arendsen Hein
Make makelock and readlock work on filesystems without symlink support....
r704 try:
return os.readlink(pathname)
except OSError, why:
if why.errno == errno.EINVAL:
return _readlock_file(pathname)
else:
raise
thananck@yahoo.com
Provided platform dependent implementations for explain_exit...
r782
Brendan Cully
Add portable shell-quoting function; teach mq to use it.
r2791 def shellquote(s):
return "'%s'" % s.replace("'", "'\\''")
Vadim Gelfer
change lock format to let us detect and break stale locks....
r1877 def testpid(pid):
'''return False if pid dead, True if running or not sure'''
try:
os.kill(pid, 0)
return True
except OSError, inst:
return inst.errno != errno.ESRCH
thananck@yahoo.com
Provided platform dependent implementations for explain_exit...
r782 def explain_exit(code):
"""return a 2-tuple (desc, code) describing a process's status"""
if os.WIFEXITED(code):
val = os.WEXITSTATUS(code)
Benoit Boissinot
i18n part2: use '_' for all strings who are part of the user interface
r1402 return _("exited with status %d") % val, val
thananck@yahoo.com
Provided platform dependent implementations for explain_exit...
r782 elif os.WIFSIGNALED(code):
val = os.WTERMSIG(code)
Benoit Boissinot
i18n part2: use '_' for all strings who are part of the user interface
r1402 return _("killed by signal %d") % val, val
thananck@yahoo.com
Provided platform dependent implementations for explain_exit...
r782 elif os.WIFSTOPPED(code):
mark.williamson@cl.cam.ac.uk
Minor tweak: os.STOPSIG -> os.WSTOPSIG. Pychecker spotted this one.
r912 val = os.WSTOPSIG(code)
Benoit Boissinot
i18n part2: use '_' for all strings who are part of the user interface
r1402 return _("stopped by signal %d") % val, val
raise ValueError(_("invalid exit code"))
Eric Hopper
Created a class in util called chunkbuffer that buffers reads from an...
r1199
Alexis S. L. Carvalho
Avoid looking up usernames if the current user owns the .hgrc file...
r3677 def isowner(fp, st=None):
"""Return True if the file object f belongs to the current user.
The return value of a util.fstat(f) may be passed as the st argument.
"""
if st is None:
Benoit Boissinot
fix errors spotted by pychecker
r3859 st = fstat(fp)
Alexis S. L. Carvalho
Avoid looking up usernames if the current user owns the .hgrc file...
r3677 return st.st_uid == os.getuid()
Benoit Boissinot
create the encode and decode functions for the store
r3852 def _buildencodefun():
e = '_'
Benoit Boissinot
fix reserved char on windows, '[]+' are allowed
r3860 win_reserved = [ord(x) for x in '\\:*?"<>|']
Benoit Boissinot
create the encode and decode functions for the store
r3852 cmap = dict([ (chr(x), chr(x)) for x in xrange(127) ])
for x in (range(32) + range(126, 256) + win_reserved):
cmap[chr(x)] = "~%02x" % x
for x in range(ord("A"), ord("Z")+1) + [ord(e)]:
cmap[chr(x)] = e + chr(x).lower()
dmap = {}
for k, v in cmap.iteritems():
dmap[v] = k
def decode(s):
i = 0
while i < len(s):
for l in xrange(1, 4):
try:
yield dmap[s[i:i+l]]
i += l
break
except KeyError:
pass
else:
raise KeyError
return (lambda s: "".join([cmap[c] for c in s]),
lambda s: "".join(list(decode(s))))
encodefilename, decodefilename = _buildencodefun()
Benoit Boissinot
switch to the .hg/store layout, fix the tests
r3853 def encodedopener(openerfn, fn):
def o(path, *args, **kw):
return openerfn(fn(path), *args, **kw)
return o
Alexis S. L. Carvalho
Avoid looking up usernames if the current user owns the .hgrc file...
r3677
Vadim Gelfer
fix file handling bugs on windows....
r2176 def opener(base, audit=True):
"""
return a function that opens files relative to base
this function is used to hide the details of COW semantics and
remote file access from higher level code.
"""
p = base
audit_p = audit
def mktempcopy(name):
d, fn = os.path.split(name)
Vadim Gelfer
merge with crew.
r2177 fd, temp = tempfile.mkstemp(prefix='.%s-' % fn, dir=d)
Vadim Gelfer
fix file handling bugs on windows....
r2176 os.close(fd)
Vadim Gelfer
reduce memory used by util.opener when making a temp copy of a file.
r2237 ofp = posixfile(temp, "wb")
Vadim Gelfer
fix file handling bugs on windows....
r2176 try:
Vadim Gelfer
add filename to IOError if read of file fails....
r2220 try:
Vadim Gelfer
reduce memory used by util.opener when making a temp copy of a file.
r2237 ifp = posixfile(name, "rb")
Vadim Gelfer
add filename to IOError if read of file fails....
r2220 except IOError, inst:
if not getattr(inst, 'filename', None):
inst.filename = name
raise
Vadim Gelfer
reduce memory used by util.opener when making a temp copy of a file.
r2237 for chunk in filechunkiter(ifp):
ofp.write(chunk)
ifp.close()
ofp.close()
Vadim Gelfer
fix file handling bugs on windows....
r2176 except:
try: os.unlink(temp)
except: pass
raise
st = os.lstat(name)
os.chmod(temp, st.st_mode)
return temp
class atomictempfile(posixfile):
"""the file will only be copied when rename is called"""
def __init__(self, name, mode):
self.__name = name
self.temp = mktempcopy(name)
posixfile.__init__(self, self.temp, mode)
def rename(self):
if not self.closed:
posixfile.close(self)
Thomas Arendsen Hein
Use platform path for renaming file in util.atomictempfile.rename()
r2308 rename(self.temp, localpath(self.__name))
Vadim Gelfer
fix file handling bugs on windows....
r2176 def __del__(self):
if not self.closed:
try:
os.unlink(self.temp)
except: pass
posixfile.close(self)
class atomicfile(atomictempfile):
"""the file will only be copied on close"""
def __init__(self, name, mode):
atomictempfile.__init__(self, name, mode)
def close(self):
self.rename()
def __del__(self):
self.rename()
def o(path, mode="r", text=False, atomic=False, atomictemp=False):
if audit_p:
audit_path(path)
f = os.path.join(p, path)
if not text:
mode += "b" # for that other OS
if mode[0] != "r":
try:
nlink = nlinks(f)
except OSError:
d = os.path.dirname(f)
if not os.path.isdir(d):
os.makedirs(d)
else:
if atomic:
return atomicfile(f, mode)
elif atomictemp:
return atomictempfile(f, mode)
if nlink > 1:
rename(mktempcopy(f), f)
return posixfile(f, mode)
return o
Eric Hopper
Created a class in util called chunkbuffer that buffers reads from an...
r1199 class chunkbuffer(object):
"""Allow arbitrary sized chunks of data to be efficiently read from an
iterator over chunks of arbitrary size."""
Bryan O'Sullivan
Minor cleanups.
r1200
Eric Hopper
Created a class in util called chunkbuffer that buffers reads from an...
r1199 def __init__(self, in_iter, targetsize = 2**16):
"""in_iter is the iterator that's iterating over the input chunks.
targetsize is how big a buffer to try to maintain."""
self.in_iter = iter(in_iter)
self.buf = ''
self.targetsize = int(targetsize)
Bryan O'Sullivan
Minor cleanups.
r1200 if self.targetsize <= 0:
Benoit Boissinot
i18n part2: use '_' for all strings who are part of the user interface
r1402 raise ValueError(_("targetsize must be greater than 0, was %d") %
Bryan O'Sullivan
Minor cleanups.
r1200 targetsize)
Eric Hopper
Created a class in util called chunkbuffer that buffers reads from an...
r1199 self.iterempty = False
Bryan O'Sullivan
Minor cleanups.
r1200
Eric Hopper
Created a class in util called chunkbuffer that buffers reads from an...
r1199 def fillbuf(self):
Bryan O'Sullivan
Minor cleanups.
r1200 """Ignore target size; read every chunk from iterator until empty."""
Eric Hopper
Created a class in util called chunkbuffer that buffers reads from an...
r1199 if not self.iterempty:
collector = cStringIO.StringIO()
collector.write(self.buf)
for ch in self.in_iter:
collector.write(ch)
self.buf = collector.getvalue()
self.iterempty = True
def read(self, l):
Bryan O'Sullivan
Minor cleanups.
r1200 """Read L bytes of data from the iterator of chunks of data.
Thomas Arendsen Hein
Cleanup of tabs and trailing spaces.
r1308 Returns less than L bytes if the iterator runs dry."""
Eric Hopper
Created a class in util called chunkbuffer that buffers reads from an...
r1199 if l > len(self.buf) and not self.iterempty:
# Clamp to a multiple of self.targetsize
targetsize = self.targetsize * ((l // self.targetsize) + 1)
collector = cStringIO.StringIO()
collector.write(self.buf)
collected = len(self.buf)
for chunk in self.in_iter:
collector.write(chunk)
collected += len(chunk)
if collected >= targetsize:
break
if collected < targetsize:
self.iterempty = True
self.buf = collector.getvalue()
Bryan O'Sullivan
Minor cleanups.
r1200 s, self.buf = self.buf[:l], buffer(self.buf, l)
Eric Hopper
Created a class in util called chunkbuffer that buffers reads from an...
r1199 return s
Vadim Gelfer
util: add limit to amount filechunkiter will read
r2462 def filechunkiter(f, size=65536, limit=None):
"""Create a generator that produces the data in the file size
(default 65536) bytes at a time, up to optional limit (default is
to read all data). Chunks may be less than size bytes if the
chunk is the last chunk in the file, or the file is a socket or
some other type of file that sometimes reads less data than is
requested."""
assert size >= 0
assert limit is None or limit >= 0
while True:
if limit is None: nbytes = size
else: nbytes = min(limit, size)
s = nbytes and f.read(nbytes)
if not s: break
if limit: limit -= len(s)
Eric Hopper
Created a class in util called chunkbuffer that buffers reads from an...
r1199 yield s
Bryan O'Sullivan
Fix up representation of dates in hgweb....
r1320
Bryan O'Sullivan
Clean up date and timezone handling....
r1321 def makedate():
Benoit Boissinot
fix handling of daylight saving time
r1482 lt = time.localtime()
if lt[8] == 1 and time.daylight:
tz = time.altzone
else:
tz = time.timezone
return time.mktime(lt), tz
Bryan O'Sullivan
Allow files to be opened in text mode, even on Windows.
r1329
Vadim Gelfer
add changelog style to command line template....
r1987 def datestr(date=None, format='%a %b %d %H:%M:%S %Y', timezone=True):
Bryan O'Sullivan
Clean up date and timezone handling....
r1321 """represent a (unixtime, offset) tuple as a localized time.
unixtime is seconds since the epoch, and offset is the time zone's
Vadim Gelfer
add changelog style to command line template....
r1987 number of seconds away from UTC. if timezone is false, do not
append time zone to string."""
Bryan O'Sullivan
Clean up date and timezone handling....
r1321 t, tz = date or makedate()
Vadim Gelfer
add changelog style to command line template....
r1987 s = time.strftime(format, time.gmtime(float(t) - tz))
if timezone:
s += " %+03d%02d" % (-tz / 3600, ((-tz % 3600) / 60))
return s
Vadim Gelfer
hgwebdir: export collections of repos...
r1829
Matt Mackall
Add date matching support...
r3812 def strdate(string, format, defaults):
Jose M. Prieto
Allow the use of human readable dates (issue 251)
r2522 """parse a localized time string and return a (unixtime, offset) tuple.
if the string cannot be parsed, ValueError is raised."""
Matt Mackall
parsedate: add UTC and GMT timezones
r3809 def timezone(string):
tz = string.split()[-1]
if tz[0] in "+-" and len(tz) == 5 and tz[1:].isdigit():
tz = int(tz)
offset = - 3600 * (tz / 100) - 60 * (tz % 100)
return offset
if tz == "GMT" or tz == "UTC":
return 0
return None
Jose M. Prieto
Allow the use of human readable dates (issue 251)
r2522
Jose M. Prieto
util.strdate: compute timestamp using UTC, not local timezone
r3255 # NOTE: unixtime = localunixtime + offset
Matt Mackall
parsedate: add UTC and GMT timezones
r3809 offset, date = timezone(string), string
if offset != None:
date = " ".join(string.split()[:-1])
Matt Mackall
improve date parsing for numerous new date formats...
r3808
Matt Mackall
Add date matching support...
r3812 # add missing elements from defaults
for part in defaults:
found = [True for p in part if ("%"+p) in format]
if not found:
date += "@" + defaults[part]
format += "@%" + part[0]
Matt Mackall
improve date parsing for numerous new date formats...
r3808
Jose M. Prieto
util.strdate: assume local time when no timezone specified
r3256 timetuple = time.strptime(date, format)
localunixtime = int(calendar.timegm(timetuple))
if offset is None:
# local timezone
unixtime = int(time.mktime(timetuple))
offset = unixtime - localunixtime
else:
unixtime = localunixtime + offset
Jose M. Prieto
util.strdate: compute timestamp using UTC, not local timezone
r3255 return unixtime, offset
Jose M. Prieto
Allow the use of human readable dates (issue 251)
r2522
Matt Mackall
Add date matching support...
r3812 def parsedate(string, formats=None, defaults=None):
Jose M. Prieto
Allow the use of human readable dates (issue 251)
r2522 """parse a localized time string and return a (unixtime, offset) tuple.
The date may be a "unixtime offset" string or in one of the specified
formats."""
Matt Mackall
parsedate: allow '' for epoch
r3807 if not string:
return 0, 0
Chris Mason
util.parsedate should understand dates from hg export
r2609 if not formats:
formats = defaultdateformats
Matt Mackall
improve date parsing for numerous new date formats...
r3808 string = string.strip()
Jose M. Prieto
Allow the use of human readable dates (issue 251)
r2522 try:
when, offset = map(int, string.split(' '))
Benoit Boissinot
validate the resulting date in parsedate
r2523 except ValueError:
Matt Mackall
Add date matching support...
r3812 # fill out defaults
if not defaults:
defaults = {}
now = makedate()
for part in "d mb yY HI M S".split():
if part not in defaults:
if part[0] in "HMS":
defaults[part] = "00"
elif part[0] in "dm":
defaults[part] = "1"
else:
defaults[part] = datestr(now, "%" + part[0], False)
Benoit Boissinot
validate the resulting date in parsedate
r2523 for format in formats:
try:
Matt Mackall
Add date matching support...
r3812 when, offset = strdate(string, format, defaults)
Benoit Boissinot
validate the resulting date in parsedate
r2523 except ValueError:
pass
else:
break
else:
Matt Mackall
parsedate: use Abort rather than ValueError
r3806 raise Abort(_('invalid date: %r ') % string)
Benoit Boissinot
validate the resulting date in parsedate
r2523 # validate explicit (probably user-specified) date and
# time zone offset. values must fit in signed 32 bits for
# current 32-bit linux runtimes. timezones go from UTC-12
# to UTC+14
if abs(when) > 0x7fffffff:
Matt Mackall
parsedate: use Abort rather than ValueError
r3806 raise Abort(_('date exceeds 32 bits: %d') % when)
Benoit Boissinot
validate the resulting date in parsedate
r2523 if offset < -50400 or offset > 43200:
Matt Mackall
parsedate: use Abort rather than ValueError
r3806 raise Abort(_('impossible time zone offset: %d') % offset)
Benoit Boissinot
validate the resulting date in parsedate
r2523 return when, offset
Jose M. Prieto
Allow the use of human readable dates (issue 251)
r2522
Matt Mackall
Add date matching support...
r3812 def matchdate(date):
"""Return a function that matches a given date match specifier
Formats include:
'{date}' match a given date to the accuracy provided
'<{date}' on or before a given date
'>{date}' on or after a given date
"""
def lower(date):
return parsedate(date, extendeddateformats)[0]
def upper(date):
d = dict(mb="12", HI="23", M="59", S="59")
for days in "31 30 29".split():
try:
d["d"] = days
return parsedate(date, extendeddateformats, d)[0]
except:
pass
d["d"] = "28"
return parsedate(date, extendeddateformats, d)[0]
if date[0] == "<":
when = upper(date[1:])
return lambda x: x <= when
elif date[0] == ">":
when = lower(date[1:])
return lambda x: x >= when
elif date[0] == "-":
try:
days = int(date[1:])
except ValueError:
raise Abort(_("invalid day spec: %s") % date[1:])
when = makedate()[0] - days * 3600 * 24
Matt Mackall
Add --date support to log...
r3813 return lambda x: x >= when
Matt Mackall
Add date matching support...
r3812 elif " to " in date:
a, b = date.split(" to ")
start, stop = lower(a), upper(b)
return lambda x: x >= start and x <= stop
else:
start, stop = lower(date), upper(date)
return lambda x: x >= start and x <= stop
Vadim Gelfer
move shortuser into util module.
r1903 def shortuser(user):
"""Return a short representation of a user name or email address."""
f = user.find('@')
if f >= 0:
user = user[:f]
f = user.find('<')
if f >= 0:
user = user[f+1:]
Thomas Arendsen Hein
shortuser should stop before the first space character....
r3176 f = user.find(' ')
if f >= 0:
user = user[:f]
Matt Mackall
shortname: truncate at '.' too
r3533 f = user.find('.')
if f >= 0:
user = user[:f]
Vadim Gelfer
move shortuser into util module.
r1903 return user
Vadim Gelfer
merge with crew.
r1920
Thomas Arendsen Hein
Move ellipsis code to util.ellipsis() and improve maxlength handling.
r3767 def ellipsis(text, maxlength=400):
"""Trim string to at most maxlength (default: 400) characters."""
if len(text) <= maxlength:
return text
else:
return "%s..." % (text[:maxlength-3])
Vadim Gelfer
hgwebdir: export collections of repos...
r1829 def walkrepos(path):
'''yield every hg repository under path, recursively.'''
def errhandler(err):
if err.filename == path:
raise err
for root, dirs, files in os.walk(path, onerror=errhandler):
for d in dirs:
if d == '.hg':
yield root
dirs[:] = []
break
Vadim Gelfer
add HGRCPATH env var, list of places to look for hgrc files....
r1951
_rcpath = None
def rcpath():
'''return hgrc search path. if env var HGRCPATH is set, use it.
for each item in path, if directory, use files ending in .rc,
else use item.
make HGRCPATH empty to only look in .hg/hgrc of current repo.
if no HGRCPATH, use default os-specific path.'''
global _rcpath
if _rcpath is None:
if 'HGRCPATH' in os.environ:
_rcpath = []
for p in os.environ['HGRCPATH'].split(os.pathsep):
if not p: continue
Benoit Boissinot
use a proper test instead of catching every exception
r1956 if os.path.isdir(p):
Vadim Gelfer
add HGRCPATH env var, list of places to look for hgrc files....
r1951 for f in os.listdir(p):
if f.endswith('.rc'):
_rcpath.append(os.path.join(p, f))
Benoit Boissinot
use a proper test instead of catching every exception
r1956 else:
_rcpath.append(p)
Vadim Gelfer
add HGRCPATH env var, list of places to look for hgrc files....
r1951 else:
_rcpath = os_rcpath()
return _rcpath
Vadim Gelfer
add support for streaming clone....
r2612
def bytecount(nbytes):
'''return byte count formatted as readable string, with units'''
units = (
(100, 1<<30, _('%.0f GB')),
(10, 1<<30, _('%.1f GB')),
(1, 1<<30, _('%.2f GB')),
(100, 1<<20, _('%.0f MB')),
(10, 1<<20, _('%.1f MB')),
(1, 1<<20, _('%.2f MB')),
(100, 1<<10, _('%.0f KB')),
(10, 1<<10, _('%.1f KB')),
(1, 1<<10, _('%.2f KB')),
(1, 1, _('%.0f bytes')),
)
for multiplier, divisor, format in units:
if nbytes >= divisor * multiplier:
return format % (nbytes / float(divisor))
return units[-1][2] % nbytes
Vadim Gelfer
clean up hg.py: move repo constructor code into each repo module
r2740
def drop_scheme(scheme, path):
sc = scheme + ':'
if path.startswith(sc):
path = path[len(sc):]
if path.startswith('//'):
path = path[2:]
return path