##// END OF EJS Templates
util: wrap lines with multi-byte characters correctly (issue2943)...
Mads Kiilerich -
r15065:24a6c3f9 stable
parent child Browse files
Show More
@@ -1,1622 +1,1623
1 1 # util.py - Mercurial utility functions and platform specfic implementations
2 2 #
3 3 # Copyright 2005 K. Thananchayan <thananck@yahoo.com>
4 4 # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
5 5 # Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com>
6 6 #
7 7 # This software may be used and distributed according to the terms of the
8 8 # GNU General Public License version 2 or any later version.
9 9
10 10 """Mercurial utility functions and platform specfic implementations.
11 11
12 12 This contains helper routines that are independent of the SCM core and
13 13 hide platform-specific details from the core.
14 14 """
15 15
16 16 from i18n import _
17 17 import error, osutil, encoding
18 18 import errno, re, shutil, sys, tempfile, traceback
19 19 import os, time, calendar, textwrap, unicodedata, signal
20 20 import imp, socket, urllib
21 21
22 22 # Python compatibility
23 23
24 24 def sha1(s):
25 25 return _fastsha1(s)
26 26
27 27 def _fastsha1(s):
28 28 # This function will import sha1 from hashlib or sha (whichever is
29 29 # available) and overwrite itself with it on the first call.
30 30 # Subsequent calls will go directly to the imported function.
31 31 if sys.version_info >= (2, 5):
32 32 from hashlib import sha1 as _sha1
33 33 else:
34 34 from sha import sha as _sha1
35 35 global _fastsha1, sha1
36 36 _fastsha1 = sha1 = _sha1
37 37 return _sha1(s)
38 38
39 39 import __builtin__
40 40
41 41 if sys.version_info[0] < 3:
42 42 def fakebuffer(sliceable, offset=0):
43 43 return sliceable[offset:]
44 44 else:
45 45 def fakebuffer(sliceable, offset=0):
46 46 return memoryview(sliceable)[offset:]
47 47 try:
48 48 buffer
49 49 except NameError:
50 50 __builtin__.buffer = fakebuffer
51 51
52 52 import subprocess
53 53 closefds = os.name == 'posix'
54 54
55 55 def popen2(cmd, env=None, newlines=False):
56 56 # Setting bufsize to -1 lets the system decide the buffer size.
57 57 # The default for bufsize is 0, meaning unbuffered. This leads to
58 58 # poor performance on Mac OS X: http://bugs.python.org/issue4194
59 59 p = subprocess.Popen(cmd, shell=True, bufsize=-1,
60 60 close_fds=closefds,
61 61 stdin=subprocess.PIPE, stdout=subprocess.PIPE,
62 62 universal_newlines=newlines,
63 63 env=env)
64 64 return p.stdin, p.stdout
65 65
66 66 def popen3(cmd, env=None, newlines=False):
67 67 p = subprocess.Popen(cmd, shell=True, bufsize=-1,
68 68 close_fds=closefds,
69 69 stdin=subprocess.PIPE, stdout=subprocess.PIPE,
70 70 stderr=subprocess.PIPE,
71 71 universal_newlines=newlines,
72 72 env=env)
73 73 return p.stdin, p.stdout, p.stderr
74 74
75 75 def version():
76 76 """Return version information if available."""
77 77 try:
78 78 import __version__
79 79 return __version__.version
80 80 except ImportError:
81 81 return 'unknown'
82 82
83 83 # used by parsedate
84 84 defaultdateformats = (
85 85 '%Y-%m-%d %H:%M:%S',
86 86 '%Y-%m-%d %I:%M:%S%p',
87 87 '%Y-%m-%d %H:%M',
88 88 '%Y-%m-%d %I:%M%p',
89 89 '%Y-%m-%d',
90 90 '%m-%d',
91 91 '%m/%d',
92 92 '%m/%d/%y',
93 93 '%m/%d/%Y',
94 94 '%a %b %d %H:%M:%S %Y',
95 95 '%a %b %d %I:%M:%S%p %Y',
96 96 '%a, %d %b %Y %H:%M:%S', # GNU coreutils "/bin/date --rfc-2822"
97 97 '%b %d %H:%M:%S %Y',
98 98 '%b %d %I:%M:%S%p %Y',
99 99 '%b %d %H:%M:%S',
100 100 '%b %d %I:%M:%S%p',
101 101 '%b %d %H:%M',
102 102 '%b %d %I:%M%p',
103 103 '%b %d %Y',
104 104 '%b %d',
105 105 '%H:%M:%S',
106 106 '%I:%M:%S%p',
107 107 '%H:%M',
108 108 '%I:%M%p',
109 109 )
110 110
111 111 extendeddateformats = defaultdateformats + (
112 112 "%Y",
113 113 "%Y-%m",
114 114 "%b",
115 115 "%b %Y",
116 116 )
117 117
118 118 def cachefunc(func):
119 119 '''cache the result of function calls'''
120 120 # XXX doesn't handle keywords args
121 121 cache = {}
122 122 if func.func_code.co_argcount == 1:
123 123 # we gain a small amount of time because
124 124 # we don't need to pack/unpack the list
125 125 def f(arg):
126 126 if arg not in cache:
127 127 cache[arg] = func(arg)
128 128 return cache[arg]
129 129 else:
130 130 def f(*args):
131 131 if args not in cache:
132 132 cache[args] = func(*args)
133 133 return cache[args]
134 134
135 135 return f
136 136
137 137 def lrucachefunc(func):
138 138 '''cache most recent results of function calls'''
139 139 cache = {}
140 140 order = []
141 141 if func.func_code.co_argcount == 1:
142 142 def f(arg):
143 143 if arg not in cache:
144 144 if len(cache) > 20:
145 145 del cache[order.pop(0)]
146 146 cache[arg] = func(arg)
147 147 else:
148 148 order.remove(arg)
149 149 order.append(arg)
150 150 return cache[arg]
151 151 else:
152 152 def f(*args):
153 153 if args not in cache:
154 154 if len(cache) > 20:
155 155 del cache[order.pop(0)]
156 156 cache[args] = func(*args)
157 157 else:
158 158 order.remove(args)
159 159 order.append(args)
160 160 return cache[args]
161 161
162 162 return f
163 163
164 164 class propertycache(object):
165 165 def __init__(self, func):
166 166 self.func = func
167 167 self.name = func.__name__
168 168 def __get__(self, obj, type=None):
169 169 result = self.func(obj)
170 170 setattr(obj, self.name, result)
171 171 return result
172 172
173 173 def pipefilter(s, cmd):
174 174 '''filter string S through command CMD, returning its output'''
175 175 p = subprocess.Popen(cmd, shell=True, close_fds=closefds,
176 176 stdin=subprocess.PIPE, stdout=subprocess.PIPE)
177 177 pout, perr = p.communicate(s)
178 178 return pout
179 179
180 180 def tempfilter(s, cmd):
181 181 '''filter string S through a pair of temporary files with CMD.
182 182 CMD is used as a template to create the real command to be run,
183 183 with the strings INFILE and OUTFILE replaced by the real names of
184 184 the temporary files generated.'''
185 185 inname, outname = None, None
186 186 try:
187 187 infd, inname = tempfile.mkstemp(prefix='hg-filter-in-')
188 188 fp = os.fdopen(infd, 'wb')
189 189 fp.write(s)
190 190 fp.close()
191 191 outfd, outname = tempfile.mkstemp(prefix='hg-filter-out-')
192 192 os.close(outfd)
193 193 cmd = cmd.replace('INFILE', inname)
194 194 cmd = cmd.replace('OUTFILE', outname)
195 195 code = os.system(cmd)
196 196 if sys.platform == 'OpenVMS' and code & 1:
197 197 code = 0
198 198 if code:
199 199 raise Abort(_("command '%s' failed: %s") %
200 200 (cmd, explainexit(code)))
201 201 fp = open(outname, 'rb')
202 202 r = fp.read()
203 203 fp.close()
204 204 return r
205 205 finally:
206 206 try:
207 207 if inname:
208 208 os.unlink(inname)
209 209 except OSError:
210 210 pass
211 211 try:
212 212 if outname:
213 213 os.unlink(outname)
214 214 except OSError:
215 215 pass
216 216
217 217 filtertable = {
218 218 'tempfile:': tempfilter,
219 219 'pipe:': pipefilter,
220 220 }
221 221
222 222 def filter(s, cmd):
223 223 "filter a string through a command that transforms its input to its output"
224 224 for name, fn in filtertable.iteritems():
225 225 if cmd.startswith(name):
226 226 return fn(s, cmd[len(name):].lstrip())
227 227 return pipefilter(s, cmd)
228 228
229 229 def binary(s):
230 230 """return true if a string is binary data"""
231 231 return bool(s and '\0' in s)
232 232
233 233 def increasingchunks(source, min=1024, max=65536):
234 234 '''return no less than min bytes per chunk while data remains,
235 235 doubling min after each chunk until it reaches max'''
236 236 def log2(x):
237 237 if not x:
238 238 return 0
239 239 i = 0
240 240 while x:
241 241 x >>= 1
242 242 i += 1
243 243 return i - 1
244 244
245 245 buf = []
246 246 blen = 0
247 247 for chunk in source:
248 248 buf.append(chunk)
249 249 blen += len(chunk)
250 250 if blen >= min:
251 251 if min < max:
252 252 min = min << 1
253 253 nmin = 1 << log2(blen)
254 254 if nmin > min:
255 255 min = nmin
256 256 if min > max:
257 257 min = max
258 258 yield ''.join(buf)
259 259 blen = 0
260 260 buf = []
261 261 if buf:
262 262 yield ''.join(buf)
263 263
264 264 Abort = error.Abort
265 265
266 266 def always(fn):
267 267 return True
268 268
269 269 def never(fn):
270 270 return False
271 271
272 272 def pathto(root, n1, n2):
273 273 '''return the relative path from one place to another.
274 274 root should use os.sep to separate directories
275 275 n1 should use os.sep to separate directories
276 276 n2 should use "/" to separate directories
277 277 returns an os.sep-separated path.
278 278
279 279 If n1 is a relative path, it's assumed it's
280 280 relative to root.
281 281 n2 should always be relative to root.
282 282 '''
283 283 if not n1:
284 284 return localpath(n2)
285 285 if os.path.isabs(n1):
286 286 if os.path.splitdrive(root)[0] != os.path.splitdrive(n1)[0]:
287 287 return os.path.join(root, localpath(n2))
288 288 n2 = '/'.join((pconvert(root), n2))
289 289 a, b = splitpath(n1), n2.split('/')
290 290 a.reverse()
291 291 b.reverse()
292 292 while a and b and a[-1] == b[-1]:
293 293 a.pop()
294 294 b.pop()
295 295 b.reverse()
296 296 return os.sep.join((['..'] * len(a)) + b) or '.'
297 297
298 298 _hgexecutable = None
299 299
300 300 def mainfrozen():
301 301 """return True if we are a frozen executable.
302 302
303 303 The code supports py2exe (most common, Windows only) and tools/freeze
304 304 (portable, not much used).
305 305 """
306 306 return (hasattr(sys, "frozen") or # new py2exe
307 307 hasattr(sys, "importers") or # old py2exe
308 308 imp.is_frozen("__main__")) # tools/freeze
309 309
310 310 def hgexecutable():
311 311 """return location of the 'hg' executable.
312 312
313 313 Defaults to $HG or 'hg' in the search path.
314 314 """
315 315 if _hgexecutable is None:
316 316 hg = os.environ.get('HG')
317 317 if hg:
318 318 _sethgexecutable(hg)
319 319 elif mainfrozen():
320 320 _sethgexecutable(sys.executable)
321 321 else:
322 322 exe = findexe('hg') or os.path.basename(sys.argv[0])
323 323 _sethgexecutable(exe)
324 324 return _hgexecutable
325 325
326 326 def _sethgexecutable(path):
327 327 """set location of the 'hg' executable"""
328 328 global _hgexecutable
329 329 _hgexecutable = path
330 330
331 331 def system(cmd, environ={}, cwd=None, onerr=None, errprefix=None, out=None):
332 332 '''enhanced shell command execution.
333 333 run with environment maybe modified, maybe in different dir.
334 334
335 335 if command fails and onerr is None, return status. if ui object,
336 336 print error message and return status, else raise onerr object as
337 337 exception.
338 338
339 339 if out is specified, it is assumed to be a file-like object that has a
340 340 write() method. stdout and stderr will be redirected to out.'''
341 341 try:
342 342 sys.stdout.flush()
343 343 except Exception:
344 344 pass
345 345 def py2shell(val):
346 346 'convert python object into string that is useful to shell'
347 347 if val is None or val is False:
348 348 return '0'
349 349 if val is True:
350 350 return '1'
351 351 return str(val)
352 352 origcmd = cmd
353 353 cmd = quotecommand(cmd)
354 354 env = dict(os.environ)
355 355 env.update((k, py2shell(v)) for k, v in environ.iteritems())
356 356 env['HG'] = hgexecutable()
357 357 if out is None or out == sys.__stdout__:
358 358 rc = subprocess.call(cmd, shell=True, close_fds=closefds,
359 359 env=env, cwd=cwd)
360 360 else:
361 361 proc = subprocess.Popen(cmd, shell=True, close_fds=closefds,
362 362 env=env, cwd=cwd, stdout=subprocess.PIPE,
363 363 stderr=subprocess.STDOUT)
364 364 for line in proc.stdout:
365 365 out.write(line)
366 366 proc.wait()
367 367 rc = proc.returncode
368 368 if sys.platform == 'OpenVMS' and rc & 1:
369 369 rc = 0
370 370 if rc and onerr:
371 371 errmsg = '%s %s' % (os.path.basename(origcmd.split(None, 1)[0]),
372 372 explainexit(rc)[0])
373 373 if errprefix:
374 374 errmsg = '%s: %s' % (errprefix, errmsg)
375 375 try:
376 376 onerr.warn(errmsg + '\n')
377 377 except AttributeError:
378 378 raise onerr(errmsg)
379 379 return rc
380 380
381 381 def checksignature(func):
382 382 '''wrap a function with code to check for calling errors'''
383 383 def check(*args, **kwargs):
384 384 try:
385 385 return func(*args, **kwargs)
386 386 except TypeError:
387 387 if len(traceback.extract_tb(sys.exc_info()[2])) == 1:
388 388 raise error.SignatureError
389 389 raise
390 390
391 391 return check
392 392
393 393 def makedir(path, notindexed):
394 394 os.mkdir(path)
395 395
396 396 def unlinkpath(f):
397 397 """unlink and remove the directory if it is empty"""
398 398 os.unlink(f)
399 399 # try removing directories that might now be empty
400 400 try:
401 401 os.removedirs(os.path.dirname(f))
402 402 except OSError:
403 403 pass
404 404
405 405 def copyfile(src, dest):
406 406 "copy a file, preserving mode and atime/mtime"
407 407 if os.path.islink(src):
408 408 try:
409 409 os.unlink(dest)
410 410 except OSError:
411 411 pass
412 412 os.symlink(os.readlink(src), dest)
413 413 else:
414 414 try:
415 415 shutil.copyfile(src, dest)
416 416 shutil.copymode(src, dest)
417 417 except shutil.Error, inst:
418 418 raise Abort(str(inst))
419 419
420 420 def copyfiles(src, dst, hardlink=None):
421 421 """Copy a directory tree using hardlinks if possible"""
422 422
423 423 if hardlink is None:
424 424 hardlink = (os.stat(src).st_dev ==
425 425 os.stat(os.path.dirname(dst)).st_dev)
426 426
427 427 num = 0
428 428 if os.path.isdir(src):
429 429 os.mkdir(dst)
430 430 for name, kind in osutil.listdir(src):
431 431 srcname = os.path.join(src, name)
432 432 dstname = os.path.join(dst, name)
433 433 hardlink, n = copyfiles(srcname, dstname, hardlink)
434 434 num += n
435 435 else:
436 436 if hardlink:
437 437 try:
438 438 oslink(src, dst)
439 439 except (IOError, OSError):
440 440 hardlink = False
441 441 shutil.copy(src, dst)
442 442 else:
443 443 shutil.copy(src, dst)
444 444 num += 1
445 445
446 446 return hardlink, num
447 447
448 448 _winreservednames = '''con prn aux nul
449 449 com1 com2 com3 com4 com5 com6 com7 com8 com9
450 450 lpt1 lpt2 lpt3 lpt4 lpt5 lpt6 lpt7 lpt8 lpt9'''.split()
451 451 _winreservedchars = ':*?"<>|'
452 452 def checkwinfilename(path):
453 453 '''Check that the base-relative path is a valid filename on Windows.
454 454 Returns None if the path is ok, or a UI string describing the problem.
455 455
456 456 >>> checkwinfilename("just/a/normal/path")
457 457 >>> checkwinfilename("foo/bar/con.xml")
458 458 "filename contains 'con', which is reserved on Windows"
459 459 >>> checkwinfilename("foo/con.xml/bar")
460 460 "filename contains 'con', which is reserved on Windows"
461 461 >>> checkwinfilename("foo/bar/xml.con")
462 462 >>> checkwinfilename("foo/bar/AUX/bla.txt")
463 463 "filename contains 'AUX', which is reserved on Windows"
464 464 >>> checkwinfilename("foo/bar/bla:.txt")
465 465 "filename contains ':', which is reserved on Windows"
466 466 >>> checkwinfilename("foo/bar/b\07la.txt")
467 467 "filename contains '\\\\x07', which is invalid on Windows"
468 468 >>> checkwinfilename("foo/bar/bla ")
469 469 "filename ends with ' ', which is not allowed on Windows"
470 470 '''
471 471 for n in path.replace('\\', '/').split('/'):
472 472 if not n:
473 473 continue
474 474 for c in n:
475 475 if c in _winreservedchars:
476 476 return _("filename contains '%s', which is reserved "
477 477 "on Windows") % c
478 478 if ord(c) <= 31:
479 479 return _("filename contains %r, which is invalid "
480 480 "on Windows") % c
481 481 base = n.split('.')[0]
482 482 if base and base.lower() in _winreservednames:
483 483 return _("filename contains '%s', which is reserved "
484 484 "on Windows") % base
485 485 t = n[-1]
486 486 if t in '. ':
487 487 return _("filename ends with '%s', which is not allowed "
488 488 "on Windows") % t
489 489
490 490 def lookupreg(key, name=None, scope=None):
491 491 return None
492 492
493 493 def hidewindow():
494 494 """Hide current shell window.
495 495
496 496 Used to hide the window opened when starting asynchronous
497 497 child process under Windows, unneeded on other systems.
498 498 """
499 499 pass
500 500
501 501 if os.name == 'nt':
502 502 checkosfilename = checkwinfilename
503 503 from windows import *
504 504 else:
505 505 from posix import *
506 506
507 507 def makelock(info, pathname):
508 508 try:
509 509 return os.symlink(info, pathname)
510 510 except OSError, why:
511 511 if why.errno == errno.EEXIST:
512 512 raise
513 513 except AttributeError: # no symlink in os
514 514 pass
515 515
516 516 ld = os.open(pathname, os.O_CREAT | os.O_WRONLY | os.O_EXCL)
517 517 os.write(ld, info)
518 518 os.close(ld)
519 519
520 520 def readlock(pathname):
521 521 try:
522 522 return os.readlink(pathname)
523 523 except OSError, why:
524 524 if why.errno not in (errno.EINVAL, errno.ENOSYS):
525 525 raise
526 526 except AttributeError: # no symlink in os
527 527 pass
528 528 fp = posixfile(pathname)
529 529 r = fp.read()
530 530 fp.close()
531 531 return r
532 532
533 533 def fstat(fp):
534 534 '''stat file object that may not have fileno method.'''
535 535 try:
536 536 return os.fstat(fp.fileno())
537 537 except AttributeError:
538 538 return os.stat(fp.name)
539 539
540 540 # File system features
541 541
542 542 def checkcase(path):
543 543 """
544 544 Check whether the given path is on a case-sensitive filesystem
545 545
546 546 Requires a path (like /foo/.hg) ending with a foldable final
547 547 directory component.
548 548 """
549 549 s1 = os.stat(path)
550 550 d, b = os.path.split(path)
551 551 p2 = os.path.join(d, b.upper())
552 552 if path == p2:
553 553 p2 = os.path.join(d, b.lower())
554 554 try:
555 555 s2 = os.stat(p2)
556 556 if s2 == s1:
557 557 return False
558 558 return True
559 559 except OSError:
560 560 return True
561 561
562 562 _fspathcache = {}
563 563 def fspath(name, root):
564 564 '''Get name in the case stored in the filesystem
565 565
566 566 The name is either relative to root, or it is an absolute path starting
567 567 with root. Note that this function is unnecessary, and should not be
568 568 called, for case-sensitive filesystems (simply because it's expensive).
569 569 '''
570 570 # If name is absolute, make it relative
571 571 if name.lower().startswith(root.lower()):
572 572 l = len(root)
573 573 if name[l] == os.sep or name[l] == os.altsep:
574 574 l = l + 1
575 575 name = name[l:]
576 576
577 577 if not os.path.lexists(os.path.join(root, name)):
578 578 return None
579 579
580 580 seps = os.sep
581 581 if os.altsep:
582 582 seps = seps + os.altsep
583 583 # Protect backslashes. This gets silly very quickly.
584 584 seps.replace('\\','\\\\')
585 585 pattern = re.compile(r'([^%s]+)|([%s]+)' % (seps, seps))
586 586 dir = os.path.normcase(os.path.normpath(root))
587 587 result = []
588 588 for part, sep in pattern.findall(name):
589 589 if sep:
590 590 result.append(sep)
591 591 continue
592 592
593 593 if dir not in _fspathcache:
594 594 _fspathcache[dir] = os.listdir(dir)
595 595 contents = _fspathcache[dir]
596 596
597 597 lpart = part.lower()
598 598 lenp = len(part)
599 599 for n in contents:
600 600 if lenp == len(n) and n.lower() == lpart:
601 601 result.append(n)
602 602 break
603 603 else:
604 604 # Cannot happen, as the file exists!
605 605 result.append(part)
606 606 dir = os.path.join(dir, lpart)
607 607
608 608 return ''.join(result)
609 609
610 610 def checknlink(testfile):
611 611 '''check whether hardlink count reporting works properly'''
612 612
613 613 # testfile may be open, so we need a separate file for checking to
614 614 # work around issue2543 (or testfile may get lost on Samba shares)
615 615 f1 = testfile + ".hgtmp1"
616 616 if os.path.lexists(f1):
617 617 return False
618 618 try:
619 619 posixfile(f1, 'w').close()
620 620 except IOError:
621 621 return False
622 622
623 623 f2 = testfile + ".hgtmp2"
624 624 fd = None
625 625 try:
626 626 try:
627 627 oslink(f1, f2)
628 628 except OSError:
629 629 return False
630 630
631 631 # nlinks() may behave differently for files on Windows shares if
632 632 # the file is open.
633 633 fd = posixfile(f2)
634 634 return nlinks(f2) > 1
635 635 finally:
636 636 if fd is not None:
637 637 fd.close()
638 638 for f in (f1, f2):
639 639 try:
640 640 os.unlink(f)
641 641 except OSError:
642 642 pass
643 643
644 644 return False
645 645
646 646 def endswithsep(path):
647 647 '''Check path ends with os.sep or os.altsep.'''
648 648 return path.endswith(os.sep) or os.altsep and path.endswith(os.altsep)
649 649
650 650 def splitpath(path):
651 651 '''Split path by os.sep.
652 652 Note that this function does not use os.altsep because this is
653 653 an alternative of simple "xxx.split(os.sep)".
654 654 It is recommended to use os.path.normpath() before using this
655 655 function if need.'''
656 656 return path.split(os.sep)
657 657
658 658 def gui():
659 659 '''Are we running in a GUI?'''
660 660 if sys.platform == 'darwin':
661 661 if 'SSH_CONNECTION' in os.environ:
662 662 # handle SSH access to a box where the user is logged in
663 663 return False
664 664 elif getattr(osutil, 'isgui', None):
665 665 # check if a CoreGraphics session is available
666 666 return osutil.isgui()
667 667 else:
668 668 # pure build; use a safe default
669 669 return True
670 670 else:
671 671 return os.name == "nt" or os.environ.get("DISPLAY")
672 672
673 673 def mktempcopy(name, emptyok=False, createmode=None):
674 674 """Create a temporary file with the same contents from name
675 675
676 676 The permission bits are copied from the original file.
677 677
678 678 If the temporary file is going to be truncated immediately, you
679 679 can use emptyok=True as an optimization.
680 680
681 681 Returns the name of the temporary file.
682 682 """
683 683 d, fn = os.path.split(name)
684 684 fd, temp = tempfile.mkstemp(prefix='.%s-' % fn, dir=d)
685 685 os.close(fd)
686 686 # Temporary files are created with mode 0600, which is usually not
687 687 # what we want. If the original file already exists, just copy
688 688 # its mode. Otherwise, manually obey umask.
689 689 try:
690 690 st_mode = os.lstat(name).st_mode & 0777
691 691 except OSError, inst:
692 692 if inst.errno != errno.ENOENT:
693 693 raise
694 694 st_mode = createmode
695 695 if st_mode is None:
696 696 st_mode = ~umask
697 697 st_mode &= 0666
698 698 os.chmod(temp, st_mode)
699 699 if emptyok:
700 700 return temp
701 701 try:
702 702 try:
703 703 ifp = posixfile(name, "rb")
704 704 except IOError, inst:
705 705 if inst.errno == errno.ENOENT:
706 706 return temp
707 707 if not getattr(inst, 'filename', None):
708 708 inst.filename = name
709 709 raise
710 710 ofp = posixfile(temp, "wb")
711 711 for chunk in filechunkiter(ifp):
712 712 ofp.write(chunk)
713 713 ifp.close()
714 714 ofp.close()
715 715 except:
716 716 try: os.unlink(temp)
717 717 except: pass
718 718 raise
719 719 return temp
720 720
721 721 class atomictempfile(object):
722 722 '''writeable file object that atomically updates a file
723 723
724 724 All writes will go to a temporary copy of the original file. Call
725 725 rename() when you are done writing, and atomictempfile will rename
726 726 the temporary copy to the original name, making the changes visible.
727 727
728 728 Unlike other file-like objects, close() discards your writes by
729 729 simply deleting the temporary file.
730 730 '''
731 731 def __init__(self, name, mode='w+b', createmode=None):
732 732 self.__name = name # permanent name
733 733 self._tempname = mktempcopy(name, emptyok=('w' in mode),
734 734 createmode=createmode)
735 735 self._fp = posixfile(self._tempname, mode)
736 736
737 737 # delegated methods
738 738 self.write = self._fp.write
739 739 self.fileno = self._fp.fileno
740 740
741 741 def rename(self):
742 742 if not self._fp.closed:
743 743 self._fp.close()
744 744 rename(self._tempname, localpath(self.__name))
745 745
746 746 def close(self):
747 747 if not self._fp.closed:
748 748 try:
749 749 os.unlink(self._tempname)
750 750 except OSError:
751 751 pass
752 752 self._fp.close()
753 753
754 754 def __del__(self):
755 755 if hasattr(self, '_fp'): # constructor actually did something
756 756 self.close()
757 757
758 758 def makedirs(name, mode=None):
759 759 """recursive directory creation with parent mode inheritance"""
760 760 parent = os.path.abspath(os.path.dirname(name))
761 761 try:
762 762 os.mkdir(name)
763 763 if mode is not None:
764 764 os.chmod(name, mode)
765 765 return
766 766 except OSError, err:
767 767 if err.errno == errno.EEXIST:
768 768 return
769 769 if not name or parent == name or err.errno != errno.ENOENT:
770 770 raise
771 771 makedirs(parent, mode)
772 772 makedirs(name, mode)
773 773
774 774 def readfile(path):
775 775 fp = open(path, 'rb')
776 776 try:
777 777 return fp.read()
778 778 finally:
779 779 fp.close()
780 780
781 781 def writefile(path, text):
782 782 fp = open(path, 'wb')
783 783 try:
784 784 fp.write(text)
785 785 finally:
786 786 fp.close()
787 787
788 788 def appendfile(path, text):
789 789 fp = open(path, 'ab')
790 790 try:
791 791 fp.write(text)
792 792 finally:
793 793 fp.close()
794 794
795 795 class chunkbuffer(object):
796 796 """Allow arbitrary sized chunks of data to be efficiently read from an
797 797 iterator over chunks of arbitrary size."""
798 798
799 799 def __init__(self, in_iter):
800 800 """in_iter is the iterator that's iterating over the input chunks.
801 801 targetsize is how big a buffer to try to maintain."""
802 802 def splitbig(chunks):
803 803 for chunk in chunks:
804 804 if len(chunk) > 2**20:
805 805 pos = 0
806 806 while pos < len(chunk):
807 807 end = pos + 2 ** 18
808 808 yield chunk[pos:end]
809 809 pos = end
810 810 else:
811 811 yield chunk
812 812 self.iter = splitbig(in_iter)
813 813 self._queue = []
814 814
815 815 def read(self, l):
816 816 """Read L bytes of data from the iterator of chunks of data.
817 817 Returns less than L bytes if the iterator runs dry."""
818 818 left = l
819 819 buf = ''
820 820 queue = self._queue
821 821 while left > 0:
822 822 # refill the queue
823 823 if not queue:
824 824 target = 2**18
825 825 for chunk in self.iter:
826 826 queue.append(chunk)
827 827 target -= len(chunk)
828 828 if target <= 0:
829 829 break
830 830 if not queue:
831 831 break
832 832
833 833 chunk = queue.pop(0)
834 834 left -= len(chunk)
835 835 if left < 0:
836 836 queue.insert(0, chunk[left:])
837 837 buf += chunk[:left]
838 838 else:
839 839 buf += chunk
840 840
841 841 return buf
842 842
843 843 def filechunkiter(f, size=65536, limit=None):
844 844 """Create a generator that produces the data in the file size
845 845 (default 65536) bytes at a time, up to optional limit (default is
846 846 to read all data). Chunks may be less than size bytes if the
847 847 chunk is the last chunk in the file, or the file is a socket or
848 848 some other type of file that sometimes reads less data than is
849 849 requested."""
850 850 assert size >= 0
851 851 assert limit is None or limit >= 0
852 852 while True:
853 853 if limit is None:
854 854 nbytes = size
855 855 else:
856 856 nbytes = min(limit, size)
857 857 s = nbytes and f.read(nbytes)
858 858 if not s:
859 859 break
860 860 if limit:
861 861 limit -= len(s)
862 862 yield s
863 863
864 864 def makedate():
865 865 lt = time.localtime()
866 866 if lt[8] == 1 and time.daylight:
867 867 tz = time.altzone
868 868 else:
869 869 tz = time.timezone
870 870 t = time.mktime(lt)
871 871 if t < 0:
872 872 hint = _("check your clock")
873 873 raise Abort(_("negative timestamp: %d") % t, hint=hint)
874 874 return t, tz
875 875
876 876 def datestr(date=None, format='%a %b %d %H:%M:%S %Y %1%2'):
877 877 """represent a (unixtime, offset) tuple as a localized time.
878 878 unixtime is seconds since the epoch, and offset is the time zone's
879 879 number of seconds away from UTC. if timezone is false, do not
880 880 append time zone to string."""
881 881 t, tz = date or makedate()
882 882 if t < 0:
883 883 t = 0 # time.gmtime(lt) fails on Windows for lt < -43200
884 884 tz = 0
885 885 if "%1" in format or "%2" in format:
886 886 sign = (tz > 0) and "-" or "+"
887 887 minutes = abs(tz) // 60
888 888 format = format.replace("%1", "%c%02d" % (sign, minutes // 60))
889 889 format = format.replace("%2", "%02d" % (minutes % 60))
890 890 s = time.strftime(format, time.gmtime(float(t) - tz))
891 891 return s
892 892
893 893 def shortdate(date=None):
894 894 """turn (timestamp, tzoff) tuple into iso 8631 date."""
895 895 return datestr(date, format='%Y-%m-%d')
896 896
897 897 def strdate(string, format, defaults=[]):
898 898 """parse a localized time string and return a (unixtime, offset) tuple.
899 899 if the string cannot be parsed, ValueError is raised."""
900 900 def timezone(string):
901 901 tz = string.split()[-1]
902 902 if tz[0] in "+-" and len(tz) == 5 and tz[1:].isdigit():
903 903 sign = (tz[0] == "+") and 1 or -1
904 904 hours = int(tz[1:3])
905 905 minutes = int(tz[3:5])
906 906 return -sign * (hours * 60 + minutes) * 60
907 907 if tz == "GMT" or tz == "UTC":
908 908 return 0
909 909 return None
910 910
911 911 # NOTE: unixtime = localunixtime + offset
912 912 offset, date = timezone(string), string
913 913 if offset is not None:
914 914 date = " ".join(string.split()[:-1])
915 915
916 916 # add missing elements from defaults
917 917 usenow = False # default to using biased defaults
918 918 for part in ("S", "M", "HI", "d", "mb", "yY"): # decreasing specificity
919 919 found = [True for p in part if ("%"+p) in format]
920 920 if not found:
921 921 date += "@" + defaults[part][usenow]
922 922 format += "@%" + part[0]
923 923 else:
924 924 # We've found a specific time element, less specific time
925 925 # elements are relative to today
926 926 usenow = True
927 927
928 928 timetuple = time.strptime(date, format)
929 929 localunixtime = int(calendar.timegm(timetuple))
930 930 if offset is None:
931 931 # local timezone
932 932 unixtime = int(time.mktime(timetuple))
933 933 offset = unixtime - localunixtime
934 934 else:
935 935 unixtime = localunixtime + offset
936 936 return unixtime, offset
937 937
938 938 def parsedate(date, formats=None, bias={}):
939 939 """parse a localized date/time and return a (unixtime, offset) tuple.
940 940
941 941 The date may be a "unixtime offset" string or in one of the specified
942 942 formats. If the date already is a (unixtime, offset) tuple, it is returned.
943 943 """
944 944 if not date:
945 945 return 0, 0
946 946 if isinstance(date, tuple) and len(date) == 2:
947 947 return date
948 948 if not formats:
949 949 formats = defaultdateformats
950 950 date = date.strip()
951 951 try:
952 952 when, offset = map(int, date.split(' '))
953 953 except ValueError:
954 954 # fill out defaults
955 955 now = makedate()
956 956 defaults = {}
957 957 for part in ("d", "mb", "yY", "HI", "M", "S"):
958 958 # this piece is for rounding the specific end of unknowns
959 959 b = bias.get(part)
960 960 if b is None:
961 961 if part[0] in "HMS":
962 962 b = "00"
963 963 else:
964 964 b = "0"
965 965
966 966 # this piece is for matching the generic end to today's date
967 967 n = datestr(now, "%" + part[0])
968 968
969 969 defaults[part] = (b, n)
970 970
971 971 for format in formats:
972 972 try:
973 973 when, offset = strdate(date, format, defaults)
974 974 except (ValueError, OverflowError):
975 975 pass
976 976 else:
977 977 break
978 978 else:
979 979 raise Abort(_('invalid date: %r') % date)
980 980 # validate explicit (probably user-specified) date and
981 981 # time zone offset. values must fit in signed 32 bits for
982 982 # current 32-bit linux runtimes. timezones go from UTC-12
983 983 # to UTC+14
984 984 if abs(when) > 0x7fffffff:
985 985 raise Abort(_('date exceeds 32 bits: %d') % when)
986 986 if when < 0:
987 987 raise Abort(_('negative date value: %d') % when)
988 988 if offset < -50400 or offset > 43200:
989 989 raise Abort(_('impossible time zone offset: %d') % offset)
990 990 return when, offset
991 991
992 992 def matchdate(date):
993 993 """Return a function that matches a given date match specifier
994 994
995 995 Formats include:
996 996
997 997 '{date}' match a given date to the accuracy provided
998 998
999 999 '<{date}' on or before a given date
1000 1000
1001 1001 '>{date}' on or after a given date
1002 1002
1003 1003 >>> p1 = parsedate("10:29:59")
1004 1004 >>> p2 = parsedate("10:30:00")
1005 1005 >>> p3 = parsedate("10:30:59")
1006 1006 >>> p4 = parsedate("10:31:00")
1007 1007 >>> p5 = parsedate("Sep 15 10:30:00 1999")
1008 1008 >>> f = matchdate("10:30")
1009 1009 >>> f(p1[0])
1010 1010 False
1011 1011 >>> f(p2[0])
1012 1012 True
1013 1013 >>> f(p3[0])
1014 1014 True
1015 1015 >>> f(p4[0])
1016 1016 False
1017 1017 >>> f(p5[0])
1018 1018 False
1019 1019 """
1020 1020
1021 1021 def lower(date):
1022 1022 d = dict(mb="1", d="1")
1023 1023 return parsedate(date, extendeddateformats, d)[0]
1024 1024
1025 1025 def upper(date):
1026 1026 d = dict(mb="12", HI="23", M="59", S="59")
1027 1027 for days in ("31", "30", "29"):
1028 1028 try:
1029 1029 d["d"] = days
1030 1030 return parsedate(date, extendeddateformats, d)[0]
1031 1031 except:
1032 1032 pass
1033 1033 d["d"] = "28"
1034 1034 return parsedate(date, extendeddateformats, d)[0]
1035 1035
1036 1036 date = date.strip()
1037 1037
1038 1038 if not date:
1039 1039 raise Abort(_("dates cannot consist entirely of whitespace"))
1040 1040 elif date[0] == "<":
1041 1041 if not date[1:]:
1042 1042 raise Abort(_("invalid day spec, use '<DATE'"))
1043 1043 when = upper(date[1:])
1044 1044 return lambda x: x <= when
1045 1045 elif date[0] == ">":
1046 1046 if not date[1:]:
1047 1047 raise Abort(_("invalid day spec, use '>DATE'"))
1048 1048 when = lower(date[1:])
1049 1049 return lambda x: x >= when
1050 1050 elif date[0] == "-":
1051 1051 try:
1052 1052 days = int(date[1:])
1053 1053 except ValueError:
1054 1054 raise Abort(_("invalid day spec: %s") % date[1:])
1055 1055 if days < 0:
1056 1056 raise Abort(_("%s must be nonnegative (see 'hg help dates')")
1057 1057 % date[1:])
1058 1058 when = makedate()[0] - days * 3600 * 24
1059 1059 return lambda x: x >= when
1060 1060 elif " to " in date:
1061 1061 a, b = date.split(" to ")
1062 1062 start, stop = lower(a), upper(b)
1063 1063 return lambda x: x >= start and x <= stop
1064 1064 else:
1065 1065 start, stop = lower(date), upper(date)
1066 1066 return lambda x: x >= start and x <= stop
1067 1067
1068 1068 def shortuser(user):
1069 1069 """Return a short representation of a user name or email address."""
1070 1070 f = user.find('@')
1071 1071 if f >= 0:
1072 1072 user = user[:f]
1073 1073 f = user.find('<')
1074 1074 if f >= 0:
1075 1075 user = user[f + 1:]
1076 1076 f = user.find(' ')
1077 1077 if f >= 0:
1078 1078 user = user[:f]
1079 1079 f = user.find('.')
1080 1080 if f >= 0:
1081 1081 user = user[:f]
1082 1082 return user
1083 1083
1084 1084 def email(author):
1085 1085 '''get email of author.'''
1086 1086 r = author.find('>')
1087 1087 if r == -1:
1088 1088 r = None
1089 1089 return author[author.find('<') + 1:r]
1090 1090
1091 1091 def _ellipsis(text, maxlength):
1092 1092 if len(text) <= maxlength:
1093 1093 return text, False
1094 1094 else:
1095 1095 return "%s..." % (text[:maxlength - 3]), True
1096 1096
1097 1097 def ellipsis(text, maxlength=400):
1098 1098 """Trim string to at most maxlength (default: 400) characters."""
1099 1099 try:
1100 1100 # use unicode not to split at intermediate multi-byte sequence
1101 1101 utext, truncated = _ellipsis(text.decode(encoding.encoding),
1102 1102 maxlength)
1103 1103 if not truncated:
1104 1104 return text
1105 1105 return utext.encode(encoding.encoding)
1106 1106 except (UnicodeDecodeError, UnicodeEncodeError):
1107 1107 return _ellipsis(text, maxlength)[0]
1108 1108
1109 1109 def bytecount(nbytes):
1110 1110 '''return byte count formatted as readable string, with units'''
1111 1111
1112 1112 units = (
1113 1113 (100, 1 << 30, _('%.0f GB')),
1114 1114 (10, 1 << 30, _('%.1f GB')),
1115 1115 (1, 1 << 30, _('%.2f GB')),
1116 1116 (100, 1 << 20, _('%.0f MB')),
1117 1117 (10, 1 << 20, _('%.1f MB')),
1118 1118 (1, 1 << 20, _('%.2f MB')),
1119 1119 (100, 1 << 10, _('%.0f KB')),
1120 1120 (10, 1 << 10, _('%.1f KB')),
1121 1121 (1, 1 << 10, _('%.2f KB')),
1122 1122 (1, 1, _('%.0f bytes')),
1123 1123 )
1124 1124
1125 1125 for multiplier, divisor, format in units:
1126 1126 if nbytes >= divisor * multiplier:
1127 1127 return format % (nbytes / float(divisor))
1128 1128 return units[-1][2] % nbytes
1129 1129
1130 1130 def uirepr(s):
1131 1131 # Avoid double backslash in Windows path repr()
1132 1132 return repr(s).replace('\\\\', '\\')
1133 1133
1134 1134 # delay import of textwrap
1135 1135 def MBTextWrapper(**kwargs):
1136 1136 class tw(textwrap.TextWrapper):
1137 1137 """
1138 1138 Extend TextWrapper for double-width characters.
1139 1139
1140 1140 Some Asian characters use two terminal columns instead of one.
1141 1141 A good example of this behavior can be seen with u'\u65e5\u672c',
1142 1142 the two Japanese characters for "Japan":
1143 1143 len() returns 2, but when printed to a terminal, they eat 4 columns.
1144 1144
1145 1145 (Note that this has nothing to do whatsoever with unicode
1146 1146 representation, or encoding of the underlying string)
1147 1147 """
1148 1148 def __init__(self, **kwargs):
1149 1149 textwrap.TextWrapper.__init__(self, **kwargs)
1150 1150
1151 def _cutdown(self, str, space_left):
1151 def _cutdown(self, ucstr, space_left):
1152 1152 l = 0
1153 ucstr = unicode(str, encoding.encoding)
1154 1153 colwidth = unicodedata.east_asian_width
1155 1154 for i in xrange(len(ucstr)):
1156 1155 l += colwidth(ucstr[i]) in 'WFA' and 2 or 1
1157 1156 if space_left < l:
1158 return (ucstr[:i].encode(encoding.encoding),
1159 ucstr[i:].encode(encoding.encoding))
1160 return str, ''
1157 return (ucstr[:i], ucstr[i:])
1158 return ucstr, ''
1161 1159
1162 1160 # overriding of base class
1163 1161 def _handle_long_word(self, reversed_chunks, cur_line, cur_len, width):
1164 1162 space_left = max(width - cur_len, 1)
1165 1163
1166 1164 if self.break_long_words:
1167 1165 cut, res = self._cutdown(reversed_chunks[-1], space_left)
1168 1166 cur_line.append(cut)
1169 1167 reversed_chunks[-1] = res
1170 1168 elif not cur_line:
1171 1169 cur_line.append(reversed_chunks.pop())
1172 1170
1173 1171 global MBTextWrapper
1174 1172 MBTextWrapper = tw
1175 1173 return tw(**kwargs)
1176 1174
1177 1175 def wrap(line, width, initindent='', hangindent=''):
1178 1176 maxindent = max(len(hangindent), len(initindent))
1179 1177 if width <= maxindent:
1180 1178 # adjust for weird terminal size
1181 1179 width = max(78, maxindent + 1)
1180 line = line.decode(encoding.encoding, encoding.encodingmode)
1181 initindent = initindent.decode(encoding.encoding, encoding.encodingmode)
1182 hangindent = hangindent.decode(encoding.encoding, encoding.encodingmode)
1182 1183 wrapper = MBTextWrapper(width=width,
1183 1184 initial_indent=initindent,
1184 1185 subsequent_indent=hangindent)
1185 return wrapper.fill(line)
1186 return wrapper.fill(line).encode(encoding.encoding)
1186 1187
1187 1188 def iterlines(iterator):
1188 1189 for chunk in iterator:
1189 1190 for line in chunk.splitlines():
1190 1191 yield line
1191 1192
1192 1193 def expandpath(path):
1193 1194 return os.path.expanduser(os.path.expandvars(path))
1194 1195
1195 1196 def hgcmd():
1196 1197 """Return the command used to execute current hg
1197 1198
1198 1199 This is different from hgexecutable() because on Windows we want
1199 1200 to avoid things opening new shell windows like batch files, so we
1200 1201 get either the python call or current executable.
1201 1202 """
1202 1203 if mainfrozen():
1203 1204 return [sys.executable]
1204 1205 return gethgcmd()
1205 1206
1206 1207 def rundetached(args, condfn):
1207 1208 """Execute the argument list in a detached process.
1208 1209
1209 1210 condfn is a callable which is called repeatedly and should return
1210 1211 True once the child process is known to have started successfully.
1211 1212 At this point, the child process PID is returned. If the child
1212 1213 process fails to start or finishes before condfn() evaluates to
1213 1214 True, return -1.
1214 1215 """
1215 1216 # Windows case is easier because the child process is either
1216 1217 # successfully starting and validating the condition or exiting
1217 1218 # on failure. We just poll on its PID. On Unix, if the child
1218 1219 # process fails to start, it will be left in a zombie state until
1219 1220 # the parent wait on it, which we cannot do since we expect a long
1220 1221 # running process on success. Instead we listen for SIGCHLD telling
1221 1222 # us our child process terminated.
1222 1223 terminated = set()
1223 1224 def handler(signum, frame):
1224 1225 terminated.add(os.wait())
1225 1226 prevhandler = None
1226 1227 if hasattr(signal, 'SIGCHLD'):
1227 1228 prevhandler = signal.signal(signal.SIGCHLD, handler)
1228 1229 try:
1229 1230 pid = spawndetached(args)
1230 1231 while not condfn():
1231 1232 if ((pid in terminated or not testpid(pid))
1232 1233 and not condfn()):
1233 1234 return -1
1234 1235 time.sleep(0.1)
1235 1236 return pid
1236 1237 finally:
1237 1238 if prevhandler is not None:
1238 1239 signal.signal(signal.SIGCHLD, prevhandler)
1239 1240
1240 1241 try:
1241 1242 any, all = any, all
1242 1243 except NameError:
1243 1244 def any(iterable):
1244 1245 for i in iterable:
1245 1246 if i:
1246 1247 return True
1247 1248 return False
1248 1249
1249 1250 def all(iterable):
1250 1251 for i in iterable:
1251 1252 if not i:
1252 1253 return False
1253 1254 return True
1254 1255
1255 1256 def interpolate(prefix, mapping, s, fn=None, escape_prefix=False):
1256 1257 """Return the result of interpolating items in the mapping into string s.
1257 1258
1258 1259 prefix is a single character string, or a two character string with
1259 1260 a backslash as the first character if the prefix needs to be escaped in
1260 1261 a regular expression.
1261 1262
1262 1263 fn is an optional function that will be applied to the replacement text
1263 1264 just before replacement.
1264 1265
1265 1266 escape_prefix is an optional flag that allows using doubled prefix for
1266 1267 its escaping.
1267 1268 """
1268 1269 fn = fn or (lambda s: s)
1269 1270 patterns = '|'.join(mapping.keys())
1270 1271 if escape_prefix:
1271 1272 patterns += '|' + prefix
1272 1273 if len(prefix) > 1:
1273 1274 prefix_char = prefix[1:]
1274 1275 else:
1275 1276 prefix_char = prefix
1276 1277 mapping[prefix_char] = prefix_char
1277 1278 r = re.compile(r'%s(%s)' % (prefix, patterns))
1278 1279 return r.sub(lambda x: fn(mapping[x.group()[1:]]), s)
1279 1280
1280 1281 def getport(port):
1281 1282 """Return the port for a given network service.
1282 1283
1283 1284 If port is an integer, it's returned as is. If it's a string, it's
1284 1285 looked up using socket.getservbyname(). If there's no matching
1285 1286 service, util.Abort is raised.
1286 1287 """
1287 1288 try:
1288 1289 return int(port)
1289 1290 except ValueError:
1290 1291 pass
1291 1292
1292 1293 try:
1293 1294 return socket.getservbyname(port)
1294 1295 except socket.error:
1295 1296 raise Abort(_("no port number associated with service '%s'") % port)
1296 1297
1297 1298 _booleans = {'1': True, 'yes': True, 'true': True, 'on': True, 'always': True,
1298 1299 '0': False, 'no': False, 'false': False, 'off': False,
1299 1300 'never': False}
1300 1301
1301 1302 def parsebool(s):
1302 1303 """Parse s into a boolean.
1303 1304
1304 1305 If s is not a valid boolean, returns None.
1305 1306 """
1306 1307 return _booleans.get(s.lower(), None)
1307 1308
1308 1309 _hexdig = '0123456789ABCDEFabcdef'
1309 1310 _hextochr = dict((a + b, chr(int(a + b, 16)))
1310 1311 for a in _hexdig for b in _hexdig)
1311 1312
1312 1313 def _urlunquote(s):
1313 1314 """unquote('abc%20def') -> 'abc def'."""
1314 1315 res = s.split('%')
1315 1316 # fastpath
1316 1317 if len(res) == 1:
1317 1318 return s
1318 1319 s = res[0]
1319 1320 for item in res[1:]:
1320 1321 try:
1321 1322 s += _hextochr[item[:2]] + item[2:]
1322 1323 except KeyError:
1323 1324 s += '%' + item
1324 1325 except UnicodeDecodeError:
1325 1326 s += unichr(int(item[:2], 16)) + item[2:]
1326 1327 return s
1327 1328
1328 1329 class url(object):
1329 1330 r"""Reliable URL parser.
1330 1331
1331 1332 This parses URLs and provides attributes for the following
1332 1333 components:
1333 1334
1334 1335 <scheme>://<user>:<passwd>@<host>:<port>/<path>?<query>#<fragment>
1335 1336
1336 1337 Missing components are set to None. The only exception is
1337 1338 fragment, which is set to '' if present but empty.
1338 1339
1339 1340 If parsefragment is False, fragment is included in query. If
1340 1341 parsequery is False, query is included in path. If both are
1341 1342 False, both fragment and query are included in path.
1342 1343
1343 1344 See http://www.ietf.org/rfc/rfc2396.txt for more information.
1344 1345
1345 1346 Note that for backward compatibility reasons, bundle URLs do not
1346 1347 take host names. That means 'bundle://../' has a path of '../'.
1347 1348
1348 1349 Examples:
1349 1350
1350 1351 >>> url('http://www.ietf.org/rfc/rfc2396.txt')
1351 1352 <url scheme: 'http', host: 'www.ietf.org', path: 'rfc/rfc2396.txt'>
1352 1353 >>> url('ssh://[::1]:2200//home/joe/repo')
1353 1354 <url scheme: 'ssh', host: '[::1]', port: '2200', path: '/home/joe/repo'>
1354 1355 >>> url('file:///home/joe/repo')
1355 1356 <url scheme: 'file', path: '/home/joe/repo'>
1356 1357 >>> url('file:///c:/temp/foo/')
1357 1358 <url scheme: 'file', path: 'c:/temp/foo/'>
1358 1359 >>> url('bundle:foo')
1359 1360 <url scheme: 'bundle', path: 'foo'>
1360 1361 >>> url('bundle://../foo')
1361 1362 <url scheme: 'bundle', path: '../foo'>
1362 1363 >>> url(r'c:\foo\bar')
1363 1364 <url path: 'c:\\foo\\bar'>
1364 1365 >>> url(r'\\blah\blah\blah')
1365 1366 <url path: '\\\\blah\\blah\\blah'>
1366 1367
1367 1368 Authentication credentials:
1368 1369
1369 1370 >>> url('ssh://joe:xyz@x/repo')
1370 1371 <url scheme: 'ssh', user: 'joe', passwd: 'xyz', host: 'x', path: 'repo'>
1371 1372 >>> url('ssh://joe@x/repo')
1372 1373 <url scheme: 'ssh', user: 'joe', host: 'x', path: 'repo'>
1373 1374
1374 1375 Query strings and fragments:
1375 1376
1376 1377 >>> url('http://host/a?b#c')
1377 1378 <url scheme: 'http', host: 'host', path: 'a', query: 'b', fragment: 'c'>
1378 1379 >>> url('http://host/a?b#c', parsequery=False, parsefragment=False)
1379 1380 <url scheme: 'http', host: 'host', path: 'a?b#c'>
1380 1381 """
1381 1382
1382 1383 _safechars = "!~*'()+"
1383 1384 _safepchars = "/!~*'()+"
1384 1385 _matchscheme = re.compile(r'^[a-zA-Z0-9+.\-]+:').match
1385 1386
1386 1387 def __init__(self, path, parsequery=True, parsefragment=True):
1387 1388 # We slowly chomp away at path until we have only the path left
1388 1389 self.scheme = self.user = self.passwd = self.host = None
1389 1390 self.port = self.path = self.query = self.fragment = None
1390 1391 self._localpath = True
1391 1392 self._hostport = ''
1392 1393 self._origpath = path
1393 1394
1394 1395 # special case for Windows drive letters and UNC paths
1395 1396 if hasdriveletter(path) or path.startswith(r'\\'):
1396 1397 self.path = path
1397 1398 return
1398 1399
1399 1400 # For compatibility reasons, we can't handle bundle paths as
1400 1401 # normal URLS
1401 1402 if path.startswith('bundle:'):
1402 1403 self.scheme = 'bundle'
1403 1404 path = path[7:]
1404 1405 if path.startswith('//'):
1405 1406 path = path[2:]
1406 1407 self.path = path
1407 1408 return
1408 1409
1409 1410 if self._matchscheme(path):
1410 1411 parts = path.split(':', 1)
1411 1412 if parts[0]:
1412 1413 self.scheme, path = parts
1413 1414 self._localpath = False
1414 1415
1415 1416 if not path:
1416 1417 path = None
1417 1418 if self._localpath:
1418 1419 self.path = ''
1419 1420 return
1420 1421 else:
1421 1422 if parsefragment and '#' in path:
1422 1423 path, self.fragment = path.split('#', 1)
1423 1424 if not path:
1424 1425 path = None
1425 1426 if self._localpath:
1426 1427 self.path = path
1427 1428 return
1428 1429
1429 1430 if parsequery and '?' in path:
1430 1431 path, self.query = path.split('?', 1)
1431 1432 if not path:
1432 1433 path = None
1433 1434 if not self.query:
1434 1435 self.query = None
1435 1436
1436 1437 # // is required to specify a host/authority
1437 1438 if path and path.startswith('//'):
1438 1439 parts = path[2:].split('/', 1)
1439 1440 if len(parts) > 1:
1440 1441 self.host, path = parts
1441 1442 path = path
1442 1443 else:
1443 1444 self.host = parts[0]
1444 1445 path = None
1445 1446 if not self.host:
1446 1447 self.host = None
1447 1448 # path of file:///d is /d
1448 1449 # path of file:///d:/ is d:/, not /d:/
1449 1450 if path and not hasdriveletter(path):
1450 1451 path = '/' + path
1451 1452
1452 1453 if self.host and '@' in self.host:
1453 1454 self.user, self.host = self.host.rsplit('@', 1)
1454 1455 if ':' in self.user:
1455 1456 self.user, self.passwd = self.user.split(':', 1)
1456 1457 if not self.host:
1457 1458 self.host = None
1458 1459
1459 1460 # Don't split on colons in IPv6 addresses without ports
1460 1461 if (self.host and ':' in self.host and
1461 1462 not (self.host.startswith('[') and self.host.endswith(']'))):
1462 1463 self._hostport = self.host
1463 1464 self.host, self.port = self.host.rsplit(':', 1)
1464 1465 if not self.host:
1465 1466 self.host = None
1466 1467
1467 1468 if (self.host and self.scheme == 'file' and
1468 1469 self.host not in ('localhost', '127.0.0.1', '[::1]')):
1469 1470 raise Abort(_('file:// URLs can only refer to localhost'))
1470 1471
1471 1472 self.path = path
1472 1473
1473 1474 # leave the query string escaped
1474 1475 for a in ('user', 'passwd', 'host', 'port',
1475 1476 'path', 'fragment'):
1476 1477 v = getattr(self, a)
1477 1478 if v is not None:
1478 1479 setattr(self, a, _urlunquote(v))
1479 1480
1480 1481 def __repr__(self):
1481 1482 attrs = []
1482 1483 for a in ('scheme', 'user', 'passwd', 'host', 'port', 'path',
1483 1484 'query', 'fragment'):
1484 1485 v = getattr(self, a)
1485 1486 if v is not None:
1486 1487 attrs.append('%s: %r' % (a, v))
1487 1488 return '<url %s>' % ', '.join(attrs)
1488 1489
1489 1490 def __str__(self):
1490 1491 r"""Join the URL's components back into a URL string.
1491 1492
1492 1493 Examples:
1493 1494
1494 1495 >>> str(url('http://user:pw@host:80/?foo#bar'))
1495 1496 'http://user:pw@host:80/?foo#bar'
1496 1497 >>> str(url('http://user:pw@host:80/?foo=bar&baz=42'))
1497 1498 'http://user:pw@host:80/?foo=bar&baz=42'
1498 1499 >>> str(url('http://user:pw@host:80/?foo=bar%3dbaz'))
1499 1500 'http://user:pw@host:80/?foo=bar%3dbaz'
1500 1501 >>> str(url('ssh://user:pw@[::1]:2200//home/joe#'))
1501 1502 'ssh://user:pw@[::1]:2200//home/joe#'
1502 1503 >>> str(url('http://localhost:80//'))
1503 1504 'http://localhost:80//'
1504 1505 >>> str(url('http://localhost:80/'))
1505 1506 'http://localhost:80/'
1506 1507 >>> str(url('http://localhost:80'))
1507 1508 'http://localhost:80/'
1508 1509 >>> str(url('bundle:foo'))
1509 1510 'bundle:foo'
1510 1511 >>> str(url('bundle://../foo'))
1511 1512 'bundle:../foo'
1512 1513 >>> str(url('path'))
1513 1514 'path'
1514 1515 >>> str(url('file:///tmp/foo/bar'))
1515 1516 'file:///tmp/foo/bar'
1516 1517 >>> print url(r'bundle:foo\bar')
1517 1518 bundle:foo\bar
1518 1519 """
1519 1520 if self._localpath:
1520 1521 s = self.path
1521 1522 if self.scheme == 'bundle':
1522 1523 s = 'bundle:' + s
1523 1524 if self.fragment:
1524 1525 s += '#' + self.fragment
1525 1526 return s
1526 1527
1527 1528 s = self.scheme + ':'
1528 1529 if self.user or self.passwd or self.host:
1529 1530 s += '//'
1530 1531 elif self.scheme and (not self.path or self.path.startswith('/')):
1531 1532 s += '//'
1532 1533 if self.user:
1533 1534 s += urllib.quote(self.user, safe=self._safechars)
1534 1535 if self.passwd:
1535 1536 s += ':' + urllib.quote(self.passwd, safe=self._safechars)
1536 1537 if self.user or self.passwd:
1537 1538 s += '@'
1538 1539 if self.host:
1539 1540 if not (self.host.startswith('[') and self.host.endswith(']')):
1540 1541 s += urllib.quote(self.host)
1541 1542 else:
1542 1543 s += self.host
1543 1544 if self.port:
1544 1545 s += ':' + urllib.quote(self.port)
1545 1546 if self.host:
1546 1547 s += '/'
1547 1548 if self.path:
1548 1549 # TODO: similar to the query string, we should not unescape the
1549 1550 # path when we store it, the path might contain '%2f' = '/',
1550 1551 # which we should *not* escape.
1551 1552 s += urllib.quote(self.path, safe=self._safepchars)
1552 1553 if self.query:
1553 1554 # we store the query in escaped form.
1554 1555 s += '?' + self.query
1555 1556 if self.fragment is not None:
1556 1557 s += '#' + urllib.quote(self.fragment, safe=self._safepchars)
1557 1558 return s
1558 1559
1559 1560 def authinfo(self):
1560 1561 user, passwd = self.user, self.passwd
1561 1562 try:
1562 1563 self.user, self.passwd = None, None
1563 1564 s = str(self)
1564 1565 finally:
1565 1566 self.user, self.passwd = user, passwd
1566 1567 if not self.user:
1567 1568 return (s, None)
1568 1569 # authinfo[1] is passed to urllib2 password manager, and its URIs
1569 1570 # must not contain credentials.
1570 1571 return (s, (None, (s, self.host),
1571 1572 self.user, self.passwd or ''))
1572 1573
1573 1574 def isabs(self):
1574 1575 if self.scheme and self.scheme != 'file':
1575 1576 return True # remote URL
1576 1577 if hasdriveletter(self.path):
1577 1578 return True # absolute for our purposes - can't be joined()
1578 1579 if self.path.startswith(r'\\'):
1579 1580 return True # Windows UNC path
1580 1581 if self.path.startswith('/'):
1581 1582 return True # POSIX-style
1582 1583 return False
1583 1584
1584 1585 def localpath(self):
1585 1586 if self.scheme == 'file' or self.scheme == 'bundle':
1586 1587 path = self.path or '/'
1587 1588 # For Windows, we need to promote hosts containing drive
1588 1589 # letters to paths with drive letters.
1589 1590 if hasdriveletter(self._hostport):
1590 1591 path = self._hostport + '/' + self.path
1591 1592 elif self.host is not None and self.path:
1592 1593 path = '/' + path
1593 1594 return path
1594 1595 return self._origpath
1595 1596
1596 1597 def hasscheme(path):
1597 1598 return bool(url(path).scheme)
1598 1599
1599 1600 def hasdriveletter(path):
1600 1601 return path[1:2] == ':' and path[0:1].isalpha()
1601 1602
1602 1603 def urllocalpath(path):
1603 1604 return url(path, parsequery=False, parsefragment=False).localpath()
1604 1605
1605 1606 def hidepassword(u):
1606 1607 '''hide user credential in a url string'''
1607 1608 u = url(u)
1608 1609 if u.passwd:
1609 1610 u.passwd = '***'
1610 1611 return str(u)
1611 1612
1612 1613 def removeauth(u):
1613 1614 '''remove all authentication information from a url string'''
1614 1615 u = url(u)
1615 1616 u.user = u.passwd = None
1616 1617 return str(u)
1617 1618
1618 1619 def isatty(fd):
1619 1620 try:
1620 1621 return fd.isatty()
1621 1622 except AttributeError:
1622 1623 return False
@@ -1,137 +1,139
1 1 Test alignment of multibyte characters
2 2
3 3 $ HGENCODING=utf-8
4 4 $ export HGENCODING
5 5 $ hg init t
6 6 $ cd t
7 7 $ python << EOF
8 8 > # (byte, width) = (6, 4)
9 9 > s = "\xe7\x9f\xad\xe5\x90\x8d"
10 10 > # (byte, width) = (7, 7): odd width is good for alignment test
11 11 > m = "MIDDLE_"
12 12 > # (byte, width) = (18, 12)
13 13 > l = "\xe9\x95\xb7\xe3\x81\x84\xe9\x95\xb7\xe3\x81\x84\xe5\x90\x8d\xe5\x89\x8d"
14 14 > f = file('s', 'w'); f.write(s); f.close()
15 15 > f = file('m', 'w'); f.write(m); f.close()
16 16 > f = file('l', 'w'); f.write(l); f.close()
17 17 > # instant extension to show list of options
18 18 > f = file('showoptlist.py', 'w'); f.write("""# encoding: utf-8
19 19 > def showoptlist(ui, repo, *pats, **opts):
20 20 > '''dummy command to show option descriptions'''
21 21 > return 0
22 22 > cmdtable = {
23 23 > 'showoptlist':
24 24 > (showoptlist,
25 > [('s', 'opt1', '', 'short width', '""" + s + """'),
26 > ('m', 'opt2', '', 'middle width', '""" + m + """'),
27 > ('l', 'opt3', '', 'long width', '""" + l + """')
25 > [('s', 'opt1', '', 'short width' + ' %(s)s' * 8, '%(s)s'),
26 > ('m', 'opt2', '', 'middle width' + ' %(m)s' * 8, '%(m)s'),
27 > ('l', 'opt3', '', 'long width' + ' %(l)s' * 8, '%(l)s')
28 28 > ],
29 29 > ""
30 30 > )
31 31 > }
32 > """)
32 > """ % globals())
33 33 > f.close()
34 34 > EOF
35 35 $ S=`cat s`
36 36 $ M=`cat m`
37 37 $ L=`cat l`
38 38
39 39 alignment of option descriptions in help
40 40
41 41 $ cat <<EOF > .hg/hgrc
42 42 > [extensions]
43 43 > ja_ext = `pwd`/showoptlist.py
44 44 > EOF
45 45
46 46 check alignment of option descriptions in help
47 47
48 48 $ hg help showoptlist
49 49 hg showoptlist
50 50
51 51 dummy command to show option descriptions
52 52
53 53 options:
54 54
55 -s --opt1 \xe7\x9f\xad\xe5\x90\x8d short width (esc)
56 -m --opt2 MIDDLE_ middle width
57 -l --opt3 \xe9\x95\xb7\xe3\x81\x84\xe9\x95\xb7\xe3\x81\x84\xe5\x90\x8d\xe5\x89\x8d long width (esc)
55 -s --opt1 \xe7\x9f\xad\xe5\x90\x8d short width \xe7\x9f\xad\xe5\x90\x8d \xe7\x9f\xad\xe5\x90\x8d \xe7\x9f\xad\xe5\x90\x8d \xe7\x9f\xad\xe5\x90\x8d \xe7\x9f\xad\xe5\x90\x8d \xe7\x9f\xad\xe5\x90\x8d \xe7\x9f\xad\xe5\x90\x8d \xe7\x9f\xad\xe5\x90\x8d (esc)
56 -m --opt2 MIDDLE_ middle width MIDDLE_ MIDDLE_ MIDDLE_ MIDDLE_ MIDDLE_
57 MIDDLE_ MIDDLE_ MIDDLE_
58 -l --opt3 \xe9\x95\xb7\xe3\x81\x84\xe9\x95\xb7\xe3\x81\x84\xe5\x90\x8d\xe5\x89\x8d long width \xe9\x95\xb7\xe3\x81\x84\xe9\x95\xb7\xe3\x81\x84\xe5\x90\x8d\xe5\x89\x8d \xe9\x95\xb7\xe3\x81\x84\xe9\x95\xb7\xe3\x81\x84\xe5\x90\x8d\xe5\x89\x8d \xe9\x95\xb7\xe3\x81\x84\xe9\x95\xb7\xe3\x81\x84\xe5\x90\x8d\xe5\x89\x8d \xe9\x95\xb7\xe3\x81\x84\xe9\x95\xb7\xe3\x81\x84\xe5\x90\x8d\xe5\x89\x8d \xe9\x95\xb7\xe3\x81\x84\xe9\x95\xb7\xe3\x81\x84\xe5\x90\x8d\xe5\x89\x8d \xe9\x95\xb7\xe3\x81\x84\xe9\x95\xb7\xe3\x81\x84\xe5\x90\x8d\xe5\x89\x8d \xe9\x95\xb7\xe3\x81\x84\xe9\x95\xb7\xe3\x81\x84\xe5\x90\x8d\xe5\x89\x8d (esc)
59 \xe9\x95\xb7\xe3\x81\x84\xe9\x95\xb7\xe3\x81\x84\xe5\x90\x8d\xe5\x89\x8d (esc)
58 60
59 61 use "hg -v help showoptlist" to show global options
60 62
61 63
62 64 $ rm -f s; touch s
63 65 $ rm -f m; touch m
64 66 $ rm -f l; touch l
65 67
66 68 add files
67 69
68 70 $ cp s $S
69 71 $ hg add $S
70 72 $ cp m $M
71 73 $ hg add $M
72 74 $ cp l $L
73 75 $ hg add $L
74 76
75 77 commit(1)
76 78
77 79 $ echo 'first line(1)' >> s; cp s $S
78 80 $ echo 'first line(2)' >> m; cp m $M
79 81 $ echo 'first line(3)' >> l; cp l $L
80 82 $ hg commit -m 'first commit' -u $S
81 83
82 84 commit(2)
83 85
84 86 $ echo 'second line(1)' >> s; cp s $S
85 87 $ echo 'second line(2)' >> m; cp m $M
86 88 $ echo 'second line(3)' >> l; cp l $L
87 89 $ hg commit -m 'second commit' -u $M
88 90
89 91 commit(3)
90 92
91 93 $ echo 'third line(1)' >> s; cp s $S
92 94 $ echo 'third line(2)' >> m; cp m $M
93 95 $ echo 'third line(3)' >> l; cp l $L
94 96 $ hg commit -m 'third commit' -u $L
95 97
96 98 check alignment of user names in annotate
97 99
98 100 $ hg annotate -u $M
99 101 \xe7\x9f\xad\xe5\x90\x8d: first line(2) (esc)
100 102 MIDDLE_: second line(2)
101 103 \xe9\x95\xb7\xe3\x81\x84\xe9\x95\xb7\xe3\x81\x84\xe5\x90\x8d\xe5\x89\x8d: third line(2) (esc)
102 104
103 105 check alignment of filenames in diffstat
104 106
105 107 $ hg diff -c tip --stat
106 108 MIDDLE_ | 1 +
107 109 \xe7\x9f\xad\xe5\x90\x8d | 1 + (esc)
108 110 \xe9\x95\xb7\xe3\x81\x84\xe9\x95\xb7\xe3\x81\x84\xe5\x90\x8d\xe5\x89\x8d | 1 + (esc)
109 111 3 files changed, 3 insertions(+), 0 deletions(-)
110 112
111 113 add branches/tags
112 114
113 115 $ hg branch $S
114 116 marked working directory as branch \xe7\x9f\xad\xe5\x90\x8d (esc)
115 117 $ hg tag $S
116 118 $ hg branch $M
117 119 marked working directory as branch MIDDLE_
118 120 $ hg tag $M
119 121 $ hg branch $L
120 122 marked working directory as branch \xe9\x95\xb7\xe3\x81\x84\xe9\x95\xb7\xe3\x81\x84\xe5\x90\x8d\xe5\x89\x8d (esc)
121 123 $ hg tag $L
122 124
123 125 check alignment of branches
124 126
125 127 $ hg tags
126 128 tip 5:d745ff46155b
127 129 \xe9\x95\xb7\xe3\x81\x84\xe9\x95\xb7\xe3\x81\x84\xe5\x90\x8d\xe5\x89\x8d 4:9259be597f19 (esc)
128 130 MIDDLE_ 3:b06c5b6def9e
129 131 \xe7\x9f\xad\xe5\x90\x8d 2:64a70663cee8 (esc)
130 132
131 133 check alignment of tags
132 134
133 135 $ hg tags
134 136 tip 5:d745ff46155b
135 137 \xe9\x95\xb7\xe3\x81\x84\xe9\x95\xb7\xe3\x81\x84\xe5\x90\x8d\xe5\x89\x8d 4:9259be597f19 (esc)
136 138 MIDDLE_ 3:b06c5b6def9e
137 139 \xe7\x9f\xad\xe5\x90\x8d 2:64a70663cee8 (esc)
General Comments 0
You need to be logged in to leave comments. Login now