upstream/mercurial-mirror Commit - r30820:6a70cf94

py3: replace pycompat.getenv with encoding.environ.get...

Pulkit Goyal -

r30820:6a70cf94 default

parent child

contrib/check-code.py

0 +2 -1

             #!/usr/bin/env python
             #
             # check-code - a style and portability checker for Mercurial
             #
             # Copyright 2010 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """style and portability checker for Mercurial
             when a rule triggers wrong, do one of the following (prefer one from top):
              * do the work-around the rule suggests
              * doublecheck that it is a false match
              * improve the rule pattern
              * add an ignore pattern to the rule (3rd arg) which matches your good line
                (you can append a short comment and match this, like: #re-raises)
              * change the pattern to a warning and list the exception in test-check-code-hg
              * ONLY use no--check-code for skipping entire files from external sources
             """
             from __future__ import absolute_import, print_function
             import glob
             import keyword
             import optparse
             import os
             import re
             import sys
             if sys.version_info[0] < 3:
                 opentext = open
             else:
                 def opentext(f):
                     return open(f, encoding='ascii')
             try:
                 xrange
             except NameError:
                 xrange = range
             try:
                 import re2
             except ImportError:
                 re2 = None
             def compilere(pat, multiline=False):
                 if multiline:
                     pat = '(?m)' + pat
                 if re2:
                     try:
                         return re2.compile(pat)
                     except re2.error:
                         pass
                 return re.compile(pat)
             # check "rules depending on implementation of repquote()" in each
             # patterns (especially pypats), before changing around repquote()
             _repquotefixedmap = {' ': ' ', '\n': '\n', '.': 'p', ':': 'q',
                                  '%': '%', '\\': 'b', '*': 'A', '+': 'P', '-': 'M'}
             def _repquoteencodechr(i):
                 if i > 255:
                     return 'u'
                 c = chr(i)
                 if c in _repquotefixedmap:
                     return _repquotefixedmap[c]
                 if c.isalpha():
                     return 'x'
                 if c.isdigit():
                     return 'n'
                 return 'o'
             _repquotett = ''.join(_repquoteencodechr(i) for i in xrange(256))
             def repquote(m):
                 t = m.group('text')
                 t = t.translate(_repquotett)
                 return m.group('quote') + t + m.group('quote')
             def reppython(m):
                 comment = m.group('comment')
                 if comment:
                     l = len(comment.rstrip())
                     return "#" * l + comment[l:]
                 return repquote(m)
             def repcomment(m):
                 return m.group(1) + "#" * len(m.group(2))
             def repccomment(m):
                 t = re.sub(r"((?<=\n) )|\S", "x", m.group(2))
                 return m.group(1) + t + "*/"
             def repcallspaces(m):
                 t = re.sub(r"\n\s+", "\n", m.group(2))
                 return m.group(1) + t
             def repinclude(m):
                 return m.group(1) + "<foo>"
             def rephere(m):
                 t = re.sub(r"\S", "x", m.group(2))
                 return m.group(1) + t
             testpats = [
               [
                 (r'pushd|popd', "don't use 'pushd' or 'popd', use 'cd'"),
                 (r'\W\$?\(\([^\)\n]*\)\)', "don't use (()) or $(()), use 'expr'"),
                 (r'grep.*-q', "don't use 'grep -q', redirect to /dev/null"),
                 (r'(?<!hg )grep.* -a', "don't use 'grep -a', use in-line python"),
                 (r'sed.*-i', "don't use 'sed -i', use a temporary file"),
                 (r'\becho\b.*\\n', "don't use 'echo \\n', use printf"),
                 (r'echo -n', "don't use 'echo -n', use printf"),
                 (r'(^|\|\s*)\bwc\b[^|]*$\n(?!.*\(re\))', "filter wc output"),
                 (r'head -c', "don't use 'head -c', use 'dd'"),
                 (r'tail -n', "don't use the '-n' option to tail, just use '-<num>'"),
                 (r'sha1sum', "don't use sha1sum, use $TESTDIR/md5sum.py"),
                 (r'ls.*-\w*R', "don't use 'ls -R', use 'find'"),
                 (r'printf.*[^\\]\\([1-9]|0\d)', r"don't use 'printf \NNN', use Python"),
                 (r'printf.*[^\\]\\x', "don't use printf \\x, use Python"),
                 (r'\$\(.*\)', "don't use $(expr), use `expr`"),
                 (r'rm -rf \*', "don't use naked rm -rf, target a directory"),
                 (r'(^|\|\s*)grep (-\w\s+)*[^|]*[(|]\w',
                  "use egrep for extended grep syntax"),
                 (r'/bin/', "don't use explicit paths for tools"),
                 (r'[^\n]\Z', "no trailing newline"),
                 (r'export .*=', "don't export and assign at once"),
                 (r'^source\b', "don't use 'source', use '.'"),
                 (r'touch -d', "don't use 'touch -d', use 'touch -t' instead"),
                 (r'\bls +[^|\n-]+ +-', "options to 'ls' must come before filenames"),
                 (r'[^>\n]>\s*\$HGRCPATH', "don't overwrite $HGRCPATH, append to it"),
                 (r'^stop\(\)', "don't use 'stop' as a shell function name"),
                 (r'(\[|\btest\b).*-e ', "don't use 'test -e', use 'test -f'"),
                 (r'\[\[\s+[^\]]*\]\]', "don't use '[[ ]]', use '[ ]'"),
                 (r'^alias\b.*=', "don't use alias, use a function"),
                 (r'if\s*!', "don't use '!' to negate exit status"),
                 (r'/dev/u?random', "don't use entropy, use /dev/zero"),
                 (r'do\s*true;\s*done', "don't use true as loop body, use sleep 0"),
                 (r'^( *)\t', "don't use tabs to indent"),
                 (r'sed (-e )?\'(\d+|/[^/]*/)i(?!\\\n)',
                  "put a backslash-escaped newline after sed 'i' command"),
                 (r'^diff *-\w*[uU].*$\n(^  \$ |^$)', "prefix diff -u/-U with cmp"),
                 (r'^\s+(if)? diff *-\w*[uU]', "prefix diff -u/-U with cmp"),
                 (r'seq ', "don't use 'seq', use $TESTDIR/seq.py"),
                 (r'\butil\.Abort\b', "directly use error.Abort"),
                 (r'\|&', "don't use |&, use 2>&1"),
                 (r'\w =  +\w', "only one space after = allowed"),
                 (r'\bsed\b.*[^\\]\\n', "don't use 'sed ... \\n', use a \\ and a newline"),
                 (r'env.*-u', "don't use 'env -u VAR', use 'unset VAR'"),
                 (r'cp.* -r ', "don't use 'cp -r', use 'cp -R'"),
               ],
               # warnings
               [
                 (r'^function', "don't use 'function', use old style"),
                 (r'^diff.*-\w*N', "don't use 'diff -N'"),
                 (r'\$PWD|\${PWD}', "don't use $PWD, use `pwd`"),
                 (r'^([^"\'\n]|("[^"\n]*")|(\'[^\'\n]*\'))*\^', "^ must be quoted"),
                 (r'kill (`|\$\()', "don't use kill, use killdaemons.py")
               ]
             ]
             testfilters = [
                 (r"( *)(#([^\n]*\S)?)", repcomment),
                 (r"<<(\S+)((.|\n)*?\n\1)", rephere),
             ]
             winglobmsg = "use (glob) to match Windows paths too"
             uprefix = r"^  \$ "
             utestpats = [
               [
                 (r'^(\S.*||  [$>] \S.*)[ \t]\n', "trailing whitespace on non-output"),
                 (uprefix + r'.*\|\s*sed[^|>\n]*\n',
                  "use regex test output patterns instead of sed"),
                 (uprefix + r'(true|exit 0)', "explicit zero exit unnecessary"),
                 (uprefix + r'.*(?<!\[)\$\?', "explicit exit code checks unnecessary"),
                 (uprefix + r'.*\|\| echo.*(fail|error)',
                  "explicit exit code checks unnecessary"),
                 (uprefix + r'set -e', "don't use set -e"),
                 (uprefix + r'(\s|fi\b|done\b)', "use > for continued lines"),
                 (uprefix + r'.*:\.\S*/', "x:.y in a path does not work on msys, rewrite "
                  "as x://.y, or see `hg log -k msys` for alternatives", r'-\S+:\.|' #-Rxxx
                  '# no-msys'), # in test-pull.t which is skipped on windows
                 (r'^  saved backup bundle to \$TESTTMP.*\.hg$', winglobmsg),
                 (r'^  changeset .* references (corrupted|missing) \$TESTTMP/.*[^)]$',
                  winglobmsg),
                 (r'^  pulling from \$TESTTMP/.*[^)]$', winglobmsg,
                  '\$TESTTMP/unix-repo$'), # in test-issue1802.t which skipped on windows
                 (r'^  reverting (?!subrepo ).*/.*[^)]$', winglobmsg),
                 (r'^  cloning subrepo \S+/.*[^)]$', winglobmsg),
                 (r'^  pushing to \$TESTTMP/.*[^)]$', winglobmsg),
                 (r'^  pushing subrepo \S+/\S+ to.*[^)]$', winglobmsg),
                 (r'^  moving \S+/.*[^)]$', winglobmsg),
                 (r'^  no changes made to subrepo since.*/.*[^)]$', winglobmsg),
                 (r'^  .*: largefile \S+ not available from file:.*/.*[^)]$', winglobmsg),
                 (r'^  .*file://\$TESTTMP',
                  'write "file:/*/$TESTTMP" + (glob) to match on windows too'),
                 (r'^  [^$>].*27\.0\.0\.1.*[^)]$',
                  'use (glob) to match localhost IP on hosts without 127.0.0.1 too'),
                 (r'^  (cat|find): .*: No such file or directory',
                  'use test -f to test for file existence'),
                 (r'^  diff -[^ -]*p',
                  "don't use (external) diff with -p for portability"),
                 (r'^  [-+][-+][-+] .* [-+]0000 \(glob\)',
                  "glob timezone field in diff output for portability"),
                 (r'^  @@ -[0-9]+ [+][0-9]+,[0-9]+ @@',
                  "use '@@ -N* +N,n @@ (glob)' style chunk header for portability"),
                 (r'^  @@ -[0-9]+,[0-9]+ [+][0-9]+ @@',
                  "use '@@ -N,n +N* @@ (glob)' style chunk header for portability"),
                 (r'^  @@ -[0-9]+ [+][0-9]+ @@',
                  "use '@@ -N* +N* @@ (glob)' style chunk header for portability"),
                 (uprefix + r'hg( +-[^ ]+( +[^ ]+)?)* +extdiff'
                  r'( +(-[^ po-]+|--(?!program|option)[^ ]+|[^-][^ ]*))*$',
                  "use $RUNTESTDIR/pdiff via extdiff (or -o/-p for false-positives)"),
               ],
               # warnings
               [
                 (r'^  (?!.*127\.0\.0\.1)[^*?/\n]* \(glob\)$',
                  "glob match with no glob string (?, *, /, and 127.0.0.1)"),
               ]
             ]
             for i in [0, 1]:
                 for tp in testpats[i]:
                     p = tp[0]
                     m = tp[1]
                     if p.startswith(r'^'):
                         p = r"^  [$>] (%s)" % p[1:]
                     else:
                         p = r"^  [$>] .*(%s)" % p
                     utestpats[i].append((p, m) + tp[2:])
             utestfilters = [
                 (r"<<(\S+)((.|\n)*?\n  > \1)", rephere),
                 (r"( +)(#([^\n]*\S)?)", repcomment),
             ]
             pypats = [
               [
                 (r'^\s*def\s*\w+\s*\(.*,\s*\(',
                  "tuple parameter unpacking not available in Python 3+"),
                 (r'lambda\s*\(.*,.*\)',
                  "tuple parameter unpacking not available in Python 3+"),
                 (r'(?<!def)\s+(cmp)\(', "cmp is not available in Python 3+"),
                 (r'\breduce\s*\(.*', "reduce is not available in Python 3+"),
                 (r'\bdict\(.*=', 'dict() is different in Py2 and 3 and is slower than {}',
                  'dict-from-generator'),
                 (r'\.has_key\b', "dict.has_key is not available in Python 3+"),
                 (r'\s<>\s', '<> operator is not available in Python 3+, use !='),
                 (r'^\s*\t', "don't use tabs"),
                 (r'\S;\s*\n', "semicolon"),
                 (r'[^_]_\([ \t\n]*(?:"[^"]+"[ \t\n+]*)+%', "don't use % inside _()"),
                 (r"[^_]_\([ \t\n]*(?:'[^']+'[ \t\n+]*)+%", "don't use % inside _()"),
                 (r'(\w|\)),\w', "missing whitespace after ,"),
                 (r'(\w|\))[+/*\-<>]\w', "missing whitespace in expression"),
                 (r'^\s+(\w|\.)+=\w[^,()\n]*$', "missing whitespace in assignment"),
                 (r'\w\s=\s\s+\w', "gratuitous whitespace after ="),
                 (r'.{81}', "line too long"),
                 (r'[^\n]\Z', "no trailing newline"),
                 (r'(\S[ \t]+|^[ \t]+)\n', "trailing whitespace"),
             #    (r'^\s+[^_ \n][^_. \n]+_[^_\n]+\s*=',
             #     "don't use underbars in identifiers"),
                 (r'^\s+(self\.)?[A-za-z][a-z0-9]+[A-Z]\w* = ',
                  "don't use camelcase in identifiers"),
                 (r'^\s*(if|while|def|class|except|try)\s[^[\n]*:\s*[^\\n]#\s]+',
                  "linebreak after :"),
                 (r'class\s[^( \n]+:', "old-style class, use class foo(object)",
                  r'#.*old-style'),
                 (r'class\s[^( \n]+\(\):',
                  "class foo() creates old style object, use class foo(object)",
                  r'#.*old-style'),
                 (r'\b(%s)\(' % '|'.join(k for k in keyword.kwlist
                                         if k not in ('print', 'exec')),
                  "Python keyword is not a function"),
                 (r',]', "unneeded trailing ',' in list"),
             #    (r'class\s[A-Z][^\(]*\((?!Exception)',
             #     "don't capitalize non-exception classes"),
             #    (r'in range\(', "use xrange"),
             #    (r'^\s*print\s+', "avoid using print in core and extensions"),
                 (r'[\x80-\xff]', "non-ASCII character literal"),
                 (r'("\')\.format\(', "str.format() has no bytes counterpart, use %"),
                 (r'^\s*(%s)\s\s' % '|'.join(keyword.kwlist),
                  "gratuitous whitespace after Python keyword"),
                 (r'([\(\[][ \t]\S)|(\S[ \t][\)\]])', "gratuitous whitespace in () or []"),
             #    (r'\s\s=', "gratuitous whitespace before ="),
                 (r'[^>< ](\+=|-=|!=|<>|<=|>=|<<=|>>=|%=)\S',
                  "missing whitespace around operator"),
                 (r'[^>< ](\+=|-=|!=|<>|<=|>=|<<=|>>=|%=)\s',
                  "missing whitespace around operator"),
                 (r'\s(\+=|-=|!=|<>|<=|>=|<<=|>>=|%=)\S',
                  "missing whitespace around operator"),
                 (r'[^^+=*/!<>&| %-](\s=|=\s)[^= ]',
                  "wrong whitespace around ="),
                 (r'\([^()]*( =[^=]|[^<>!=]= )',
                  "no whitespace around = for named parameters"),
                 (r'raise Exception', "don't raise generic exceptions"),
                 (r'raise [^,(]+, (\([^\)]+\)|[^,\(\)]+)$',
                  "don't use old-style two-argument raise, use Exception(message)"),
                 (r' is\s+(not\s+)?["\'0-9-]', "object comparison with literal"),
                 (r' [=!]=\s+(True|False|None)',
                  "comparison with singleton, use 'is' or 'is not' instead"),
                 (r'^\s*(while|if) [01]:',
                  "use True/False for constant Boolean expression"),
                 (r'(?:(?<!def)\s+|\()hasattr\(',
                  'hasattr(foo, bar) is broken, use util.safehasattr(foo, bar) instead'),
                 (r'opener\([^)]*\).read\(',
                  "use opener.read() instead"),
                 (r'opener\([^)]*\).write\(',
                  "use opener.write() instead"),
                 (r'[\s\(](open|file)\([^)]*\)\.read\(',
                  "use util.readfile() instead"),
                 (r'[\s\(](open|file)\([^)]*\)\.write\(',
                  "use util.writefile() instead"),
                 (r'^[\s\(]*(open(er)?|file)\([^)]*\)',
                  "always assign an opened file to a variable, and close it afterwards"),
                 (r'[\s\(](open|file)\([^)]*\)\.',
                  "always assign an opened file to a variable, and close it afterwards"),
                 (r'(?i)descend[e]nt', "the proper spelling is descendAnt"),
                 (r'\.debug\(\_', "don't mark debug messages for translation"),
                 (r'\.strip\(\)\.split\(\)', "no need to strip before splitting"),
                 (r'^\s*except\s*:', "naked except clause", r'#.*re-raises'),
                 (r'^\s*except\s([^\(,]+|\([^\)]+\))\s*,',
                  'legacy exception syntax; use "as" instead of ","'),
                 (r':\n(    )*( ){1,3}[^ ]', "must indent 4 spaces"),
                 (r'release\(.*wlock, .*lock\)', "wrong lock release order"),
                 (r'\b__bool__\b', "__bool__ should be __nonzero__ in Python 2"),
                 (r'os\.path\.join\(.*, *(""|\'\')\)',
                  "use pathutil.normasprefix(path) instead of os.path.join(path, '')"),
                 (r'\s0[0-7]+\b', 'legacy octal syntax; use "0o" prefix instead of "0"'),
                 # XXX only catch mutable arguments on the first line of the definition
                 (r'def.*[( ]\w+=\{\}', "don't use mutable default arguments"),
                 (r'\butil\.Abort\b', "directly use error.Abort"),
                 (r'^@(\w*\.)?cachefunc', "module-level @cachefunc is risky, please avoid"),
                 (r'^import Queue', "don't use Queue, use util.queue + util.empty"),
                 (r'^import cStringIO', "don't use cStringIO.StringIO, use util.stringio"),
                 (r'^import urllib', "don't use urllib, use util.urlreq/util.urlerr"),
                 (r'^import SocketServer', "don't use SockerServer, use util.socketserver"),
                 (r'^import urlparse', "don't use urlparse, use util.urlparse"),
                 (r'^import xmlrpclib', "don't use xmlrpclib, use util.xmlrpclib"),
                 (r'^import cPickle', "don't use cPickle, use util.pickle"),
                 (r'^import pickle', "don't use pickle, use util.pickle"),
                 (r'^import httplib', "don't use httplib, use util.httplib"),
                 (r'^import BaseHTTPServer', "use util.httpserver instead"),
                 (r'\.next\(\)', "don't use .next(), use next(...)"),
                 # rules depending on implementation of repquote()
                 (r' x+[xpqo%APM][\'"]\n\s+[\'"]x',
                  'string join across lines with no space'),
                 (r'''(?x)ui\.(status|progress|write|note|warn)\(
                      [ \t\n#]*
                      (?# any strings/comments might precede a string, which
                        # contains translatable message)
                      ((['"]|\'\'\'|""")[ \npq%bAPMxno]*(['"]|\'\'\'|""")[ \t\n#]+)*
                      (?# sequence consisting of below might precede translatable message
                        # - formatting string: "% 10s", "%05d", "% -3.2f", "%*s", "%%" ...
                        # - escaped character: "\\", "\n", "\0" ...
                        # - character other than '%', 'b' as '\', and 'x' as alphabet)
                      (['"]|\'\'\'|""")
                      ((%([ n]?[PM]?([np]+|A))?x)|%%|b[bnx]|[ \nnpqAPMo])*x
                      (?# this regexp can't use [^...] style,
                        # because _preparepats forcibly adds "\n" into [^...],
                        # even though this regexp wants match it against "\n")''',
                  "missing _() in ui message (use () to hide false-positives)"),
               ],
               # warnings
               [
                 # rules depending on implementation of repquote()
                 (r'(^| )pp +xxxxqq[ \n][^\n]', "add two newlines after '.. note::'"),
               ]
             ]
             pyfilters = [
                 (r"""(?msx)(?P<comment>\#.*?$)|
                      ((?P<quote>('''|\"\"\"|(?<!')'(?!')|(?<!")"(?!")))
                       (?P<text>(([^\\]|\\.)*?))
                       (?P=quote))""", reppython),
             ]
             txtfilters = []
             txtpats = [
               [
                 ('\s$', 'trailing whitespace'),
                 ('.. note::[ \n][^\n]', 'add two newlines after note::')
               ],
               []
             ]
             cpats = [
               [
                 (r'//', "don't use //-style comments"),
                 (r'^  ', "don't use spaces to indent"),
                 (r'\S\t', "don't use tabs except for indent"),
                 (r'(\S[ \t]+|^[ \t]+)\n', "trailing whitespace"),
                 (r'.{81}', "line too long"),
                 (r'(while|if|do|for)\(', "use space after while/if/do/for"),
                 (r'return\(', "return is not a function"),
                 (r' ;', "no space before ;"),
                 (r'[^;] \)', "no space before )"),
                 (r'[)][{]', "space between ) and {"),
                 (r'\w+\* \w+', "use int *foo, not int* foo"),
                 (r'\W\([^\)]+\) \w+', "use (int)foo, not (int) foo"),
                 (r'\w+ (\+\+|--)', "use foo++, not foo ++"),
                 (r'\w,\w', "missing whitespace after ,"),
                 (r'^[^#]\w[+/*]\w', "missing whitespace in expression"),
                 (r'\w\s=\s\s+\w', "gratuitous whitespace after ="),
                 (r'^#\s+\w', "use #foo, not # foo"),
                 (r'[^\n]\Z', "no trailing newline"),
                 (r'^\s*#import\b', "use only #include in standard C code"),
                 (r'strcpy\(', "don't use strcpy, use strlcpy or memcpy"),
                 (r'strcat\(', "don't use strcat"),
                 # rules depending on implementation of repquote()
               ],
               # warnings
               [
                 # rules depending on implementation of repquote()
               ]
             ]
             cfilters = [
                 (r'(/\*)(((\*(?!/))|[^*])*)\*/', repccomment),
                 (r'''(?P<quote>(?<!")")(?P<text>([^"]|\\")+)"(?!")''', repquote),
                 (r'''(#\s*include\s+<)([^>]+)>''', repinclude),
                 (r'(\()([^)]+\))', repcallspaces),
             ]
             inutilpats = [
               [
                 (r'\bui\.', "don't use ui in util"),
               ],
               # warnings
               []
             ]
             inrevlogpats = [
               [
                 (r'\brepo\.', "don't use repo in revlog"),
               ],
               # warnings
               []
             ]
             webtemplatefilters = []
             webtemplatepats = [
               [],
               [
                 (r'{desc(\|(?!websub|firstline)[^\|]*)+}',
                  'follow desc keyword with either firstline or websub'),
               ]
             ]
             allfilesfilters = []
             allfilespats = [
               [
                 (r'(http|https)://[a-zA-Z0-9./]*selenic.com/',
                  'use mercurial-scm.org domain URL'),
               ],
               # warnings
               [],
             ]
             py3pats = [
               [
                 (r'os\.environ', "use encoding.environ instead (py3)"),
                 (r'os\.name', "use pycompat.osname instead (py3)"),
                 (r'os\.getcwd', "use pycompat.getcwd instead (py3)"),
                 (r'os\.sep', "use pycompat.ossep instead (py3)"),
                 (r'os\.pathsep', "use pycompat.ospathsep instead (py3)"),
                 (r'os\.altsep', "use pycompat.osaltsep instead (py3)"),
-                (r'os\.getenv', "use pycompat.osgetenv instead (py3)"),
                 (r'sys\.platform', "use pycompat.sysplatform instead (py3)"),
                 (r'getopt\.getopt', "use pycompat.getoptb instead (py3)"),
+                (r'os\.getenv', "use encoding.environ.get instead"),
+                (r'os\.setenv', "modifying the environ dict is not preferred"),
               ],
               # warnings
               [],
             ]
             checks = [
                 ('python', r'.*\.(py|cgi)$', r'^#!.*python', pyfilters, pypats),
                 ('python 3', r'.*(hgext|mercurial).*(?<!pycompat)\.py', '',
                         pyfilters, py3pats),
                 ('test script', r'(.*/)?test-[^.~]*$', '', testfilters, testpats),
                 ('c', r'.*\.[ch]$', '', cfilters, cpats),
                 ('unified test', r'.*\.t$', '', utestfilters, utestpats),
                 ('layering violation repo in revlog', r'mercurial/revlog\.py', '',
                  pyfilters, inrevlogpats),
                 ('layering violation ui in util', r'mercurial/util\.py', '', pyfilters,
                  inutilpats),
                 ('txt', r'.*\.txt$', '', txtfilters, txtpats),
                 ('web template', r'mercurial/templates/.*\.tmpl', '',
                  webtemplatefilters, webtemplatepats),
                 ('all except for .po', r'.*(?<!\.po)$', '',
                  allfilesfilters, allfilespats),
             ]
             def _preparepats():
                 for c in checks:
                     failandwarn = c[-1]
                     for pats in failandwarn:
                         for i, pseq in enumerate(pats):
                             # fix-up regexes for multi-line searches
                             p = pseq[0]
                             # \s doesn't match \n
                             p = re.sub(r'(?<!\\)\\s', r'[ \\t]', p)
                             # [^...] doesn't match newline
                             p = re.sub(r'(?<!\\)\[\^', r'[^\\n', p)
                             pats[i] = (re.compile(p, re.MULTILINE),) + pseq[1:]
                     filters = c[3]
                     for i, flt in enumerate(filters):
                         filters[i] = re.compile(flt[0]), flt[1]
             class norepeatlogger(object):
                 def __init__(self):
                     self._lastseen = None
                 def log(self, fname, lineno, line, msg, blame):
                     """print error related a to given line of a given file.
                     The faulty line will also be printed but only once in the case
                     of multiple errors.
                     :fname: filename
                     :lineno: line number
                     :line: actual content of the line
                     :msg: error message
                     """
                     msgid = fname, lineno, line
                     if msgid != self._lastseen:
                         if blame:
                             print("%s:%d (%s):" % (fname, lineno, blame))
                         else:
                             print("%s:%d:" % (fname, lineno))
                         print(" > %s" % line)
                         self._lastseen = msgid
                     print(" " + msg)
             _defaultlogger = norepeatlogger()
             def getblame(f):
                 lines = []
                 for l in os.popen('hg annotate -un %s' % f):
                     start, line = l.split(':', 1)
                     user, rev = start.split()
                     lines.append((line[1:-1], user, rev))
                 return lines
             def checkfile(f, logfunc=_defaultlogger.log, maxerr=None, warnings=False,
                           blame=False, debug=False, lineno=True):
                 """checks style and portability of a given file
                 :f: filepath
                 :logfunc: function used to report error
                           logfunc(filename, linenumber, linecontent, errormessage)
                 :maxerr: number of error to display before aborting.
                          Set to false (default) to report all errors
                 return True if no error is found, False otherwise.
                 """
                 blamecache = None
                 result = True
                 try:
                     with opentext(f) as fp:
                         try:
                             pre = post = fp.read()
                         except UnicodeDecodeError as e:
                             print("%s while reading %s" % (e, f))
                             return result
                 except IOError as e:
                     print("Skipping %s, %s" % (f, str(e).split(':', 1)[0]))
                     return result
                 for name, match, magic, filters, pats in checks:
                     post = pre # discard filtering result of previous check
                     if debug:
                         print(name, f)
                     fc = 0
                     if not (re.match(match, f) or (magic and re.search(magic, pre))):
                         if debug:
                             print("Skipping %s for %s it doesn't match %s" % (
                                    name, match, f))
                         continue
                     if "no-" "check-code" in pre:
                         # If you're looking at this line, it's because a file has:
                         # no- check- code
                         # but the reason to output skipping is to make life for
                         # tests easier. So, instead of writing it with a normal
                         # spelling, we write it with the expected spelling from
                         # tests/test-check-code.t
                         print("Skipping %s it has no-che?k-code (glob)" % f)
                         return "Skip" # skip checking this file
                     for p, r in filters:
                         post = re.sub(p, r, post)
                     nerrs = len(pats[0]) # nerr elements are errors
                     if warnings:
                         pats = pats[0] + pats[1]
                     else:
                         pats = pats[0]
                     # print post # uncomment to show filtered version
                     if debug:
                         print("Checking %s for %s" % (name, f))
                     prelines = None
                     errors = []
                     for i, pat in enumerate(pats):
                         if len(pat) == 3:
                             p, msg, ignore = pat
                         else:
                             p, msg = pat
                             ignore = None
                         if i >= nerrs:
                             msg = "warning: " + msg
                         pos = 0
                         n = 0
                         for m in p.finditer(post):
                             if prelines is None:
                                 prelines = pre.splitlines()
                                 postlines = post.splitlines(True)
                             start = m.start()
                             while n < len(postlines):
                                 step = len(postlines[n])
                                 if pos + step > start:
                                     break
                                 pos += step
                                 n += 1
                             l = prelines[n]
                             if ignore and re.search(ignore, l, re.MULTILINE):
                                 if debug:
                                     print("Skipping %s for %s:%s (ignore pattern)" % (
                                         name, f, n))
                                 continue
                             bd = ""
                             if blame:
                                 bd = 'working directory'
                                 if not blamecache:
                                     blamecache = getblame(f)
                                 if n < len(blamecache):
                                     bl, bu, br = blamecache[n]
                                     if bl == l:
                                         bd = '%s@%s' % (bu, br)
                             errors.append((f, lineno and n + 1, l, msg, bd))
                             result = False
                     errors.sort()
                     for e in errors:
                         logfunc(*e)
                         fc += 1
                         if maxerr and fc >= maxerr:
                             print(" (too many errors, giving up)")
                             break
                 return result
             def main():
                 parser = optparse.OptionParser("%prog [options] [files]")
                 parser.add_option("-w", "--warnings", action="store_true",
                                   help="include warning-level checks")
                 parser.add_option("-p", "--per-file", type="int",
                                   help="max warnings per file")
                 parser.add_option("-b", "--blame", action="store_true",
                                   help="use annotate to generate blame info")
                 parser.add_option("", "--debug", action="store_true",
                                   help="show debug information")
                 parser.add_option("", "--nolineno", action="store_false",
                                   dest='lineno', help="don't show line numbers")
                 parser.set_defaults(per_file=15, warnings=False, blame=False, debug=False,
                                     lineno=True)
                 (options, args) = parser.parse_args()
                 if len(args) == 0:
                     check = glob.glob("*")
                 else:
                     check = args
                 _preparepats()
                 ret = 0
                 for f in check:
                     if not checkfile(f, maxerr=options.per_file, warnings=options.warnings,
                                      blame=options.blame, debug=options.debug,
                                      lineno=options.lineno):
                         ret = 1
                 return ret
             if __name__ == "__main__":
                 sys.exit(main())

hgext/largefiles/lfutil.py

0 +6 -5

             # Copyright 2009-2010 Gregory P. Ward
             # Copyright 2009-2010 Intelerad Medical Systems Incorporated
             # Copyright 2010-2011 Fog Creek Software
             # Copyright 2010-2011 Unity Technologies
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             '''largefiles utility code: must not import other modules in this package.'''
             from __future__ import absolute_import
             import copy
             import hashlib
             import os
             import platform
             import stat
             from mercurial.i18n import _
             from mercurial import (
                 dirstate,
+                encoding,
                 error,
                 httpconnection,
                 match as matchmod,
                 node,
                 pycompat,
                 scmutil,
                 util,
             )
             shortname = '.hglf'
             shortnameslash = shortname + '/'
             longname = 'largefiles'
             # -- Private worker functions ------------------------------------------
             def getminsize(ui, assumelfiles, opt, default=10):
                 lfsize = opt
                 if not lfsize and assumelfiles:
                     lfsize = ui.config(longname, 'minsize', default=default)
                 if lfsize:
                     try:
                         lfsize = float(lfsize)
                     except ValueError:
                         raise error.Abort(_('largefiles: size must be number (not %s)\n')
                                          % lfsize)
                 if lfsize is None:
                     raise error.Abort(_('minimum size for largefiles must be specified'))
                 return lfsize
             def link(src, dest):
                 """Try to create hardlink - if that fails, efficiently make a copy."""
                 util.makedirs(os.path.dirname(dest))
                 try:
                     util.oslink(src, dest)
                 except OSError:
                     # if hardlinks fail, fallback on atomic copy
                     with open(src, 'rb') as srcf:
                         with util.atomictempfile(dest) as dstf:
                             for chunk in util.filechunkiter(srcf):
                                 dstf.write(chunk)
                     os.chmod(dest, os.stat(src).st_mode)
             def usercachepath(ui, hash):
                 '''Return the correct location in the "global" largefiles cache for a file
                 with the given hash.
                 This cache is used for sharing of largefiles across repositories - both
                 to preserve download bandwidth and storage space.'''
                 return os.path.join(_usercachedir(ui), hash)
             def _usercachedir(ui):
                 '''Return the location of the "global" largefiles cache.'''
                 path = ui.configpath(longname, 'usercache', None)
                 if path:
                     return path
                 if pycompat.osname == 'nt':
-                    appdata = pycompat.osgetenv('LOCALAPPDATA',\
+                    appdata = encoding.environ.get('LOCALAPPDATA',\
-                                    pycompat.osgetenv('APPDATA'))
+                                    encoding.environ.get('APPDATA'))
                     if appdata:
                         return os.path.join(appdata, longname)
                 elif platform.system() == 'Darwin':
-                    home = pycompat.osgetenv('HOME')
+                    home = encoding.environ.get('HOME')
                     if home:
                         return os.path.join(home, 'Library', 'Caches', longname)
                 elif pycompat.osname == 'posix':
-                    path = pycompat.osgetenv('XDG_CACHE_HOME')
+                    path = encoding.environ.get('XDG_CACHE_HOME')
                     if path:
                         return os.path.join(path, longname)
-                    home = pycompat.osgetenv('HOME')
+                    home = encoding.environ.get('HOME')
                     if home:
                         return os.path.join(home, '.cache', longname)
                 else:
                     raise error.Abort(_('unknown operating system: %s\n')
                                       % pycompat.osname)
                 raise error.Abort(_('unknown %s usercache location') % longname)
             def inusercache(ui, hash):
                 path = usercachepath(ui, hash)
                 return os.path.exists(path)
             def findfile(repo, hash):
                 '''Return store path of the largefile with the specified hash.
                 As a side effect, the file might be linked from user cache.
                 Return None if the file can't be found locally.'''
                 path, exists = findstorepath(repo, hash)
                 if exists:
                     repo.ui.note(_('found %s in store\n') % hash)
                     return path
                 elif inusercache(repo.ui, hash):
                     repo.ui.note(_('found %s in system cache\n') % hash)
                     path = storepath(repo, hash)
                     link(usercachepath(repo.ui, hash), path)
                     return path
                 return None
             class largefilesdirstate(dirstate.dirstate):
                 def __getitem__(self, key):
                     return super(largefilesdirstate, self).__getitem__(unixpath(key))
                 def normal(self, f):
                     return super(largefilesdirstate, self).normal(unixpath(f))
                 def remove(self, f):
                     return super(largefilesdirstate, self).remove(unixpath(f))
                 def add(self, f):
                     return super(largefilesdirstate, self).add(unixpath(f))
                 def drop(self, f):
                     return super(largefilesdirstate, self).drop(unixpath(f))
                 def forget(self, f):
                     return super(largefilesdirstate, self).forget(unixpath(f))
                 def normallookup(self, f):
                     return super(largefilesdirstate, self).normallookup(unixpath(f))
                 def _ignore(self, f):
                     return False
                 def write(self, tr=False):
                     # (1) disable PENDING mode always
                     #     (lfdirstate isn't yet managed as a part of the transaction)
                     # (2) avoid develwarn 'use dirstate.write with ....'
                     super(largefilesdirstate, self).write(None)
             def openlfdirstate(ui, repo, create=True):
                 '''
                 Return a dirstate object that tracks largefiles: i.e. its root is
                 the repo root, but it is saved in .hg/largefiles/dirstate.
                 '''
                 vfs = repo.vfs
                 lfstoredir = longname
                 opener = scmutil.opener(vfs.join(lfstoredir))
                 lfdirstate = largefilesdirstate(opener, ui, repo.root,
                                                  repo.dirstate._validate)
                 # If the largefiles dirstate does not exist, populate and create
                 # it. This ensures that we create it on the first meaningful
                 # largefiles operation in a new clone.
                 if create and not vfs.exists(vfs.join(lfstoredir, 'dirstate')):
                     matcher = getstandinmatcher(repo)
                     standins = repo.dirstate.walk(matcher, [], False, False)
                     if len(standins) > 0:
                         vfs.makedirs(lfstoredir)
                     for standin in standins:
                         lfile = splitstandin(standin)
                         lfdirstate.normallookup(lfile)
                 return lfdirstate
             def lfdirstatestatus(lfdirstate, repo):
                 wctx = repo['.']
                 match = matchmod.always(repo.root, repo.getcwd())
                 unsure, s = lfdirstate.status(match, [], False, False, False)
                 modified, clean = s.modified, s.clean
                 for lfile in unsure:
                     try:
                         fctx = wctx[standin(lfile)]
                     except LookupError:
                         fctx = None
                     if not fctx or fctx.data().strip() != hashfile(repo.wjoin(lfile)):
                         modified.append(lfile)
                     else:
                         clean.append(lfile)
                         lfdirstate.normal(lfile)
                 return s
             def listlfiles(repo, rev=None, matcher=None):
                 '''return a list of largefiles in the working copy or the
                 specified changeset'''
                 if matcher is None:
                     matcher = getstandinmatcher(repo)
                 # ignore unknown files in working directory
                 return [splitstandin(f)
                         for f in repo[rev].walk(matcher)
                         if rev is not None or repo.dirstate[f] != '?']
             def instore(repo, hash, forcelocal=False):
                 '''Return true if a largefile with the given hash exists in the store'''
                 return os.path.exists(storepath(repo, hash, forcelocal))
             def storepath(repo, hash, forcelocal=False):
                 '''Return the correct location in the repository largefiles store for a
                 file with the given hash.'''
                 if not forcelocal and repo.shared():
                     return repo.vfs.reljoin(repo.sharedpath, longname, hash)
                 return repo.join(longname, hash)
             def findstorepath(repo, hash):
                 '''Search through the local store path(s) to find the file for the given
                 hash.  If the file is not found, its path in the primary store is returned.
                 The return value is a tuple of (path, exists(path)).
                 '''
                 # For shared repos, the primary store is in the share source.  But for
                 # backward compatibility, force a lookup in the local store if it wasn't
                 # found in the share source.
                 path = storepath(repo, hash, False)
                 if instore(repo, hash):
                     return (path, True)
                 elif repo.shared() and instore(repo, hash, True):
                     return storepath(repo, hash, True), True
                 return (path, False)
             def copyfromcache(repo, hash, filename):
                 '''Copy the specified largefile from the repo or system cache to
                 filename in the repository. Return true on success or false if the
                 file was not found in either cache (which should not happened:
                 this is meant to be called only after ensuring that the needed
                 largefile exists in the cache).'''
                 wvfs = repo.wvfs
                 path = findfile(repo, hash)
                 if path is None:
                     return False
                 wvfs.makedirs(wvfs.dirname(wvfs.join(filename)))
                 # The write may fail before the file is fully written, but we
                 # don't use atomic writes in the working copy.
                 with open(path, 'rb') as srcfd:
                     with wvfs(filename, 'wb') as destfd:
                         gothash = copyandhash(
                             util.filechunkiter(srcfd), destfd)
                 if gothash != hash:
                     repo.ui.warn(_('%s: data corruption in %s with hash %s\n')
                                  % (filename, path, gothash))
                     wvfs.unlink(filename)
                     return False
                 return True
             def copytostore(repo, rev, file, uploaded=False):
                 wvfs = repo.wvfs
                 hash = readstandin(repo, file, rev)
                 if instore(repo, hash):
                     return
                 if wvfs.exists(file):
                     copytostoreabsolute(repo, wvfs.join(file), hash)
                 else:
                     repo.ui.warn(_("%s: largefile %s not available from local store\n") %
                                  (file, hash))
             def copyalltostore(repo, node):
                 '''Copy all largefiles in a given revision to the store'''
                 ctx = repo[node]
                 for filename in ctx.files():
                     if isstandin(filename) and filename in ctx.manifest():
                         realfile = splitstandin(filename)
                         copytostore(repo, ctx.node(), realfile)
             def copytostoreabsolute(repo, file, hash):
                 if inusercache(repo.ui, hash):
                     link(usercachepath(repo.ui, hash), storepath(repo, hash))
                 else:
                     util.makedirs(os.path.dirname(storepath(repo, hash)))
                     with open(file, 'rb') as srcf:
                         with util.atomictempfile(storepath(repo, hash),
                                                  createmode=repo.store.createmode) as dstf:
                             for chunk in util.filechunkiter(srcf):
                                 dstf.write(chunk)
                     linktousercache(repo, hash)
             def linktousercache(repo, hash):
                 '''Link / copy the largefile with the specified hash from the store
                 to the cache.'''
                 path = usercachepath(repo.ui, hash)
                 link(storepath(repo, hash), path)
             def getstandinmatcher(repo, rmatcher=None):
                 '''Return a match object that applies rmatcher to the standin directory'''
                 wvfs = repo.wvfs
                 standindir = shortname
                 # no warnings about missing files or directories
                 badfn = lambda f, msg: None
                 if rmatcher and not rmatcher.always():
                     pats = [wvfs.join(standindir, pat) for pat in rmatcher.files()]
                     if not pats:
                         pats = [wvfs.join(standindir)]
                     match = scmutil.match(repo[None], pats, badfn=badfn)
                     # if pats is empty, it would incorrectly always match, so clear _always
                     match._always = False
                 else:
                     # no patterns: relative to repo root
                     match = scmutil.match(repo[None], [wvfs.join(standindir)], badfn=badfn)
                 return match
             def composestandinmatcher(repo, rmatcher):
                 '''Return a matcher that accepts standins corresponding to the
                 files accepted by rmatcher. Pass the list of files in the matcher
                 as the paths specified by the user.'''
                 smatcher = getstandinmatcher(repo, rmatcher)
                 isstandin = smatcher.matchfn
                 def composedmatchfn(f):
                     return isstandin(f) and rmatcher.matchfn(splitstandin(f))
                 smatcher.matchfn = composedmatchfn
                 return smatcher
             def standin(filename):
                 '''Return the repo-relative path to the standin for the specified big
                 file.'''
                 # Notes:
                 # 1) Some callers want an absolute path, but for instance addlargefiles
                 #    needs it repo-relative so it can be passed to repo[None].add().  So
                 #    leave it up to the caller to use repo.wjoin() to get an absolute path.
                 # 2) Join with '/' because that's what dirstate always uses, even on
                 #    Windows. Change existing separator to '/' first in case we are
                 #    passed filenames from an external source (like the command line).
                 return shortnameslash + util.pconvert(filename)
             def isstandin(filename):
                 '''Return true if filename is a big file standin. filename must be
                 in Mercurial's internal form (slash-separated).'''
                 return filename.startswith(shortnameslash)
             def splitstandin(filename):
                 # Split on / because that's what dirstate always uses, even on Windows.
                 # Change local separator to / first just in case we are passed filenames
                 # from an external source (like the command line).
                 bits = util.pconvert(filename).split('/', 1)
                 if len(bits) == 2 and bits[0] == shortname:
                     return bits[1]
                 else:
                     return None
             def updatestandin(repo, standin):
                 file = repo.wjoin(splitstandin(standin))
                 if repo.wvfs.exists(splitstandin(standin)):
                     hash = hashfile(file)
                     executable = getexecutable(file)
                     writestandin(repo, standin, hash, executable)
                 else:
                     raise error.Abort(_('%s: file not found!') % splitstandin(standin))
             def readstandin(repo, filename, node=None):
                 '''read hex hash from standin for filename at given node, or working
                 directory if no node is given'''
                 return repo[node][standin(filename)].data().strip()
             def writestandin(repo, standin, hash, executable):
                 '''write hash to <repo.root>/<standin>'''
                 repo.wwrite(standin, hash + '\n', executable and 'x' or '')
             def copyandhash(instream, outfile):
                 '''Read bytes from instream (iterable) and write them to outfile,
                 computing the SHA-1 hash of the data along the way. Return the hash.'''
                 hasher = hashlib.sha1('')
                 for data in instream:
                     hasher.update(data)
                     outfile.write(data)
                 return hasher.hexdigest()
             def hashrepofile(repo, file):
                 return hashfile(repo.wjoin(file))
             def hashfile(file):
                 if not os.path.exists(file):
                     return ''
                 hasher = hashlib.sha1('')
                 with open(file, 'rb') as fd:
                     for data in util.filechunkiter(fd):
                         hasher.update(data)
                 return hasher.hexdigest()
             def getexecutable(filename):
                 mode = os.stat(filename).st_mode
                 return ((mode & stat.S_IXUSR) and
                         (mode & stat.S_IXGRP) and
                         (mode & stat.S_IXOTH))
             def urljoin(first, second, *arg):
                 def join(left, right):
                     if not left.endswith('/'):
                         left += '/'
                     if right.startswith('/'):
                         right = right[1:]
                     return left + right
                 url = join(first, second)
                 for a in arg:
                     url = join(url, a)
                 return url
             def hexsha1(data):
                 """hexsha1 returns the hex-encoded sha1 sum of the data in the file-like
                 object data"""
                 h = hashlib.sha1()
                 for chunk in util.filechunkiter(data):
                     h.update(chunk)
                 return h.hexdigest()
             def httpsendfile(ui, filename):
                 return httpconnection.httpsendfile(ui, filename, 'rb')
             def unixpath(path):
                 '''Return a version of path normalized for use with the lfdirstate.'''
                 return util.pconvert(os.path.normpath(path))
             def islfilesrepo(repo):
                 '''Return true if the repo is a largefile repo.'''
                 if ('largefiles' in repo.requirements and
                         any(shortnameslash in f[0] for f in repo.store.datafiles())):
                     return True
                 return any(openlfdirstate(repo.ui, repo, False))
             class storeprotonotcapable(Exception):
                 def __init__(self, storetypes):
                     self.storetypes = storetypes
             def getstandinsstate(repo):
                 standins = []
                 matcher = getstandinmatcher(repo)
                 for standin in repo.dirstate.walk(matcher, [], False, False):
                     lfile = splitstandin(standin)
                     try:
                         hash = readstandin(repo, lfile)
                     except IOError:
                         hash = None
                     standins.append((lfile, hash))
                 return standins
             def synclfdirstate(repo, lfdirstate, lfile, normallookup):
                 lfstandin = standin(lfile)
                 if lfstandin in repo.dirstate:
                     stat = repo.dirstate._map[lfstandin]
                     state, mtime = stat[0], stat[3]
                 else:
                     state, mtime = '?', -1
                 if state == 'n':
                     if (normallookup or mtime < 0 or
                         not repo.wvfs.exists(lfile)):
                         # state 'n' doesn't ensure 'clean' in this case
                         lfdirstate.normallookup(lfile)
                     else:
                         lfdirstate.normal(lfile)
                 elif state == 'm':
                     lfdirstate.normallookup(lfile)
                 elif state == 'r':
                     lfdirstate.remove(lfile)
                 elif state == 'a':
                     lfdirstate.add(lfile)
                 elif state == '?':
                     lfdirstate.drop(lfile)
             def markcommitted(orig, ctx, node):
                 repo = ctx.repo()
                 orig(node)
                 # ATTENTION: "ctx.files()" may differ from "repo[node].files()"
                 # because files coming from the 2nd parent are omitted in the latter.
                 #
                 # The former should be used to get targets of "synclfdirstate",
                 # because such files:
                 # - are marked as "a" by "patch.patch()" (e.g. via transplant), and
                 # - have to be marked as "n" after commit, but
                 # - aren't listed in "repo[node].files()"
                 lfdirstate = openlfdirstate(repo.ui, repo)
                 for f in ctx.files():
                     if isstandin(f):
                         lfile = splitstandin(f)
                         synclfdirstate(repo, lfdirstate, lfile, False)
                 lfdirstate.write()
                 # As part of committing, copy all of the largefiles into the cache.
                 copyalltostore(repo, node)
             def getlfilestoupdate(oldstandins, newstandins):
                 changedstandins = set(oldstandins).symmetric_difference(set(newstandins))
                 filelist = []
                 for f in changedstandins:
                     if f[0] not in filelist:
                         filelist.append(f[0])
                 return filelist
             def getlfilestoupload(repo, missing, addfunc):
                 for i, n in enumerate(missing):
                     repo.ui.progress(_('finding outgoing largefiles'), i,
                         unit=_('revisions'), total=len(missing))
                     parents = [p for p in repo[n].parents() if p != node.nullid]
                     oldlfstatus = repo.lfstatus
                     repo.lfstatus = False
                     try:
                         ctx = repo[n]
                     finally:
                         repo.lfstatus = oldlfstatus
                     files = set(ctx.files())
                     if len(parents) == 2:
                         mc = ctx.manifest()
                         mp1 = ctx.parents()[0].manifest()
                         mp2 = ctx.parents()[1].manifest()
                         for f in mp1:
                             if f not in mc:
                                 files.add(f)
                         for f in mp2:
                             if f not in mc:
                                 files.add(f)
                         for f in mc:
                             if mc[f] != mp1.get(f, None) or mc[f] != mp2.get(f, None):
                                 files.add(f)
                     for fn in files:
                         if isstandin(fn) and fn in ctx:
                             addfunc(fn, ctx[fn].data().strip())
                 repo.ui.progress(_('finding outgoing largefiles'), None)
             def updatestandinsbymatch(repo, match):
                 '''Update standins in the working directory according to specified match
                 This returns (possibly modified) ``match`` object to be used for
                 subsequent commit process.
                 '''
                 ui = repo.ui
                 # Case 1: user calls commit with no specific files or
                 # include/exclude patterns: refresh and commit all files that
                 # are "dirty".
                 if match is None or match.always():
                     # Spend a bit of time here to get a list of files we know
                     # are modified so we can compare only against those.
                     # It can cost a lot of time (several seconds)
                     # otherwise to update all standins if the largefiles are
                     # large.
                     lfdirstate = openlfdirstate(ui, repo)
                     dirtymatch = matchmod.always(repo.root, repo.getcwd())
                     unsure, s = lfdirstate.status(dirtymatch, [], False, False,
                                                   False)
                     modifiedfiles = unsure + s.modified + s.added + s.removed
                     lfiles = listlfiles(repo)
                     # this only loops through largefiles that exist (not
                     # removed/renamed)
                     for lfile in lfiles:
                         if lfile in modifiedfiles:
                             if repo.wvfs.exists(standin(lfile)):
                                 # this handles the case where a rebase is being
                                 # performed and the working copy is not updated
                                 # yet.
                                 if repo.wvfs.exists(lfile):
                                     updatestandin(repo,
                                         standin(lfile))
                     return match
                 lfiles = listlfiles(repo)
                 match._files = repo._subdirlfs(match.files(), lfiles)
                 # Case 2: user calls commit with specified patterns: refresh
                 # any matching big files.
                 smatcher = composestandinmatcher(repo, match)
                 standins = repo.dirstate.walk(smatcher, [], False, False)
                 # No matching big files: get out of the way and pass control to
                 # the usual commit() method.
                 if not standins:
                     return match
                 # Refresh all matching big files.  It's possible that the
                 # commit will end up failing, in which case the big files will
                 # stay refreshed.  No harm done: the user modified them and
                 # asked to commit them, so sooner or later we're going to
                 # refresh the standins.  Might as well leave them refreshed.
                 lfdirstate = openlfdirstate(ui, repo)
                 for fstandin in standins:
                     lfile = splitstandin(fstandin)
                     if lfdirstate[lfile] != 'r':
                         updatestandin(repo, fstandin)
                 # Cook up a new matcher that only matches regular files or
                 # standins corresponding to the big files requested by the
                 # user.  Have to modify _files to prevent commit() from
                 # complaining "not tracked" for big files.
                 match = copy.copy(match)
                 origmatchfn = match.matchfn
                 # Check both the list of largefiles and the list of
                 # standins because if a largefile was removed, it
                 # won't be in the list of largefiles at this point
                 match._files += sorted(standins)
                 actualfiles = []
                 for f in match._files:
                     fstandin = standin(f)
                     # For largefiles, only one of the normal and standin should be
                     # committed (except if one of them is a remove).  In the case of a
                     # standin removal, drop the normal file if it is unknown to dirstate.
                     # Thus, skip plain largefile names but keep the standin.
                     if f in lfiles or fstandin in standins:
                         if repo.dirstate[fstandin] != 'r':
                             if repo.dirstate[f] != 'r':
                                 continue
                         elif repo.dirstate[f] == '?':
                             continue
                     actualfiles.append(f)
                 match._files = actualfiles
                 def matchfn(f):
                     if origmatchfn(f):
                         return f not in lfiles
                     else:
                         return f in standins
                 match.matchfn = matchfn
                 return match
             class automatedcommithook(object):
                 '''Stateful hook to update standins at the 1st commit of resuming
                 For efficiency, updating standins in the working directory should
                 be avoided while automated committing (like rebase, transplant and
                 so on), because they should be updated before committing.
                 But the 1st commit of resuming automated committing (e.g. ``rebase
                 --continue``) should update them, because largefiles may be
                 modified manually.
                 '''
                 def __init__(self, resuming):
                     self.resuming = resuming
                 def __call__(self, repo, match):
                     if self.resuming:
                         self.resuming = False # avoids updating at subsequent commits
                         return updatestandinsbymatch(repo, match)
                     else:
                         return match
             def getstatuswriter(ui, repo, forcibly=None):
                 '''Return the function to write largefiles specific status out
                 If ``forcibly`` is ``None``, this returns the last element of
                 ``repo._lfstatuswriters`` as "default" writer function.
                 Otherwise, this returns the function to always write out (or
                 ignore if ``not forcibly``) status.
                 '''
                 if forcibly is None and util.safehasattr(repo, '_largefilesenabled'):
                     return repo._lfstatuswriters[-1]
                 else:
                     if forcibly:
                         return ui.status # forcibly WRITE OUT
                     else:
                         return lambda *msg, **opts: None # forcibly IGNORE

mercurial/profiling.py

0 +2 -2

             # profiling.py - profiling functions
             #
             # Copyright 2016 Gregory Szorc <gregory.szorc@gmail.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import, print_function
             import contextlib
             import time
             from .i18n import _
             from . import (
+                encoding,
                 error,
-                pycompat,
                 util,
             )
             @contextlib.contextmanager
             def lsprofile(ui, fp):
                 format = ui.config('profiling', 'format', default='text')
                 field = ui.config('profiling', 'sort', default='inlinetime')
                 limit = ui.configint('profiling', 'limit', default=30)
                 climit = ui.configint('profiling', 'nested', default=0)
                 if format not in ['text', 'kcachegrind']:
                     ui.warn(_("unrecognized profiling format '%s'"
                                 " - Ignored\n") % format)
                     format = 'text'
                 try:
                     from . import lsprof
                 except ImportError:
                     raise error.Abort(_(
                         'lsprof not available - install from '
                         'http://codespeak.net/svn/user/arigo/hack/misc/lsprof/'))
                 p = lsprof.Profiler()
                 p.enable(subcalls=True)
                 try:
                     yield
                 finally:
                     p.disable()
                     if format == 'kcachegrind':
                         from . import lsprofcalltree
                         calltree = lsprofcalltree.KCacheGrind(p)
                         calltree.output(fp)
                     else:
                         # format == 'text'
                         stats = lsprof.Stats(p.getstats())
                         stats.sort(field)
                         stats.pprint(limit=limit, file=fp, climit=climit)
             @contextlib.contextmanager
             def flameprofile(ui, fp):
                 try:
                     from flamegraph import flamegraph
                 except ImportError:
                     raise error.Abort(_(
                         'flamegraph not available - install from '
                         'https://github.com/evanhempel/python-flamegraph'))
                 # developer config: profiling.freq
                 freq = ui.configint('profiling', 'freq', default=1000)
                 filter_ = None
                 collapse_recursion = True
                 thread = flamegraph.ProfileThread(fp, 1.0 / freq,
                                                   filter_, collapse_recursion)
                 start_time = time.clock()
                 try:
                     thread.start()
                     yield
                 finally:
                     thread.stop()
                     thread.join()
                     print('Collected %d stack frames (%d unique) in %2.2f seconds.' % (
                         time.clock() - start_time, thread.num_frames(),
                         thread.num_frames(unique=True)))
             @contextlib.contextmanager
             def statprofile(ui, fp):
                 from . import statprof
                 freq = ui.configint('profiling', 'freq', default=1000)
                 if freq > 0:
                     # Cannot reset when profiler is already active. So silently no-op.
                     if statprof.state.profile_level == 0:
                         statprof.reset(freq)
                 else:
                     ui.warn(_("invalid sampling frequency '%s' - ignoring\n") % freq)
                 statprof.start(mechanism='thread')
                 try:
                     yield
                 finally:
                     data = statprof.stop()
                     profformat = ui.config('profiling', 'statformat', 'hotpath')
                     formats = {
                         'byline': statprof.DisplayFormats.ByLine,
                         'bymethod': statprof.DisplayFormats.ByMethod,
                         'hotpath': statprof.DisplayFormats.Hotpath,
                         'json': statprof.DisplayFormats.Json,
                     }
                     if profformat in formats:
                         displayformat = formats[profformat]
                     else:
                         ui.warn(_('unknown profiler output format: %s\n') % profformat)
                         displayformat = statprof.DisplayFormats.Hotpath
                     statprof.display(fp, data=data, format=displayformat)
             @contextlib.contextmanager
             def profile(ui):
                 """Start profiling.
                 Profiling is active when the context manager is active. When the context
                 manager exits, profiling results will be written to the configured output.
                 """
-                profiler = pycompat.osgetenv('HGPROF')
+                profiler = encoding.environ.get('HGPROF')
                 if profiler is None:
                     profiler = ui.config('profiling', 'type', default='stat')
                 if profiler not in ('ls', 'stat', 'flame'):
                     ui.warn(_("unrecognized profiler '%s' - ignored\n") % profiler)
                     profiler = 'stat'
                 output = ui.config('profiling', 'output')
                 if output == 'blackbox':
                     fp = util.stringio()
                 elif output:
                     path = ui.expandpath(output)
                     fp = open(path, 'wb')
                 else:
                     fp = ui.ferr
                 try:
                     if profiler == 'ls':
                         proffn = lsprofile
                     elif profiler == 'flame':
                         proffn = flameprofile
                     else:
                         proffn = statprofile
                     with proffn(ui, fp):
                         yield
                 finally:
                     if output:
                         if output == 'blackbox':
                             val = 'Profile:\n%s' % fp.getvalue()
                             # ui.log treats the input as a format string,
                             # so we need to escape any % signs.
                             val = val.replace('%', '%%')
                             ui.log('profile', val)
                         fp.close()
             @contextlib.contextmanager
             def maybeprofile(ui):
                 """Profile if enabled, else do nothing.
                 This context manager can be used to optionally profile if profiling
                 is enabled. Otherwise, it does nothing.
                 The purpose of this context manager is to make calling code simpler:
                 just use a single code path for calling into code you may want to profile
                 and this function determines whether to start profiling.
                 """
                 if ui.configbool('profiling', 'enabled'):
                     with profile(ui):
                         yield
                 else:
                     yield

mercurial/pycompat.py

0 0 -2

             # pycompat.py - portability shim for python 3
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Mercurial portability shim for python 3.
             This contains aliases to hide python version-specific details from the core.
             """
             from __future__ import absolute_import
             import getopt
             import os
             import shlex
             import sys
             ispy3 = (sys.version_info[0] >= 3)
             if not ispy3:
                 import cPickle as pickle
                 import cStringIO as io
                 import httplib
                 import Queue as _queue
                 import SocketServer as socketserver
                 import urlparse
                 urlunquote = urlparse.unquote
                 import xmlrpclib
             else:
                 import http.client as httplib
                 import io
                 import pickle
                 import queue as _queue
                 import socketserver
                 import urllib.parse as urlparse
                 urlunquote = urlparse.unquote_to_bytes
                 import xmlrpc.client as xmlrpclib
             if ispy3:
                 import builtins
                 import functools
                 fsencode = os.fsencode
                 fsdecode = os.fsdecode
                 # A bytes version of os.name.
                 osname = os.name.encode('ascii')
                 ospathsep = os.pathsep.encode('ascii')
                 ossep = os.sep.encode('ascii')
                 osaltsep = os.altsep
-                osgetenv = os.getenvb
                 if osaltsep:
                     osaltsep = osaltsep.encode('ascii')
                 # os.getcwd() on Python 3 returns string, but it has os.getcwdb() which
                 # returns bytes.
                 getcwd = os.getcwdb
                 sysplatform = sys.platform.encode('ascii')
                 sysexecutable = sys.executable
                 if sysexecutable:
                     sysexecutable = os.fsencode(sysexecutable)
                 # TODO: .buffer might not exist if std streams were replaced; we'll need
                 # a silly wrapper to make a bytes stream backed by a unicode one.
                 stdin = sys.stdin.buffer
                 stdout = sys.stdout.buffer
                 stderr = sys.stderr.buffer
                 # Since Python 3 converts argv to wchar_t type by Py_DecodeLocale() on Unix,
                 # we can use os.fsencode() to get back bytes argv.
                 #
                 # https://hg.python.org/cpython/file/v3.5.1/Programs/python.c#l55
                 #
                 # TODO: On Windows, the native argv is wchar_t, so we'll need a different
                 # workaround to simulate the Python 2 (i.e. ANSI Win32 API) behavior.
                 sysargv = list(map(os.fsencode, sys.argv))
                 def sysstr(s):
                     """Return a keyword str to be passed to Python functions such as
                     getattr() and str.encode()
                     This never raises UnicodeDecodeError. Non-ascii characters are
                     considered invalid and mapped to arbitrary but unique code points
                     such that 'sysstr(a) != sysstr(b)' for all 'a != b'.
                     """
                     if isinstance(s, builtins.str):
                         return s
                     return s.decode(u'latin-1')
                 def _wrapattrfunc(f):
                     @functools.wraps(f)
                     def w(object, name, *args):
                         return f(object, sysstr(name), *args)
                     return w
                 # these wrappers are automagically imported by hgloader
                 delattr = _wrapattrfunc(builtins.delattr)
                 getattr = _wrapattrfunc(builtins.getattr)
                 hasattr = _wrapattrfunc(builtins.hasattr)
                 setattr = _wrapattrfunc(builtins.setattr)
                 xrange = builtins.range
                 # getopt.getopt() on Python 3 deals with unicodes internally so we cannot
                 # pass bytes there. Passing unicodes will result in unicodes as return
                 # values which we need to convert again to bytes.
                 def getoptb(args, shortlist, namelist):
                     args = [a.decode('latin-1') for a in args]
                     shortlist = shortlist.decode('latin-1')
                     namelist = [a.decode('latin-1') for a in namelist]
                     opts, args = getopt.getopt(args, shortlist, namelist)
                     opts = [(a[0].encode('latin-1'), a[1].encode('latin-1'))
                             for a in opts]
                     args = [a.encode('latin-1') for a in args]
                     return opts, args
                 # keys of keyword arguments in Python need to be strings which are unicodes
                 # Python 3. This function takes keyword arguments, convert the keys to str.
                 def strkwargs(dic):
                     dic = dict((k.decode('latin-1'), v) for k, v in dic.iteritems())
                     return dic
                 # keys of keyword arguments need to be unicode while passing into
                 # a function. This function helps us to convert those keys back to bytes
                 # again as we need to deal with bytes.
                 def byteskwargs(dic):
                     dic = dict((k.encode('latin-1'), v) for k, v in dic.iteritems())
                     return dic
                 # shlex.split() accepts unicodes on Python 3. This function takes bytes
                 # argument, convert it into unicodes, pass into shlex.split(), convert the
                 # returned value to bytes and return that.
                 # TODO: handle shlex.shlex().
                 def shlexsplit(s):
                     ret = shlex.split(s.decode('latin-1'))
                     return [a.encode('latin-1') for a in ret]
             else:
                 def sysstr(s):
                     return s
                 # Partial backport from os.py in Python 3, which only accepts bytes.
                 # In Python 2, our paths should only ever be bytes, a unicode path
                 # indicates a bug.
                 def fsencode(filename):
                     if isinstance(filename, str):
                         return filename
                     else:
                         raise TypeError(
                             "expect str, not %s" % type(filename).__name__)
                 # In Python 2, fsdecode() has a very chance to receive bytes. So it's
                 # better not to touch Python 2 part as it's already working fine.
                 def fsdecode(filename):
                     return filename
                 def getoptb(args, shortlist, namelist):
                     return getopt.getopt(args, shortlist, namelist)
                 def strkwargs(dic):
                     return dic
                 def byteskwargs(dic):
                     return dic
                 osname = os.name
                 ospathsep = os.pathsep
                 ossep = os.sep
                 osaltsep = os.altsep
                 stdin = sys.stdin
                 stdout = sys.stdout
                 stderr = sys.stderr
                 sysargv = sys.argv
                 sysplatform = sys.platform
                 getcwd = os.getcwd
-                osgetenv = os.getenv
                 sysexecutable = sys.executable
                 shlexsplit = shlex.split
             stringio = io.StringIO
             empty = _queue.Empty
             queue = _queue.Queue
             class _pycompatstub(object):
                 def __init__(self):
                     self._aliases = {}
                 def _registeraliases(self, origin, items):
                     """Add items that will be populated at the first access"""
                     items = map(sysstr, items)
                     self._aliases.update(
                         (item.replace(sysstr('_'), sysstr('')).lower(), (origin, item))
                         for item in items)
                 def __getattr__(self, name):
                     try:
                         origin, item = self._aliases[name]
                     except KeyError:
                         raise AttributeError(name)
                     self.__dict__[name] = obj = getattr(origin, item)
                     return obj
             httpserver = _pycompatstub()
             urlreq = _pycompatstub()
             urlerr = _pycompatstub()
             if not ispy3:
                 import BaseHTTPServer
                 import CGIHTTPServer
                 import SimpleHTTPServer
                 import urllib2
                 import urllib
                 urlreq._registeraliases(urllib, (
                     "addclosehook",
                     "addinfourl",
                     "ftpwrapper",
                     "pathname2url",
                     "quote",
                     "splitattr",
                     "splitpasswd",
                     "splitport",
                     "splituser",
                     "unquote",
                     "url2pathname",
                     "urlencode",
                 ))
                 urlreq._registeraliases(urllib2, (
                     "AbstractHTTPHandler",
                     "BaseHandler",
                     "build_opener",
                     "FileHandler",
                     "FTPHandler",
                     "HTTPBasicAuthHandler",
                     "HTTPDigestAuthHandler",
                     "HTTPHandler",
                     "HTTPPasswordMgrWithDefaultRealm",
                     "HTTPSHandler",
                     "install_opener",
                     "ProxyHandler",
                     "Request",
                     "urlopen",
                 ))
                 urlerr._registeraliases(urllib2, (
                     "HTTPError",
                     "URLError",
                 ))
                 httpserver._registeraliases(BaseHTTPServer, (
                     "HTTPServer",
                     "BaseHTTPRequestHandler",
                 ))
                 httpserver._registeraliases(SimpleHTTPServer, (
                     "SimpleHTTPRequestHandler",
                 ))
                 httpserver._registeraliases(CGIHTTPServer, (
                     "CGIHTTPRequestHandler",
                 ))
             else:
                 import urllib.request
                 urlreq._registeraliases(urllib.request, (
                     "AbstractHTTPHandler",
                     "addclosehook",
                     "addinfourl",
                     "BaseHandler",
                     "build_opener",
                     "FileHandler",
                     "FTPHandler",
                     "ftpwrapper",
                     "HTTPHandler",
                     "HTTPSHandler",
                     "install_opener",
                     "pathname2url",
                     "HTTPBasicAuthHandler",
                     "HTTPDigestAuthHandler",
                     "HTTPPasswordMgrWithDefaultRealm",
                     "ProxyHandler",
                     "quote",
                     "Request",
                     "splitattr",
                     "splitpasswd",
                     "splitport",
                     "splituser",
                     "unquote",
                     "url2pathname",
                     "urlopen",
                 ))
                 import urllib.error
                 urlerr._registeraliases(urllib.error, (
                     "HTTPError",
                     "URLError",
                 ))
                 import http.server
                 httpserver._registeraliases(http.server, (
                     "HTTPServer",
                     "BaseHTTPRequestHandler",
                     "SimpleHTTPRequestHandler",
                     "CGIHTTPRequestHandler",
                 ))

mercurial/url.py

0 +3 -3

             # url.py - HTTP handling for mercurial
             #
             # Copyright 2005, 2006, 2007, 2008 Matt Mackall <mpm@selenic.com>
             # Copyright 2006, 2007 Alexis S. L. Carvalho <alexis@cecm.usp.br>
             # Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import base64
             import os
             import socket
             from .i18n import _
             from . import (
+                encoding,
                 error,
                 httpconnection as httpconnectionmod,
                 keepalive,
-                pycompat,
                 sslutil,
                 util,
             )
             httplib = util.httplib
             stringio = util.stringio
             urlerr = util.urlerr
             urlreq = util.urlreq
             class passwordmgr(object):
                 def __init__(self, ui, passwddb):
                     self.ui = ui
                     self.passwddb = passwddb
                 def add_password(self, realm, uri, user, passwd):
                     return self.passwddb.add_password(realm, uri, user, passwd)
                 def find_user_password(self, realm, authuri):
                     authinfo = self.passwddb.find_user_password(realm, authuri)
                     user, passwd = authinfo
                     if user and passwd:
                         self._writedebug(user, passwd)
                         return (user, passwd)
                     if not user or not passwd:
                         res = httpconnectionmod.readauthforuri(self.ui, authuri, user)
                         if res:
                             group, auth = res
                             user, passwd = auth.get('username'), auth.get('password')
                             self.ui.debug("using auth.%s.* for authentication\n" % group)
                     if not user or not passwd:
                         u = util.url(authuri)
                         u.query = None
                         if not self.ui.interactive():
                             raise error.Abort(_('http authorization required for %s') %
                                              util.hidepassword(str(u)))
                         self.ui.write(_("http authorization required for %s\n") %
                                       util.hidepassword(str(u)))
                         self.ui.write(_("realm: %s\n") % realm)
                         if user:
                             self.ui.write(_("user: %s\n") % user)
                         else:
                             user = self.ui.prompt(_("user:"), default=None)
                         if not passwd:
                             passwd = self.ui.getpass()
                     self.passwddb.add_password(realm, authuri, user, passwd)
                     self._writedebug(user, passwd)
                     return (user, passwd)
                 def _writedebug(self, user, passwd):
                     msg = _('http auth: user %s, password %s\n')
                     self.ui.debug(msg % (user, passwd and '*' * len(passwd) or 'not set'))
                 def find_stored_password(self, authuri):
                     return self.passwddb.find_user_password(None, authuri)
             class proxyhandler(urlreq.proxyhandler):
                 def __init__(self, ui):
                     proxyurl = (ui.config("http_proxy", "host") or
-                                    pycompat.osgetenv('http_proxy'))
+                                    encoding.environ.get('http_proxy'))
                     # XXX proxyauthinfo = None
                     if proxyurl:
                         # proxy can be proper url or host[:port]
                         if not (proxyurl.startswith('http:') or
                                 proxyurl.startswith('https:')):
                             proxyurl = 'http://' + proxyurl + '/'
                         proxy = util.url(proxyurl)
                         if not proxy.user:
                             proxy.user = ui.config("http_proxy", "user")
                             proxy.passwd = ui.config("http_proxy", "passwd")
                         # see if we should use a proxy for this url
                         no_list = ["localhost", "127.0.0.1"]
                         no_list.extend([p.lower() for
                                         p in ui.configlist("http_proxy", "no")])
                         no_list.extend([p.strip().lower() for
-                                        p in pycompat.osgetenv("no_proxy", '').split(',')
+                                        p in encoding.environ.get("no_proxy", '').split(',')
                                         if p.strip()])
                         # "http_proxy.always" config is for running tests on localhost
                         if ui.configbool("http_proxy", "always"):
                             self.no_list = []
                         else:
                             self.no_list = no_list
                         proxyurl = str(proxy)
                         proxies = {'http': proxyurl, 'https': proxyurl}
                         ui.debug('proxying through http://%s:%s\n' %
                                   (proxy.host, proxy.port))
                     else:
                         proxies = {}
                     urlreq.proxyhandler.__init__(self, proxies)
                     self.ui = ui
                 def proxy_open(self, req, proxy, type_):
                     host = req.get_host().split(':')[0]
                     for e in self.no_list:
                         if host == e:
                             return None
                         if e.startswith('*.') and host.endswith(e[2:]):
                             return None
                         if e.startswith('.') and host.endswith(e[1:]):
                             return None
                     return urlreq.proxyhandler.proxy_open(self, req, proxy, type_)
             def _gen_sendfile(orgsend):
                 def _sendfile(self, data):
                     # send a file
                     if isinstance(data, httpconnectionmod.httpsendfile):
                         # if auth required, some data sent twice, so rewind here
                         data.seek(0)
                         for chunk in util.filechunkiter(data):
                             orgsend(self, chunk)
                     else:
                         orgsend(self, data)
                 return _sendfile
             has_https = util.safehasattr(urlreq, 'httpshandler')
             class httpconnection(keepalive.HTTPConnection):
                 # must be able to send big bundle as stream.
                 send = _gen_sendfile(keepalive.HTTPConnection.send)
                 def getresponse(self):
                     proxyres = getattr(self, 'proxyres', None)
                     if proxyres:
                         if proxyres.will_close:
                             self.close()
                         self.proxyres = None
                         return proxyres
                     return keepalive.HTTPConnection.getresponse(self)
             # general transaction handler to support different ways to handle
             # HTTPS proxying before and after Python 2.6.3.
             def _generic_start_transaction(handler, h, req):
                 tunnel_host = getattr(req, '_tunnel_host', None)
                 if tunnel_host:
                     if tunnel_host[:7] not in ['http://', 'https:/']:
                         tunnel_host = 'https://' + tunnel_host
                     new_tunnel = True
                 else:
                     tunnel_host = req.get_selector()
                     new_tunnel = False
                 if new_tunnel or tunnel_host == req.get_full_url(): # has proxy
                     u = util.url(tunnel_host)
                     if new_tunnel or u.scheme == 'https': # only use CONNECT for HTTPS
                         h.realhostport = ':'.join([u.host, (u.port or '443')])
                         h.headers = req.headers.copy()
                         h.headers.update(handler.parent.addheaders)
                         return
                 h.realhostport = None
                 h.headers = None
             def _generic_proxytunnel(self):
                 proxyheaders = dict(
                         [(x, self.headers[x]) for x in self.headers
                          if x.lower().startswith('proxy-')])
                 self.send('CONNECT %s HTTP/1.0\r\n' % self.realhostport)
                 for header in proxyheaders.iteritems():
                     self.send('%s: %s\r\n' % header)
                 self.send('\r\n')
                 # majority of the following code is duplicated from
                 # httplib.HTTPConnection as there are no adequate places to
                 # override functions to provide the needed functionality
                 res = self.response_class(self.sock,
                                           strict=self.strict,
                                           method=self._method)
                 while True:
                     version, status, reason = res._read_status()
                     if status != httplib.CONTINUE:
                         break
                     # skip lines that are all whitespace
                     list(iter(lambda: res.fp.readline().strip(), ''))
                 res.status = status
                 res.reason = reason.strip()
                 if res.status == 200:
                     # skip lines until we find a blank line
                     list(iter(res.fp.readline, '\r\n'))
                     return True
                 if version == 'HTTP/1.0':
                     res.version = 10
                 elif version.startswith('HTTP/1.'):
                     res.version = 11
                 elif version == 'HTTP/0.9':
                     res.version = 9
                 else:
                     raise httplib.UnknownProtocol(version)
                 if res.version == 9:
                     res.length = None
                     res.chunked = 0
                     res.will_close = 1
                     res.msg = httplib.HTTPMessage(stringio())
                     return False
                 res.msg = httplib.HTTPMessage(res.fp)
                 res.msg.fp = None
                 # are we using the chunked-style of transfer encoding?
                 trenc = res.msg.getheader('transfer-encoding')
                 if trenc and trenc.lower() == "chunked":
                     res.chunked = 1
                     res.chunk_left = None
                 else:
                     res.chunked = 0
                 # will the connection close at the end of the response?
                 res.will_close = res._check_close()
                 # do we have a Content-Length?
                 # NOTE: RFC 2616, section 4.4, #3 says we ignore this if
                 # transfer-encoding is "chunked"
                 length = res.msg.getheader('content-length')
                 if length and not res.chunked:
                     try:
                         res.length = int(length)
                     except ValueError:
                         res.length = None
                     else:
                         if res.length < 0:  # ignore nonsensical negative lengths
                             res.length = None
                 else:
                     res.length = None
                 # does the body have a fixed length? (of zero)
                 if (status == httplib.NO_CONTENT or status == httplib.NOT_MODIFIED or
 <= status < 200 or # 1xx codes
                     res._method == 'HEAD'):
                     res.length = 0
                 # if the connection remains open, and we aren't using chunked, and
                 # a content-length was not provided, then assume that the connection
                 # WILL close.
                 if (not res.will_close and
                    not res.chunked and
                    res.length is None):
                     res.will_close = 1
                 self.proxyres = res
                 return False
             class httphandler(keepalive.HTTPHandler):
                 def http_open(self, req):
                     return self.do_open(httpconnection, req)
                 def _start_transaction(self, h, req):
                     _generic_start_transaction(self, h, req)
                     return keepalive.HTTPHandler._start_transaction(self, h, req)
             if has_https:
                 class httpsconnection(httplib.HTTPConnection):
                     response_class = keepalive.HTTPResponse
                     default_port = httplib.HTTPS_PORT
                     # must be able to send big bundle as stream.
                     send = _gen_sendfile(keepalive.safesend)
                     getresponse = keepalive.wrapgetresponse(httplib.HTTPConnection)
                     def __init__(self, host, port=None, key_file=None, cert_file=None,
                                  *args, **kwargs):
                         httplib.HTTPConnection.__init__(self, host, port, *args, **kwargs)
                         self.key_file = key_file
                         self.cert_file = cert_file
                     def connect(self):
                         self.sock = socket.create_connection((self.host, self.port))
                         host = self.host
                         if self.realhostport: # use CONNECT proxy
                             _generic_proxytunnel(self)
                             host = self.realhostport.rsplit(':', 1)[0]
                         self.sock = sslutil.wrapsocket(
                             self.sock, self.key_file, self.cert_file, ui=self.ui,
                             serverhostname=host)
                         sslutil.validatesocket(self.sock)
                 class httpshandler(keepalive.KeepAliveHandler, urlreq.httpshandler):
                     def __init__(self, ui):
                         keepalive.KeepAliveHandler.__init__(self)
                         urlreq.httpshandler.__init__(self)
                         self.ui = ui
                         self.pwmgr = passwordmgr(self.ui,
                                                  self.ui.httppasswordmgrdb)
                     def _start_transaction(self, h, req):
                         _generic_start_transaction(self, h, req)
                         return keepalive.KeepAliveHandler._start_transaction(self, h, req)
                     def https_open(self, req):
                         # req.get_full_url() does not contain credentials and we may
                         # need them to match the certificates.
                         url = req.get_full_url()
                         user, password = self.pwmgr.find_stored_password(url)
                         res = httpconnectionmod.readauthforuri(self.ui, url, user)
                         if res:
                             group, auth = res
                             self.auth = auth
                             self.ui.debug("using auth.%s.* for authentication\n" % group)
                         else:
                             self.auth = None
                         return self.do_open(self._makeconnection, req)
                     def _makeconnection(self, host, port=None, *args, **kwargs):
                         keyfile = None
                         certfile = None
                         if len(args) >= 1: # key_file
                             keyfile = args[0]
                         if len(args) >= 2: # cert_file
                             certfile = args[1]
                         args = args[2:]
                         # if the user has specified different key/cert files in
                         # hgrc, we prefer these
                         if self.auth and 'key' in self.auth and 'cert' in self.auth:
                             keyfile = self.auth['key']
                             certfile = self.auth['cert']
                         conn = httpsconnection(host, port, keyfile, certfile, *args,
                                                **kwargs)
                         conn.ui = self.ui
                         return conn
             class httpdigestauthhandler(urlreq.httpdigestauthhandler):
                 def __init__(self, *args, **kwargs):
                     urlreq.httpdigestauthhandler.__init__(self, *args, **kwargs)
                     self.retried_req = None
                 def reset_retry_count(self):
                     # Python 2.6.5 will call this on 401 or 407 errors and thus loop
                     # forever. We disable reset_retry_count completely and reset in
                     # http_error_auth_reqed instead.
                     pass
                 def http_error_auth_reqed(self, auth_header, host, req, headers):
                     # Reset the retry counter once for each request.
                     if req is not self.retried_req:
                         self.retried_req = req
                         self.retried = 0
                     return urlreq.httpdigestauthhandler.http_error_auth_reqed(
                                 self, auth_header, host, req, headers)
             class httpbasicauthhandler(urlreq.httpbasicauthhandler):
                 def __init__(self, *args, **kwargs):
                     self.auth = None
                     urlreq.httpbasicauthhandler.__init__(self, *args, **kwargs)
                     self.retried_req = None
                 def http_request(self, request):
                     if self.auth:
                         request.add_unredirected_header(self.auth_header, self.auth)
                     return request
                 def https_request(self, request):
                     if self.auth:
                         request.add_unredirected_header(self.auth_header, self.auth)
                     return request
                 def reset_retry_count(self):
                     # Python 2.6.5 will call this on 401 or 407 errors and thus loop
                     # forever. We disable reset_retry_count completely and reset in
                     # http_error_auth_reqed instead.
                     pass
                 def http_error_auth_reqed(self, auth_header, host, req, headers):
                     # Reset the retry counter once for each request.
                     if req is not self.retried_req:
                         self.retried_req = req
                         self.retried = 0
                     return urlreq.httpbasicauthhandler.http_error_auth_reqed(
                                     self, auth_header, host, req, headers)
                 def retry_http_basic_auth(self, host, req, realm):
                     user, pw = self.passwd.find_user_password(realm, req.get_full_url())
                     if pw is not None:
                         raw = "%s:%s" % (user, pw)
                         auth = 'Basic %s' % base64.b64encode(raw).strip()
                         if req.get_header(self.auth_header, None) == auth:
                             return None
                         self.auth = auth
                         req.add_unredirected_header(self.auth_header, auth)
                         return self.parent.open(req)
                     else:
                         return None
             handlerfuncs = []
             def opener(ui, authinfo=None):
                 '''
                 construct an opener suitable for urllib2
                 authinfo will be added to the password manager
                 '''
                 # experimental config: ui.usehttp2
                 if ui.configbool('ui', 'usehttp2', False):
                     handlers = [
                         httpconnectionmod.http2handler(
                             ui,
                             passwordmgr(ui, ui.httppasswordmgrdb))
                     ]
                 else:
                     handlers = [httphandler()]
                     if has_https:
                         handlers.append(httpshandler(ui))
                 handlers.append(proxyhandler(ui))
                 passmgr = passwordmgr(ui, ui.httppasswordmgrdb)
                 if authinfo is not None:
                     realm, uris, user, passwd = authinfo
                     saveduser, savedpass = passmgr.find_stored_password(uris[0])
                     if user != saveduser or passwd:
                         passmgr.add_password(realm, uris, user, passwd)
                     ui.debug('http auth: user %s, password %s\n' %
                              (user, passwd and '*' * len(passwd) or 'not set'))
                 handlers.extend((httpbasicauthhandler(passmgr),
                                  httpdigestauthhandler(passmgr)))
                 handlers.extend([h(ui, passmgr) for h in handlerfuncs])
                 opener = urlreq.buildopener(*handlers)
                 # The user agent should should *NOT* be used by servers for e.g.
                 # protocol detection or feature negotiation: there are other
                 # facilities for that.
                 #
                 # "mercurial/proto-1.0" was the original user agent string and
                 # exists for backwards compatibility reasons.
                 #
                 # The "(Mercurial %s)" string contains the distribution
                 # name and version. Other client implementations should choose their
                 # own distribution name. Since servers should not be using the user
                 # agent string for anything, clients should be able to define whatever
                 # user agent they deem appropriate.
                 agent = 'mercurial/proto-1.0 (Mercurial %s)' % util.version()
                 opener.addheaders = [('User-agent', agent)]
                 # This header should only be needed by wire protocol requests. But it has
                 # been sent on all requests since forever. We keep sending it for backwards
                 # compatibility reasons. Modern versions of the wire protocol use
                 # X-HgProto-<N> for advertising client support.
                 opener.addheaders.append(('Accept', 'application/mercurial-0.1'))
                 return opener
             def open(ui, url_, data=None):
                 u = util.url(url_)
                 if u.scheme:
                     u.scheme = u.scheme.lower()
                     url_, authinfo = u.authinfo()
                 else:
                     path = util.normpath(os.path.abspath(url_))
                     url_ = 'file://' + urlreq.pathname2url(path)
                     authinfo = None
                 return opener(ui, authinfo).open(url_, data)

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages