##// END OF EJS Templates
narrow: don't hexify paths and double-hexify known nodes on wire (BC)...
narrow: don't hexify paths and double-hexify known nodes on wire (BC) It isn't obvious, but wireprototypes.encodelist() is meant only for binary nodeids. So when we used it for encoding hex nodeids and paths, the encoded result was surprising and hard to read. This patch changes the encoding to make the list of paths a comma-separated list and the list of common nodes to be a encodelist()-encoded list of binary nodeids (so the result is just singly-hexified nodeids). This is clearly a breaking change, but the feature is experimental and we're not aware of anyone running a server using this command yet. Differential Revision: https://phab.mercurial-scm.org/D6851

File last commit:

r42583:c2deb251 default
r43214:c2676b5a default
Show More
testparseutil.py
620 lines | 19.5 KiB | text/x-python | PythonLexer
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 # testparseutil.py - utilities to parse test script for check tools
#
# Copyright 2018 FUJIWARA Katsunori <foozy@lares.dti.ne.jp> and others
#
# This software may be used and distributed according to the terms of the
# GNU General Public License version 2 or any later version.
from __future__ import absolute_import, print_function
import abc
import re
import sys
####################
# for Python3 compatibility (almost comes from mercurial/pycompat.py)
ispy3 = (sys.version_info[0] >= 3)
def identity(a):
return a
def _rapply(f, xs):
if xs is None:
# assume None means non-value of optional data
return xs
if isinstance(xs, (list, set, tuple)):
return type(xs)(_rapply(f, x) for x in xs)
if isinstance(xs, dict):
return type(xs)((_rapply(f, k), _rapply(f, v)) for k, v in xs.items())
return f(xs)
def rapply(f, xs):
if f is identity:
# fast path mainly for py2
return xs
return _rapply(f, xs)
if ispy3:
import builtins
def bytestr(s):
# tiny version of pycompat.bytestr
return s.encode('latin1')
def sysstr(s):
if isinstance(s, builtins.str):
return s
return s.decode(u'latin-1')
def opentext(f):
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 return open(f, 'r')
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 else:
bytestr = str
sysstr = identity
opentext = open
def b2s(x):
# convert BYTES elements in "x" to SYSSTR recursively
return rapply(sysstr, x)
def writeout(data):
# write "data" in BYTES into stdout
Augie Fackler
testparseutil: stop extracting using std* streams as bytes on py3...
r42582 sys.stdout.write(data)
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129
def writeerr(data):
# write "data" in BYTES into stderr
Augie Fackler
testparseutil: stop extracting using std* streams as bytes on py3...
r42582 sys.stderr.write(data)
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129
####################
class embeddedmatcher(object):
"""Base class to detect embedded code fragments in *.t test script
"""
__metaclass__ = abc.ABCMeta
def __init__(self, desc):
self.desc = desc
@abc.abstractmethod
def startsat(self, line):
"""Examine whether embedded code starts at line
This can return arbitrary object, and it is used as 'ctx' for
subsequent method invocations.
"""
@abc.abstractmethod
def endsat(self, ctx, line):
"""Examine whether embedded code ends at line"""
@abc.abstractmethod
def isinside(self, ctx, line):
"""Examine whether line is inside embedded code, if not yet endsat
"""
@abc.abstractmethod
def ignores(self, ctx):
"""Examine whether detected embedded code should be ignored"""
@abc.abstractmethod
def filename(self, ctx):
"""Return filename of embedded code
If filename isn't specified for embedded code explicitly, this
returns None.
"""
@abc.abstractmethod
def codeatstart(self, ctx, line):
"""Return actual code at the start line of embedded code
This might return None, if the start line doesn't contain
actual code.
"""
@abc.abstractmethod
def codeatend(self, ctx, line):
"""Return actual code at the end line of embedded code
This might return None, if the end line doesn't contain actual
code.
"""
@abc.abstractmethod
def codeinside(self, ctx, line):
"""Return actual code at line inside embedded code"""
def embedded(basefile, lines, errors, matchers):
"""pick embedded code fragments up from given lines
This is common parsing logic, which examines specified matchers on
given lines.
:basefile: a name of a file, from which lines to be parsed come.
:lines: to be parsed (might be a value returned by "open(basefile)")
:errors: an array, into which messages for detected error are stored
:matchers: an array of embeddedmatcher objects
This function yields '(filename, starts, ends, code)' tuple.
:filename: a name of embedded code, if it is explicitly specified
(e.g. "foobar" of "cat >> foobar <<EOF").
Otherwise, this is None
:starts: line number (1-origin), at which embedded code starts (inclusive)
:ends: line number (1-origin), at which embedded code ends (exclusive)
:code: extracted embedded code, which is single-stringified
>>> class ambigmatcher(object):
... # mock matcher class to examine implementation of
... # "ambiguous matching" corner case
... def __init__(self, desc, matchfunc):
... self.desc = desc
... self.matchfunc = matchfunc
... def startsat(self, line):
... return self.matchfunc(line)
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> ambig1 = ambigmatcher('ambiguous #1',
... lambda l: l.startswith(' $ cat '))
>>> ambig2 = ambigmatcher('ambiguous #2',
... lambda l: l.endswith('<< EOF\\n'))
>>> lines = [' $ cat > foo.py << EOF\\n']
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 >>> errors = []
>>> matchers = [ambig1, ambig2]
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> list(t for t in embedded('<dummy>', lines, errors, matchers))
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 []
>>> b2s(errors)
['<dummy>:1: ambiguous line for "ambiguous #1", "ambiguous #2"']
"""
matcher = None
ctx = filename = code = startline = None # for pyflakes
for lineno, line in enumerate(lines, 1):
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 if not line.endswith('\n'):
line += '\n' # to normalize EOF line
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 if matcher: # now, inside embedded code
if matcher.endsat(ctx, line):
codeatend = matcher.codeatend(ctx, line)
if codeatend is not None:
code.append(codeatend)
if not matcher.ignores(ctx):
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 yield (filename, startline, lineno, ''.join(code))
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 matcher = None
# DO NOT "continue", because line might start next fragment
elif not matcher.isinside(ctx, line):
# this is an error of basefile
# (if matchers are implemented correctly)
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 errors.append('%s:%d: unexpected line for "%s"'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 % (basefile, lineno, matcher.desc))
# stop extracting embedded code by current 'matcher',
# because appearance of unexpected line might mean
# that expected end-of-embedded-code line might never
# appear
matcher = None
# DO NOT "continue", because line might start next fragment
else:
code.append(matcher.codeinside(ctx, line))
continue
# examine whether current line starts embedded code or not
assert not matcher
matched = []
for m in matchers:
ctx = m.startsat(line)
if ctx:
matched.append((m, ctx))
if matched:
if len(matched) > 1:
# this is an error of matchers, maybe
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 errors.append('%s:%d: ambiguous line for %s' %
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 (basefile, lineno,
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 ', '.join(['"%s"' % m.desc
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 for m, c in matched])))
# omit extracting embedded code, because choosing
# arbitrary matcher from matched ones might fail to
# detect the end of embedded code as expected.
continue
matcher, ctx = matched[0]
filename = matcher.filename(ctx)
code = []
codeatstart = matcher.codeatstart(ctx, line)
if codeatstart is not None:
code.append(codeatstart)
startline = lineno
else:
startline = lineno + 1
if matcher:
# examine whether EOF ends embedded code, because embedded
# code isn't yet ended explicitly
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 if matcher.endsat(ctx, '\n'):
codeatend = matcher.codeatend(ctx, '\n')
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 if codeatend is not None:
code.append(codeatend)
if not matcher.ignores(ctx):
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 yield (filename, startline, lineno + 1, ''.join(code))
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 else:
# this is an error of basefile
# (if matchers are implemented correctly)
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 errors.append('%s:%d: unexpected end of file for "%s"'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 % (basefile, lineno, matcher.desc))
# heredoc limit mark to ignore embedded code at check-code.py or so
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 heredocignorelimit = 'NO_CHECK_EOF'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129
# the pattern to match against cases below, and to return a limit mark
# string as 'lname' group
#
# - << LIMITMARK
# - << "LIMITMARK"
# - << 'LIMITMARK'
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 heredoclimitpat = r'\s*<<\s*(?P<lquote>["\']?)(?P<limit>\w+)(?P=lquote)'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129
class fileheredocmatcher(embeddedmatcher):
"""Detect "cat > FILE << LIMIT" style embedded code
Augie Fackler
testparseutil: fix doctest to use str instead of bytes...
r42583 >>> matcher = fileheredocmatcher('heredoc .py file', r'[^<]+\\.py')
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> b2s(matcher.startsat(' $ cat > file.py << EOF\\n'))
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 ('file.py', ' > EOF\\n')
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> b2s(matcher.startsat(' $ cat >>file.py <<EOF\\n'))
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 ('file.py', ' > EOF\\n')
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> b2s(matcher.startsat(' $ cat> \\x27any file.py\\x27<< "EOF"\\n'))
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 ('any file.py', ' > EOF\\n')
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> b2s(matcher.startsat(" $ cat > file.py << 'ANYLIMIT'\\n"))
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 ('file.py', ' > ANYLIMIT\\n')
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> b2s(matcher.startsat(' $ cat<<ANYLIMIT>"file.py"\\n'))
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 ('file.py', ' > ANYLIMIT\\n')
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> start = ' $ cat > file.py << EOF\\n'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 >>> ctx = matcher.startsat(start)
>>> matcher.codeatstart(ctx, start)
>>> b2s(matcher.filename(ctx))
'file.py'
>>> matcher.ignores(ctx)
False
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> inside = ' > foo = 1\\n'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 >>> matcher.endsat(ctx, inside)
False
>>> matcher.isinside(ctx, inside)
True
>>> b2s(matcher.codeinside(ctx, inside))
'foo = 1\\n'
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> end = ' > EOF\\n'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 >>> matcher.endsat(ctx, end)
True
>>> matcher.codeatend(ctx, end)
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> matcher.endsat(ctx, ' > EOFEOF\\n')
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 False
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> ctx = matcher.startsat(' $ cat > file.py << NO_CHECK_EOF\\n')
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 >>> matcher.ignores(ctx)
True
"""
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 _prefix = ' > '
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129
def __init__(self, desc, namepat):
super(fileheredocmatcher, self).__init__(desc)
# build the pattern to match against cases below (and ">>"
# variants), and to return a target filename string as 'name'
# group
#
# - > NAMEPAT
# - > "NAMEPAT"
# - > 'NAMEPAT'
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 namepat = (r'\s*>>?\s*(?P<nquote>["\']?)(?P<name>%s)(?P=nquote)'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 % namepat)
self._fileres = [
# "cat > NAME << LIMIT" case
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 re.compile(r' \$ \s*cat' + namepat + heredoclimitpat),
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 # "cat << LIMIT > NAME" case
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 re.compile(r' \$ \s*cat' + heredoclimitpat + namepat),
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 ]
def startsat(self, line):
# ctx is (filename, END-LINE-OF-EMBEDDED-CODE) tuple
for filere in self._fileres:
matched = filere.match(line)
if matched:
return (matched.group('name'),
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 ' > %s\n' % matched.group('limit'))
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129
def endsat(self, ctx, line):
return ctx[1] == line
def isinside(self, ctx, line):
return line.startswith(self._prefix)
def ignores(self, ctx):
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 return ' > %s\n' % heredocignorelimit == ctx[1]
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129
def filename(self, ctx):
return ctx[0]
def codeatstart(self, ctx, line):
return None # no embedded code at start line
def codeatend(self, ctx, line):
return None # no embedded code at end line
def codeinside(self, ctx, line):
return line[len(self._prefix):] # strip prefix
####
# for embedded python script
class pydoctestmatcher(embeddedmatcher):
"""Detect ">>> code" style embedded python code
>>> matcher = pydoctestmatcher()
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> startline = ' >>> foo = 1\\n'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 >>> matcher.startsat(startline)
True
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> matcher.startsat(' ... foo = 1\\n')
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 False
>>> ctx = matcher.startsat(startline)
>>> matcher.filename(ctx)
>>> matcher.ignores(ctx)
False
>>> b2s(matcher.codeatstart(ctx, startline))
'foo = 1\\n'
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> inside = ' >>> foo = 1\\n'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 >>> matcher.endsat(ctx, inside)
False
>>> matcher.isinside(ctx, inside)
True
>>> b2s(matcher.codeinside(ctx, inside))
'foo = 1\\n'
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> inside = ' ... foo = 1\\n'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 >>> matcher.endsat(ctx, inside)
False
>>> matcher.isinside(ctx, inside)
True
>>> b2s(matcher.codeinside(ctx, inside))
'foo = 1\\n'
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> inside = ' expected output\\n'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 >>> matcher.endsat(ctx, inside)
False
>>> matcher.isinside(ctx, inside)
True
>>> b2s(matcher.codeinside(ctx, inside))
'\\n'
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> inside = ' \\n'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 >>> matcher.endsat(ctx, inside)
False
>>> matcher.isinside(ctx, inside)
True
>>> b2s(matcher.codeinside(ctx, inside))
'\\n'
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> end = ' $ foo bar\\n'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 >>> matcher.endsat(ctx, end)
True
>>> matcher.codeatend(ctx, end)
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> end = '\\n'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 >>> matcher.endsat(ctx, end)
True
>>> matcher.codeatend(ctx, end)
"""
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 _prefix = ' >>> '
_prefixre = re.compile(r' (>>>|\.\.\.) ')
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129
# If a line matches against not _prefixre but _outputre, that line
# is "an expected output line" (= not a part of code fragment).
#
# Strictly speaking, a line matching against "(#if|#else|#endif)"
# is also treated similarly in "inline python code" semantics by
# run-tests.py. But "directive line inside inline python code"
# should be rejected by Mercurial reviewers. Therefore, this
# regexp does not matche against such directive lines.
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 _outputre = re.compile(r' $| [^$]')
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129
def __init__(self):
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 super(pydoctestmatcher, self).__init__("doctest style python code")
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129
def startsat(self, line):
# ctx is "True"
return line.startswith(self._prefix)
def endsat(self, ctx, line):
return not (self._prefixre.match(line) or self._outputre.match(line))
def isinside(self, ctx, line):
return True # always true, if not yet ended
def ignores(self, ctx):
return False # should be checked always
def filename(self, ctx):
return None # no filename
def codeatstart(self, ctx, line):
return line[len(self._prefix):] # strip prefix ' >>> '/' ... '
def codeatend(self, ctx, line):
return None # no embedded code at end line
def codeinside(self, ctx, line):
if self._prefixre.match(line):
return line[len(self._prefix):] # strip prefix ' >>> '/' ... '
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 return '\n' # an expected output line is treated as an empty line
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129
class pyheredocmatcher(embeddedmatcher):
"""Detect "python << LIMIT" style embedded python code
>>> matcher = pyheredocmatcher()
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> b2s(matcher.startsat(' $ python << EOF\\n'))
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 ' > EOF\\n'
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> b2s(matcher.startsat(' $ $PYTHON <<EOF\\n'))
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 ' > EOF\\n'
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> b2s(matcher.startsat(' $ "$PYTHON"<< "EOF"\\n'))
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 ' > EOF\\n'
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> b2s(matcher.startsat(" $ $PYTHON << 'ANYLIMIT'\\n"))
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 ' > ANYLIMIT\\n'
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> matcher.startsat(' $ "$PYTHON" < EOF\\n')
>>> start = ' $ python << EOF\\n'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 >>> ctx = matcher.startsat(start)
>>> matcher.codeatstart(ctx, start)
>>> matcher.filename(ctx)
>>> matcher.ignores(ctx)
False
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> inside = ' > foo = 1\\n'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 >>> matcher.endsat(ctx, inside)
False
>>> matcher.isinside(ctx, inside)
True
>>> b2s(matcher.codeinside(ctx, inside))
'foo = 1\\n'
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> end = ' > EOF\\n'
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 >>> matcher.endsat(ctx, end)
True
>>> matcher.codeatend(ctx, end)
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> matcher.endsat(ctx, ' > EOFEOF\\n')
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 False
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 >>> ctx = matcher.startsat(' $ python << NO_CHECK_EOF\\n')
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 >>> matcher.ignores(ctx)
True
"""
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 _prefix = ' > '
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 _startre = re.compile(r' \$ (\$PYTHON|"\$PYTHON"|python).*' +
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 heredoclimitpat)
def __init__(self):
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 super(pyheredocmatcher, self).__init__("heredoc python invocation")
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129
def startsat(self, line):
# ctx is END-LINE-OF-EMBEDDED-CODE
matched = self._startre.match(line)
if matched:
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 return ' > %s\n' % matched.group('limit')
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129
def endsat(self, ctx, line):
return ctx == line
def isinside(self, ctx, line):
return line.startswith(self._prefix)
def ignores(self, ctx):
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 return ' > %s\n' % heredocignorelimit == ctx
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129
def filename(self, ctx):
return None # no filename
def codeatstart(self, ctx, line):
return None # no embedded code at start line
def codeatend(self, ctx, line):
return None # no embedded code at end line
def codeinside(self, ctx, line):
return line[len(self._prefix):] # strip prefix
_pymatchers = [
pydoctestmatcher(),
pyheredocmatcher(),
# use '[^<]+' instead of '\S+', in order to match against
# paths including whitespaces
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 fileheredocmatcher('heredoc .py file', r'[^<]+\.py'),
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 ]
def pyembedded(basefile, lines, errors):
return embedded(basefile, lines, errors, _pymatchers)
####
# for embedded shell script
_shmatchers = [
# use '[^<]+' instead of '\S+', in order to match against
# paths including whitespaces
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 fileheredocmatcher('heredoc .sh file', r'[^<]+\.sh'),
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 ]
def shembedded(basefile, lines, errors):
return embedded(basefile, lines, errors, _shmatchers)
####
# for embedded hgrc configuration
_hgrcmatchers = [
# use '[^<]+' instead of '\S+', in order to match against
# paths including whitespaces
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 fileheredocmatcher('heredoc hgrc file',
r'(([^/<]+/)+hgrc|\$HGRCPATH|\${HGRCPATH})'),
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 ]
def hgrcembedded(basefile, lines, errors):
return embedded(basefile, lines, errors, _hgrcmatchers)
####
if __name__ == "__main__":
import optparse
import sys
def showembedded(basefile, lines, embeddedfunc, opts):
errors = []
for name, starts, ends, code in embeddedfunc(basefile, lines, errors):
if not name:
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 name = '<anonymous>'
writeout("%s:%d: %s starts\n" % (basefile, starts, name))
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 if opts.verbose and code:
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 writeout(" |%s\n" %
"\n |".join(l for l in code.splitlines()))
writeout("%s:%d: %s ends\n" % (basefile, ends, name))
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 for e in errors:
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 writeerr("%s\n" % e)
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 return len(errors)
def applyembedded(args, embeddedfunc, opts):
ret = 0
if args:
for f in args:
with opentext(f) as fp:
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 if showembedded(f, fp, embeddedfunc, opts):
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 ret = 1
else:
Augie Fackler
testparseutil: stop extracting using std* streams as bytes on py3...
r42582 lines = [l for l in sys.stdin.readlines()]
Pulkit Goyal
py3: make contrib/testparseutil.py to work on str(unicodes)...
r42517 if showembedded('<stdin>', lines, embeddedfunc, opts):
FUJIWARA Katsunori
contrib: add an utility module to parse test scripts...
r40129 ret = 1
return ret
commands = {}
def command(name, desc):
def wrap(func):
commands[name] = (desc, func)
return wrap
@command("pyembedded", "detect embedded python script")
def pyembeddedcmd(args, opts):
return applyembedded(args, pyembedded, opts)
@command("shembedded", "detect embedded shell script")
def shembeddedcmd(args, opts):
return applyembedded(args, shembedded, opts)
@command("hgrcembedded", "detect embedded hgrc configuration")
def hgrcembeddedcmd(args, opts):
return applyembedded(args, hgrcembedded, opts)
availablecommands = "\n".join([" - %s: %s" % (key, value[0])
for key, value in commands.items()])
parser = optparse.OptionParser("""%prog COMMAND [file ...]
Pick up embedded code fragments from given file(s) or stdin, and list
up start/end lines of them in standard compiler format
("FILENAME:LINENO:").
Available commands are:
""" + availablecommands + """
""")
parser.add_option("-v", "--verbose",
help="enable additional output (e.g. actual code)",
action="store_true")
(opts, args) = parser.parse_args()
if not args or args[0] not in commands:
parser.print_help()
sys.exit(255)
sys.exit(commands[args[0]][1](args[1:], opts))