upstream/mercurial-mirror Commit - r26843:f580c78e

uescape: also encode non-printable char under 128...

Pierre-Yves David -

r26843:f580c78e default

parent child

mercurial/templatefilters.py

0 +1 -1

              # template-filters.py - common template expansion filters
              #
              # Copyright 2005-2008 Matt Mackall <mpm@selenic.com>
              #
              # This software may be used and distributed according to the terms of the
              # GNU General Public License version 2 or any later version.
              from __future__ import absolute_import
              import cgi
              import os
              import re
              import time
              import urllib
              from . import (
                  encoding,
                  hbisect,
                  node,
                  templatekw,
                  util,
              )
              def addbreaks(text):
                  """:addbreaks: Any text. Add an XHTML "<br />" tag before the end of
                  every line except the last.
                  """
                  return text.replace('\n', '<br/>\n')
              agescales = [("year", 3600 * 24 * 365, 'Y'),
                           ("month", 3600 * 24 * 30, 'M'),
                           ("week", 3600 * 24 * 7, 'W'),
                           ("day", 3600 * 24, 'd'),
                           ("hour", 3600, 'h'),
                           ("minute", 60, 'm'),
                           ("second", 1, 's')]
              def age(date, abbrev=False):
                  """:age: Date. Returns a human-readable date/time difference between the
                  given date/time and the current date/time.
                  """
                  def plural(t, c):
                      if c == 1:
                          return t
                      return t + "s"
                  def fmt(t, c, a):
                      if abbrev:
                          return "%d%s" % (c, a)
                      return "%d %s" % (c, plural(t, c))
                  now = time.time()
                  then = date[0]
                  future = False
                  if then > now:
                      future = True
                      delta = max(1, int(then - now))
                      if delta > agescales[0][1] * 30:
                          return 'in the distant future'
                  else:
                      delta = max(1, int(now - then))
                      if delta > agescales[0][1] * 2:
                          return util.shortdate(date)
                  for t, s, a in agescales:
                      n = delta // s
                      if n >= 2 or s == 1:
                          if future:
                              return '%s from now' % fmt(t, n, a)
                          return '%s ago' % fmt(t, n, a)
              def basename(path):
                  """:basename: Any text. Treats the text as a path, and returns the last
                  component of the path after splitting by the path separator
                  (ignoring trailing separators). For example, "foo/bar/baz" becomes
                  "baz" and "foo/bar//" becomes "bar".
                  """
                  return os.path.basename(path)
              def count(i):
                  """:count: List or text. Returns the length as an integer."""
                  return len(i)
              def domain(author):
                  """:domain: Any text. Finds the first string that looks like an email
                  address, and extracts just the domain component. Example: ``User
                  <user@example.com>`` becomes ``example.com``.
                  """
                  f = author.find('@')
                  if f == -1:
                      return ''
                  author = author[f + 1:]
                  f = author.find('>')
                  if f >= 0:
                      author = author[:f]
                  return author
              def email(text):
                  """:email: Any text. Extracts the first string that looks like an email
                  address. Example: ``User <user@example.com>`` becomes
                  ``user@example.com``.
                  """
                  return util.email(text)
              def escape(text):
                  """:escape: Any text. Replaces the special XML/XHTML characters "&", "<"
                  and ">" with XML entities, and filters out NUL characters.
                  """
                  return cgi.escape(text.replace('\0', ''), True)
              para_re = None
              space_re = None
              def fill(text, width, initindent='', hangindent=''):
                  '''fill many paragraphs with optional indentation.'''
                  global para_re, space_re
                  if para_re is None:
                      para_re = re.compile('(\n\n|\n\\s*[-*]\\s*)', re.M)
                      space_re = re.compile(r'  +')
                  def findparas():
                      start = 0
                      while True:
                          m = para_re.search(text, start)
                          if not m:
                              uctext = unicode(text[start:], encoding.encoding)
                              w = len(uctext)
                              while 0 < w and uctext[w - 1].isspace():
                                  w -= 1
                              yield (uctext[:w].encode(encoding.encoding),
                                     uctext[w:].encode(encoding.encoding))
                              break
                          yield text[start:m.start(0)], m.group(1)
                          start = m.end(1)
                  return "".join([util.wrap(space_re.sub(' ', util.wrap(para, width)),
                                            width, initindent, hangindent) + rest
                                  for para, rest in findparas()])
              def fill68(text):
                  """:fill68: Any text. Wraps the text to fit in 68 columns."""
                  return fill(text, 68)
              def fill76(text):
                  """:fill76: Any text. Wraps the text to fit in 76 columns."""
                  return fill(text, 76)
              def firstline(text):
                  """:firstline: Any text. Returns the first line of text."""
                  try:
                      return text.splitlines(True)[0].rstrip('\r\n')
                  except IndexError:
                      return ''
              def hexfilter(text):
                  """:hex: Any text. Convert a binary Mercurial node identifier into
                  its long hexadecimal representation.
                  """
                  return node.hex(text)
              def hgdate(text):
                  """:hgdate: Date. Returns the date as a pair of numbers: "1157407993
 " (Unix timestamp, timezone offset).
                  """
                  return "%d %d" % text
              def isodate(text):
                  """:isodate: Date. Returns the date in ISO 8601 format: "2009-08-18 13:00
                  +0200".
                  """
                  return util.datestr(text, '%Y-%m-%d %H:%M %1%2')
              def isodatesec(text):
                  """:isodatesec: Date. Returns the date in ISO 8601 format, including
                  seconds: "2009-08-18 13:00:13 +0200". See also the rfc3339date
                  filter.
                  """
                  return util.datestr(text, '%Y-%m-%d %H:%M:%S %1%2')
              def indent(text, prefix):
                  '''indent each non-empty line of text after first with prefix.'''
                  lines = text.splitlines()
                  num_lines = len(lines)
                  endswithnewline = text[-1:] == '\n'
                  def indenter():
                      for i in xrange(num_lines):
                          l = lines[i]
                          if i and l.strip():
                              yield prefix
                          yield l
                          if i < num_lines - 1 or endswithnewline:
                              yield '\n'
                  return "".join(indenter())
              def json(obj):
                  if obj is None or obj is False or obj is True:
                      return {None: 'null', False: 'false', True: 'true'}[obj]
                  elif isinstance(obj, int) or isinstance(obj, float):
                      return str(obj)
                  elif isinstance(obj, str):
                      u = unicode(obj, encoding.encoding, 'replace')
                      return '"%s"' % jsonescape(u)
                  elif isinstance(obj, unicode):
                      return '"%s"' % jsonescape(obj)
                  elif util.safehasattr(obj, 'keys'):
                      out = []
                      for k, v in sorted(obj.iteritems()):
                          s = '%s: %s' % (json(k), json(v))
                          out.append(s)
                      return '{' + ', '.join(out) + '}'
                  elif util.safehasattr(obj, '__iter__'):
                      out = []
                      for i in obj:
                          out.append(json(i))
                      return '[' + ', '.join(out) + ']'
                  elif util.safehasattr(obj, '__call__'):
                      return json(obj())
                  else:
                      raise TypeError('cannot encode type %s' % obj.__class__.__name__)
              def _uescape(c):
-                 if ord(c) < 0x80:
+                 if 0x20 <= ord(c) < 0x80:
                      return c
                  else:
                      return '\\u%04x' % ord(c)
              _escapes = [
                  ('\\', '\\\\'), ('"', '\\"'), ('\t', '\\t'), ('\n', '\\n'),
                  ('\r', '\\r'), ('\f', '\\f'), ('\b', '\\b'),
                  ('<', '\\u003c'), ('>', '\\u003e'), ('\0', '\\u0000')
              ]
              def jsonescape(s):
                  for k, v in _escapes:
                      s = s.replace(k, v)
                  return ''.join(_uescape(c) for c in s)
              def lower(text):
                  """:lower: Any text. Converts the text to lowercase."""
                  return encoding.lower(text)
              def nonempty(str):
                  """:nonempty: Any text. Returns '(none)' if the string is empty."""
                  return str or "(none)"
              def obfuscate(text):
                  """:obfuscate: Any text. Returns the input text rendered as a sequence of
                  XML entities.
                  """
                  text = unicode(text, encoding.encoding, 'replace')
                  return ''.join(['&#%d;' % ord(c) for c in text])
              def permissions(flags):
                  if "l" in flags:
                      return "lrwxrwxrwx"
                  if "x" in flags:
                      return "-rwxr-xr-x"
                  return "-rw-r--r--"
              def person(author):
                  """:person: Any text. Returns the name before an email address,
                  interpreting it as per RFC 5322.
                  >>> person('foo@bar')
                  'foo'
                  >>> person('Foo Bar <foo@bar>')
                  'Foo Bar'
                  >>> person('"Foo Bar" <foo@bar>')
                  'Foo Bar'
                  >>> person('"Foo \"buz\" Bar" <foo@bar>')
                  'Foo "buz" Bar'
                  >>> # The following are invalid, but do exist in real-life
                  ...
                  >>> person('Foo "buz" Bar <foo@bar>')
                  'Foo "buz" Bar'
                  >>> person('"Foo Bar <foo@bar>')
                  'Foo Bar'
                  """
                  if '@' not in author:
                      return author
                  f = author.find('<')
                  if f != -1:
                      return author[:f].strip(' "').replace('\\"', '"')
                  f = author.find('@')
                  return author[:f].replace('.', ' ')
              def revescape(text):
                  """:revescape: Any text. Escapes all "special" characters, except @.
                  Forward slashes are escaped twice to prevent web servers from prematurely
                  unescaping them. For example, "@foo bar/baz" becomes "@foo%20bar%252Fbaz".
                  """
                  return urllib.quote(text, safe='/@').replace('/', '%252F')
              def rfc3339date(text):
                  """:rfc3339date: Date. Returns a date using the Internet date format
                  specified in RFC 3339: "2009-08-18T13:00:13+02:00".
                  """
                  return util.datestr(text, "%Y-%m-%dT%H:%M:%S%1:%2")
              def rfc822date(text):
                  """:rfc822date: Date. Returns a date using the same format used in email
                  headers: "Tue, 18 Aug 2009 13:00:13 +0200".
                  """
                  return util.datestr(text, "%a, %d %b %Y %H:%M:%S %1%2")
              def short(text):
                  """:short: Changeset hash. Returns the short form of a changeset hash,
                  i.e. a 12 hexadecimal digit string.
                  """
                  return text[:12]
              def shortbisect(text):
                  """:shortbisect: Any text. Treats `text` as a bisection status, and
                  returns a single-character representing the status (G: good, B: bad,
                  S: skipped, U: untested, I: ignored). Returns single space if `text`
                  is not a valid bisection status.
                  """
                  return hbisect.shortlabel(text) or ' '
              def shortdate(text):
                  """:shortdate: Date. Returns a date like "2006-09-18"."""
                  return util.shortdate(text)
              def splitlines(text):
                  """:splitlines: Any text. Split text into a list of lines."""
                  return templatekw.showlist('line', text.splitlines(), 'lines')
              def stringescape(text):
                  return text.encode('string_escape')
              def stringify(thing):
                  """:stringify: Any type. Turns the value into text by converting values into
                  text and concatenating them.
                  """
                  if util.safehasattr(thing, '__iter__') and not isinstance(thing, str):
                      return "".join([stringify(t) for t in thing if t is not None])
                  if thing is None:
                      return ""
                  return str(thing)
              def stripdir(text):
                  """:stripdir: Treat the text as path and strip a directory level, if
                  possible. For example, "foo" and "foo/bar" becomes "foo".
                  """
                  dir = os.path.dirname(text)
                  if dir == "":
                      return os.path.basename(text)
                  else:
                      return dir
              def tabindent(text):
                  """:tabindent: Any text. Returns the text, with every non-empty line
                  except the first starting with a tab character.
                  """
                  return indent(text, '\t')
              def upper(text):
                  """:upper: Any text. Converts the text to uppercase."""
                  return encoding.upper(text)
              def urlescape(text):
                  """:urlescape: Any text. Escapes all "special" characters. For example,
                  "foo bar" becomes "foo%20bar".
                  """
                  return urllib.quote(text)
              def userfilter(text):
                  """:user: Any text. Returns a short representation of a user name or email
                  address."""
                  return util.shortuser(text)
              def emailuser(text):
                  """:emailuser: Any text. Returns the user portion of an email address."""
                  return util.emailuser(text)
              def xmlescape(text):
                  text = (text
                          .replace('&', '&amp;')
                          .replace('<', '&lt;')
                          .replace('>', '&gt;')
                          .replace('"', '&quot;')
                          .replace("'", '&#39;')) # &apos; invalid in HTML
                  return re.sub('[\x00-\x08\x0B\x0C\x0E-\x1F]', ' ', text)
              filters = {
                  "addbreaks": addbreaks,
                  "age": age,
                  "basename": basename,
                  "count": count,
                  "domain": domain,
                  "email": email,
                  "escape": escape,
                  "fill68": fill68,
                  "fill76": fill76,
                  "firstline": firstline,
                  "hex": hexfilter,
                  "hgdate": hgdate,
                  "isodate": isodate,
                  "isodatesec": isodatesec,
                  "json": json,
                  "jsonescape": jsonescape,
                  "lower": lower,
                  "nonempty": nonempty,
                  "obfuscate": obfuscate,
                  "permissions": permissions,
                  "person": person,
                  "revescape": revescape,
                  "rfc3339date": rfc3339date,
                  "rfc822date": rfc822date,
                  "short": short,
                  "shortbisect": shortbisect,
                  "shortdate": shortdate,
                  "splitlines": splitlines,
                  "stringescape": stringescape,
                  "stringify": stringify,
                  "stripdir": stripdir,
                  "tabindent": tabindent,
                  "upper": upper,
                  "urlescape": urlescape,
                  "user": userfilter,
                  "emailuser": emailuser,
                  "xmlescape": xmlescape,
              }
              def websub(text, websubtable):
                  """:websub: Any text. Only applies to hgweb. Applies the regular
                  expression replacements defined in the websub section.
                  """
                  if websubtable:
                      for regexp, format in websubtable:
                          text = regexp.sub(format, text)
                  return text
              # tell hggettext to extract docstrings from these functions:
              i18nfunctions = filters.values()

tests/test-template-engine.t

0 +13 0

                $ cat > engine.py << EOF
                >
                > from mercurial import templater
                >
                > class mytemplater(object):
                >     def __init__(self, loader, filters, defaults):
                >         self.loader = loader
                >
                >     def process(self, t, map):
                >         tmpl = self.loader(t)
                >         for k, v in map.iteritems():
                >             if k in ('templ', 'ctx', 'repo', 'revcache', 'cache'):
                >                 continue
                >             if hasattr(v, '__call__'):
                >                 v = v(**map)
                >             v = templater.stringify(v)
                >             tmpl = tmpl.replace('{{%s}}' % k, v)
                >         yield tmpl
                >
                > templater.engines['my'] = mytemplater
                > EOF
                $ hg init test
                $ echo '[extensions]' > test/.hg/hgrc
                $ echo "engine = `pwd`/engine.py" >> test/.hg/hgrc
                $ cd test
                $ cat > mymap << EOF
                > changeset = my:changeset.txt
                > EOF
                $ cat > changeset.txt << EOF
                > {{rev}} {{node}} {{author}}
                > EOF
                $ hg ci -Ama
                adding changeset.txt
                adding mymap
                $ hg log --style=./mymap
 97e5f848f0936960273bbf75be6388cd0350a32b test
                $ cat > changeset.txt << EOF
                > {{p1rev}} {{p1node}} {{p2rev}} {{p2node}}
                > EOF
                $ hg ci -Ama
                $ hg log --style=./mymap
 97e5f848f0936960273bbf75be6388cd0350a32b -1 0000000000000000000000000000000000000000
                -1 0000000000000000000000000000000000000000 -1 0000000000000000000000000000000000000000
+             Fuzzing the unicode escaper to ensure it produces valid data
+             #if hypothesis
+               >>> from hypothesishelpers import *
+               >>> import mercurial.templatefilters as tf
+               >>> import json
+               >>> @check(st.text().map(lambda s: s.encode('utf-8')))
+               ... def testtfescapeproducesvalidjson(text):
+               ...     json.loads('"' + tf.jsonescape(text) + '"')
+             #endif
-               $ cd ..

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages