upstream/ipython Commit - r24469:eed56ba3

Merge pull request from Carreau/invalid-escape-sequence...

Min RK -

r24469:eed56ba3

parent child

IPython/core/completer.py

0 +1 -1

              """Completion for IPython.
              This module started as fork of the rlcompleter module in the Python standard
              library.  The original enhancements made to rlcompleter have been sent
              upstream and were accepted as of Python 2.3,
              This module now support a wide variety of completion mechanism both available
              for normal classic Python code, as well as completer for IPython specific
              Syntax like magics.
              Latex and Unicode completion
              ============================
              IPython and compatible frontends not only can complete your code, but can help
              you to input a wide range of characters. In particular we allow you to insert
              a unicode character using the tab completion mechanism.
              Forward latex/unicode completion
              --------------------------------
              Forward completion allows you to easily type a unicode character using its latex
              name, or unicode long description. To do so type a backslash follow by the
              relevant name and press tab:
              Using latex completion:
              .. code::
                  \\alpha<tab>
                  α
              or using unicode completion:
              .. code::
                  \\greek small letter alpha<tab>
                  α
              Only valid Python identifiers will complete. Combining characters (like arrow or
              dots) are also available, unlike latex they need to be put after the their
              counterpart that is to say, `F\\\\vec<tab>` is correct, not `\\\\vec<tab>F`.
              Some browsers are known to display combining characters incorrectly.
              Backward latex completion
              -------------------------
              It is sometime challenging to know how to type a character, if you are using
              IPython, or any compatible frontend you can prepend backslash to the character
              and press `<tab>` to expand it to its latex form.
              .. code::
                  \\α<tab>
                  \\alpha
              Both forward and backward completions can be deactivated by setting the
              ``Completer.backslash_combining_completions`` option to ``False``.
              Experimental
              ============
              Starting with IPython 6.0, this module can make use of the Jedi library to
              generate completions both using static analysis of the code, and dynamically
              inspecting multiple namespaces. The APIs attached to this new mechanism is
              unstable and will raise unless use in an :any:`provisionalcompleter` context
              manager.
              You will find that the following are experimental:
                  - :any:`provisionalcompleter`
                  - :any:`IPCompleter.completions`
                  - :any:`Completion`
                  - :any:`rectify_completions`
              .. note::
                  better name for :any:`rectify_completions` ?
              We welcome any feedback on these new API, and we also encourage you to try this
              module in debug mode (start IPython with ``--Completer.debug=True``) in order
              to have extra logging information is :any:`jedi` is crashing, or if current
              IPython completer pending deprecations are returning results not yet handled
              by :any:`jedi`
              Using Jedi for tab completion allow snippets like the following to work without
              having to execute any code:
                 >>> myvar = ['hello', 42]
                 ... myvar[1].bi<tab>
              Tab completion will be able to infer that ``myvar[1]`` is a real number without
              executing any code unlike the previously available ``IPCompleter.greedy``
              option.
              Be sure to update :any:`jedi` to the latest stable version or to try the
              current development version to get better completions.
              """
              # Copyright (c) IPython Development Team.
              # Distributed under the terms of the Modified BSD License.
              #
              # Some of this code originated from rlcompleter in the Python standard library
              # Copyright (C) 2001 Python Software Foundation, www.python.org
              import __main__
              import builtins as builtin_mod
              import glob
              import time
              import inspect
              import itertools
              import keyword
              import os
              import re
              import sys
              import unicodedata
              import string
              import warnings
              from contextlib import contextmanager
              from importlib import import_module
              from typing import Iterator, List, Tuple, Iterable, Union
              from types import SimpleNamespace
              from traitlets.config.configurable import Configurable
              from IPython.core.error import TryNext
              from IPython.core.inputsplitter import ESC_MAGIC
              from IPython.core.latex_symbols import latex_symbols, reverse_latex_symbol
              from IPython.core.oinspect import InspectColors
              from IPython.utils import generics
              from IPython.utils.dir2 import dir2, get_real_method
              from IPython.utils.process import arg_split
              from traitlets import Bool, Enum, observe, Int
              # skip module docstests
              skip_doctest = True
              try:
                  import jedi
                  jedi.settings.case_insensitive_completion = False
                  import jedi.api.helpers
                  import jedi.api.classes
                  JEDI_INSTALLED = True
              except ImportError:
                  JEDI_INSTALLED = False
              #-----------------------------------------------------------------------------
              # Globals
              #-----------------------------------------------------------------------------
              # Public API
              __all__ = ['Completer','IPCompleter']
              if sys.platform == 'win32':
                  PROTECTABLES = ' '
              else:
                  PROTECTABLES = ' ()[]{}?=\\|;:\'#*"^&'
              # Protect against returning an enormous number of completions which the frontend
              # may have trouble processing.
              MATCHES_LIMIT = 500
              _deprecation_readline_sentinel = object()
              class ProvisionalCompleterWarning(FutureWarning):
                  """
                  Exception raise by an experimental feature in this module.
                  Wrap code in :any:`provisionalcompleter` context manager if you
                  are certain you want to use an unstable feature.
                  """
                  pass
              warnings.filterwarnings('error', category=ProvisionalCompleterWarning)
              @contextmanager
              def provisionalcompleter(action='ignore'):
                  """
                  This contest manager has to be used in any place where unstable completer
                  behavior and API may be called.
                  >>> with provisionalcompleter():
                  ...     completer.do_experimetal_things() # works
                  >>> completer.do_experimental_things() # raises.
                  .. note:: Unstable
                      By using this context manager you agree that the API in use may change
                      without warning, and that you won't complain if they do so.
                      You also understand that if the API is not to you liking you should report
                      a bug to explain your use case upstream and improve the API and will loose
                      credibility if you complain after the API is make stable.
                      We'll be happy to get your feedback , feature request and improvement on
                      any of the unstable APIs !
                  """
                  with warnings.catch_warnings():
                      warnings.filterwarnings(action, category=ProvisionalCompleterWarning)
                      yield
              def has_open_quotes(s):
                  """Return whether a string has open quotes.
                  This simply counts whether the number of quote characters of either type in
                  the string is odd.
                  Returns
                  -------
                  If there is an open quote, the quote character is returned.  Else, return
                  False.
                  """
                  # We check " first, then ', so complex cases with nested quotes will get
                  # the " to take precedence.
                  if s.count('"') % 2:
                      return '"'
                  elif s.count("'") % 2:
                      return "'"
                  else:
                      return False
              def protect_filename(s, protectables=PROTECTABLES):
                  """Escape a string to protect certain characters."""
                  if set(s) & set(protectables):
                      if sys.platform == "win32":
                          return '"' + s + '"'
                      else:
                          return "".join(("\\" + c if c in protectables else c) for c in s)
                  else:
                      return s
              def expand_user(path:str) -> Tuple[str, bool, str]:
                  """Expand ``~``-style usernames in strings.
                  This is similar to :func:`os.path.expanduser`, but it computes and returns
                  extra information that will be useful if the input was being used in
                  computing completions, and you wish to return the completions with the
                  original '~' instead of its expanded value.
                  Parameters
                  ----------
                  path : str
                    String to be expanded.  If no ~ is present, the output is the same as the
                    input.
                  Returns
                  -------
                  newpath : str
                    Result of ~ expansion in the input path.
                  tilde_expand : bool
                    Whether any expansion was performed or not.
                  tilde_val : str
                    The value that ~ was replaced with.
                  """
                  # Default values
                  tilde_expand = False
                  tilde_val = ''
                  newpath = path
                  if path.startswith('~'):
                      tilde_expand = True
                      rest = len(path)-1
                      newpath = os.path.expanduser(path)
                      if rest:
                          tilde_val = newpath[:-rest]
                      else:
                          tilde_val = newpath
                  return newpath, tilde_expand, tilde_val
              def compress_user(path:str, tilde_expand:bool, tilde_val:str) -> str:
                  """Does the opposite of expand_user, with its outputs.
                  """
                  if tilde_expand:
                      return path.replace(tilde_val, '~')
                  else:
                      return path
              def completions_sorting_key(word):
                  """key for sorting completions
                  This does several things:
                  - Demote any completions starting with underscores to the end
                  - Insert any %magic and %%cellmagic completions in the alphabetical order
                    by their name
                  """
                  prio1, prio2 = 0, 0
                  if word.startswith('__'):
                      prio1 = 2
                  elif word.startswith('_'):
                      prio1 = 1
                  if word.endswith('='):
                      prio1 = -1
                  if word.startswith('%%'):
                      # If there's another % in there, this is something else, so leave it alone
                      if not "%" in word[2:]:
                          word = word[2:]
                          prio2 = 2
                  elif word.startswith('%'):
                      if not "%" in word[1:]:
                          word = word[1:]
                          prio2 = 1
                  return prio1, word, prio2
              class _FakeJediCompletion:
                  """
                  This is a workaround to communicate to the UI that Jedi has crashed and to
                  report a bug. Will be used only id :any:`IPCompleter.debug` is set to true.
                  Added in IPython 6.0 so should likely be removed for 7.0
                  """
                  def __init__(self, name):
                      self.name = name
                      self.complete = name
                      self.type = 'crashed'
                      self.name_with_symbols = name
                      self.signature = ''
                      self._origin = 'fake'
                  def __repr__(self):
                      return '<Fake completion object jedi has crashed>'
              class Completion:
                  """
                  Completion object used and return by IPython completers.
                  .. warning:: Unstable
                      This function is unstable, API may change without warning.
                      It will also raise unless use in proper context manager.
                  This act as a middle ground :any:`Completion` object between the
                  :any:`jedi.api.classes.Completion` object and the Prompt Toolkit completion
                  object. While Jedi need a lot of information about evaluator and how the
                  code should be ran/inspected, PromptToolkit (and other frontend) mostly
                  need user facing information.
                  - Which range should be replaced replaced by what.
                  - Some metadata (like completion type), or meta information to displayed to
                    the use user.
                  For debugging purpose we can also store the origin of the completion (``jedi``,
                  ``IPython.python_matches``, ``IPython.magics_matches``...).
                  """
                  __slots__ = ['start', 'end', 'text', 'type', 'signature', '_origin']
                  def __init__(self, start: int, end: int, text: str, *, type: str=None, _origin='', signature='') -> None:
                      warnings.warn("``Completion`` is a provisional API (as of IPython 6.0). "
                                    "It may change without warnings. "
                                    "Use in corresponding context manager.",
                                    category=ProvisionalCompleterWarning, stacklevel=2)
                      self.start = start
                      self.end = end
                      self.text = text
                      self.type = type
                      self.signature = signature
                      self._origin = _origin
                  def __repr__(self):
                      return '<Completion start=%s end=%s text=%r type=%r, signature=%r,>' % \
                              (self.start, self.end, self.text, self.type or '?', self.signature or '?')
                  def __eq__(self, other)->Bool:
                      """
                      Equality and hash do not hash the type (as some completer may not be
                      able to infer the type), but are use to (partially) de-duplicate
                      completion.
                      Completely de-duplicating completion is a bit tricker that just
                      comparing as it depends on surrounding text, which Completions are not
                      aware of.
                      """
                      return self.start == other.start and \
                          self.end == other.end and \
                          self.text == other.text
                  def __hash__(self):
                      return hash((self.start, self.end, self.text))
              _IC = Iterable[Completion]
              def _deduplicate_completions(text: str, completions: _IC)-> _IC:
                  """
                  Deduplicate a set of completions.
                  .. warning:: Unstable
                      This function is unstable, API may change without warning.
                  Parameters
                  ----------
                  text: str
                      text that should be completed.
                  completions: Iterator[Completion]
                      iterator over the completions to deduplicate
                  Yields
                  ------
                  `Completions` objects
                  Completions coming from multiple sources, may be different but end up having
                  the same effect when applied to ``text``. If this is the case, this will
                  consider completions as equal and only emit the first encountered.
                  Not folded in `completions()` yet for debugging purpose, and to detect when
                  the IPython completer does return things that Jedi does not, but should be
                  at some point.
                  """
                  completions = list(completions)
                  if not completions:
                      return
                  new_start = min(c.start for c in completions)
                  new_end = max(c.end for c in completions)
                  seen = set()
                  for c in completions:
                      new_text = text[new_start:c.start] + c.text + text[c.end:new_end]
                      if new_text not in seen:
                          yield c
                          seen.add(new_text)
              def rectify_completions(text: str, completions: _IC, *, _debug=False)->_IC:
                  """
                  Rectify a set of completions to all have the same ``start`` and ``end``
                  .. warning:: Unstable
                      This function is unstable, API may change without warning.
                      It will also raise unless use in proper context manager.
                  Parameters
                  ----------
                  text: str
                      text that should be completed.
                  completions: Iterator[Completion]
                      iterator over the completions to rectify
                  :any:`jedi.api.classes.Completion` s returned by Jedi may not have the same start and end, though
                  the Jupyter Protocol requires them to behave like so. This will readjust
                  the completion to have the same ``start`` and ``end`` by padding both
                  extremities with surrounding text.
                  During stabilisation should support a ``_debug`` option to log which
                  completion are return by the IPython completer and not found in Jedi in
                  order to make upstream bug report.
                  """
                  warnings.warn("`rectify_completions` is a provisional API (as of IPython 6.0). "
                               "It may change without warnings. "
                               "Use in corresponding context manager.",
                                category=ProvisionalCompleterWarning, stacklevel=2)
                  completions = list(completions)
                  if not completions:
                      return
                  starts = (c.start for c in completions)
                  ends = (c.end for c in completions)
                  new_start = min(starts)
                  new_end = max(ends)
                  seen_jedi = set()
                  seen_python_matches = set()
                  for c in completions:
                      new_text = text[new_start:c.start] + c.text + text[c.end:new_end]
                      if c._origin == 'jedi':
                          seen_jedi.add(new_text)
                      elif c._origin == 'IPCompleter.python_matches':
                          seen_python_matches.add(new_text)
                      yield Completion(new_start, new_end, new_text, type=c.type, _origin=c._origin, signature=c.signature)
                  diff = seen_python_matches.difference(seen_jedi)
                  if diff and _debug:
                      print('IPython.python matches have extras:', diff)
              if sys.platform == 'win32':
                  DELIMS = ' \t\n`!@#$^&*()=+[{]}|;\'",<>?'
              else:
                  DELIMS = ' \t\n`!@#$^&*()=+[{]}\\|;:\'",<>?'
              GREEDY_DELIMS = ' =\r\n'
              class CompletionSplitter(object):
                  """An object to split an input line in a manner similar to readline.
                  By having our own implementation, we can expose readline-like completion in
                  a uniform manner to all frontends.  This object only needs to be given the
                  line of text to be split and the cursor position on said line, and it
                  returns the 'word' to be completed on at the cursor after splitting the
                  entire line.
                  What characters are used as splitting delimiters can be controlled by
                  setting the ``delims`` attribute (this is a property that internally
                  automatically builds the necessary regular expression)"""
                  # Private interface
                  # A string of delimiter characters.  The default value makes sense for
                  # IPython's most typical usage patterns.
                  _delims = DELIMS
                  # The expression (a normal string) to be compiled into a regular expression
                  # for actual splitting.  We store it as an attribute mostly for ease of
                  # debugging, since this type of code can be so tricky to debug.
                  _delim_expr = None
                  # The regular expression that does the actual splitting
                  _delim_re = None
                  def __init__(self, delims=None):
                      delims = CompletionSplitter._delims if delims is None else delims
                      self.delims = delims
                  @property
                  def delims(self):
                      """Return the string of delimiter characters."""
                      return self._delims
                  @delims.setter
                  def delims(self, delims):
                      """Set the delimiters for line splitting."""
                      expr = '[' + ''.join('\\'+ c for c in delims) + ']'
                      self._delim_re = re.compile(expr)
                      self._delims = delims
                      self._delim_expr = expr
                  def split_line(self, line, cursor_pos=None):
                      """Split a line of text with a cursor at the given position.
                      """
                      l = line if cursor_pos is None else line[:cursor_pos]
                      return self._delim_re.split(l)[-1]
              class Completer(Configurable):
                  greedy = Bool(False,
                      help="""Activate greedy completion
                      PENDING DEPRECTION. this is now mostly taken care of with Jedi.
                      This will enable completion on elements of lists, results of function calls, etc.,
                      but can be unsafe because the code is actually evaluated on TAB.
                      """
                  ).tag(config=True)
                  use_jedi = Bool(default_value=False,
                                  help="Experimental: Use Jedi to generate autocompletions. "
                                  "Off by default.").tag(config=True)
                  jedi_compute_type_timeout = Int(default_value=400,
                      help="""Experimental: restrict time (in milliseconds) during which Jedi can compute types.
                      Set to 0 to stop computing types. Non-zero value lower than 100ms may hurt
                      performance by preventing jedi to build its cache.
                      """).tag(config=True)
                  debug = Bool(default_value=False,
                               help='Enable debug for the Completer. Mostly print extra '
                                    'information for experimental jedi integration.')\
                                    .tag(config=True)
                  backslash_combining_completions = Bool(True,
                      help="Enable unicode completions, e.g. \\alpha<tab> . "
                           "Includes completion of latex commands, unicode names, and expanding "
                           "unicode characters back to latex commands.").tag(config=True)
                  def __init__(self, namespace=None, global_namespace=None, **kwargs):
                      """Create a new completer for the command line.
                      Completer(namespace=ns, global_namespace=ns2) -> completer instance.
                      If unspecified, the default namespace where completions are performed
                      is __main__ (technically, __main__.__dict__). Namespaces should be
                      given as dictionaries.
                      An optional second namespace can be given.  This allows the completer
                      to handle cases where both the local and global scopes need to be
                      distinguished.
                      """
                      # Don't bind to namespace quite yet, but flag whether the user wants a
                      # specific namespace or to use __main__.__dict__. This will allow us
                      # to bind to __main__.__dict__ at completion time, not now.
                      if namespace is None:
                          self.use_main_ns = True
                      else:
                          self.use_main_ns = False
                          self.namespace = namespace
                      # The global namespace, if given, can be bound directly
                      if global_namespace is None:
                          self.global_namespace = {}
                      else:
                          self.global_namespace = global_namespace
                      super(Completer, self).__init__(**kwargs)
                  def complete(self, text, state):
                      """Return the next possible completion for 'text'.
                      This is called successively with state == 0, 1, 2, ... until it
                      returns None.  The completion should begin with 'text'.
                      """
                      if self.use_main_ns:
                          self.namespace = __main__.__dict__
                      if state == 0:
                          if "." in text:
                              self.matches = self.attr_matches(text)
                          else:
                              self.matches = self.global_matches(text)
                      try:
                          return self.matches[state]
                      except IndexError:
                          return None
                  def global_matches(self, text):
                      """Compute matches when text is a simple name.
                      Return a list of all keywords, built-in functions and names currently
                      defined in self.namespace or self.global_namespace that match.
                      """
                      matches = []
                      match_append = matches.append
                      n = len(text)
                      for lst in [keyword.kwlist,
                                  builtin_mod.__dict__.keys(),
                                  self.namespace.keys(),
                                  self.global_namespace.keys()]:
                          for word in lst:
                              if word[:n] == text and word != "__builtins__":
                                  match_append(word)
                      snake_case_re = re.compile(r"[^_]+(_[^_]+)+?\Z")
                      for lst in [self.namespace.keys(),
                                  self.global_namespace.keys()]:
                          shortened = {"_".join([sub[0] for sub in word.split('_')]) : word
                                       for word in lst if snake_case_re.match(word)}
                          for word in shortened.keys():
                              if word[:n] == text and word != "__builtins__":
                                  match_append(shortened[word])
                      return matches
                  def attr_matches(self, text):
                      """Compute matches when text contains a dot.
                      Assuming the text is of the form NAME.NAME....[NAME], and is
                      evaluatable in self.namespace or self.global_namespace, it will be
                      evaluated and its attributes (as revealed by dir()) are used as
                      possible completions.  (For class instances, class members are
                      also considered.)
                      WARNING: this can still invoke arbitrary C code, if an object
                      with a __getattr__ hook is evaluated.
                      """
                      # Another option, seems to work great. Catches things like ''.<tab>
                      m = re.match(r"(\S+(\.\w+)*)\.(\w*)$", text)
                      if m:
                          expr, attr = m.group(1, 3)
                      elif self.greedy:
                          m2 = re.match(r"(.+)\.(\w*)$", self.line_buffer)
                          if not m2:
                              return []
                          expr, attr = m2.group(1,2)
                      else:
                          return []
                      try:
                          obj = eval(expr, self.namespace)
                      except:
                          try:
                              obj = eval(expr, self.global_namespace)
                          except:
                              return []
                      if self.limit_to__all__ and hasattr(obj, '__all__'):
                          words = get__all__entries(obj)
                      else:
                          words = dir2(obj)
                      try:
                          words = generics.complete_object(obj, words)
                      except TryNext:
                          pass
                      except AssertionError:
                          raise
                      except Exception:
                          # Silence errors from completion function
                          #raise # dbg
                          pass
                      # Build match list to return
                      n = len(attr)
                      return [u"%s.%s" % (expr, w) for w in words if w[:n] == attr ]
              def get__all__entries(obj):
                  """returns the strings in the __all__ attribute"""
                  try:
                      words = getattr(obj, '__all__')
                  except:
                      return []
                  return [w for w in words if isinstance(w, str)]
              def match_dict_keys(keys: List[str], prefix: str, delims: str):
                  """Used by dict_key_matches, matching the prefix to a list of keys
                  Parameters
                  ==========
                  keys:
                      list of keys in dictionary currently being completed.
                  prefix:
                      Part of the text already typed by the user. e.g. `mydict[b'fo`
                  delims:
                      String of delimiters to consider when finding the current key.
                  Returns
                  =======
                  A tuple of three elements: ``quote``, ``token_start``, ``matched``, with
                  ``quote`` being the quote that need to be used to close current string.
                  ``token_start`` the position where the replacement should start occurring,
                  ``matches`` a list of replacement/completion
                  """
                  if not prefix:
                      return None, 0, [repr(k) for k in keys
                                    if isinstance(k, (str, bytes))]
                  quote_match = re.search('["\']', prefix)
                  quote = quote_match.group()
                  try:
                      prefix_str = eval(prefix + quote, {})
                  except Exception:
                      return None, 0, []
                  pattern = '[^' + ''.join('\\' + c for c in delims) + ']*$'
                  token_match = re.search(pattern, prefix, re.UNICODE)
                  token_start = token_match.start()
                  token_prefix = token_match.group()
                  matched = []
                  for key in keys:
                      try:
                          if not key.startswith(prefix_str):
                              continue
                      except (AttributeError, TypeError, UnicodeError):
                          # Python 3+ TypeError on b'a'.startswith('a') or vice-versa
                          continue
                      # reformat remainder of key to begin with prefix
                      rem = key[len(prefix_str):]
                      # force repr wrapped in '
                      rem_repr = repr(rem + '"') if isinstance(rem, str) else repr(rem + b'"')
                      if rem_repr.startswith('u') and prefix[0] not in 'uU':
                          # Found key is unicode, but prefix is Py2 string.
                          # Therefore attempt to interpret key as string.
                          try:
                              rem_repr = repr(rem.encode('ascii') + '"')
                          except UnicodeEncodeError:
                              continue
                      rem_repr = rem_repr[1 + rem_repr.index("'"):-2]
                      if quote == '"':
                          # The entered prefix is quoted with ",
                          # but the match is quoted with '.
                          # A contained " hence needs escaping for comparison:
                          rem_repr = rem_repr.replace('"', '\\"')
                      # then reinsert prefix from start of token
                      matched.append('%s%s' % (token_prefix, rem_repr))
                  return quote, token_start, matched
              def cursor_to_position(text:str, line:int, column:int)->int:
                  """
                  Convert the (line,column) position of the cursor in text to an offset in a
                  string.
                  Parameters
                  ----------
                  text : str
                      The text in which to calculate the cursor offset
                  line : int
                      Line of the cursor; 0-indexed
                  column : int
                      Column of the cursor 0-indexed
                  Return
                  ------
                      Position of the cursor in ``text``, 0-indexed.
                  See Also
                  --------
                  position_to_cursor: reciprocal of this function
                  """
                  lines = text.split('\n')
                  assert line <= len(lines), '{} <= {}'.format(str(line), str(len(lines)))
                  return sum(len(l) + 1 for l in lines[:line]) + column
              def position_to_cursor(text:str, offset:int)->Tuple[int, int]:
                  """
                  Convert the position of the cursor in text (0 indexed) to a line
                  number(0-indexed) and a column number (0-indexed) pair
                  Position should be a valid position in ``text``.
                  Parameters
                  ----------
                  text : str
                      The text in which to calculate the cursor offset
                  offset : int
                      Position of the cursor in ``text``, 0-indexed.
                  Return
                  ------
                  (line, column) : (int, int)
                      Line of the cursor; 0-indexed, column of the cursor 0-indexed
                  See Also
                  --------
                  cursor_to_position : reciprocal of this function
                  """
                  assert 0 <= offset <= len(text) , "0 <= %s <= %s" % (offset , len(text))
                  before = text[:offset]
                  blines = before.split('\n')  # ! splitnes trim trailing \n
                  line = before.count('\n')
                  col = len(blines[-1])
                  return line, col
              def _safe_isinstance(obj, module, class_name):
                  """Checks if obj is an instance of module.class_name if loaded
                  """
                  return (module in sys.modules and
                          isinstance(obj, getattr(import_module(module), class_name)))
              def back_unicode_name_matches(text):
                  u"""Match unicode characters back to unicode name
                  This does  ``☃`` -> ``\\snowman``
                  Note that snowman is not a valid python3 combining character but will be expanded.
                  Though it will not recombine back to the snowman character by the completion machinery.
                  This will not either back-complete standard sequences like \\n, \\b ...
                  Used on Python 3 only.
                  """
                  if len(text)<2:
                      return u'', ()
                  maybe_slash = text[-2]
                  if maybe_slash != '\\':
                      return u'', ()
                  char = text[-1]
                  # no expand on quote for completion in strings.
                  # nor backcomplete standard ascii keys
                  if char in string.ascii_letters or char in ['"',"'"]:
                      return u'', ()
                  try :
                      unic = unicodedata.name(char)
                      return '\\'+char,['\\'+unic]
                  except KeyError:
                      pass
                  return u'', ()
              def back_latex_name_matches(text:str):
                  """Match latex characters back to unicode name
                  This does ``\\ℵ`` -> ``\\aleph``
                  Used on Python 3 only.
                  """
                  if len(text)<2:
                      return u'', ()
                  maybe_slash = text[-2]
                  if maybe_slash != '\\':
                      return u'', ()
                  char = text[-1]
                  # no expand on quote for completion in strings.
                  # nor backcomplete standard ascii keys
                  if char in string.ascii_letters or char in ['"',"'"]:
                      return u'', ()
                  try :
                      latex = reverse_latex_symbol[char]
                      # '\\' replace the \ as well
                      return '\\'+char,[latex]
                  except KeyError:
                      pass
                  return u'', ()
              def _formatparamchildren(parameter) -> str:
                  """
                  Get parameter name and value from Jedi Private API
                  Jedi does not expose a simple way to get `param=value` from its API.
                  Parameter
                  =========
                  parameter:
                      Jedi's function `Param`
                  Returns
                  =======
                  A string like 'a', 'b=1', '*args', '**kwargs'
                  """
                  description = parameter.description
                  if not description.startswith('param '):
                      raise ValueError('Jedi function parameter description have change format.'
                                       'Expected "param ...", found %r".' % description)
                  return description[6:]
              def _make_signature(completion)-> str:
                  """
                  Make the signature from a jedi completion
                  Parameter
                  =========
                  completion: jedi.Completion
                      object does not complete a function type
                  Returns
                  =======
                  a string consisting of the function signature, with the parenthesis but
                  without the function name. example:
                  `(a, *args, b=1, **kwargs)`
                  """
                  return '(%s)'% ', '.join([f for f in (_formatparamchildren(p) for p in completion.params) if f])
              class IPCompleter(Completer):
                  """Extension of the completer class with IPython-specific features"""
                  @observe('greedy')
                  def _greedy_changed(self, change):
                      """update the splitter and readline delims when greedy is changed"""
                      if change['new']:
                          self.splitter.delims = GREEDY_DELIMS
                      else:
                          self.splitter.delims = DELIMS
                  merge_completions = Bool(True,
                      help="""Whether to merge completion results into a single list
                      If False, only the completion results from the first non-empty
                      completer will be returned.
                      """
                  ).tag(config=True)
                  omit__names = Enum((0,1,2), default_value=2,
                      help="""Instruct the completer to omit private method names
                      Specifically, when completing on ``object.<tab>``.
                      When 2 [default]: all names that start with '_' will be excluded.
                      When 1: all 'magic' names (``__foo__``) will be excluded.
                      When 0: nothing will be excluded.
                      """
                  ).tag(config=True)
                  limit_to__all__ = Bool(False,
                      help="""
                      DEPRECATED as of version 5.0.
                      Instruct the completer to use __all__ for the completion
                      Specifically, when completing on ``object.<tab>``.
                      When True: only those names in obj.__all__ will be included.
                      When False [default]: the __all__ attribute is ignored
                      """,
                  ).tag(config=True)
                  @observe('limit_to__all__')
                  def _limit_to_all_changed(self, change):
                      warnings.warn('`IPython.core.IPCompleter.limit_to__all__` configuration '
                          'value has been deprecated since IPython 5.0, will be made to have '
                          'no effects and then removed in future version of IPython.',
                          UserWarning)
                  def __init__(self, shell=None, namespace=None, global_namespace=None,
                               use_readline=_deprecation_readline_sentinel, config=None, **kwargs):
                      """IPCompleter() -> completer
                      Return a completer object.
                      Parameters
                      ----------
                      shell
                          a pointer to the ipython shell itself.  This is needed
                          because this completer knows about magic functions, and those can
                          only be accessed via the ipython instance.
                      namespace : dict, optional
                          an optional dict where completions are performed.
                      global_namespace : dict, optional
                          secondary optional dict for completions, to
                          handle cases (such as IPython embedded inside functions) where
                          both Python scopes are visible.
                      use_readline : bool, optional
                          DEPRECATED, ignored since IPython 6.0, will have no effects
                      """
                      self.magic_escape = ESC_MAGIC
                      self.splitter = CompletionSplitter()
                      if use_readline is not _deprecation_readline_sentinel:
                          warnings.warn('The `use_readline` parameter is deprecated and ignored since IPython 6.0.',
                                        DeprecationWarning, stacklevel=2)
                      # _greedy_changed() depends on splitter and readline being defined:
                      Completer.__init__(self, namespace=namespace, global_namespace=global_namespace,
                                          config=config, **kwargs)
                      # List where completion matches will be stored
                      self.matches = []
                      self.shell = shell
                      # Regexp to split filenames with spaces in them
                      self.space_name_re = re.compile(r'([^\\] )')
                      # Hold a local ref. to glob.glob for speed
                      self.glob = glob.glob
                      # Determine if we are running on 'dumb' terminals, like (X)Emacs
                      # buffers, to avoid completion problems.
                      term = os.environ.get('TERM','xterm')
                      self.dumb_terminal = term in ['dumb','emacs']
                      # Special handling of backslashes needed in win32 platforms
                      if sys.platform == "win32":
                          self.clean_glob = self._clean_glob_win32
                      else:
                          self.clean_glob = self._clean_glob
                      #regexp to parse docstring for function signature
                      self.docstring_sig_re = re.compile(r'^[\w|\s.]+\(([^)]*)\).*')
                      self.docstring_kwd_re = re.compile(r'[\s|\[]*(\w+)(?:\s*=\s*.*)')
                      #use this if positional argument name is also needed
                      #= re.compile(r'[\s|\[]*(\w+)(?:\s*=?\s*.*)')
                      self.magic_arg_matchers = [
                          self.magic_config_matches,
                          self.magic_color_matches,
                      ]
                      # This is set externally by InteractiveShell
                      self.custom_completers = None
                  @property
                  def matchers(self):
                      """All active matcher routines for completion"""
                      if self.use_jedi:
                          return [
                              self.file_matches,
                              self.magic_matches,
                              self.dict_key_matches,
                          ]
                      else:
                          return [
                              self.python_matches,
                              self.file_matches,
                              self.magic_matches,
                              self.python_func_kw_matches,
                              self.dict_key_matches,
                          ]
                  def all_completions(self, text):
                      """
                      Wrapper around the complete method for the benefit of emacs.
                      """
                      return self.complete(text)[1]
                  def _clean_glob(self, text):
                      return self.glob("%s*" % text)
                  def _clean_glob_win32(self,text):
                      return [f.replace("\\","/")
                              for f in self.glob("%s*" % text)]
                  def file_matches(self, text):
                      """Match filenames, expanding ~USER type strings.
                      Most of the seemingly convoluted logic in this completer is an
                      attempt to handle filenames with spaces in them.  And yet it's not
                      quite perfect, because Python's readline doesn't expose all of the
                      GNU readline details needed for this to be done correctly.
                      For a filename with a space in it, the printed completions will be
                      only the parts after what's already been typed (instead of the
                      full completions, as is normally done).  I don't think with the
                      current (as of Python 2.3) Python readline it's possible to do
                      better."""
                      # chars that require escaping with backslash - i.e. chars
                      # that readline treats incorrectly as delimiters, but we
                      # don't want to treat as delimiters in filename matching
                      # when escaped with backslash
                      if text.startswith('!'):
                          text = text[1:]
                          text_prefix = u'!'
                      else:
                          text_prefix = u''
                      text_until_cursor = self.text_until_cursor
                      # track strings with open quotes
                      open_quotes = has_open_quotes(text_until_cursor)
                      if '(' in text_until_cursor or '[' in text_until_cursor:
                          lsplit = text
                      else:
                          try:
                              # arg_split ~ shlex.split, but with unicode bugs fixed by us
                              lsplit = arg_split(text_until_cursor)[-1]
                          except ValueError:
                              # typically an unmatched ", or backslash without escaped char.
                              if open_quotes:
                                  lsplit = text_until_cursor.split(open_quotes)[-1]
                              else:
                                  return []
                          except IndexError:
                              # tab pressed on empty line
                              lsplit = ""
                      if not open_quotes and lsplit != protect_filename(lsplit):
                          # if protectables are found, do matching on the whole escaped name
                          has_protectables = True
                          text0,text = text,lsplit
                      else:
                          has_protectables = False
                          text = os.path.expanduser(text)
                      if text == "":
                          return [text_prefix + protect_filename(f) for f in self.glob("*")]
                      # Compute the matches from the filesystem
                      if sys.platform == 'win32':
                          m0 = self.clean_glob(text)
                      else:
                          m0 = self.clean_glob(text.replace('\\', ''))
                      if has_protectables:
                          # If we had protectables, we need to revert our changes to the
                          # beginning of filename so that we don't double-write the part
                          # of the filename we have so far
                          len_lsplit = len(lsplit)
                          matches = [text_prefix + text0 +
                                     protect_filename(f[len_lsplit:]) for f in m0]
                      else:
                          if open_quotes:
                              # if we have a string with an open quote, we don't need to
                              # protect the names beyond the quote (and we _shouldn't_, as
                              # it would cause bugs when the filesystem call is made).
                              matches = m0 if sys.platform == "win32" else\
                                  [protect_filename(f, open_quotes) for f in m0]
                          else:
                              matches = [text_prefix +
                                         protect_filename(f) for f in m0]
                      # Mark directories in input list by appending '/' to their names.
                      return [x+'/' if os.path.isdir(x) else x for x in matches]
                  def magic_matches(self, text):
                      """Match magics"""
                      # Get all shell magics now rather than statically, so magics loaded at
                      # runtime show up too.
                      lsm = self.shell.magics_manager.lsmagic()
                      line_magics = lsm['line']
                      cell_magics = lsm['cell']
                      pre = self.magic_escape
                      pre2 = pre+pre
                      explicit_magic = text.startswith(pre)
                      # Completion logic:
                      # - user gives %%: only do cell magics
                      # - user gives %: do both line and cell magics
                      # - no prefix: do both
                      # In other words, line magics are skipped if the user gives %% explicitly
                      #
                      # We also exclude magics that match any currently visible names:
                      # https://github.com/ipython/ipython/issues/4877, unless the user has
                      # typed a %:
                      # https://github.com/ipython/ipython/issues/10754
                      bare_text = text.lstrip(pre)
                      global_matches = self.global_matches(bare_text)
                      if not explicit_magic:
                          def matches(magic):
                              """
                              Filter magics, in particular remove magics that match
                              a name present in global namespace.
                              """
                              return ( magic.startswith(bare_text) and
                                       magic not in global_matches )
                      else:
                          def matches(magic):
                              return magic.startswith(bare_text)
                      comp = [ pre2+m for m in cell_magics if matches(m)]
                      if not text.startswith(pre2):
                          comp += [ pre+m for m in line_magics if matches(m)]
                      return comp
                  def magic_config_matches(self, text:str) -> List[str]:
                      """ Match class names and attributes for %config magic """
                      texts = text.strip().split()
                      if len(texts) > 0 and (texts[0] == 'config' or texts[0] == '%config'):
                          # get all configuration classes
                          classes = sorted(set([ c for c in self.shell.configurables
                                                 if c.__class__.class_traits(config=True)
                                                 ]), key=lambda x: x.__class__.__name__)
                          classnames = [ c.__class__.__name__ for c in classes ]
                          # return all classnames if config or %config is given
                          if len(texts) == 1:
                              return classnames
                          # match classname
                          classname_texts = texts[1].split('.')
                          classname = classname_texts[0]
                          classname_matches = [ c for c in classnames
                                                if c.startswith(classname) ]
                          # return matched classes or the matched class with attributes
                          if texts[1].find('.') < 0:
                              return classname_matches
                          elif len(classname_matches) == 1 and \
                                          classname_matches[0] == classname:
                              cls = classes[classnames.index(classname)].__class__
                              help = cls.class_get_help()
                              # strip leading '--' from cl-args:
                              help = re.sub(re.compile(r'^--', re.MULTILINE), '', help)
                              return [ attr.split('=')[0]
                                       for attr in help.strip().splitlines()
                                       if attr.startswith(texts[1]) ]
                      return []
                  def magic_color_matches(self, text:str) -> List[str] :
                      """ Match color schemes for %colors magic"""
                      texts = text.split()
                      if text.endswith(' '):
                          # .split() strips off the trailing whitespace. Add '' back
                          # so that: '%colors ' -> ['%colors', '']
                          texts.append('')
                      if len(texts) == 2 and (texts[0] == 'colors' or texts[0] == '%colors'):
                          prefix = texts[1]
                          return [ color for color in InspectColors.keys()
                                   if color.startswith(prefix) ]
                      return []
                  def _jedi_matches(self, cursor_column:int, cursor_line:int, text:str):
                      """
                      Return a list of :any:`jedi.api.Completions` object from a ``text`` and
                      cursor position.
                      Parameters
                      ----------
                      cursor_column : int
                          column position of the cursor in ``text``, 0-indexed.
                      cursor_line : int
                          line position of the cursor in ``text``, 0-indexed
                      text : str
                          text to complete
                      Debugging
                      ---------
                      If ``IPCompleter.debug`` is ``True`` may return a :any:`_FakeJediCompletion`
                      object containing a string with the Jedi debug information attached.
                      """
                      namespaces = [self.namespace]
                      if self.global_namespace is not None:
                          namespaces.append(self.global_namespace)
                      completion_filter = lambda x:x
                      offset = cursor_to_position(text, cursor_line, cursor_column)
                      # filter output if we are completing for object members
                      if offset:
                          pre = text[offset-1]
                          if pre == '.':
                              if self.omit__names == 2:
                                  completion_filter = lambda c:not c.name.startswith('_')
                              elif self.omit__names == 1:
                                  completion_filter = lambda c:not (c.name.startswith('__') and c.name.endswith('__'))
                              elif self.omit__names == 0:
                                  completion_filter = lambda x:x
                              else:
                                  raise ValueError("Don't understand self.omit__names == {}".format(self.omit__names))
                      interpreter = jedi.Interpreter(
                          text[:offset], namespaces, column=cursor_column, line=cursor_line + 1)
                      try_jedi = True
                      try:
                          # should we check the type of the node is Error ?
                          try:
                              # jedi < 0.11
                              from jedi.parser.tree import ErrorLeaf
                          except ImportError:
                              # jedi >= 0.11
                              from parso.tree import ErrorLeaf
                          next_to_last_tree = interpreter._get_module().tree_node.children[-2]
                          completing_string = False
                          if isinstance(next_to_last_tree, ErrorLeaf):
                              completing_string = next_to_last_tree.value.lstrip()[0] in {'"', "'"}
                          # if we are in a string jedi is likely not the right candidate for
                          # now. Skip it.
                          try_jedi = not completing_string
                      except Exception as e:
                          # many of things can go wrong, we are using private API just don't crash.
                          if self.debug:
                              print("Error detecting if completing a non-finished string :", e, '|')
                      if not try_jedi:
                          return []
                      try:
                          return filter(completion_filter, interpreter.completions())
                      except Exception as e:
                          if self.debug:
                              return [_FakeJediCompletion('Oops Jedi has crashed, please report a bug with the following:\n"""\n%s\ns"""' % (e))]
                          else:
                              return []
                  def python_matches(self, text):
                      """Match attributes or global python names"""
                      if "." in text:
                          try:
                              matches = self.attr_matches(text)
                              if text.endswith('.') and self.omit__names:
                                  if self.omit__names == 1:
                                      # true if txt is _not_ a __ name, false otherwise:
                                      no__name = (lambda txt:
                                                  re.match(r'.*\.__.*?__',txt) is None)
                                  else:
                                      # true if txt is _not_ a _ name, false otherwise:
                                      no__name = (lambda txt:
                                                  re.match(r'\._.*?',txt[txt.rindex('.'):]) is None)
                                  matches = filter(no__name, matches)
                          except NameError:
                              # catches <undefined attributes>.<tab>
                              matches = []
                      else:
                          matches = self.global_matches(text)
                      return matches
                  def _default_arguments_from_docstring(self, doc):
                      """Parse the first line of docstring for call signature.
                      Docstring should be of the form 'min(iterable[, key=func])\n'.
                      It can also parse cython docstring of the form
                      'Minuit.migrad(self, int ncall=10000, resume=True, int nsplit=1)'.
                      """
                      if doc is None:
                          return []
                      #care only the firstline
                      line = doc.lstrip().splitlines()[0]
                      #p = re.compile(r'^[\w|\s.]+\(([^)]*)\).*')
                      #'min(iterable[, key=func])\n' -> 'iterable[, key=func]'
                      sig = self.docstring_sig_re.search(line)
                      if sig is None:
                          return []
                      # iterable[, key=func]' -> ['iterable[' ,' key=func]']
                      sig = sig.groups()[0].split(',')
                      ret = []
                      for s in sig:
                          #re.compile(r'[\s|\[]*(\w+)(?:\s*=\s*.*)')
                          ret += self.docstring_kwd_re.findall(s)
                      return ret
                  def _default_arguments(self, obj):
                      """Return the list of default arguments of obj if it is callable,
                      or empty list otherwise."""
                      call_obj = obj
                      ret = []
                      if inspect.isbuiltin(obj):
                          pass
                      elif not (inspect.isfunction(obj) or inspect.ismethod(obj)):
                          if inspect.isclass(obj):
                              #for cython embedsignature=True the constructor docstring
                              #belongs to the object itself not __init__
                              ret += self._default_arguments_from_docstring(
                                          getattr(obj, '__doc__', ''))
                              # for classes, check for __init__,__new__
                              call_obj = (getattr(obj, '__init__', None) or
                                     getattr(obj, '__new__', None))
                          # for all others, check if they are __call__able
                          elif hasattr(obj, '__call__'):
                              call_obj = obj.__call__
                      ret += self._default_arguments_from_docstring(
                               getattr(call_obj, '__doc__', ''))
                      _keeps = (inspect.Parameter.KEYWORD_ONLY,
                                inspect.Parameter.POSITIONAL_OR_KEYWORD)
                      try:
                          sig = inspect.signature(call_obj)
                          ret.extend(k for k, v in sig.parameters.items() if
                                     v.kind in _keeps)
                      except ValueError:
                          pass
                      return list(set(ret))
                  def python_func_kw_matches(self,text):
                      """Match named parameters (kwargs) of the last open function"""
                      if "." in text: # a parameter cannot be dotted
                          return []
                      try: regexp = self.__funcParamsRegex
                      except AttributeError:
                          regexp = self.__funcParamsRegex = re.compile(r'''
                              '.*?(?<!\\)' |    # single quoted strings or
                              ".*?(?<!\\)" |    # double quoted strings or
                              \w+          |    # identifier
                              \S                # other characters
                              ''', re.VERBOSE | re.DOTALL)
                      # 1. find the nearest identifier that comes before an unclosed
                      # parenthesis before the cursor
                      # e.g. for "foo (1+bar(x), pa<cursor>,a=1)", the candidate is "foo"
                      tokens = regexp.findall(self.text_until_cursor)
                      iterTokens = reversed(tokens); openPar = 0
                      for token in iterTokens:
                          if token == ')':
                              openPar -= 1
                          elif token == '(':
                              openPar += 1
                              if openPar > 0:
                                  # found the last unclosed parenthesis
                                  break
                      else:
                          return []
                      # 2. Concatenate dotted names ("foo.bar" for "foo.bar(x, pa" )
                      ids = []
                      isId = re.compile(r'\w+$').match
                      while True:
                          try:
                              ids.append(next(iterTokens))
                              if not isId(ids[-1]):
                                  ids.pop(); break
                              if not next(iterTokens) == '.':
                                  break
                          except StopIteration:
                              break
                      # Find all named arguments already assigned to, as to avoid suggesting
                      # them again
                      usedNamedArgs = set()
                      par_level = -1
                      for token, next_token in zip(tokens, tokens[1:]):
                          if token == '(':
                              par_level += 1
                          elif token == ')':
                              par_level -= 1
                          if par_level != 0:
                              continue
                          if next_token != '=':
                              continue
                          usedNamedArgs.add(token)
                      # lookup the candidate callable matches either using global_matches
                      # or attr_matches for dotted names
                      if len(ids) == 1:
                          callableMatches = self.global_matches(ids[0])
                      else:
                          callableMatches = self.attr_matches('.'.join(ids[::-1]))
                      argMatches = []
                      for callableMatch in callableMatches:
                          try:
                              namedArgs = self._default_arguments(eval(callableMatch,
                                                                      self.namespace))
                          except:
                              continue
                          # Remove used named arguments from the list, no need to show twice
                          for namedArg in set(namedArgs) - usedNamedArgs:
                              if namedArg.startswith(text):
                                  argMatches.append(u"%s=" %namedArg)
                      return argMatches
                  def dict_key_matches(self, text):
                      "Match string keys in a dictionary, after e.g. 'foo[' "
                      def get_keys(obj):
                          # Objects can define their own completions by defining an
                          # _ipy_key_completions_() method.
                          method = get_real_method(obj, '_ipython_key_completions_')
                          if method is not None:
                              return method()
                          # Special case some common in-memory dict-like types
                          if isinstance(obj, dict) or\
                             _safe_isinstance(obj, 'pandas', 'DataFrame'):
                              try:
                                  return list(obj.keys())
                              except Exception:
                                  return []
                          elif _safe_isinstance(obj, 'numpy', 'ndarray') or\
                               _safe_isinstance(obj, 'numpy', 'void'):
                              return obj.dtype.names or []
                          return []
                      try:
                          regexps = self.__dict_key_regexps
                      except AttributeError:
                          dict_key_re_fmt = r'''(?x)
                          (  # match dict-referring expression wrt greedy setting
                              %s
                          )
                          \[   # open bracket
                          \s*  # and optional whitespace
                          ([uUbB]?  # string prefix (r not handled)
                              (?:   # unclosed string
                                  '(?:[^']|(?<!\\)\\')*
                              |
                                  "(?:[^"]|(?<!\\)\\")*
                              )
                          )?
                          $
                          '''
                          regexps = self.__dict_key_regexps = {
-                             False: re.compile(dict_key_re_fmt % '''
+                             False: re.compile(dict_key_re_fmt % r'''
                                                # identifiers separated by .
                                                (?!\d)\w+
                                                (?:\.(?!\d)\w+)*
                                                '''),
                              True: re.compile(dict_key_re_fmt % '''
                                               .+
                                               ''')
                          }
                      match = regexps[self.greedy].search(self.text_until_cursor)
                      if match is None:
                          return []
                      expr, prefix = match.groups()
                      try:
                          obj = eval(expr, self.namespace)
                      except Exception:
                          try:
                              obj = eval(expr, self.global_namespace)
                          except Exception:
                              return []
                      keys = get_keys(obj)
                      if not keys:
                          return keys
                      closing_quote, token_offset, matches = match_dict_keys(keys, prefix, self.splitter.delims)
                      if not matches:
                          return matches
                      # get the cursor position of
                      # - the text being completed
                      # - the start of the key text
                      # - the start of the completion
                      text_start = len(self.text_until_cursor) - len(text)
                      if prefix:
                          key_start = match.start(2)
                          completion_start = key_start + token_offset
                      else:
                          key_start = completion_start = match.end()
                      # grab the leading prefix, to make sure all completions start with `text`
                      if text_start > key_start:
                          leading = ''
                      else:
                          leading = text[text_start:completion_start]
                      # the index of the `[` character
                      bracket_idx = match.end(1)
                      # append closing quote and bracket as appropriate
                      # this is *not* appropriate if the opening quote or bracket is outside
                      # the text given to this method
                      suf = ''
                      continuation = self.line_buffer[len(self.text_until_cursor):]
                      if key_start > text_start and closing_quote:
                          # quotes were opened inside text, maybe close them
                          if continuation.startswith(closing_quote):
                              continuation = continuation[len(closing_quote):]
                          else:
                              suf += closing_quote
                      if bracket_idx > text_start:
                          # brackets were opened inside text, maybe close them
                          if not continuation.startswith(']'):
                              suf += ']'
                      return [leading + k + suf for k in matches]
                  def unicode_name_matches(self, text):
                      u"""Match Latex-like syntax for unicode characters base
                      on the name of the character.
                      This does  ``\\GREEK SMALL LETTER ETA`` -> ``η``
                      Works only on valid python 3 identifier, or on combining characters that
                      will combine to form a valid identifier.
                      Used on Python 3 only.
                      """
                      slashpos = text.rfind('\\')
                      if slashpos > -1:
                          s = text[slashpos+1:]
                          try :
                              unic = unicodedata.lookup(s)
                              # allow combining chars
                              if ('a'+unic).isidentifier():
                                  return '\\'+s,[unic]
                          except KeyError:
                              pass
                      return u'', []
                  def latex_matches(self, text):
                      u"""Match Latex syntax for unicode characters.
                      This does both ``\\alp`` -> ``\\alpha`` and ``\\alpha`` -> ``α``
                      Used on Python 3 only.
                      """
                      slashpos = text.rfind('\\')
                      if slashpos > -1:
                          s = text[slashpos:]
                          if s in latex_symbols:
                              # Try to complete a full latex symbol to unicode
                              # \\alpha -> α
                              return s, [latex_symbols[s]]
                          else:
                              # If a user has partially typed a latex symbol, give them
                              # a full list of options \al -> [\aleph, \alpha]
                              matches = [k for k in latex_symbols if k.startswith(s)]
                              return s, matches
                      return u'', []
                  def dispatch_custom_completer(self, text):
                      if not self.custom_completers:
                          return
                      line = self.line_buffer
                      if not line.strip():
                          return None
                      # Create a little structure to pass all the relevant information about
                      # the current completion to any custom completer.
                      event = SimpleNamespace()
                      event.line = line
                      event.symbol = text
                      cmd = line.split(None,1)[0]
                      event.command = cmd
                      event.text_until_cursor = self.text_until_cursor
                      # for foo etc, try also to find completer for %foo
                      if not cmd.startswith(self.magic_escape):
                          try_magic = self.custom_completers.s_matches(
                              self.magic_escape + cmd)
                      else:
                          try_magic = []
                      for c in itertools.chain(self.custom_completers.s_matches(cmd),
                               try_magic,
                               self.custom_completers.flat_matches(self.text_until_cursor)):
                          try:
                              res = c(event)
                              if res:
                                  # first, try case sensitive match
                                  withcase = [r for r in res if r.startswith(text)]
                                  if withcase:
                                      return withcase
                                  # if none, then case insensitive ones are ok too
                                  text_low = text.lower()
                                  return [r for r in res if r.lower().startswith(text_low)]
                          except TryNext:
                              pass
                          except KeyboardInterrupt:
                              """
                              If custom completer take too long,
                              let keyboard interrupt abort and return nothing.
                              """
                              break
                      return None
                  def completions(self, text: str, offset: int)->Iterator[Completion]:
                      """
                      Returns an iterator over the possible completions
                      .. warning:: Unstable
                          This function is unstable, API may change without warning.
                          It will also raise unless use in proper context manager.
                      Parameters
                      ----------
                      text:str
                          Full text of the current input, multi line string.
                      offset:int
                          Integer representing the position of the cursor in ``text``. Offset
                          is 0-based indexed.
                      Yields
                      ------
                          :any:`Completion` object
                      The cursor on a text can either be seen as being "in between"
                      characters or "On" a character depending on the interface visible to
                      the user. For consistency the cursor being on "in between" characters X
                      and Y is equivalent to the cursor being "on" character Y, that is to say
                      the character the cursor is on is considered as being after the cursor.
                      Combining characters may span more that one position in the
                      text.
                      .. note::
                          If ``IPCompleter.debug`` is :any:`True` will yield a ``--jedi/ipython--``
                          fake Completion token to distinguish completion returned by Jedi
                          and usual IPython completion.
                      .. note::
                          Completions are not completely deduplicated yet. If identical
                          completions are coming from different sources this function does not
                          ensure that each completion object will only be present once.
                      """
                      warnings.warn("_complete is a provisional API (as of IPython 6.0). "
                                    "It may change without warnings. "
                                    "Use in corresponding context manager.",
                                    category=ProvisionalCompleterWarning, stacklevel=2)
                      seen = set()
                      try:
                          for c in self._completions(text, offset, _timeout=self.jedi_compute_type_timeout/1000):
                              if c and (c in seen):
                                  continue
                              yield c
                              seen.add(c)
                      except KeyboardInterrupt:
                          """if completions take too long and users send keyboard interrupt,
                          do not crash and return ASAP. """
                          pass
                  def _completions(self, full_text: str, offset: int, *, _timeout)->Iterator[Completion]:
                      """
                      Core completion module.Same signature as :any:`completions`, with the
                      extra `timeout` parameter (in seconds).
                      Computing jedi's completion ``.type`` can be quite expensive (it is a
                      lazy property) and can require some warm-up, more warm up than just
                      computing the ``name`` of a completion. The warm-up can be :
                          - Long warm-up the first time a module is encountered after
                          install/update: actually build parse/inference tree.
                          - first time the module is encountered in a session: load tree from
                          disk.
                      We don't want to block completions for tens of seconds so we give the
                      completer a "budget" of ``_timeout`` seconds per invocation to compute
                      completions types, the completions that have not yet been computed will
                      be marked as "unknown" an will have a chance to be computed next round
                      are things get cached.
                      Keep in mind that Jedi is not the only thing treating the completion so
                      keep the timeout short-ish as if we take more than 0.3 second we still
                      have lots of processing to do.
                      """
                      deadline = time.monotonic() + _timeout
                      before = full_text[:offset]
                      cursor_line, cursor_column = position_to_cursor(full_text, offset)
                      matched_text, matches, matches_origin, jedi_matches = self._complete(
                          full_text=full_text, cursor_line=cursor_line, cursor_pos=cursor_column)
                      iter_jm = iter(jedi_matches)
                      if _timeout:
                          for jm in iter_jm:
                              try:
                                  type_ = jm.type
                              except Exception:
                                  if self.debug:
                                      print("Error in Jedi getting type of ", jm)
                                  type_ = None
                              delta = len(jm.name_with_symbols) - len(jm.complete)
                              if type_ == 'function':
                                  signature = _make_signature(jm)
                              else:
                                  signature = ''
                              yield Completion(start=offset - delta,
                                               end=offset,
                                               text=jm.name_with_symbols,
                                               type=type_,
                                               signature=signature,
                                               _origin='jedi')
                              if time.monotonic() > deadline:
                                  break
                      for jm in iter_jm:
                          delta = len(jm.name_with_symbols) - len(jm.complete)
                          yield Completion(start=offset - delta,
                                           end=offset,
                                           text=jm.name_with_symbols,
                                           type='<unknown>',  # don't compute type for speed
                                           _origin='jedi',
                                           signature='')
                      start_offset = before.rfind(matched_text)
                      # TODO:
                      # Suppress this, right now just for debug.
                      if jedi_matches and matches and self.debug:
                          yield Completion(start=start_offset, end=offset, text='--jedi/ipython--',
                                           _origin='debug', type='none', signature='')
                      # I'm unsure if this is always true, so let's assert and see if it
                      # crash
                      assert before.endswith(matched_text)
                      for m, t in zip(matches, matches_origin):
                          yield Completion(start=start_offset, end=offset, text=m, _origin=t, signature='', type='<unknown>')
                  def complete(self, text=None, line_buffer=None, cursor_pos=None):
                      """Find completions for the given text and line context.
                      Note that both the text and the line_buffer are optional, but at least
                      one of them must be given.
                      Parameters
                      ----------
                        text : string, optional
                          Text to perform the completion on.  If not given, the line buffer
                          is split using the instance's CompletionSplitter object.
                        line_buffer : string, optional
                          If not given, the completer attempts to obtain the current line
                          buffer via readline.  This keyword allows clients which are
                          requesting for text completions in non-readline contexts to inform
                          the completer of the entire text.
                        cursor_pos : int, optional
                          Index of the cursor in the full line buffer.  Should be provided by
                          remote frontends where kernel has no access to frontend state.
                      Returns
                      -------
                      text : str
                        Text that was actually used in the completion.
                      matches : list
                        A list of completion matches.
                      .. note::
                          This API is likely to be deprecated and replaced by
                          :any:`IPCompleter.completions` in the future.
                      """
                      warnings.warn('`Completer.complete` is pending deprecation since '
                              'IPython 6.0 and will be replaced by `Completer.completions`.',
                                    PendingDeprecationWarning)
                      # potential todo, FOLD the 3rd throw away argument of _complete
                      # into the first 2 one.
                      return self._complete(line_buffer=line_buffer, cursor_pos=cursor_pos, text=text, cursor_line=0)[:2]
                  def _complete(self, *, cursor_line, cursor_pos, line_buffer=None, text=None,
                                full_text=None) -> Tuple[str, List[str], List[str], Iterable[_FakeJediCompletion]]:
                      """
                      Like complete but can also returns raw jedi completions as well as the
                      origin of the completion text. This could (and should) be made much
                      cleaner but that will be simpler once we drop the old (and stateful)
                      :any:`complete` API.
                      With current provisional API, cursor_pos act both (depending on the
                      caller) as the offset in the ``text`` or ``line_buffer``, or as the
                      ``column`` when passing multiline strings this could/should be renamed
                      but would add extra noise.
                      """
                      # if the cursor position isn't given, the only sane assumption we can
                      # make is that it's at the end of the line (the common case)
                      if cursor_pos is None:
                          cursor_pos = len(line_buffer) if text is None else len(text)
                      if self.use_main_ns:
                          self.namespace = __main__.__dict__
                      # if text is either None or an empty string, rely on the line buffer
                      if (not line_buffer) and full_text:
                          line_buffer = full_text.split('\n')[cursor_line]
                      if not text:
                          text = self.splitter.split_line(line_buffer, cursor_pos)
                      if self.backslash_combining_completions:
                          # allow deactivation of these on windows.
                          base_text = text if not line_buffer else line_buffer[:cursor_pos]
                          latex_text, latex_matches = self.latex_matches(base_text)
                          if latex_matches:
                              return latex_text, latex_matches, ['latex_matches']*len(latex_matches), ()
                          name_text = ''
                          name_matches = []
                          for meth in (self.unicode_name_matches, back_latex_name_matches, back_unicode_name_matches):
                              name_text, name_matches = meth(base_text)
                              if name_text:
                                  return name_text, name_matches[:MATCHES_LIMIT], \
                                         [meth.__qualname__]*min(len(name_matches), MATCHES_LIMIT), ()
                      # If no line buffer is given, assume the input text is all there was
                      if line_buffer is None:
                          line_buffer = text
                      self.line_buffer = line_buffer
                      self.text_until_cursor = self.line_buffer[:cursor_pos]
                      # Do magic arg matches
                      for matcher in self.magic_arg_matchers:
                          matches = list(matcher(line_buffer))[:MATCHES_LIMIT]
                          if matches:
                              origins = [matcher.__qualname__] * len(matches)
                              return text, matches, origins, ()
                      # Start with a clean slate of completions
                      matches = []
                      custom_res = self.dispatch_custom_completer(text)
                      # FIXME: we should extend our api to return a dict with completions for
                      # different types of objects.  The rlcomplete() method could then
                      # simply collapse the dict into a list for readline, but we'd have
                      # richer completion semantics in other environments.
                      completions = ()
                      if self.use_jedi:
                          if not full_text:
                              full_text = line_buffer
                          completions = self._jedi_matches(
                              cursor_pos, cursor_line, full_text)
                      if custom_res is not None:
                          # did custom completers produce something?
                          matches = [(m, 'custom') for m in custom_res]
                      else:
                          # Extend the list of completions with the results of each
                          # matcher, so we return results to the user from all
                          # namespaces.
                          if self.merge_completions:
                              matches = []
                              for matcher in self.matchers:
                                  try:
                                      matches.extend([(m, matcher.__qualname__)
                                                      for m in matcher(text)])
                                  except:
                                      # Show the ugly traceback if the matcher causes an
                                      # exception, but do NOT crash the kernel!
                                      sys.excepthook(*sys.exc_info())
                          else:
                              for matcher in self.matchers:
                                  matches = [(m, matcher.__qualname__)
                                             for m in matcher(text)]
                                  if matches:
                                      break
                      seen = set()
                      filtered_matches = set()
                      for m in matches:
                          t, c = m
                          if t not in seen:
                              filtered_matches.add(m)
                              seen.add(t)
                      _filtered_matches = sorted(
                          set(filtered_matches), key=lambda x: completions_sorting_key(x[0]))\
                          [:MATCHES_LIMIT]
                      _matches = [m[0] for m in _filtered_matches]
                      origins = [m[1] for m in _filtered_matches]
                      self.matches = _matches
                      return text, _matches, origins, completions

IPython/core/debugger.py

0 +1 -1

              # -*- coding: utf-8 -*-
              """
              Pdb debugger class.
              Modified from the standard pdb.Pdb class to avoid including readline, so that
              the command line completion of other programs which include this isn't
              damaged.
              In the future, this class will be expanded with improvements over the standard
              pdb.
              The code in this file is mainly lifted out of cmd.py in Python 2.2, with minor
              changes. Licensing should therefore be under the standard Python terms.  For
              details on the PSF (Python Software Foundation) standard license, see:
              https://docs.python.org/2/license.html
              """
              #*****************************************************************************
              #
              #       This file is licensed under the PSF license.
              #
              #       Copyright (C) 2001 Python Software Foundation, www.python.org
              #       Copyright (C) 2005-2006 Fernando Perez. <fperez@colorado.edu>
              #
              #
              #*****************************************************************************
              import bdb
              import functools
              import inspect
              import linecache
              import sys
              import warnings
              import re
              from IPython import get_ipython
              from IPython.utils import PyColorize
              from IPython.utils import coloransi, py3compat
              from IPython.core.excolors import exception_colors
              from IPython.testing.skipdoctest import skip_doctest
              prompt = 'ipdb> '
              #We have to check this directly from sys.argv, config struct not yet available
              from pdb import Pdb as OldPdb
              # Allow the set_trace code to operate outside of an ipython instance, even if
              # it does so with some limitations.  The rest of this support is implemented in
              # the Tracer constructor.
              def make_arrow(pad):
                  """generate the leading arrow in front of traceback or debugger"""
                  if pad >= 2:
                      return '-'*(pad-2) + '> '
                  elif pad == 1:
                      return '>'
                  return ''
              def BdbQuit_excepthook(et, ev, tb, excepthook=None):
                  """Exception hook which handles `BdbQuit` exceptions.
                  All other exceptions are processed using the `excepthook`
                  parameter.
                  """
                  warnings.warn("`BdbQuit_excepthook` is deprecated since version 5.1",
                                DeprecationWarning, stacklevel=2)
                  if et==bdb.BdbQuit:
                      print('Exiting Debugger.')
                  elif excepthook is not None:
                      excepthook(et, ev, tb)
                  else:
                      # Backwards compatibility. Raise deprecation warning?
                      BdbQuit_excepthook.excepthook_ori(et,ev,tb)
              def BdbQuit_IPython_excepthook(self,et,ev,tb,tb_offset=None):
                  warnings.warn(
                      "`BdbQuit_IPython_excepthook` is deprecated since version 5.1",
                      DeprecationWarning, stacklevel=2)
                  print('Exiting Debugger.')
              class Tracer(object):
                  """
                  DEPRECATED
                  Class for local debugging, similar to pdb.set_trace.
                  Instances of this class, when called, behave like pdb.set_trace, but
                  providing IPython's enhanced capabilities.
                  This is implemented as a class which must be initialized in your own code
                  and not as a standalone function because we need to detect at runtime
                  whether IPython is already active or not.  That detection is done in the
                  constructor, ensuring that this code plays nicely with a running IPython,
                  while functioning acceptably (though with limitations) if outside of it.
                  """
                  @skip_doctest
                  def __init__(self, colors=None):
                      """
                      DEPRECATED
                      Create a local debugger instance.
                      Parameters
                      ----------
                      colors : str, optional
                          The name of the color scheme to use, it must be one of IPython's
                          valid color schemes.  If not given, the function will default to
                          the current IPython scheme when running inside IPython, and to
                          'NoColor' otherwise.
                      Examples
                      --------
                      ::
                          from IPython.core.debugger import Tracer; debug_here = Tracer()
                      Later in your code::
                          debug_here()  # -> will open up the debugger at that point.
                      Once the debugger activates, you can use all of its regular commands to
                      step through code, set breakpoints, etc.  See the pdb documentation
                      from the Python standard library for usage details.
                      """
                      warnings.warn("`Tracer` is deprecated since version 5.1, directly use "
                                    "`IPython.core.debugger.Pdb.set_trace()`",
                                    DeprecationWarning, stacklevel=2)
                      ip = get_ipython()
                      if ip is None:
                          # Outside of ipython, we set our own exception hook manually
                          sys.excepthook = functools.partial(BdbQuit_excepthook,
                                                             excepthook=sys.excepthook)
                          def_colors = 'NoColor'
                      else:
                          # In ipython, we use its custom exception handler mechanism
                          def_colors = ip.colors
                          ip.set_custom_exc((bdb.BdbQuit,), BdbQuit_IPython_excepthook)
                      if colors is None:
                          colors = def_colors
                      # The stdlib debugger internally uses a modified repr from the `repr`
                      # module, that limits the length of printed strings to a hardcoded
                      # limit of 30 characters.  That much trimming is too aggressive, let's
                      # at least raise that limit to 80 chars, which should be enough for
                      # most interactive uses.
                      try:
                          try:
                              from reprlib import aRepr  # Py 3
                          except ImportError:
                              from repr import aRepr  # Py 2
                          aRepr.maxstring = 80
                      except:
                          # This is only a user-facing convenience, so any error we encounter
                          # here can be warned about but can be otherwise ignored.  These
                          # printouts will tell us about problems if this API changes
                          import traceback
                          traceback.print_exc()
                      self.debugger = Pdb(colors)
                  def __call__(self):
                      """Starts an interactive debugger at the point where called.
                      This is similar to the pdb.set_trace() function from the std lib, but
                      using IPython's enhanced debugger."""
                      self.debugger.set_trace(sys._getframe().f_back)
-             RGX_EXTRA_INDENT = re.compile('(?<=\n)\s+')
+             RGX_EXTRA_INDENT = re.compile(r'(?<=\n)\s+')
              def strip_indentation(multiline_string):
                  return RGX_EXTRA_INDENT.sub('', multiline_string)
              def decorate_fn_with_doc(new_fn, old_fn, additional_text=""):
                  """Make new_fn have old_fn's doc string. This is particularly useful
                  for the ``do_...`` commands that hook into the help system.
                  Adapted from from a comp.lang.python posting
                  by Duncan Booth."""
                  def wrapper(*args, **kw):
                      return new_fn(*args, **kw)
                  if old_fn.__doc__:
                      wrapper.__doc__ = strip_indentation(old_fn.__doc__) + additional_text
                  return wrapper
              def _file_lines(fname):
                  """Return the contents of a named file as a list of lines.
                  This function never raises an IOError exception: if the file can't be
                  read, it simply returns an empty list."""
                  try:
                      outfile = open(fname)
                  except IOError:
                      return []
                  else:
                      out = outfile.readlines()
                      outfile.close()
                      return out
              class Pdb(OldPdb):
                  """Modified Pdb class, does not load readline.
                  for a standalone version that uses prompt_toolkit, see
                  `IPython.terminal.debugger.TerminalPdb` and
                  `IPython.terminal.debugger.set_trace()`
                  """
                  def __init__(self, color_scheme=None, completekey=None,
                               stdin=None, stdout=None, context=5):
                      # Parent constructor:
                      try:
                          self.context = int(context)
                          if self.context <= 0:
                              raise ValueError("Context must be a positive integer")
                      except (TypeError, ValueError):
                              raise ValueError("Context must be a positive integer")
                      OldPdb.__init__(self, completekey, stdin, stdout)
                      # IPython changes...
                      self.shell = get_ipython()
                      if self.shell is None:
                          save_main = sys.modules['__main__']
                          # No IPython instance running, we must create one
                          from IPython.terminal.interactiveshell import \
                              TerminalInteractiveShell
                          self.shell = TerminalInteractiveShell.instance()
                          # needed by any code which calls __import__("__main__") after
                          # the debugger was entered. See also #9941.
                          sys.modules['__main__'] = save_main
                      if color_scheme is not None:
                          warnings.warn(
                              "The `color_scheme` argument is deprecated since version 5.1",
                              DeprecationWarning, stacklevel=2)
                      else:
                          color_scheme = self.shell.colors
                      self.aliases = {}
                      # Create color table: we copy the default one from the traceback
                      # module and add a few attributes needed for debugging
                      self.color_scheme_table = exception_colors()
                      # shorthands
                      C = coloransi.TermColors
                      cst = self.color_scheme_table
                      cst['NoColor'].colors.prompt = C.NoColor
                      cst['NoColor'].colors.breakpoint_enabled = C.NoColor
                      cst['NoColor'].colors.breakpoint_disabled = C.NoColor
                      cst['Linux'].colors.prompt = C.Green
                      cst['Linux'].colors.breakpoint_enabled = C.LightRed
                      cst['Linux'].colors.breakpoint_disabled = C.Red
                      cst['LightBG'].colors.prompt = C.Blue
                      cst['LightBG'].colors.breakpoint_enabled = C.LightRed
                      cst['LightBG'].colors.breakpoint_disabled = C.Red
                      cst['Neutral'].colors.prompt = C.Blue
                      cst['Neutral'].colors.breakpoint_enabled = C.LightRed
                      cst['Neutral'].colors.breakpoint_disabled = C.Red
                      # Add a python parser so we can syntax highlight source while
                      # debugging.
                      self.parser = PyColorize.Parser(style=color_scheme)
                      self.set_colors(color_scheme)
                      # Set the prompt - the default prompt is '(Pdb)'
                      self.prompt = prompt
                  def set_colors(self, scheme):
                      """Shorthand access to the color table scheme selector method."""
                      self.color_scheme_table.set_active_scheme(scheme)
                      self.parser.style = scheme
                  def interaction(self, frame, traceback):
                      try:
                          OldPdb.interaction(self, frame, traceback)
                      except KeyboardInterrupt:
                          sys.stdout.write('\n' + self.shell.get_exception_only())
                  def new_do_up(self, arg):
                      OldPdb.do_up(self, arg)
                  do_u = do_up = decorate_fn_with_doc(new_do_up, OldPdb.do_up)
                  def new_do_down(self, arg):
                      OldPdb.do_down(self, arg)
                  do_d = do_down = decorate_fn_with_doc(new_do_down, OldPdb.do_down)
                  def new_do_frame(self, arg):
                      OldPdb.do_frame(self, arg)
                  def new_do_quit(self, arg):
                      if hasattr(self, 'old_all_completions'):
                          self.shell.Completer.all_completions=self.old_all_completions
                      return OldPdb.do_quit(self, arg)
                  do_q = do_quit = decorate_fn_with_doc(new_do_quit, OldPdb.do_quit)
                  def new_do_restart(self, arg):
                      """Restart command. In the context of ipython this is exactly the same
                      thing as 'quit'."""
                      self.msg("Restart doesn't make sense here. Using 'quit' instead.")
                      return self.do_quit(arg)
                  def print_stack_trace(self, context=None):
                      if context is None:
                          context = self.context
                      try:
                          context=int(context)
                          if context <= 0:
                              raise ValueError("Context must be a positive integer")
                      except (TypeError, ValueError):
                              raise ValueError("Context must be a positive integer")
                      try:
                          for frame_lineno in self.stack:
                              self.print_stack_entry(frame_lineno, context=context)
                      except KeyboardInterrupt:
                          pass
                  def print_stack_entry(self,frame_lineno, prompt_prefix='\n-> ',
                                        context=None):
                      if context is None:
                          context = self.context
                      try:
                          context=int(context)
                          if context <= 0:
                              raise ValueError("Context must be a positive integer")
                      except (TypeError, ValueError):
                              raise ValueError("Context must be a positive integer")
                      print(self.format_stack_entry(frame_lineno, '', context))
                      # vds: >>
                      frame, lineno = frame_lineno
                      filename = frame.f_code.co_filename
                      self.shell.hooks.synchronize_with_editor(filename, lineno, 0)
                      # vds: <<
                  def format_stack_entry(self, frame_lineno, lprefix=': ', context=None):
                      if context is None:
                          context = self.context
                      try:
                          context=int(context)
                          if context <= 0:
                              print("Context must be a positive integer")
                      except (TypeError, ValueError):
                              print("Context must be a positive integer")
                      try:
                          import reprlib  # Py 3
                      except ImportError:
                          import repr as reprlib  # Py 2
                      ret = []
                      Colors = self.color_scheme_table.active_colors
                      ColorsNormal = Colors.Normal
                      tpl_link = u'%s%%s%s' % (Colors.filenameEm, ColorsNormal)
                      tpl_call = u'%s%%s%s%%s%s' % (Colors.vName, Colors.valEm, ColorsNormal)
                      tpl_line = u'%%s%s%%s %s%%s' % (Colors.lineno, ColorsNormal)
                      tpl_line_em = u'%%s%s%%s %s%%s%s' % (Colors.linenoEm, Colors.line,
                                                          ColorsNormal)
                      frame, lineno = frame_lineno
                      return_value = ''
                      if '__return__' in frame.f_locals:
                          rv = frame.f_locals['__return__']
                          #return_value += '->'
                          return_value += reprlib.repr(rv) + '\n'
                      ret.append(return_value)
                      #s = filename + '(' + `lineno` + ')'
                      filename = self.canonic(frame.f_code.co_filename)
                      link = tpl_link % py3compat.cast_unicode(filename)
                      if frame.f_code.co_name:
                          func = frame.f_code.co_name
                      else:
                          func = "<lambda>"
                      call = ''
                      if func != '?':
                          if '__args__' in frame.f_locals:
                              args = reprlib.repr(frame.f_locals['__args__'])
                          else:
                              args = '()'
                          call = tpl_call % (func, args)
                      # The level info should be generated in the same format pdb uses, to
                      # avoid breaking the pdbtrack functionality of python-mode in *emacs.
                      if frame is self.curframe:
                          ret.append('> ')
                      else:
                          ret.append('  ')
                      ret.append(u'%s(%s)%s\n' % (link,lineno,call))
                      start = lineno - 1 - context//2
                      lines = linecache.getlines(filename)
                      start = min(start, len(lines) - context)
                      start = max(start, 0)
                      lines = lines[start : start + context]
                      for i,line in enumerate(lines):
                          show_arrow = (start + 1 + i == lineno)
                          linetpl = (frame is self.curframe or show_arrow) \
                                    and tpl_line_em \
                                    or tpl_line
                          ret.append(self.__format_line(linetpl, filename,
                                                        start + 1 + i, line,
                                                        arrow = show_arrow) )
                      return ''.join(ret)
                  def __format_line(self, tpl_line, filename, lineno, line, arrow = False):
                      bp_mark = ""
                      bp_mark_color = ""
                      new_line, err = self.parser.format2(line, 'str')
                      if not err:
                          line = new_line
                      bp = None
                      if lineno in self.get_file_breaks(filename):
                          bps = self.get_breaks(filename, lineno)
                          bp = bps[-1]
                      if bp:
                          Colors = self.color_scheme_table.active_colors
                          bp_mark = str(bp.number)
                          bp_mark_color = Colors.breakpoint_enabled
                          if not bp.enabled:
                              bp_mark_color = Colors.breakpoint_disabled
                      numbers_width = 7
                      if arrow:
                          # This is the line with the error
                          pad = numbers_width - len(str(lineno)) - len(bp_mark)
                          num = '%s%s' % (make_arrow(pad), str(lineno))
                      else:
                          num = '%*s' % (numbers_width - len(bp_mark), str(lineno))
                      return tpl_line % (bp_mark_color + bp_mark, num, line)
                  def print_list_lines(self, filename, first, last):
                      """The printing (as opposed to the parsing part of a 'list'
                      command."""
                      try:
                          Colors = self.color_scheme_table.active_colors
                          ColorsNormal = Colors.Normal
                          tpl_line = '%%s%s%%s %s%%s' % (Colors.lineno, ColorsNormal)
                          tpl_line_em = '%%s%s%%s %s%%s%s' % (Colors.linenoEm, Colors.line, ColorsNormal)
                          src = []
                          if filename == "<string>" and hasattr(self, "_exec_filename"):
                              filename = self._exec_filename
                          for lineno in range(first, last+1):
                              line = linecache.getline(filename, lineno)
                              if not line:
                                  break
                              if lineno == self.curframe.f_lineno:
                                  line = self.__format_line(tpl_line_em, filename, lineno, line, arrow = True)
                              else:
                                  line = self.__format_line(tpl_line, filename, lineno, line, arrow = False)
                              src.append(line)
                              self.lineno = lineno
                          print(''.join(src))
                      except KeyboardInterrupt:
                          pass
                  def do_list(self, arg):
                      """Print lines of code from the current stack frame
                      """
                      self.lastcmd = 'list'
                      last = None
                      if arg:
                          try:
                              x = eval(arg, {}, {})
                              if type(x) == type(()):
                                  first, last = x
                                  first = int(first)
                                  last = int(last)
                                  if last < first:
                                      # Assume it's a count
                                      last = first + last
                              else:
                                  first = max(1, int(x) - 5)
                          except:
                              print('*** Error in argument:', repr(arg))
                              return
                      elif self.lineno is None:
                          first = max(1, self.curframe.f_lineno - 5)
                      else:
                          first = self.lineno + 1
                      if last is None:
                          last = first + 10
                      self.print_list_lines(self.curframe.f_code.co_filename, first, last)
                      # vds: >>
                      lineno = first
                      filename = self.curframe.f_code.co_filename
                      self.shell.hooks.synchronize_with_editor(filename, lineno, 0)
                      # vds: <<
                  do_l = do_list
                  def getsourcelines(self, obj):
                      lines, lineno = inspect.findsource(obj)
                      if inspect.isframe(obj) and obj.f_globals is obj.f_locals:
                          # must be a module frame: do not try to cut a block out of it
                          return lines, 1
                      elif inspect.ismodule(obj):
                          return lines, 1
                      return inspect.getblock(lines[lineno:]), lineno+1
                  def do_longlist(self, arg):
                      """Print lines of code from the current stack frame.
                      Shows more lines than 'list' does.
                      """
                      self.lastcmd = 'longlist'
                      try:
                          lines, lineno = self.getsourcelines(self.curframe)
                      except OSError as err:
                          self.error(err)
                          return
                      last = lineno + len(lines)
                      self.print_list_lines(self.curframe.f_code.co_filename, lineno, last)
                  do_ll = do_longlist
                  def do_debug(self, arg):
                      """debug code
                      Enter a recursive debugger that steps through the code
                      argument (which is an arbitrary expression or statement to be
                      executed in the current environment).
                      """
                      sys.settrace(None)
                      globals = self.curframe.f_globals
                      locals = self.curframe_locals
                      p = self.__class__(completekey=self.completekey,
                                         stdin=self.stdin, stdout=self.stdout)
                      p.use_rawinput = self.use_rawinput
                      p.prompt = "(%s) " % self.prompt.strip()
                      self.message("ENTERING RECURSIVE DEBUGGER")
                      sys.call_tracing(p.run, (arg, globals, locals))
                      self.message("LEAVING RECURSIVE DEBUGGER")
                      sys.settrace(self.trace_dispatch)
                      self.lastcmd = p.lastcmd
                  def do_pdef(self, arg):
                      """Print the call signature for any callable object.
                      The debugger interface to %pdef"""
                      namespaces = [('Locals', self.curframe.f_locals),
                                    ('Globals', self.curframe.f_globals)]
                      self.shell.find_line_magic('pdef')(arg, namespaces=namespaces)
                  def do_pdoc(self, arg):
                      """Print the docstring for an object.
                      The debugger interface to %pdoc."""
                      namespaces = [('Locals', self.curframe.f_locals),
                                    ('Globals', self.curframe.f_globals)]
                      self.shell.find_line_magic('pdoc')(arg, namespaces=namespaces)
                  def do_pfile(self, arg):
                      """Print (or run through pager) the file where an object is defined.
                      The debugger interface to %pfile.
                      """
                      namespaces = [('Locals', self.curframe.f_locals),
                                    ('Globals', self.curframe.f_globals)]
                      self.shell.find_line_magic('pfile')(arg, namespaces=namespaces)
                  def do_pinfo(self, arg):
                      """Provide detailed information about an object.
                      The debugger interface to %pinfo, i.e., obj?."""
                      namespaces = [('Locals', self.curframe.f_locals),
                                    ('Globals', self.curframe.f_globals)]
                      self.shell.find_line_magic('pinfo')(arg, namespaces=namespaces)
                  def do_pinfo2(self, arg):
                      """Provide extra detailed information about an object.
                      The debugger interface to %pinfo2, i.e., obj??."""
                      namespaces = [('Locals', self.curframe.f_locals),
                                    ('Globals', self.curframe.f_globals)]
                      self.shell.find_line_magic('pinfo2')(arg, namespaces=namespaces)
                  def do_psource(self, arg):
                      """Print (or run through pager) the source code for an object."""
                      namespaces = [('Locals', self.curframe.f_locals),
                                    ('Globals', self.curframe.f_globals)]
                      self.shell.find_line_magic('psource')(arg, namespaces=namespaces)
                  def do_where(self, arg):
                      """w(here)
                      Print a stack trace, with the most recent frame at the bottom.
                      An arrow indicates the "current frame", which determines the
                      context of most commands. 'bt' is an alias for this command.
                      Take a number as argument as an (optional) number of context line to
                      print"""
                      if arg:
                          context = int(arg)
                          self.print_stack_trace(context)
                      else:
                          self.print_stack_trace()
                  do_w = do_where
              def set_trace(frame=None):
                  """
                  Start debugging from `frame`.
                  If frame is not specified, debugging starts from caller's frame.
                  """
                  Pdb().set_trace(frame or sys._getframe().f_back)

IPython/core/inputsplitter.py

0 +1 -1

              """Input handling and transformation machinery.
              The first class in this module, :class:`InputSplitter`, is designed to tell when
              input from a line-oriented frontend is complete and should be executed, and when
              the user should be prompted for another line of code instead. The name 'input
              splitter' is largely for historical reasons.
              A companion, :class:`IPythonInputSplitter`, provides the same functionality but
              with full support for the extended IPython syntax (magics, system calls, etc).
              The code to actually do these transformations is in :mod:`IPython.core.inputtransformer`.
              :class:`IPythonInputSplitter` feeds the raw code to the transformers in order
              and stores the results.
              For more details, see the class docstrings below.
              """
              # Copyright (c) IPython Development Team.
              # Distributed under the terms of the Modified BSD License.
              import ast
              import codeop
              import io
              import re
              import sys
              import tokenize
              import warnings
              from IPython.utils.py3compat import cast_unicode
              from IPython.core.inputtransformer import (leading_indent,
                                                         classic_prompt,
                                                         ipy_prompt,
                                                         cellmagic,
                                                         assemble_logical_lines,
                                                         help_end,
                                                         escaped_commands,
                                                         assign_from_magic,
                                                         assign_from_system,
                                                         assemble_python_lines,
                                                         )
              # These are available in this module for backwards compatibility.
              from IPython.core.inputtransformer import (ESC_SHELL, ESC_SH_CAP, ESC_HELP,
                                                      ESC_HELP2, ESC_MAGIC, ESC_MAGIC2,
                                                      ESC_QUOTE, ESC_QUOTE2, ESC_PAREN, ESC_SEQUENCES)
              #-----------------------------------------------------------------------------
              # Utilities
              #-----------------------------------------------------------------------------
              # FIXME: These are general-purpose utilities that later can be moved to the
              # general ward.  Kept here for now because we're being very strict about test
              # coverage with this code, and this lets us ensure that we keep 100% coverage
              # while developing.
              # compiled regexps for autoindent management
              dedent_re = re.compile('|'.join([
                  r'^\s+raise(\s.*)?$', # raise statement (+ space + other stuff, maybe)
                  r'^\s+raise\([^\)]*\).*$', # wacky raise with immediate open paren
                  r'^\s+return(\s.*)?$', # normal return (+ space + other stuff, maybe)
                  r'^\s+return\([^\)]*\).*$', # wacky return with immediate open paren
                  r'^\s+pass\s*$', # pass (optionally followed by trailing spaces)
                  r'^\s+break\s*$', # break (optionally followed by trailing spaces)
                  r'^\s+continue\s*$', # continue (optionally followed by trailing spaces)
              ]))
              ini_spaces_re = re.compile(r'^([ \t\r\f\v]+)')
              # regexp to match pure comment lines so we don't accidentally insert 'if 1:'
              # before pure comments
-             comment_line_re = re.compile('^\s*\#')
+             comment_line_re = re.compile(r'^\s*\#')
              def num_ini_spaces(s):
                  """Return the number of initial spaces in a string.
                  Note that tabs are counted as a single space.  For now, we do *not* support
                  mixing of tabs and spaces in the user's input.
                  Parameters
                  ----------
                  s : string
                  Returns
                  -------
                  n : int
                  """
                  ini_spaces = ini_spaces_re.match(s)
                  if ini_spaces:
                      return ini_spaces.end()
                  else:
                      return 0
              # Fake token types for partial_tokenize:
              INCOMPLETE_STRING = tokenize.N_TOKENS
              IN_MULTILINE_STATEMENT = tokenize.N_TOKENS + 1
              # The 2 classes below have the same API as TokenInfo, but don't try to look up
              # a token type name that they won't find.
              class IncompleteString:
                  type = exact_type = INCOMPLETE_STRING
                  def __init__(self, s, start, end, line):
                      self.s = s
                      self.start = start
                      self.end = end
                      self.line = line
              class InMultilineStatement:
                  type = exact_type = IN_MULTILINE_STATEMENT
                  def __init__(self, pos, line):
                      self.s = ''
                      self.start = self.end = pos
                      self.line = line
              def partial_tokens(s):
                  """Iterate over tokens from a possibly-incomplete string of code.
                  This adds two special token types: INCOMPLETE_STRING and
                  IN_MULTILINE_STATEMENT. These can only occur as the last token yielded, and
                  represent the two main ways for code to be incomplete.
                  """
                  readline = io.StringIO(s).readline
                  token = tokenize.TokenInfo(tokenize.NEWLINE, '', (1, 0), (1, 0), '')
                  try:
                      for token in tokenize.generate_tokens(readline):
                          yield token
                  except tokenize.TokenError as e:
                      # catch EOF error
                      lines = s.splitlines(keepends=True)
                      end = len(lines), len(lines[-1])
                      if 'multi-line string' in e.args[0]:
                          l, c = start = token.end
                          s = lines[l-1][c:] + ''.join(lines[l:])
                          yield IncompleteString(s, start, end, lines[-1])
                      elif 'multi-line statement' in e.args[0]:
                          yield InMultilineStatement(end, lines[-1])
                      else:
                          raise
              def find_next_indent(code):
                  """Find the number of spaces for the next line of indentation"""
                  tokens = list(partial_tokens(code))
                  if tokens[-1].type == tokenize.ENDMARKER:
                      tokens.pop()
                  if not tokens:
                      return 0
                  while (tokens[-1].type in {tokenize.DEDENT, tokenize.NEWLINE, tokenize.COMMENT}):
                      tokens.pop()
                  if tokens[-1].type == INCOMPLETE_STRING:
                      # Inside a multiline string
                      return 0
                  # Find the indents used before
                  prev_indents = [0]
                  def _add_indent(n):
                      if n != prev_indents[-1]:
                          prev_indents.append(n)
                  tokiter = iter(tokens)
                  for tok in tokiter:
                      if tok.type in {tokenize.INDENT, tokenize.DEDENT}:
                          _add_indent(tok.end[1])
                      elif (tok.type == tokenize.NL):
                          try:
                              _add_indent(next(tokiter).start[1])
                          except StopIteration:
                              break
                  last_indent = prev_indents.pop()
                  # If we've just opened a multiline statement (e.g. 'a = ['), indent more
                  if tokens[-1].type == IN_MULTILINE_STATEMENT:
                      if tokens[-2].exact_type in {tokenize.LPAR, tokenize.LSQB, tokenize.LBRACE}:
                          return last_indent + 4
                      return last_indent
                  if tokens[-1].exact_type == tokenize.COLON:
                      # Line ends with colon - indent
                      return last_indent + 4
                  if last_indent:
                      # Examine the last line for dedent cues - statements like return or
                      # raise which normally end a block of code.
                      last_line_starts = 0
                      for i, tok in enumerate(tokens):
                          if tok.type == tokenize.NEWLINE:
                              last_line_starts = i + 1
                      last_line_tokens = tokens[last_line_starts:]
                      names = [t.string for t in last_line_tokens if t.type == tokenize.NAME]
                      if names and names[0] in {'raise', 'return', 'pass', 'break', 'continue'}:
                          # Find the most recent indentation less than the current level
                          for indent in reversed(prev_indents):
                              if indent < last_indent:
                                  return indent
                  return last_indent
              def last_blank(src):
                  """Determine if the input source ends in a blank.
                  A blank is either a newline or a line consisting of whitespace.
                  Parameters
                  ----------
                  src : string
                    A single or multiline string.
                  """
                  if not src: return False
                  ll  = src.splitlines()[-1]
                  return (ll == '') or ll.isspace()
              last_two_blanks_re = re.compile(r'\n\s*\n\s*$', re.MULTILINE)
              last_two_blanks_re2 = re.compile(r'.+\n\s*\n\s+$', re.MULTILINE)
              def last_two_blanks(src):
                  """Determine if the input source ends in two blanks.
                  A blank is either a newline or a line consisting of whitespace.
                  Parameters
                  ----------
                  src : string
                    A single or multiline string.
                  """
                  if not src: return False
                  # The logic here is tricky: I couldn't get a regexp to work and pass all
                  # the tests, so I took a different approach: split the source by lines,
                  # grab the last two and prepend '###\n' as a stand-in for whatever was in
                  # the body before the last two lines.  Then, with that structure, it's
                  # possible to analyze with two regexps.  Not the most elegant solution, but
                  # it works.  If anyone tries to change this logic, make sure to validate
                  # the whole test suite first!
                  new_src = '\n'.join(['###\n'] + src.splitlines()[-2:])
                  return (bool(last_two_blanks_re.match(new_src)) or
                          bool(last_two_blanks_re2.match(new_src)) )
              def remove_comments(src):
                  """Remove all comments from input source.
                  Note: comments are NOT recognized inside of strings!
                  Parameters
                  ----------
                  src : string
                    A single or multiline input string.
                  Returns
                  -------
                  String with all Python comments removed.
                  """
                  return re.sub('#.*', '', src)
              def get_input_encoding():
                  """Return the default standard input encoding.
                  If sys.stdin has no encoding, 'ascii' is returned."""
                  # There are strange environments for which sys.stdin.encoding is None. We
                  # ensure that a valid encoding is returned.
                  encoding = getattr(sys.stdin, 'encoding', None)
                  if encoding is None:
                      encoding = 'ascii'
                  return encoding
              #-----------------------------------------------------------------------------
              # Classes and functions for normal Python syntax handling
              #-----------------------------------------------------------------------------
              class InputSplitter(object):
                  r"""An object that can accumulate lines of Python source before execution.
                  This object is designed to be fed python source line-by-line, using
                  :meth:`push`. It will return on each push whether the currently pushed
                  code could be executed already. In addition, it provides a method called
                  :meth:`push_accepts_more` that can be used to query whether more input
                  can be pushed into a single interactive block.
                  This is a simple example of how an interactive terminal-based client can use
                  this tool::
                      isp = InputSplitter()
                      while isp.push_accepts_more():
                          indent = ' '*isp.indent_spaces
                          prompt = '>>> ' + indent
                          line = indent + raw_input(prompt)
                          isp.push(line)
                      print 'Input source was:\n', isp.source_reset(),
                  """
                  # A cache for storing the current indentation
                  # The first value stores the most recently processed source input
                  # The second value is the number of spaces for the current indentation
                  # If self.source matches the first value, the second value is a valid
                  # current indentation. Otherwise, the cache is invalid and the indentation
                  # must be recalculated.
                  _indent_spaces_cache = None, None
                  # String, indicating the default input encoding.  It is computed by default
                  # at initialization time via get_input_encoding(), but it can be reset by a
                  # client with specific knowledge of the encoding.
                  encoding = ''
                  # String where the current full source input is stored, properly encoded.
                  # Reading this attribute is the normal way of querying the currently pushed
                  # source code, that has been properly encoded.
                  source = ''
                  # Code object corresponding to the current source.  It is automatically
                  # synced to the source, so it can be queried at any time to obtain the code
                  # object; it will be None if the source doesn't compile to valid Python.
                  code = None
                  # Private attributes
                  # List with lines of input accumulated so far
                  _buffer = None
                  # Command compiler
                  _compile = None
                  # Boolean indicating whether the current block is complete
                  _is_complete = None
                  # Boolean indicating whether the current block has an unrecoverable syntax error
                  _is_invalid = False
                  def __init__(self):
                      """Create a new InputSplitter instance.
                      """
                      self._buffer = []
                      self._compile = codeop.CommandCompiler()
                      self.encoding = get_input_encoding()
                  def reset(self):
                      """Reset the input buffer and associated state."""
                      self._buffer[:] = []
                      self.source = ''
                      self.code = None
                      self._is_complete = False
                      self._is_invalid = False
                  def source_reset(self):
                      """Return the input source and perform a full reset.
                      """
                      out = self.source
                      self.reset()
                      return out
                  def check_complete(self, source):
                      """Return whether a block of code is ready to execute, or should be continued
                      This is a non-stateful API, and will reset the state of this InputSplitter.
                      Parameters
                      ----------
                      source : string
                        Python input code, which can be multiline.
                      Returns
                      -------
                      status : str
                        One of 'complete', 'incomplete', or 'invalid' if source is not a
                        prefix of valid code.
                      indent_spaces : int or None
                        The number of spaces by which to indent the next line of code. If
                        status is not 'incomplete', this is None.
                      """
                      self.reset()
                      try:
                          self.push(source)
                      except SyntaxError:
                          # Transformers in IPythonInputSplitter can raise SyntaxError,
                          # which push() will not catch.
                          return 'invalid', None
                      else:
                          if self._is_invalid:
                              return 'invalid', None
                          elif self.push_accepts_more():
                              return 'incomplete', self.get_indent_spaces()
                          else:
                              return 'complete', None
                      finally:
                          self.reset()
                  def push(self, lines):
                      """Push one or more lines of input.
                      This stores the given lines and returns a status code indicating
                      whether the code forms a complete Python block or not.
                      Any exceptions generated in compilation are swallowed, but if an
                      exception was produced, the method returns True.
                      Parameters
                      ----------
                      lines : string
                        One or more lines of Python input.
                      Returns
                      -------
                      is_complete : boolean
                        True if the current input source (the result of the current input
                        plus prior inputs) forms a complete Python execution block.  Note that
                        this value is also stored as a private attribute (``_is_complete``), so it
                        can be queried at any time.
                      """
                      self._store(lines)
                      source = self.source
                      # Before calling _compile(), reset the code object to None so that if an
                      # exception is raised in compilation, we don't mislead by having
                      # inconsistent code/source attributes.
                      self.code, self._is_complete = None, None
                      self._is_invalid = False
                      # Honor termination lines properly
                      if source.endswith('\\\n'):
                          return False
                      try:
                          with warnings.catch_warnings():
                              warnings.simplefilter('error', SyntaxWarning)
                              self.code = self._compile(source, symbol="exec")
                      # Invalid syntax can produce any of a number of different errors from
                      # inside the compiler, so we have to catch them all.  Syntax errors
                      # immediately produce a 'ready' block, so the invalid Python can be
                      # sent to the kernel for evaluation with possible ipython
                      # special-syntax conversion.
                      except (SyntaxError, OverflowError, ValueError, TypeError,
                              MemoryError, SyntaxWarning):
                          self._is_complete = True
                          self._is_invalid = True
                      else:
                          # Compilation didn't produce any exceptions (though it may not have
                          # given a complete code object)
                          self._is_complete = self.code is not None
                      return self._is_complete
                  def push_accepts_more(self):
                      """Return whether a block of interactive input can accept more input.
                      This method is meant to be used by line-oriented frontends, who need to
                      guess whether a block is complete or not based solely on prior and
                      current input lines.  The InputSplitter considers it has a complete
                      interactive block and will not accept more input when either:
                      * A SyntaxError is raised
                      * The code is complete and consists of a single line or a single
                        non-compound statement
                      * The code is complete and has a blank line at the end
                      If the current input produces a syntax error, this method immediately
                      returns False but does *not* raise the syntax error exception, as
                      typically clients will want to send invalid syntax to an execution
                      backend which might convert the invalid syntax into valid Python via
                      one of the dynamic IPython mechanisms.
                      """
                      # With incomplete input, unconditionally accept more
                      # A syntax error also sets _is_complete to True - see push()
                      if not self._is_complete:
                          #print("Not complete")  # debug
                          return True
                      # The user can make any (complete) input execute by leaving a blank line
                      last_line = self.source.splitlines()[-1]
                      if (not last_line) or last_line.isspace():
                          #print("Blank line")  # debug
                          return False
                      # If there's just a single line or AST node, and we're flush left, as is
                      # the case after a simple statement such as 'a=1', we want to execute it
                      # straight away.
                      if self.get_indent_spaces() == 0:
                          if len(self.source.splitlines()) <= 1:
                              return False
                          try:
                              code_ast = ast.parse(u''.join(self._buffer))
                          except Exception:
                              #print("Can't parse AST")  # debug
                              return False
                          else:
                              if len(code_ast.body) == 1 and \
                                                  not hasattr(code_ast.body[0], 'body'):
                                  #print("Simple statement")  # debug
                                  return False
                      # General fallback - accept more code
                      return True
                  def get_indent_spaces(self):
                      sourcefor, n = self._indent_spaces_cache
                      if sourcefor == self.source:
                          return n
                      # self.source always has a trailing newline
                      n = find_next_indent(self.source[:-1])
                      self._indent_spaces_cache = (self.source, n)
                      return n
                  # Backwards compatibility. I think all code that used .indent_spaces was
                  # inside IPython, but we can leave this here until IPython 7 in case any
                  # other modules are using it. -TK, November 2017
                  indent_spaces = property(get_indent_spaces)
                  def _store(self, lines, buffer=None, store='source'):
                      """Store one or more lines of input.
                      If input lines are not newline-terminated, a newline is automatically
                      appended."""
                      if buffer is None:
                          buffer = self._buffer
                      if lines.endswith('\n'):
                          buffer.append(lines)
                      else:
                          buffer.append(lines+'\n')
                      setattr(self, store, self._set_source(buffer))
                  def _set_source(self, buffer):
                      return u''.join(buffer)
              class IPythonInputSplitter(InputSplitter):
                  """An input splitter that recognizes all of IPython's special syntax."""
                  # String with raw, untransformed input.
                  source_raw = ''
                  # Flag to track when a transformer has stored input that it hasn't given
                  # back yet.
                  transformer_accumulating = False
                  # Flag to track when assemble_python_lines has stored input that it hasn't
                  # given back yet.
                  within_python_line = False
                  # Private attributes
                  # List with lines of raw input accumulated so far.
                  _buffer_raw = None
                  def __init__(self, line_input_checker=True, physical_line_transforms=None,
                                  logical_line_transforms=None, python_line_transforms=None):
                      super(IPythonInputSplitter, self).__init__()
                      self._buffer_raw = []
                      self._validate = True
                      if physical_line_transforms is not None:
                          self.physical_line_transforms = physical_line_transforms
                      else:
                          self.physical_line_transforms = [
                                                           leading_indent(),
                                                           classic_prompt(),
                                                           ipy_prompt(),
                                                           cellmagic(end_on_blank_line=line_input_checker),
                                                          ]
                      self.assemble_logical_lines = assemble_logical_lines()
                      if logical_line_transforms is not None:
                          self.logical_line_transforms = logical_line_transforms
                      else:
                          self.logical_line_transforms = [
                                                          help_end(),
                                                          escaped_commands(),
                                                          assign_from_magic(),
                                                          assign_from_system(),
                                                         ]
                      self.assemble_python_lines = assemble_python_lines()
                      if python_line_transforms is not None:
                          self.python_line_transforms = python_line_transforms
                      else:
                          # We don't use any of these at present
                          self.python_line_transforms = []
                  @property
                  def transforms(self):
                      "Quick access to all transformers."
                      return self.physical_line_transforms + \
                          [self.assemble_logical_lines] + self.logical_line_transforms + \
                          [self.assemble_python_lines]  + self.python_line_transforms
                  @property
                  def transforms_in_use(self):
                      """Transformers, excluding logical line transformers if we're in a
                      Python line."""
                      t = self.physical_line_transforms[:]
                      if not self.within_python_line:
                          t += [self.assemble_logical_lines] + self.logical_line_transforms
                      return t + [self.assemble_python_lines] + self.python_line_transforms
                  def reset(self):
                      """Reset the input buffer and associated state."""
                      super(IPythonInputSplitter, self).reset()
                      self._buffer_raw[:] = []
                      self.source_raw = ''
                      self.transformer_accumulating = False
                      self.within_python_line = False
                      for t in self.transforms:
                          try:
                              t.reset()
                          except SyntaxError:
                              # Nothing that calls reset() expects to handle transformer
                              # errors
                              pass
                  def flush_transformers(self):
                      def _flush(transform, outs):
                          """yield transformed lines
                          always strings, never None
                          transform: the current transform
                          outs: an iterable of previously transformed inputs.
                               Each may be multiline, which will be passed
                               one line at a time to transform.
                          """
                          for out in outs:
                              for line in out.splitlines():
                                  # push one line at a time
                                  tmp = transform.push(line)
                                  if tmp is not None:
                                      yield tmp
                          # reset the transform
                          tmp = transform.reset()
                          if tmp is not None:
                              yield tmp
                      out = []
                      for t in self.transforms_in_use:
                          out = _flush(t, out)
                      out = list(out)
                      if out:
                          self._store('\n'.join(out))
                  def raw_reset(self):
                      """Return raw input only and perform a full reset.
                      """
                      out = self.source_raw
                      self.reset()
                      return out
                  def source_reset(self):
                      try:
                          self.flush_transformers()
                          return self.source
                      finally:
                          self.reset()
                  def push_accepts_more(self):
                      if self.transformer_accumulating:
                          return True
                      else:
                          return super(IPythonInputSplitter, self).push_accepts_more()
                  def transform_cell(self, cell):
                      """Process and translate a cell of input.
                      """
                      self.reset()
                      try:
                          self.push(cell)
                          self.flush_transformers()
                          return self.source
                      finally:
                          self.reset()
                  def push(self, lines):
                      """Push one or more lines of IPython input.
                      This stores the given lines and returns a status code indicating
                      whether the code forms a complete Python block or not, after processing
                      all input lines for special IPython syntax.
                      Any exceptions generated in compilation are swallowed, but if an
                      exception was produced, the method returns True.
                      Parameters
                      ----------
                      lines : string
                        One or more lines of Python input.
                      Returns
                      -------
                      is_complete : boolean
                        True if the current input source (the result of the current input
                        plus prior inputs) forms a complete Python execution block.  Note that
                        this value is also stored as a private attribute (_is_complete), so it
                        can be queried at any time.
                      """
                      # We must ensure all input is pure unicode
                      lines = cast_unicode(lines, self.encoding)
                      # ''.splitlines() --> [], but we need to push the empty line to transformers
                      lines_list = lines.splitlines()
                      if not lines_list:
                          lines_list = ['']
                      # Store raw source before applying any transformations to it.  Note
                      # that this must be done *after* the reset() call that would otherwise
                      # flush the buffer.
                      self._store(lines, self._buffer_raw, 'source_raw')
                      transformed_lines_list = []
                      for line in lines_list:
                          transformed = self._transform_line(line)
                          if transformed is not None:
                              transformed_lines_list.append(transformed)
                      if transformed_lines_list:
                          transformed_lines = '\n'.join(transformed_lines_list)
                          return super(IPythonInputSplitter, self).push(transformed_lines)
                      else:
                          # Got nothing back from transformers - they must be waiting for
                          # more input.
                          return False
                  def _transform_line(self, line):
                      """Push a line of input code through the various transformers.
                      Returns any output from the transformers, or None if a transformer
                      is accumulating lines.
                      Sets self.transformer_accumulating as a side effect.
                      """
                      def _accumulating(dbg):
                          #print(dbg)
                          self.transformer_accumulating = True
                          return None
                      for transformer in self.physical_line_transforms:
                          line = transformer.push(line)
                          if line is None:
                              return _accumulating(transformer)
                      if not self.within_python_line:
                          line = self.assemble_logical_lines.push(line)
                          if line is None:
                              return _accumulating('acc logical line')
                          for transformer in self.logical_line_transforms:
                              line = transformer.push(line)
                              if line is None:
                                  return _accumulating(transformer)
                      line = self.assemble_python_lines.push(line)
                      if line is None:
                          self.within_python_line = True
                          return _accumulating('acc python line')
                      else:
                          self.within_python_line = False
                      for transformer in self.python_line_transforms:
                          line = transformer.push(line)
                          if line is None:
                              return _accumulating(transformer)
                      #print("transformers clear") #debug
                      self.transformer_accumulating = False
                      return line

IPython/core/inputtransformer.py

0 +2 -2

              """Input transformer classes to support IPython special syntax.
              This includes the machinery to recognise and transform ``%magic`` commands,
              ``!system`` commands, ``help?`` querying, prompt stripping, and so forth.
              """
              import abc
              import functools
              import re
              from io import StringIO
              from IPython.core.splitinput import LineInfo
              from IPython.utils import tokenize2
              from IPython.utils.tokenize2 import generate_tokens, untokenize, TokenError
              #-----------------------------------------------------------------------------
              # Globals
              #-----------------------------------------------------------------------------
              # The escape sequences that define the syntax transformations IPython will
              # apply to user input.  These can NOT be just changed here: many regular
              # expressions and other parts of the code may use their hardcoded values, and
              # for all intents and purposes they constitute the 'IPython syntax', so they
              # should be considered fixed.
              ESC_SHELL  = '!'     # Send line to underlying system shell
              ESC_SH_CAP = '!!'    # Send line to system shell and capture output
              ESC_HELP   = '?'     # Find information about object
              ESC_HELP2  = '??'    # Find extra-detailed information about object
              ESC_MAGIC  = '%'     # Call magic function
              ESC_MAGIC2 = '%%'    # Call cell-magic function
              ESC_QUOTE  = ','     # Split args on whitespace, quote each as string and call
              ESC_QUOTE2 = ';'     # Quote all args as a single string, call
              ESC_PAREN  = '/'     # Call first argument with rest of line as arguments
              ESC_SEQUENCES = [ESC_SHELL, ESC_SH_CAP, ESC_HELP ,\
                               ESC_HELP2, ESC_MAGIC, ESC_MAGIC2,\
                               ESC_QUOTE, ESC_QUOTE2, ESC_PAREN ]
              class InputTransformer(metaclass=abc.ABCMeta):
                  """Abstract base class for line-based input transformers."""
                  @abc.abstractmethod
                  def push(self, line):
                      """Send a line of input to the transformer, returning the transformed
                      input or None if the transformer is waiting for more input.
                      Must be overridden by subclasses.
                      Implementations may raise ``SyntaxError`` if the input is invalid. No
                      other exceptions may be raised.
                      """
                      pass
                  @abc.abstractmethod
                  def reset(self):
                      """Return, transformed any lines that the transformer has accumulated,
                      and reset its internal state.
                      Must be overridden by subclasses.
                      """
                      pass
                  @classmethod
                  def wrap(cls, func):
                      """Can be used by subclasses as a decorator, to return a factory that
                      will allow instantiation with the decorated object.
                      """
                      @functools.wraps(func)
                      def transformer_factory(**kwargs):
                          return cls(func, **kwargs)
                      return transformer_factory
              class StatelessInputTransformer(InputTransformer):
                  """Wrapper for a stateless input transformer implemented as a function."""
                  def __init__(self, func):
                      self.func = func
                  def __repr__(self):
                      return "StatelessInputTransformer(func={0!r})".format(self.func)
                  def push(self, line):
                      """Send a line of input to the transformer, returning the
                      transformed input."""
                      return self.func(line)
                  def reset(self):
                      """No-op - exists for compatibility."""
                      pass
              class CoroutineInputTransformer(InputTransformer):
                  """Wrapper for an input transformer implemented as a coroutine."""
                  def __init__(self, coro, **kwargs):
                      # Prime it
                      self.coro = coro(**kwargs)
                      next(self.coro)
                  def __repr__(self):
                      return "CoroutineInputTransformer(coro={0!r})".format(self.coro)
                  def push(self, line):
                      """Send a line of input to the transformer, returning the
                      transformed input or None if the transformer is waiting for more
                      input.
                      """
                      return self.coro.send(line)
                  def reset(self):
                      """Return, transformed any lines that the transformer has
                      accumulated, and reset its internal state.
                      """
                      return self.coro.send(None)
              class TokenInputTransformer(InputTransformer):
                  """Wrapper for a token-based input transformer.
                  func should accept a list of tokens (5-tuples, see tokenize docs), and
                  return an iterable which can be passed to tokenize.untokenize().
                  """
                  def __init__(self, func):
                      self.func = func
                      self.buf = []
                      self.reset_tokenizer()
                  def reset_tokenizer(self):
                      it = iter(self.buf)
                      self.tokenizer = generate_tokens(it.__next__)
                  def push(self, line):
                      self.buf.append(line + '\n')
                      if all(l.isspace() for l in self.buf):
                          return self.reset()
                      tokens = []
                      stop_at_NL = False
                      try:
                          for intok in self.tokenizer:
                              tokens.append(intok)
                              t = intok[0]
                              if t == tokenize2.NEWLINE or (stop_at_NL and t == tokenize2.NL):
                                  # Stop before we try to pull a line we don't have yet
                                  break
                              elif t == tokenize2.ERRORTOKEN:
                                  stop_at_NL = True
                      except TokenError:
                          # Multi-line statement - stop and try again with the next line
                          self.reset_tokenizer()
                          return None
                      return self.output(tokens)
                  def output(self, tokens):
                      self.buf.clear()
                      self.reset_tokenizer()
                      return untokenize(self.func(tokens)).rstrip('\n')
                  def reset(self):
                      l = ''.join(self.buf)
                      self.buf.clear()
                      self.reset_tokenizer()
                      if l:
                          return l.rstrip('\n')
              class assemble_python_lines(TokenInputTransformer):
                  def __init__(self):
                      super(assemble_python_lines, self).__init__(None)
                  def output(self, tokens):
                      return self.reset()
              @CoroutineInputTransformer.wrap
              def assemble_logical_lines():
-                 """Join lines following explicit line continuations (\)"""
+                 r"""Join lines following explicit line continuations (\)"""
                  line = ''
                  while True:
                      line = (yield line)
                      if not line or line.isspace():
                          continue
                      parts = []
                      while line is not None:
                          if line.endswith('\\') and (not has_comment(line)):
                              parts.append(line[:-1])
                              line = (yield None) # Get another line
                          else:
                              parts.append(line)
                              break
                      # Output
                      line = ''.join(parts)
              # Utilities
              def _make_help_call(target, esc, lspace, next_input=None):
                  """Prepares a pinfo(2)/psearch call from a target name and the escape
                  (i.e. ? or ??)"""
                  method  = 'pinfo2' if esc == '??' \
                              else 'psearch' if '*' in target \
                              else 'pinfo'
                  arg = " ".join([method, target])
                  #Prepare arguments for get_ipython().run_line_magic(magic_name, magic_args)
                  t_magic_name, _, t_magic_arg_s = arg.partition(' ')
                  t_magic_name = t_magic_name.lstrip(ESC_MAGIC)
                  if next_input is None:
                      return '%sget_ipython().run_line_magic(%r, %r)' % (lspace, t_magic_name, t_magic_arg_s)
                  else:
                      return '%sget_ipython().set_next_input(%r);get_ipython().run_line_magic(%r, %r)' % \
                         (lspace, next_input, t_magic_name, t_magic_arg_s)
              # These define the transformations for the different escape characters.
              def _tr_system(line_info):
                  "Translate lines escaped with: !"
                  cmd = line_info.line.lstrip().lstrip(ESC_SHELL)
                  return '%sget_ipython().system(%r)' % (line_info.pre, cmd)
              def _tr_system2(line_info):
                  "Translate lines escaped with: !!"
                  cmd = line_info.line.lstrip()[2:]
                  return '%sget_ipython().getoutput(%r)' % (line_info.pre, cmd)
              def _tr_help(line_info):
                  "Translate lines escaped with: ?/??"
                  # A naked help line should just fire the intro help screen
                  if not line_info.line[1:]:
                      return 'get_ipython().show_usage()'
                  return _make_help_call(line_info.ifun, line_info.esc, line_info.pre)
              def _tr_magic(line_info):
                  "Translate lines escaped with: %"
                  tpl = '%sget_ipython().run_line_magic(%r, %r)'
                  if line_info.line.startswith(ESC_MAGIC2):
                      return line_info.line
                  cmd = ' '.join([line_info.ifun, line_info.the_rest]).strip()
                  #Prepare arguments for get_ipython().run_line_magic(magic_name, magic_args)
                  t_magic_name, _, t_magic_arg_s = cmd.partition(' ')
                  t_magic_name = t_magic_name.lstrip(ESC_MAGIC)
                  return tpl % (line_info.pre, t_magic_name, t_magic_arg_s)
              def _tr_quote(line_info):
                  "Translate lines escaped with: ,"
                  return '%s%s("%s")' % (line_info.pre, line_info.ifun,
                                       '", "'.join(line_info.the_rest.split()) )
              def _tr_quote2(line_info):
                  "Translate lines escaped with: ;"
                  return '%s%s("%s")' % (line_info.pre, line_info.ifun,
                                         line_info.the_rest)
              def _tr_paren(line_info):
                  "Translate lines escaped with: /"
                  return '%s%s(%s)' % (line_info.pre, line_info.ifun,
                                       ", ".join(line_info.the_rest.split()))
              tr = { ESC_SHELL  : _tr_system,
                     ESC_SH_CAP : _tr_system2,
                     ESC_HELP   : _tr_help,
                     ESC_HELP2  : _tr_help,
                     ESC_MAGIC  : _tr_magic,
                     ESC_QUOTE  : _tr_quote,
                     ESC_QUOTE2 : _tr_quote2,
                     ESC_PAREN  : _tr_paren }
              @StatelessInputTransformer.wrap
              def escaped_commands(line):
                  """Transform escaped commands - %magic, !system, ?help + various autocalls.
                  """
                  if not line or line.isspace():
                      return line
                  lineinf = LineInfo(line)
                  if lineinf.esc not in tr:
                      return line
                  return tr[lineinf.esc](lineinf)
              _initial_space_re = re.compile(r'\s*')
              _help_end_re = re.compile(r"""(%{0,2}
                                            [a-zA-Z_*][\w*]*        # Variable name
                                            (\.[a-zA-Z_*][\w*]*)*   # .etc.etc
                                            )
                                            (\?\??)$                # ? or ??
                                            """,
                                            re.VERBOSE)
              # Extra pseudotokens for multiline strings and data structures
              _MULTILINE_STRING = object()
              _MULTILINE_STRUCTURE = object()
              def _line_tokens(line):
                  """Helper for has_comment and ends_in_comment_or_string."""
                  readline = StringIO(line).readline
                  toktypes = set()
                  try:
                      for t in generate_tokens(readline):
                          toktypes.add(t[0])
                  except TokenError as e:
                      # There are only two cases where a TokenError is raised.
                      if 'multi-line string' in e.args[0]:
                          toktypes.add(_MULTILINE_STRING)
                      else:
                          toktypes.add(_MULTILINE_STRUCTURE)
                  return toktypes
              def has_comment(src):
                  """Indicate whether an input line has (i.e. ends in, or is) a comment.
                  This uses tokenize, so it can distinguish comments from # inside strings.
                  Parameters
                  ----------
                  src : string
                    A single line input string.
                  Returns
                  -------
                  comment : bool
                      True if source has a comment.
                  """
                  return (tokenize2.COMMENT in _line_tokens(src))
              def ends_in_comment_or_string(src):
                  """Indicates whether or not an input line ends in a comment or within
                  a multiline string.
                  Parameters
                  ----------
                  src : string
                    A single line input string.
                  Returns
                  -------
                  comment : bool
                      True if source ends in a comment or multiline string.
                  """
                  toktypes = _line_tokens(src)
                  return (tokenize2.COMMENT in toktypes) or (_MULTILINE_STRING in toktypes)
              @StatelessInputTransformer.wrap
              def help_end(line):
                  """Translate lines with ?/?? at the end"""
                  m = _help_end_re.search(line)
                  if m is None or ends_in_comment_or_string(line):
                      return line
                  target = m.group(1)
                  esc = m.group(3)
                  lspace = _initial_space_re.match(line).group(0)
                  # If we're mid-command, put it back on the next prompt for the user.
                  next_input = line.rstrip('?') if line.strip() != m.group(0) else None
                  return _make_help_call(target, esc, lspace, next_input)
              @CoroutineInputTransformer.wrap
              def cellmagic(end_on_blank_line=False):
                  """Captures & transforms cell magics.
                  After a cell magic is started, this stores up any lines it gets until it is
                  reset (sent None).
                  """
                  tpl = 'get_ipython().run_cell_magic(%r, %r, %r)'
-                 cellmagic_help_re = re.compile('%%\w+\?')
+                 cellmagic_help_re = re.compile(r'%%\w+\?')
                  line = ''
                  while True:
                      line = (yield line)
                      # consume leading empty lines
                      while not line:
                          line = (yield line)
                      if not line.startswith(ESC_MAGIC2):
                          # This isn't a cell magic, idle waiting for reset then start over
                          while line is not None:
                              line = (yield line)
                          continue
                      if cellmagic_help_re.match(line):
                          # This case will be handled by help_end
                          continue
                      first = line
                      body = []
                      line = (yield None)
                      while (line is not None) and \
                                              ((line.strip() != '') or not end_on_blank_line):
                          body.append(line)
                          line = (yield None)
                      # Output
                      magic_name, _, first = first.partition(' ')
                      magic_name = magic_name.lstrip(ESC_MAGIC2)
                      line = tpl % (magic_name, first, u'\n'.join(body))
              def _strip_prompts(prompt_re, initial_re=None, turnoff_re=None):
                  """Remove matching input prompts from a block of input.
                  Parameters
                  ----------
                  prompt_re : regular expression
                      A regular expression matching any input prompt (including continuation)
                  initial_re : regular expression, optional
                      A regular expression matching only the initial prompt, but not continuation.
                      If no initial expression is given, prompt_re will be used everywhere.
                      Used mainly for plain Python prompts, where the continuation prompt
                      ``...`` is a valid Python expression in Python 3, so shouldn't be stripped.
                  If initial_re and prompt_re differ,
                  only initial_re will be tested against the first line.
                  If any prompt is found on the first two lines,
                  prompts will be stripped from the rest of the block.
                  """
                  if initial_re is None:
                      initial_re = prompt_re
                  line = ''
                  while True:
                      line = (yield line)
                      # First line of cell
                      if line is None:
                          continue
                      out, n1 = initial_re.subn('', line, count=1)
                      if turnoff_re and not n1:
                          if turnoff_re.match(line):
                              # We're in e.g. a cell magic; disable this transformer for
                              # the rest of the cell.
                              while line is not None:
                                  line = (yield line)
                              continue
                      line = (yield out)
                      if line is None:
                          continue
                      # check for any prompt on the second line of the cell,
                      # because people often copy from just after the first prompt,
                      # so we might not see it in the first line.
                      out, n2 = prompt_re.subn('', line, count=1)
                      line = (yield out)
                      if n1 or n2:
                          # Found a prompt in the first two lines - check for it in
                          # the rest of the cell as well.
                          while line is not None:
                              line = (yield prompt_re.sub('', line, count=1))
                      else:
                          # Prompts not in input - wait for reset
                          while line is not None:
                              line = (yield line)
              @CoroutineInputTransformer.wrap
              def classic_prompt():
                  """Strip the >>>/... prompts of the Python interactive shell."""
                  # FIXME: non-capturing version (?:...) usable?
                  prompt_re = re.compile(r'^(>>>|\.\.\.)( |$)')
                  initial_re = re.compile(r'^>>>( |$)')
                  # Any %magic/!system is IPython syntax, so we needn't look for >>> prompts
                  turnoff_re = re.compile(r'^[%!]')
                  return _strip_prompts(prompt_re, initial_re, turnoff_re)
              @CoroutineInputTransformer.wrap
              def ipy_prompt():
                  """Strip IPython's In [1]:/...: prompts."""
                  # FIXME: non-capturing version (?:...) usable?
                  prompt_re = re.compile(r'^(In \[\d+\]: |\s*\.{3,}: ?)')
                  # Disable prompt stripping inside cell magics
                  turnoff_re = re.compile(r'^%%')
                  return _strip_prompts(prompt_re, turnoff_re=turnoff_re)
              @CoroutineInputTransformer.wrap
              def leading_indent():
                  """Remove leading indentation.
                  If the first line starts with a spaces or tabs, the same whitespace will be
                  removed from each following line until it is reset.
                  """
                  space_re = re.compile(r'^[ \t]+')
                  line = ''
                  while True:
                      line = (yield line)
                      if line is None:
                          continue
                      m = space_re.match(line)
                      if m:
                          space = m.group(0)
                          while line is not None:
                              if line.startswith(space):
                                  line = line[len(space):]
                              line = (yield line)
                      else:
                          # No leading spaces - wait for reset
                          while line is not None:
                              line = (yield line)
              _assign_pat = \
              r'''(?P<lhs>(\s*)
                  ([\w\.]+)                # Initial identifier
                  (\s*,\s*
                      \*?[\w\.]+)*         # Further identifiers for unpacking
                  \s*?,?                   # Trailing comma
                  )
                  \s*=\s*
              '''
              assign_system_re = re.compile(r'{}!\s*(?P<cmd>.*)'.format(_assign_pat), re.VERBOSE)
              assign_system_template = '%s = get_ipython().getoutput(%r)'
              @StatelessInputTransformer.wrap
              def assign_from_system(line):
                  """Transform assignment from system commands (e.g. files = !ls)"""
                  m = assign_system_re.match(line)
                  if m is None:
                      return line
                  return assign_system_template % m.group('lhs', 'cmd')
              assign_magic_re = re.compile(r'{}%\s*(?P<cmd>.*)'.format(_assign_pat), re.VERBOSE)
              assign_magic_template = '%s = get_ipython().run_line_magic(%r, %r)'
              @StatelessInputTransformer.wrap
              def assign_from_magic(line):
                  """Transform assignment from magic commands (e.g. a = %who_ls)"""
                  m = assign_magic_re.match(line)
                  if m is None:
                      return line
                  #Prepare arguments for get_ipython().run_line_magic(magic_name, magic_args)
                  m_lhs, m_cmd = m.group('lhs', 'cmd')
                  t_magic_name, _, t_magic_arg_s = m_cmd.partition(' ')
                  t_magic_name = t_magic_name.lstrip(ESC_MAGIC)
                  return assign_magic_template % (m_lhs, t_magic_name, t_magic_arg_s)

IPython/core/magics/config.py

0 +1 -1

              """Implementation of configuration-related magic functions.
              """
              #-----------------------------------------------------------------------------
              #  Copyright (c) 2012 The IPython Development Team.
              #
              #  Distributed under the terms of the Modified BSD License.
              #
              #  The full license is in the file COPYING.txt, distributed with this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              # Stdlib
              import re
              # Our own packages
              from IPython.core.error import UsageError
              from IPython.core.magic import Magics, magics_class, line_magic
              from logging import error
              #-----------------------------------------------------------------------------
              # Magic implementation classes
              #-----------------------------------------------------------------------------
-             reg = re.compile('^\w+\.\w+$')
+             reg = re.compile(r'^\w+\.\w+$')
              @magics_class
              class ConfigMagics(Magics):
                  def __init__(self, shell):
                      super(ConfigMagics, self).__init__(shell)
                      self.configurables = []
                  @line_magic
                  def config(self, s):
                      """configure IPython
                          %config Class[.trait=value]
                      This magic exposes most of the IPython config system. Any
                      Configurable class should be able to be configured with the simple
                      line::
                          %config Class.trait=value
                      Where `value` will be resolved in the user's namespace, if it is an
                      expression or variable name.
                      Examples
                      --------
                      To see what classes are available for config, pass no arguments::
                          In [1]: %config
                          Available objects for config:
                              TerminalInteractiveShell
                              HistoryManager
                              PrefilterManager
                              AliasManager
                              IPCompleter
                              DisplayFormatter
                      To view what is configurable on a given class, just pass the class
                      name::
                          In [2]: %config IPCompleter
                          IPCompleter options
                          -----------------
                          IPCompleter.omit__names=<Enum>
                              Current: 2
                              Choices: (0, 1, 2)
                              Instruct the completer to omit private method names
                              Specifically, when completing on ``object.<tab>``.
                              When 2 [default]: all names that start with '_' will be excluded.
                              When 1: all 'magic' names (``__foo__``) will be excluded.
                              When 0: nothing will be excluded.
                          IPCompleter.merge_completions=<CBool>
                              Current: True
                              Whether to merge completion results into a single list
                              If False, only the completion results from the first non-empty
                              completer will be returned.
                          IPCompleter.limit_to__all__=<CBool>
                              Current: False
                              Instruct the completer to use __all__ for the completion
                              Specifically, when completing on ``object.<tab>``.
                              When True: only those names in obj.__all__ will be included.
                              When False [default]: the __all__ attribute is ignored
                          IPCompleter.greedy=<CBool>
                              Current: False
                              Activate greedy completion
                              This will enable completion on elements of lists, results of
                              function calls, etc., but can be unsafe because the code is
                              actually evaluated on TAB.
                      but the real use is in setting values::
                          In [3]: %config IPCompleter.greedy = True
                      and these values are read from the user_ns if they are variables::
                          In [4]: feeling_greedy=False
                          In [5]: %config IPCompleter.greedy = feeling_greedy
                      """
                      from traitlets.config.loader import Config
                      # some IPython objects are Configurable, but do not yet have
                      # any configurable traits.  Exclude them from the effects of
                      # this magic, as their presence is just noise:
                      configurables = sorted(set([ c for c in self.shell.configurables
                                                   if c.__class__.class_traits(config=True)
                                                   ]), key=lambda x: x.__class__.__name__)
                      classnames = [ c.__class__.__name__ for c in configurables ]
                      line = s.strip()
                      if not line:
                          # print available configurable names
                          print("Available objects for config:")
                          for name in classnames:
                              print("    ", name)
                          return
                      elif line in classnames:
                          # `%config TerminalInteractiveShell` will print trait info for
                          # TerminalInteractiveShell
                          c = configurables[classnames.index(line)]
                          cls = c.__class__
                          help = cls.class_get_help(c)
                          # strip leading '--' from cl-args:
                          help = re.sub(re.compile(r'^--', re.MULTILINE), '', help)
                          print(help)
                          return
                      elif reg.match(line):
                          cls, attr = line.split('.')
                          return getattr(configurables[classnames.index(cls)],attr)
                      elif '=' not in line:
                          msg = "Invalid config statement: %r, "\
                                "should be `Class.trait = value`."
                          ll = line.lower()
                          for classname in classnames:
                              if ll == classname.lower():
                                  msg = msg + '\nDid you mean %s (note the case)?' % classname
                                  break
                          raise UsageError( msg % line)
                      # otherwise, assume we are setting configurables.
                      # leave quotes on args when splitting, because we want
                      # unquoted args to eval in user_ns
                      cfg = Config()
                      exec("cfg."+line, locals(), self.shell.user_ns)
                      for configurable in configurables:
                          try:
                              configurable.update_config(cfg)
                          except Exception as e:
                              error(e)

IPython/core/splitinput.py

0 +2 -2

              # encoding: utf-8
              """
              Simple utility for splitting user input. This is used by both inputsplitter and
              prefilter.
              Authors:
              * Brian Granger
              * Fernando Perez
              """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2008-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import re
              import sys
              from IPython.utils import py3compat
              from IPython.utils.encoding import get_stream_enc
              #-----------------------------------------------------------------------------
              # Main function
              #-----------------------------------------------------------------------------
              # RegExp for splitting line contents into pre-char//first word-method//rest.
              # For clarity, each group in on one line.
              # WARNING: update the regexp if the escapes in interactiveshell are changed, as
              # they are hardwired in.
              # Although it's not solely driven by the regex, note that:
              # ,;/% only trigger if they are the first character on the line
              # ! and !! trigger if they are first char(s) *or* follow an indent
              # ? triggers as first or last char.
-             line_split = re.compile("""
+             line_split = re.compile(r"""
                           ^(\s*)               # any leading space
                           ([,;/%]|!!?|\?\??)?  # escape character or characters
                           \s*(%{0,2}[\w\.\*]*)     # function/method, possibly with leading %
                                                # to correctly treat things like '?%magic'
                           (.*?$|$)             # rest of line
                           """, re.VERBOSE)
              def split_user_input(line, pattern=None):
                  """Split user input into initial whitespace, escape character, function part
                  and the rest.
                  """
                  # We need to ensure that the rest of this routine deals only with unicode
                  encoding = get_stream_enc(sys.stdin, 'utf-8')
                  line = py3compat.cast_unicode(line, encoding)
                  if pattern is None:
                      pattern = line_split
                  match = pattern.match(line)
                  if not match:
                      # print "match failed for line '%s'" % line
                      try:
                          ifun, the_rest = line.split(None,1)
                      except ValueError:
                          # print "split failed for line '%s'" % line
                          ifun, the_rest = line, u''
-                     pre = re.match('^(\s*)(.*)',line).groups()[0]
+                     pre = re.match(r'^(\s*)(.*)',line).groups()[0]
                      esc = ""
                  else:
                      pre, esc, ifun, the_rest = match.groups()
                  #print 'line:<%s>' % line # dbg
                  #print 'pre <%s> ifun <%s> rest <%s>' % (pre,ifun.strip(),the_rest) # dbg
                  return pre, esc or '', ifun.strip(), the_rest.lstrip()
              class LineInfo(object):
                  """A single line of input and associated info.
                  Includes the following as properties:
                  line
                    The original, raw line
                  continue_prompt
                    Is this line a continuation in a sequence of multiline input?
                  pre
                    Any leading whitespace.
                  esc
                    The escape character(s) in pre or the empty string if there isn't one.
                    Note that '!!' and '??' are possible values for esc. Otherwise it will
                    always be a single character.
                  ifun
                    The 'function part', which is basically the maximal initial sequence
                    of valid python identifiers and the '.' character. This is what is
                    checked for alias and magic transformations, used for auto-calling,
                    etc. In contrast to Python identifiers, it may start with "%" and contain
                    "*".
                  the_rest
                    Everything else on the line.
                  """
                  def __init__(self, line, continue_prompt=False):
                      self.line            = line
                      self.continue_prompt = continue_prompt
                      self.pre, self.esc, self.ifun, self.the_rest = split_user_input(line)
                      self.pre_char       = self.pre.strip()
                      if self.pre_char:
                          self.pre_whitespace = '' # No whitespace allowed before esc chars
                      else:
                          self.pre_whitespace = self.pre
                  def ofind(self, ip):
                      """Do a full, attribute-walking lookup of the ifun in the various
                      namespaces for the given IPython InteractiveShell instance.
                      Return a dict with keys: {found, obj, ospace, ismagic}
                      Note: can cause state changes because of calling getattr, but should
                      only be run if autocall is on and if the line hasn't matched any
                      other, less dangerous handlers.
                      Does cache the results of the call, so can be called multiple times
                      without worrying about *further* damaging state.
                      """
                      return ip._ofind(self.ifun)
                  def __str__(self):
                      return "LineInfo [%s|%s|%s|%s]" %(self.pre, self.esc, self.ifun, self.the_rest)

IPython/utils/path.py

0 +1 -1

              # encoding: utf-8
              """
              Utilities for path handling.
              """
              # Copyright (c) IPython Development Team.
              # Distributed under the terms of the Modified BSD License.
              import os
              import sys
              import errno
              import shutil
              import random
              import glob
              from warnings import warn
              from IPython.utils.process import system
              from IPython.utils import py3compat
              from IPython.utils.decorators import undoc
              #-----------------------------------------------------------------------------
              # Code
              #-----------------------------------------------------------------------------
              fs_encoding = sys.getfilesystemencoding()
              def _writable_dir(path):
                  """Whether `path` is a directory, to which the user has write access."""
                  return os.path.isdir(path) and os.access(path, os.W_OK)
              if sys.platform == 'win32':
                  def _get_long_path_name(path):
                      """Get a long path name (expand ~) on Windows using ctypes.
                      Examples
                      --------
                      >>> get_long_path_name('c:\\docume~1')
                      'c:\\\\Documents and Settings'
                      """
                      try:
                          import ctypes
                      except ImportError:
                          raise ImportError('you need to have ctypes installed for this to work')
                      _GetLongPathName = ctypes.windll.kernel32.GetLongPathNameW
                      _GetLongPathName.argtypes = [ctypes.c_wchar_p, ctypes.c_wchar_p,
                          ctypes.c_uint ]
                      buf = ctypes.create_unicode_buffer(260)
                      rv = _GetLongPathName(path, buf, 260)
                      if rv == 0 or rv > 260:
                          return path
                      else:
                          return buf.value
              else:
                  def _get_long_path_name(path):
                      """Dummy no-op."""
                      return path
              def get_long_path_name(path):
                  """Expand a path into its long form.
                  On Windows this expands any ~ in the paths. On other platforms, it is
                  a null operation.
                  """
                  return _get_long_path_name(path)
              def unquote_filename(name, win32=(sys.platform=='win32')):
                  """ On Windows, remove leading and trailing quotes from filenames.
                  This function has been deprecated and should not be used any more:
                  unquoting is now taken care of by :func:`IPython.utils.process.arg_split`.
                  """
                  warn("'unquote_filename' is deprecated since IPython 5.0 and should not "
                       "be used anymore", DeprecationWarning, stacklevel=2)
                  if win32:
                      if name.startswith(("'", '"')) and name.endswith(("'", '"')):
                          name = name[1:-1]
                  return name
              def compress_user(path):
                  """Reverse of :func:`os.path.expanduser`
                  """
                  home = os.path.expanduser('~')
                  if path.startswith(home):
                      path =  "~" + path[len(home):]
                  return path
              def get_py_filename(name, force_win32=None):
                  """Return a valid python filename in the current directory.
                  If the given name is not a file, it adds '.py' and searches again.
                  Raises IOError with an informative message if the file isn't found.
                  """
                  name = os.path.expanduser(name)
                  if force_win32 is not None:
                      warn("The 'force_win32' argument to 'get_py_filename' is deprecated "
                           "since IPython 5.0 and should not be used anymore",
                          DeprecationWarning, stacklevel=2)
                  if not os.path.isfile(name) and not name.endswith('.py'):
                      name += '.py'
                  if os.path.isfile(name):
                      return name
                  else:
                      raise IOError('File `%r` not found.' % name)
              def filefind(filename, path_dirs=None):
                  """Find a file by looking through a sequence of paths.
                  This iterates through a sequence of paths looking for a file and returns
                  the full, absolute path of the first occurrence of the file.  If no set of
                  path dirs is given, the filename is tested as is, after running through
                  :func:`expandvars` and :func:`expanduser`.  Thus a simple call::
                      filefind('myfile.txt')
                  will find the file in the current working dir, but::
                      filefind('~/myfile.txt')
                  Will find the file in the users home directory.  This function does not
                  automatically try any paths, such as the cwd or the user's home directory.
                  Parameters
                  ----------
                  filename : str
                      The filename to look for.
                  path_dirs : str, None or sequence of str
                      The sequence of paths to look for the file in.  If None, the filename
                      need to be absolute or be in the cwd.  If a string, the string is
                      put into a sequence and the searched.  If a sequence, walk through
                      each element and join with ``filename``, calling :func:`expandvars`
                      and :func:`expanduser` before testing for existence.
                  Returns
                  -------
                  Raises :exc:`IOError` or returns absolute path to file.
                  """
                  # If paths are quoted, abspath gets confused, strip them...
                  filename = filename.strip('"').strip("'")
                  # If the input is an absolute path, just check it exists
                  if os.path.isabs(filename) and os.path.isfile(filename):
                      return filename
                  if path_dirs is None:
                      path_dirs = ("",)
                  elif isinstance(path_dirs, str):
                      path_dirs = (path_dirs,)
                  for path in path_dirs:
                      if path == '.': path = os.getcwd()
                      testname = expand_path(os.path.join(path, filename))
                      if os.path.isfile(testname):
                          return os.path.abspath(testname)
                  raise IOError("File %r does not exist in any of the search paths: %r" %
                                (filename, path_dirs) )
              class HomeDirError(Exception):
                  pass
              def get_home_dir(require_writable=False):
                  """Return the 'home' directory, as a unicode string.
                  Uses os.path.expanduser('~'), and checks for writability.
                  See stdlib docs for how this is determined.
                  $HOME is first priority on *ALL* platforms.
                  Parameters
                  ----------
                  require_writable : bool [default: False]
                      if True:
                          guarantees the return value is a writable directory, otherwise
                          raises HomeDirError
                      if False:
                          The path is resolved, but it is not guaranteed to exist or be writable.
                  """
                  homedir = os.path.expanduser('~')
                  # Next line will make things work even when /home/ is a symlink to
                  # /usr/home as it is on FreeBSD, for example
                  homedir = os.path.realpath(homedir)
                  if not _writable_dir(homedir) and os.name == 'nt':
                      # expanduser failed, use the registry to get the 'My Documents' folder.
                      try:
                          try:
                              import winreg as wreg  # Py 3
                          except ImportError:
                              import _winreg as wreg  # Py 2
                          key = wreg.OpenKey(
                              wreg.HKEY_CURRENT_USER,
-                             "Software\Microsoft\Windows\CurrentVersion\Explorer\Shell Folders"
+                             r"Software\Microsoft\Windows\CurrentVersion\Explorer\Shell Folders"
                          )
                          homedir = wreg.QueryValueEx(key,'Personal')[0]
                          key.Close()
                      except:
                          pass
                  if (not require_writable) or _writable_dir(homedir):
                      return py3compat.cast_unicode(homedir, fs_encoding)
                  else:
                      raise HomeDirError('%s is not a writable dir, '
                              'set $HOME environment variable to override' % homedir)
              def get_xdg_dir():
                  """Return the XDG_CONFIG_HOME, if it is defined and exists, else None.
                  This is only for non-OS X posix (Linux,Unix,etc.) systems.
                  """
                  env = os.environ
                  if os.name == 'posix' and sys.platform != 'darwin':
                      # Linux, Unix, AIX, etc.
                      # use ~/.config if empty OR not set
                      xdg = env.get("XDG_CONFIG_HOME", None) or os.path.join(get_home_dir(), '.config')
                      if xdg and _writable_dir(xdg):
                          return py3compat.cast_unicode(xdg, fs_encoding)
                  return None
              def get_xdg_cache_dir():
                  """Return the XDG_CACHE_HOME, if it is defined and exists, else None.
                  This is only for non-OS X posix (Linux,Unix,etc.) systems.
                  """
                  env = os.environ
                  if os.name == 'posix' and sys.platform != 'darwin':
                      # Linux, Unix, AIX, etc.
                      # use ~/.cache if empty OR not set
                      xdg = env.get("XDG_CACHE_HOME", None) or os.path.join(get_home_dir(), '.cache')
                      if xdg and _writable_dir(xdg):
                          return py3compat.cast_unicode(xdg, fs_encoding)
                  return None
              @undoc
              def get_ipython_dir():
                  warn("get_ipython_dir has moved to the IPython.paths module since IPython 4.0.", stacklevel=2)
                  from IPython.paths import get_ipython_dir
                  return get_ipython_dir()
              @undoc
              def get_ipython_cache_dir():
                  warn("get_ipython_cache_dir has moved to the IPython.paths module since IPython 4.0.", stacklevel=2)
                  from IPython.paths import get_ipython_cache_dir
                  return get_ipython_cache_dir()
              @undoc
              def get_ipython_package_dir():
                  warn("get_ipython_package_dir has moved to the IPython.paths module since IPython 4.0.", stacklevel=2)
                  from IPython.paths import get_ipython_package_dir
                  return get_ipython_package_dir()
              @undoc
              def get_ipython_module_path(module_str):
                  warn("get_ipython_module_path has moved to the IPython.paths module since IPython 4.0.", stacklevel=2)
                  from IPython.paths import get_ipython_module_path
                  return get_ipython_module_path(module_str)
              @undoc
              def locate_profile(profile='default'):
                  warn("locate_profile has moved to the IPython.paths module since IPython 4.0.", stacklevel=2)
                  from IPython.paths import locate_profile
                  return locate_profile(profile=profile)
              def expand_path(s):
                  """Expand $VARS and ~names in a string, like a shell
                  :Examples:
                     In [2]: os.environ['FOO']='test'
                     In [3]: expand_path('variable FOO is $FOO')
                     Out[3]: 'variable FOO is test'
                  """
                  # This is a pretty subtle hack. When expand user is given a UNC path
                  # on Windows (\\server\share$\%username%), os.path.expandvars, removes
                  # the $ to get (\\server\share\%username%). I think it considered $
                  # alone an empty var. But, we need the $ to remains there (it indicates
                  # a hidden share).
                  if os.name=='nt':
                      s = s.replace('$\\', 'IPYTHON_TEMP')
                  s = os.path.expandvars(os.path.expanduser(s))
                  if os.name=='nt':
                      s = s.replace('IPYTHON_TEMP', '$\\')
                  return s
              def unescape_glob(string):
                  """Unescape glob pattern in `string`."""
                  def unescape(s):
                      for pattern in '*[]!?':
                          s = s.replace(r'\{0}'.format(pattern), pattern)
                      return s
                  return '\\'.join(map(unescape, string.split('\\\\')))
              def shellglob(args):
                  """
                  Do glob expansion for each element in `args` and return a flattened list.
                  Unmatched glob pattern will remain as-is in the returned list.
                  """
                  expanded = []
                  # Do not unescape backslash in Windows as it is interpreted as
                  # path separator:
                  unescape = unescape_glob if sys.platform != 'win32' else lambda x: x
                  for a in args:
                      expanded.extend(glob.glob(a) or [unescape(a)])
                  return expanded
              def target_outdated(target,deps):
                  """Determine whether a target is out of date.
                  target_outdated(target,deps) -> 1/0
                  deps: list of filenames which MUST exist.
                  target: single filename which may or may not exist.
                  If target doesn't exist or is older than any file listed in deps, return
                  true, otherwise return false.
                  """
                  try:
                      target_time = os.path.getmtime(target)
                  except os.error:
                      return 1
                  for dep in deps:
                      dep_time = os.path.getmtime(dep)
                      if dep_time > target_time:
                          #print "For target",target,"Dep failed:",dep # dbg
                          #print "times (dep,tar):",dep_time,target_time # dbg
                          return 1
                  return 0
              def target_update(target,deps,cmd):
                  """Update a target with a given command given a list of dependencies.
                  target_update(target,deps,cmd) -> runs cmd if target is outdated.
                  This is just a wrapper around target_outdated() which calls the given
                  command if target is outdated."""
                  if target_outdated(target,deps):
                      system(cmd)
              ENOLINK = 1998
              def link(src, dst):
                  """Hard links ``src`` to ``dst``, returning 0 or errno.
                  Note that the special errno ``ENOLINK`` will be returned if ``os.link`` isn't
                  supported by the operating system.
                  """
                  if not hasattr(os, "link"):
                      return ENOLINK
                  link_errno = 0
                  try:
                      os.link(src, dst)
                  except OSError as e:
                      link_errno = e.errno
                  return link_errno
              def link_or_copy(src, dst):
                  """Attempts to hardlink ``src`` to ``dst``, copying if the link fails.
                  Attempts to maintain the semantics of ``shutil.copy``.
                  Because ``os.link`` does not overwrite files, a unique temporary file
                  will be used if the target already exists, then that file will be moved
                  into place.
                  """
                  if os.path.isdir(dst):
                      dst = os.path.join(dst, os.path.basename(src))
                  link_errno = link(src, dst)
                  if link_errno == errno.EEXIST:
                      if os.stat(src).st_ino == os.stat(dst).st_ino:
                          # dst is already a hard link to the correct file, so we don't need
                          # to do anything else. If we try to link and rename the file
                          # anyway, we get duplicate files - see http://bugs.python.org/issue21876
                          return
                      new_dst = dst + "-temp-%04X" %(random.randint(1, 16**4), )
                      try:
                          link_or_copy(src, new_dst)
                      except:
                          try:
                              os.remove(new_dst)
                          except OSError:
                              pass
                          raise
                      os.rename(new_dst, dst)
                  elif link_errno != 0:
                      # Either link isn't supported, or the filesystem doesn't support
                      # linking, or 'src' and 'dst' are on different filesystems.
                      shutil.copy(src, dst)
              def ensure_dir_exists(path, mode=0o755):
                  """ensure that a directory exists
                  If it doesn't exist, try to create it and protect against a race condition
                  if another process is doing the same.
                  The default permissions are 755, which differ from os.makedirs default of 777.
                  """
                  if not os.path.exists(path):
                      try:
                          os.makedirs(path, mode=mode)
                      except OSError as e:
                          if e.errno != errno.EEXIST:
                              raise
                  elif not os.path.isdir(path):
                      raise IOError("%r exists but is not a directory" % path)

IPython/utils/text.py

0 +1 -1

              # encoding: utf-8
              """
              Utilities for working with strings and text.
              Inheritance diagram:
              .. inheritance-diagram:: IPython.utils.text
                 :parts: 3
              """
              import os
              import re
              import sys
              import textwrap
              from string import Formatter
              from pathlib import Path
              from IPython.utils import py3compat
              # datetime.strftime date format for ipython
              if sys.platform == 'win32':
                  date_format = "%B %d, %Y"
              else:
                  date_format = "%B %-d, %Y"
              class LSString(str):
                  """String derivative with a special access attributes.
                  These are normal strings, but with the special attributes:
                      .l (or .list) : value as list (split on newlines).
                      .n (or .nlstr): original value (the string itself).
                      .s (or .spstr): value as whitespace-separated string.
                      .p (or .paths): list of path objects (requires path.py package)
                  Any values which require transformations are computed only once and
                  cached.
                  Such strings are very useful to efficiently interact with the shell, which
                  typically only understands whitespace-separated options for commands."""
                  def get_list(self):
                      try:
                          return self.__list
                      except AttributeError:
                          self.__list = self.split('\n')
                          return self.__list
                  l = list = property(get_list)
                  def get_spstr(self):
                      try:
                          return self.__spstr
                      except AttributeError:
                          self.__spstr = self.replace('\n',' ')
                          return self.__spstr
                  s = spstr = property(get_spstr)
                  def get_nlstr(self):
                      return self
                  n = nlstr = property(get_nlstr)
                  def get_paths(self):
                      try:
                          return self.__paths
                      except AttributeError:
                          self.__paths = [Path(p) for p in self.split('\n') if os.path.exists(p)]
                          return self.__paths
                  p = paths = property(get_paths)
              # FIXME: We need to reimplement type specific displayhook and then add this
              # back as a custom printer. This should also be moved outside utils into the
              # core.
              # def print_lsstring(arg):
              #     """ Prettier (non-repr-like) and more informative printer for LSString """
              #     print "LSString (.p, .n, .l, .s available). Value:"
              #     print arg
              #
              #
              # print_lsstring = result_display.when_type(LSString)(print_lsstring)
              class SList(list):
                  """List derivative with a special access attributes.
                  These are normal lists, but with the special attributes:
                  * .l (or .list) : value as list (the list itself).
                  * .n (or .nlstr): value as a string, joined on newlines.
                  * .s (or .spstr): value as a string, joined on spaces.
                  * .p (or .paths): list of path objects (requires path.py package)
                  Any values which require transformations are computed only once and
                  cached."""
                  def get_list(self):
                      return self
                  l = list = property(get_list)
                  def get_spstr(self):
                      try:
                          return self.__spstr
                      except AttributeError:
                          self.__spstr = ' '.join(self)
                          return self.__spstr
                  s = spstr = property(get_spstr)
                  def get_nlstr(self):
                      try:
                          return self.__nlstr
                      except AttributeError:
                          self.__nlstr = '\n'.join(self)
                          return self.__nlstr
                  n = nlstr = property(get_nlstr)
                  def get_paths(self):
                      try:
                          return self.__paths
                      except AttributeError:
                          self.__paths = [Path(p) for p in self if os.path.exists(p)]
                          return self.__paths
                  p = paths = property(get_paths)
                  def grep(self, pattern, prune = False, field = None):
                      """ Return all strings matching 'pattern' (a regex or callable)
                      This is case-insensitive. If prune is true, return all items
                      NOT matching the pattern.
                      If field is specified, the match must occur in the specified
                      whitespace-separated field.
                      Examples::
                          a.grep( lambda x: x.startswith('C') )
                          a.grep('Cha.*log', prune=1)
                          a.grep('chm', field=-1)
                      """
                      def match_target(s):
                          if field is None:
                              return s
                          parts = s.split()
                          try:
                              tgt = parts[field]
                              return tgt
                          except IndexError:
                              return ""
                      if isinstance(pattern, str):
                          pred = lambda x : re.search(pattern, x, re.IGNORECASE)
                      else:
                          pred = pattern
                      if not prune:
                          return SList([el for el in self if pred(match_target(el))])
                      else:
                          return SList([el for el in self if not pred(match_target(el))])
                  def fields(self, *fields):
                      """ Collect whitespace-separated fields from string list
                      Allows quick awk-like usage of string lists.
                      Example data (in var a, created by 'a = !ls -l')::
                          -rwxrwxrwx  1 ville None      18 Dec 14  2006 ChangeLog
                          drwxrwxrwx+ 6 ville None       0 Oct 24 18:05 IPython
                      * ``a.fields(0)`` is ``['-rwxrwxrwx', 'drwxrwxrwx+']``
                      * ``a.fields(1,0)`` is ``['1 -rwxrwxrwx', '6 drwxrwxrwx+']``
                        (note the joining by space).
                      * ``a.fields(-1)`` is ``['ChangeLog', 'IPython']``
                      IndexErrors are ignored.
                      Without args, fields() just split()'s the strings.
                      """
                      if len(fields) == 0:
                          return [el.split() for el in self]
                      res = SList()
                      for el in [f.split() for f in self]:
                          lineparts = []
                          for fd in fields:
                              try:
                                  lineparts.append(el[fd])
                              except IndexError:
                                  pass
                          if lineparts:
                              res.append(" ".join(lineparts))
                      return res
                  def sort(self,field= None,  nums = False):
                      """ sort by specified fields (see fields())
                      Example::
                          a.sort(1, nums = True)
                      Sorts a by second field, in numerical order (so that 21 > 3)
                      """
                      #decorate, sort, undecorate
                      if field is not None:
                          dsu = [[SList([line]).fields(field),  line] for line in self]
                      else:
                          dsu = [[line,  line] for line in self]
                      if nums:
                          for i in range(len(dsu)):
                              numstr = "".join([ch for ch in dsu[i][0] if ch.isdigit()])
                              try:
                                  n = int(numstr)
                              except ValueError:
                                  n = 0
                              dsu[i][0] = n
                      dsu.sort()
                      return SList([t[1] for t in dsu])
              # FIXME: We need to reimplement type specific displayhook and then add this
              # back as a custom printer. This should also be moved outside utils into the
              # core.
              # def print_slist(arg):
              #     """ Prettier (non-repr-like) and more informative printer for SList """
              #     print "SList (.p, .n, .l, .s, .grep(), .fields(), sort() available):"
              #     if hasattr(arg,  'hideonce') and arg.hideonce:
              #         arg.hideonce = False
              #         return
              #
              #     nlprint(arg)   # This was a nested list printer, now removed.
              #
              # print_slist = result_display.when_type(SList)(print_slist)
              def indent(instr,nspaces=4, ntabs=0, flatten=False):
                  """Indent a string a given number of spaces or tabstops.
                  indent(str,nspaces=4,ntabs=0) -> indent str by ntabs+nspaces.
                  Parameters
                  ----------
                  instr : basestring
                      The string to be indented.
                  nspaces : int (default: 4)
                      The number of spaces to be indented.
                  ntabs : int (default: 0)
                      The number of tabs to be indented.
                  flatten : bool (default: False)
                      Whether to scrub existing indentation.  If True, all lines will be
                      aligned to the same indentation.  If False, existing indentation will
                      be strictly increased.
                  Returns
                  -------
                  str|unicode : string indented by ntabs and nspaces.
                  """
                  if instr is None:
                      return
                  ind = '\t'*ntabs+' '*nspaces
                  if flatten:
                      pat = re.compile(r'^\s*', re.MULTILINE)
                  else:
                      pat = re.compile(r'^', re.MULTILINE)
                  outstr = re.sub(pat, ind, instr)
                  if outstr.endswith(os.linesep+ind):
                      return outstr[:-len(ind)]
                  else:
                      return outstr
              def list_strings(arg):
                  """Always return a list of strings, given a string or list of strings
                  as input.
                  Examples
                  --------
                  ::
                      In [7]: list_strings('A single string')
                      Out[7]: ['A single string']
                      In [8]: list_strings(['A single string in a list'])
                      Out[8]: ['A single string in a list']
                      In [9]: list_strings(['A','list','of','strings'])
                      Out[9]: ['A', 'list', 'of', 'strings']
                  """
                  if isinstance(arg, str):
                      return [arg]
                  else:
                      return arg
              def marquee(txt='',width=78,mark='*'):
                  """Return the input string centered in a 'marquee'.
                  Examples
                  --------
                  ::
                      In [16]: marquee('A test',40)
                      Out[16]: '**************** A test ****************'
                      In [17]: marquee('A test',40,'-')
                      Out[17]: '---------------- A test ----------------'
                      In [18]: marquee('A test',40,' ')
                      Out[18]: '                 A test                 '
                  """
                  if not txt:
                      return (mark*width)[:width]
                  nmark = (width-len(txt)-2)//len(mark)//2
                  if nmark < 0: nmark =0
                  marks = mark*nmark
                  return '%s %s %s' % (marks,txt,marks)
              ini_spaces_re = re.compile(r'^(\s+)')
              def num_ini_spaces(strng):
                  """Return the number of initial spaces in a string"""
                  ini_spaces = ini_spaces_re.match(strng)
                  if ini_spaces:
                      return ini_spaces.end()
                  else:
                      return 0
              def format_screen(strng):
                  """Format a string for screen printing.
                  This removes some latex-type format codes."""
                  # Paragraph continue
                  par_re = re.compile(r'\\$',re.MULTILINE)
                  strng = par_re.sub('',strng)
                  return strng
              def dedent(text):
                  """Equivalent of textwrap.dedent that ignores unindented first line.
                  This means it will still dedent strings like:
                  '''foo
                  is a bar
                  '''
                  For use in wrap_paragraphs.
                  """
                  if text.startswith('\n'):
                      # text starts with blank line, don't ignore the first line
                      return textwrap.dedent(text)
                  # split first line
                  splits = text.split('\n',1)
                  if len(splits) == 1:
                      # only one line
                      return textwrap.dedent(text)
                  first, rest = splits
                  # dedent everything but the first line
                  rest = textwrap.dedent(rest)
                  return '\n'.join([first, rest])
              def wrap_paragraphs(text, ncols=80):
                  """Wrap multiple paragraphs to fit a specified width.
                  This is equivalent to textwrap.wrap, but with support for multiple
                  paragraphs, as separated by empty lines.
                  Returns
                  -------
                  list of complete paragraphs, wrapped to fill `ncols` columns.
                  """
                  paragraph_re = re.compile(r'\n(\s*\n)+', re.MULTILINE)
                  text = dedent(text).strip()
                  paragraphs = paragraph_re.split(text)[::2] # every other entry is space
                  out_ps = []
                  indent_re = re.compile(r'\n\s+', re.MULTILINE)
                  for p in paragraphs:
                      # presume indentation that survives dedent is meaningful formatting,
                      # so don't fill unless text is flush.
                      if indent_re.search(p) is None:
                          # wrap paragraph
                          p = textwrap.fill(p, ncols)
                      out_ps.append(p)
                  return out_ps
              def long_substr(data):
                  """Return the longest common substring in a list of strings.
                  Credit: http://stackoverflow.com/questions/2892931/longest-common-substring-from-more-than-two-strings-python
                  """
                  substr = ''
                  if len(data) > 1 and len(data[0]) > 0:
                      for i in range(len(data[0])):
                          for j in range(len(data[0])-i+1):
                              if j > len(substr) and all(data[0][i:i+j] in x for x in data):
                                  substr = data[0][i:i+j]
                  elif len(data) == 1:
                      substr = data[0]
                  return substr
              def strip_email_quotes(text):
                  """Strip leading email quotation characters ('>').
                  Removes any combination of leading '>' interspersed with whitespace that
                  appears *identically* in all lines of the input text.
                  Parameters
                  ----------
                  text : str
                  Examples
                  --------
                  Simple uses::
                      In [2]: strip_email_quotes('> > text')
                      Out[2]: 'text'
                      In [3]: strip_email_quotes('> > text\\n> > more')
                      Out[3]: 'text\\nmore'
                  Note how only the common prefix that appears in all lines is stripped::
                      In [4]: strip_email_quotes('> > text\\n> > more\\n> more...')
                      Out[4]: '> text\\n> more\\nmore...'
                  So if any line has no quote marks ('>') , then none are stripped from any
                  of them ::
                      In [5]: strip_email_quotes('> > text\\n> > more\\nlast different')
                      Out[5]: '> > text\\n> > more\\nlast different'
                  """
                  lines = text.splitlines()
                  matches = set()
                  for line in lines:
                      prefix = re.match(r'^(\s*>[ >]*)', line)
                      if prefix:
                          matches.add(prefix.group(1))
                      else:
                          break
                  else:
                      prefix = long_substr(list(matches))
                      if prefix:
                          strip = len(prefix)
                          text = '\n'.join([ ln[strip:] for ln in lines])
                  return text
              def strip_ansi(source):
                  """
                  Remove ansi escape codes from text.
                  Parameters
                  ----------
                  source : str
                      Source to remove the ansi from
                  """
                  return re.sub(r'\033\[(\d|;)+?m', '', source)
              class EvalFormatter(Formatter):
                  """A String Formatter that allows evaluation of simple expressions.
                  Note that this version interprets a : as specifying a format string (as per
                  standard string formatting), so if slicing is required, you must explicitly
                  create a slice.
                  This is to be used in templating cases, such as the parallel batch
                  script templates, where simple arithmetic on arguments is useful.
                  Examples
                  --------
                  ::
                      In [1]: f = EvalFormatter()
                      In [2]: f.format('{n//4}', n=8)
                      Out[2]: '2'
                      In [3]: f.format("{greeting[slice(2,4)]}", greeting="Hello")
                      Out[3]: 'll'
                  """
                  def get_field(self, name, args, kwargs):
                      v = eval(name, kwargs)
                      return v, name
              #XXX: As of Python 3.4, the format string parsing no longer splits on a colon
              # inside [], so EvalFormatter can handle slicing. Once we only support 3.4 and
              # above, it should be possible to remove FullEvalFormatter.
              class FullEvalFormatter(Formatter):
                  """A String Formatter that allows evaluation of simple expressions.
                  Any time a format key is not found in the kwargs,
                  it will be tried as an expression in the kwargs namespace.
                  Note that this version allows slicing using [1:2], so you cannot specify
                  a format string. Use :class:`EvalFormatter` to permit format strings.
                  Examples
                  --------
                  ::
                      In [1]: f = FullEvalFormatter()
                      In [2]: f.format('{n//4}', n=8)
                      Out[2]: '2'
                      In [3]: f.format('{list(range(5))[2:4]}')
                      Out[3]: '[2, 3]'
                      In [4]: f.format('{3*2}')
                      Out[4]: '6'
                  """
                  # copied from Formatter._vformat with minor changes to allow eval
                  # and replace the format_spec code with slicing
                  def vformat(self, format_string, args, kwargs):
                      result = []
                      for literal_text, field_name, format_spec, conversion in \
                              self.parse(format_string):
                          # output the literal text
                          if literal_text:
                              result.append(literal_text)
                          # if there's a field, output it
                          if field_name is not None:
                              # this is some markup, find the object and do
                              # the formatting
                              if format_spec:
                                  # override format spec, to allow slicing:
                                  field_name = ':'.join([field_name, format_spec])
                              # eval the contents of the field for the object
                              # to be formatted
                              obj = eval(field_name, kwargs)
                              # do any conversion on the resulting object
                              obj = self.convert_field(obj, conversion)
                              # format the object and append to the result
                              result.append(self.format_field(obj, ''))
                      return ''.join(py3compat.cast_unicode(s) for s in result)
              class DollarFormatter(FullEvalFormatter):
                  """Formatter allowing Itpl style $foo replacement, for names and attribute
                  access only. Standard {foo} replacement also works, and allows full
                  evaluation of its arguments.
                  Examples
                  --------
                  ::
                      In [1]: f = DollarFormatter()
                      In [2]: f.format('{n//4}', n=8)
                      Out[2]: '2'
                      In [3]: f.format('23 * 76 is $result', result=23*76)
                      Out[3]: '23 * 76 is 1748'
                      In [4]: f.format('$a or {b}', a=1, b=2)
                      Out[4]: '1 or 2'
                  """
-                 _dollar_pattern_ignore_single_quote = re.compile("(.*?)\$(\$?[\w\.]+)(?=([^']*'[^']*')*[^']*$)")
+                 _dollar_pattern_ignore_single_quote = re.compile(r"(.*?)\$(\$?[\w\.]+)(?=([^']*'[^']*')*[^']*$)")
                  def parse(self, fmt_string):
                      for literal_txt, field_name, format_spec, conversion \
                                  in Formatter.parse(self, fmt_string):
                          # Find $foo patterns in the literal text.
                          continue_from = 0
                          txt = ""
                          for m in self._dollar_pattern_ignore_single_quote.finditer(literal_txt):
                              new_txt, new_field = m.group(1,2)
                              # $$foo --> $foo
                              if new_field.startswith("$"):
                                  txt += new_txt + new_field
                              else:
                                  yield (txt + new_txt, new_field, "", None)
                                  txt = ""
                              continue_from = m.end()
                          # Re-yield the {foo} style pattern
                          yield (txt + literal_txt[continue_from:], field_name, format_spec, conversion)
              #-----------------------------------------------------------------------------
              # Utils to columnize a list of string
              #-----------------------------------------------------------------------------
              def _col_chunks(l, max_rows, row_first=False):
                  """Yield successive max_rows-sized column chunks from l."""
                  if row_first:
                      ncols = (len(l) // max_rows) + (len(l) % max_rows > 0)
                      for i in range(ncols):
                          yield [l[j] for j in range(i, len(l), ncols)]
                  else:
                      for i in range(0, len(l), max_rows):
                          yield l[i:(i + max_rows)]
              def _find_optimal(rlist, row_first=False, separator_size=2, displaywidth=80):
                  """Calculate optimal info to columnize a list of string"""
                  for max_rows in range(1, len(rlist) + 1):
                      col_widths = list(map(max, _col_chunks(rlist, max_rows, row_first)))
                      sumlength = sum(col_widths)
                      ncols = len(col_widths)
                      if sumlength + separator_size * (ncols - 1) <= displaywidth:
                          break
                  return {'num_columns': ncols,
                          'optimal_separator_width': (displaywidth - sumlength) // (ncols - 1) if (ncols - 1) else 0,
                          'max_rows': max_rows,
                          'column_widths': col_widths
                          }
              def _get_or_default(mylist, i, default=None):
                  """return list item number, or default if don't exist"""
                  if i >= len(mylist):
                      return default
                  else :
                      return mylist[i]
              def compute_item_matrix(items, row_first=False, empty=None, *args, **kwargs) :
                  """Returns a nested list, and info to columnize items
                  Parameters
                  ----------
                  items
                      list of strings to columize
                  row_first : (default False)
                      Whether to compute columns for a row-first matrix instead of
                      column-first (default).
                  empty : (default None)
                      default value to fill list if needed
                  separator_size : int (default=2)
                      How much characters will be used as a separation between each columns.
                  displaywidth : int (default=80)
                      The width of the area onto which the columns should enter
                  Returns
                  -------
                  strings_matrix
                      nested list of string, the outer most list contains as many list as
                      rows, the innermost lists have each as many element as columns. If the
                      total number of elements in `items` does not equal the product of
                      rows*columns, the last element of some lists are filled with `None`.
                  dict_info
                      some info to make columnize easier:
                      num_columns
                        number of columns
                      max_rows
                        maximum number of rows (final number may be less)
                      column_widths
                        list of with of each columns
                      optimal_separator_width
                        best separator width between columns
                  Examples
                  --------
                  ::
                      In [1]: l = ['aaa','b','cc','d','eeeee','f','g','h','i','j','k','l']
                      In [2]: list, info = compute_item_matrix(l, displaywidth=12)
                      In [3]: list
                      Out[3]: [['aaa', 'f', 'k'], ['b', 'g', 'l'], ['cc', 'h', None], ['d', 'i', None], ['eeeee', 'j', None]]
                      In [4]: ideal = {'num_columns': 3, 'column_widths': [5, 1, 1], 'optimal_separator_width': 2, 'max_rows': 5}
                      In [5]: all((info[k] == ideal[k] for k in ideal.keys()))
                      Out[5]: True
                  """
                  info = _find_optimal(list(map(len, items)), row_first, *args, **kwargs)
                  nrow, ncol = info['max_rows'], info['num_columns']
                  if row_first:
                      return ([[_get_or_default(items, r * ncol + c, default=empty) for c in range(ncol)] for r in range(nrow)], info)
                  else:
                      return ([[_get_or_default(items, c * nrow + r, default=empty) for c in range(ncol)] for r in range(nrow)], info)
              def columnize(items, row_first=False, separator='  ', displaywidth=80, spread=False):
                  """ Transform a list of strings into a single string with columns.
                  Parameters
                  ----------
                  items : sequence of strings
                      The strings to process.
                  row_first : (default False)
                      Whether to compute columns for a row-first matrix instead of
                      column-first (default).
                  separator : str, optional [default is two spaces]
                      The string that separates columns.
                  displaywidth : int, optional [default is 80]
                      Width of the display in number of characters.
                  Returns
                  -------
                  The formatted string.
                  """
                  if not items:
                      return '\n'
                  matrix, info = compute_item_matrix(items, row_first=row_first, separator_size=len(separator), displaywidth=displaywidth)
                  if spread:
                      separator = separator.ljust(int(info['optimal_separator_width']))
                  fmatrix = [filter(None, x) for x in matrix]
                  sjoin = lambda x : separator.join([ y.ljust(w, ' ') for y, w in zip(x, info['column_widths'])])
                  return '\n'.join(map(sjoin, fmatrix))+'\n'
              def get_text_list(list_, last_sep=' and ', sep=", ", wrap_item_with=""):
                  """
                  Return a string with a natural enumeration of items
                  >>> get_text_list(['a', 'b', 'c', 'd'])
                  'a, b, c and d'
                  >>> get_text_list(['a', 'b', 'c'], ' or ')
                  'a, b or c'
                  >>> get_text_list(['a', 'b', 'c'], ', ')
                  'a, b, c'
                  >>> get_text_list(['a', 'b'], ' or ')
                  'a or b'
                  >>> get_text_list(['a'])
                  'a'
                  >>> get_text_list([])
                  ''
                  >>> get_text_list(['a', 'b'], wrap_item_with="`")
                  '`a` and `b`'
                  >>> get_text_list(['a', 'b', 'c', 'd'], " = ", sep=" + ")
                  'a + b + c = d'
                  """
                  if len(list_) == 0:
                      return ''
                  if wrap_item_with:
                      list_ = ['%s%s%s' % (wrap_item_with, item, wrap_item_with) for
                               item in list_]
                  if len(list_) == 1:
                      return list_[0]
                  return '%s%s%s' % (
                      sep.join(i for i in list_[:-1]),
                      last_sep, list_[-1])

IPython/utils/tokenize2.py

0 +1 -1

              """Patched version of standard library tokenize, to deal with various bugs.
              Based on Python 3.2 code.
              Patches:
              - Gareth Rees' patch for Python issue #12691 (untokenizing)
                - Except we don't encode the output of untokenize
                - Python 2 compatible syntax, so that it can be byte-compiled at installation
              - Newlines in comments and blank lines should be either NL or NEWLINE, depending
                on whether they are in a multi-line statement. Filed as Python issue #17061.
              - Export generate_tokens & TokenError
              - u and rb literals are allowed under Python 3.3 and above.
              ------------------------------------------------------------------------------
              Tokenization help for Python programs.
              tokenize(readline) is a generator that breaks a stream of bytes into
              Python tokens.  It decodes the bytes according to PEP-0263 for
              determining source file encoding.
              It accepts a readline-like method which is called repeatedly to get the
              next line of input (or b"" for EOF).  It generates 5-tuples with these
              members:
                  the token type (see token.py)
                  the token (a string)
                  the starting (row, column) indices of the token (a 2-tuple of ints)
                  the ending (row, column) indices of the token (a 2-tuple of ints)
                  the original line (string)
              It is designed to match the working of the Python tokenizer exactly, except
              that it produces COMMENT tokens for comments and gives type OP for all
              operators.  Additionally, all token lists start with an ENCODING token
              which tells you which encoding was used to decode the bytes stream.
              """
              __author__ = 'Ka-Ping Yee <ping@lfw.org>'
              __credits__ = ('GvR, ESR, Tim Peters, Thomas Wouters, Fred Drake, '
                             'Skip Montanaro, Raymond Hettinger, Trent Nelson, '
                             'Michael Foord')
              import builtins
              import re
              import sys
              from token import *
              from codecs import lookup, BOM_UTF8
              import collections
              from io import TextIOWrapper
-             cookie_re = re.compile("coding[:=]\s*([-\w.]+)")
+             cookie_re = re.compile(r"coding[:=]\s*([-\w.]+)")
              import token
              __all__ = token.__all__ + ["COMMENT", "tokenize", "detect_encoding",
                                         "NL", "untokenize", "ENCODING", "TokenInfo"]
              del token
              __all__ += ["generate_tokens", "TokenError"]
              COMMENT = N_TOKENS
              tok_name[COMMENT] = 'COMMENT'
              NL = N_TOKENS + 1
              tok_name[NL] = 'NL'
              ENCODING = N_TOKENS + 2
              tok_name[ENCODING] = 'ENCODING'
              N_TOKENS += 3
              class TokenInfo(collections.namedtuple('TokenInfo', 'type string start end line')):
                  def __repr__(self):
                      annotated_type = '%d (%s)' % (self.type, tok_name[self.type])
                      return ('TokenInfo(type=%s, string=%r, start=%r, end=%r, line=%r)' %
                              self._replace(type=annotated_type))
              def group(*choices): return '(' + '|'.join(choices) + ')'
              def any(*choices): return group(*choices) + '*'
              def maybe(*choices): return group(*choices) + '?'
              # Note: we use unicode matching for names ("\w") but ascii matching for
              # number literals.
              Whitespace = r'[ \f\t]*'
              Comment = r'#[^\r\n]*'
              Ignore = Whitespace + any(r'\\\r?\n' + Whitespace) + maybe(Comment)
              Name = r'\w+'
              Hexnumber = r'0[xX][0-9a-fA-F]+'
              Binnumber = r'0[bB][01]+'
              Octnumber = r'0[oO][0-7]+'
              Decnumber = r'(?:0+|[1-9][0-9]*)'
              Intnumber = group(Hexnumber, Binnumber, Octnumber, Decnumber)
              Exponent = r'[eE][-+]?[0-9]+'
              Pointfloat = group(r'[0-9]+\.[0-9]*', r'\.[0-9]+') + maybe(Exponent)
              Expfloat = r'[0-9]+' + Exponent
              Floatnumber = group(Pointfloat, Expfloat)
              Imagnumber = group(r'[0-9]+[jJ]', Floatnumber + r'[jJ]')
              Number = group(Imagnumber, Floatnumber, Intnumber)
              StringPrefix = r'(?:[bB][rR]?|[rR][bB]?|[uU])?'
              # Tail end of ' string.
              Single = r"[^'\\]*(?:\\.[^'\\]*)*'"
              # Tail end of " string.
              Double = r'[^"\\]*(?:\\.[^"\\]*)*"'
              # Tail end of ''' string.
              Single3 = r"[^'\\]*(?:(?:\\.|'(?!''))[^'\\]*)*'''"
              # Tail end of """ string.
              Double3 = r'[^"\\]*(?:(?:\\.|"(?!""))[^"\\]*)*"""'
              Triple = group(StringPrefix + "'''", StringPrefix + '"""')
              # Single-line ' or " string.
              String = group(StringPrefix + r"'[^\n'\\]*(?:\\.[^\n'\\]*)*'",
                             StringPrefix + r'"[^\n"\\]*(?:\\.[^\n"\\]*)*"')
              # Because of leftmost-then-longest match semantics, be sure to put the
              # longest operators first (e.g., if = came before ==, == would get
              # recognized as two instances of =).
              Operator = group(r"\*\*=?", r">>=?", r"<<=?", r"!=",
                               r"//=?", r"->",
                               r"[+\-*/%&|^=<>]=?",
                               r"~")
              Bracket = '[][(){}]'
              Special = group(r'\r?\n', r'\.\.\.', r'[:;.,@]')
              Funny = group(Operator, Bracket, Special)
              PlainToken = group(Number, Funny, String, Name)
              Token = Ignore + PlainToken
              # First (or only) line of ' or " string.
              ContStr = group(StringPrefix + r"'[^\n'\\]*(?:\\.[^\n'\\]*)*" +
                              group("'", r'\\\r?\n'),
                              StringPrefix + r'"[^\n"\\]*(?:\\.[^\n"\\]*)*' +
                              group('"', r'\\\r?\n'))
              PseudoExtras = group(r'\\\r?\n', Comment, Triple)
              PseudoToken = Whitespace + group(PseudoExtras, Number, Funny, ContStr, Name)
              def _compile(expr):
                  return re.compile(expr, re.UNICODE)
              tokenprog, pseudoprog, single3prog, double3prog = map(
                  _compile, (Token, PseudoToken, Single3, Double3))
              endprogs = {"'": _compile(Single), '"': _compile(Double),
                          "'''": single3prog, '"""': double3prog,
                          "r'''": single3prog, 'r"""': double3prog,
                          "b'''": single3prog, 'b"""': double3prog,
                          "R'''": single3prog, 'R"""': double3prog,
                          "B'''": single3prog, 'B"""': double3prog,
                          "br'''": single3prog, 'br"""': double3prog,
                          "bR'''": single3prog, 'bR"""': double3prog,
                          "Br'''": single3prog, 'Br"""': double3prog,
                          "BR'''": single3prog, 'BR"""': double3prog,
                          'r': None, 'R': None, 'b': None, 'B': None}
              triple_quoted = {}
              for t in ("'''", '"""',
                        "r'''", 'r"""', "R'''", 'R"""',
                        "b'''", 'b"""', "B'''", 'B"""',
                        "br'''", 'br"""', "Br'''", 'Br"""',
                        "bR'''", 'bR"""', "BR'''", 'BR"""'):
                  triple_quoted[t] = t
              single_quoted = {}
              for t in ("'", '"',
                        "r'", 'r"', "R'", 'R"',
                        "b'", 'b"', "B'", 'B"',
                        "br'", 'br"', "Br'", 'Br"',
                        "bR'", 'bR"', "BR'", 'BR"' ):
                  single_quoted[t] = t
              for _prefix in ['rb', 'rB', 'Rb', 'RB', 'u', 'U']:
                  _t2 = _prefix+'"""'
                  endprogs[_t2] = double3prog
                  triple_quoted[_t2] = _t2
                  _t1 = _prefix + "'''"
                  endprogs[_t1] = single3prog
                  triple_quoted[_t1] = _t1
                  single_quoted[_prefix+'"'] = _prefix+'"'
                  single_quoted[_prefix+"'"] = _prefix+"'"
              del _prefix, _t2, _t1
              endprogs['u'] = None
              endprogs['U'] = None
              del _compile
              tabsize = 8
              class TokenError(Exception): pass
              class StopTokenizing(Exception): pass
              class Untokenizer:
                  def __init__(self):
                      self.tokens = []
                      self.prev_row = 1
                      self.prev_col = 0
                      self.encoding = 'utf-8'
                  def add_whitespace(self, tok_type, start):
                      row, col = start
                      assert row >= self.prev_row
                      col_offset = col - self.prev_col
                      if col_offset > 0:
                          self.tokens.append(" " * col_offset)
                      elif row > self.prev_row and tok_type not in (NEWLINE, NL, ENDMARKER):
                          # Line was backslash-continued.
                          self.tokens.append(" ")
                  def untokenize(self, tokens):
                      iterable = iter(tokens)
                      for t in iterable:
                          if len(t) == 2:
                              self.compat(t, iterable)
                              break
                          tok_type, token, start, end = t[:4]
                          if tok_type == ENCODING:
                              self.encoding = token
                              continue
                          self.add_whitespace(tok_type, start)
                          self.tokens.append(token)
                          self.prev_row, self.prev_col = end
                          if tok_type in (NEWLINE, NL):
                              self.prev_row += 1
                              self.prev_col = 0
                      return "".join(self.tokens)
                  def compat(self, token, iterable):
                      # This import is here to avoid problems when the itertools
                      # module is not built yet and tokenize is imported.
                      from itertools import chain
                      startline = False
                      prevstring = False
                      indents = []
                      toks_append = self.tokens.append
                      for tok in chain([token], iterable):
                          toknum, tokval = tok[:2]
                          if toknum == ENCODING:
                              self.encoding = tokval
                              continue
                          if toknum in (NAME, NUMBER):
                              tokval += ' '
                          # Insert a space between two consecutive strings
                          if toknum == STRING:
                              if prevstring:
                                  tokval = ' ' + tokval
                              prevstring = True
                          else:
                              prevstring = False
                          if toknum == INDENT:
                              indents.append(tokval)
                              continue
                          elif toknum == DEDENT:
                              indents.pop()
                              continue
                          elif toknum in (NEWLINE, NL):
                              startline = True
                          elif startline and indents:
                              toks_append(indents[-1])
                              startline = False
                          toks_append(tokval)
              def untokenize(tokens):
                  """
                  Convert ``tokens`` (an iterable) back into Python source code. Return
                  a bytes object, encoded using the encoding specified by the last
                  ENCODING token in ``tokens``, or UTF-8 if no ENCODING token is found.
                  The result is guaranteed to tokenize back to match the input so that
                  the conversion is lossless and round-trips are assured.  The
                  guarantee applies only to the token type and token string as the
                  spacing between tokens (column positions) may change.
                  :func:`untokenize` has two modes. If the input tokens are sequences
                  of length 2 (``type``, ``string``) then spaces are added as necessary to
                  preserve the round-trip property.
                  If the input tokens are sequences of length 4 or more (``type``,
                  ``string``, ``start``, ``end``), as returned by :func:`tokenize`, then
                  spaces are added so that each token appears in the result at the
                  position indicated by ``start`` and ``end``, if possible.
                  """
                  return Untokenizer().untokenize(tokens)
              def _get_normal_name(orig_enc):
                  """Imitates get_normal_name in tokenizer.c."""
                  # Only care about the first 12 characters.
                  enc = orig_enc[:12].lower().replace("_", "-")
                  if enc == "utf-8" or enc.startswith("utf-8-"):
                      return "utf-8"
                  if enc in ("latin-1", "iso-8859-1", "iso-latin-1") or \
                     enc.startswith(("latin-1-", "iso-8859-1-", "iso-latin-1-")):
                      return "iso-8859-1"
                  return orig_enc
              def detect_encoding(readline):
                  """
                  The detect_encoding() function is used to detect the encoding that should
                  be used to decode a Python source file.  It requires one argument, readline,
                  in the same way as the tokenize() generator.
                  It will call readline a maximum of twice, and return the encoding used
                  (as a string) and a list of any lines (left as bytes) it has read in.
                  It detects the encoding from the presence of a utf-8 bom or an encoding
                  cookie as specified in pep-0263.  If both a bom and a cookie are present,
                  but disagree, a SyntaxError will be raised.  If the encoding cookie is an
                  invalid charset, raise a SyntaxError.  Note that if a utf-8 bom is found,
                  'utf-8-sig' is returned.
                  If no encoding is specified, then the default of 'utf-8' will be returned.
                  """
                  bom_found = False
                  encoding = None
                  default = 'utf-8'
                  def read_or_stop():
                      try:
                          return readline()
                      except StopIteration:
                          return b''
                  def find_cookie(line):
                      try:
                          # Decode as UTF-8. Either the line is an encoding declaration,
                          # in which case it should be pure ASCII, or it must be UTF-8
                          # per default encoding.
                          line_string = line.decode('utf-8')
                      except UnicodeDecodeError:
                          raise SyntaxError("invalid or missing encoding declaration")
                      matches = cookie_re.findall(line_string)
                      if not matches:
                          return None
                      encoding = _get_normal_name(matches[0])
                      try:
                          codec = lookup(encoding)
                      except LookupError:
                          # This behaviour mimics the Python interpreter
                          raise SyntaxError("unknown encoding: " + encoding)
                      if bom_found:
                          if encoding != 'utf-8':
                              # This behaviour mimics the Python interpreter
                              raise SyntaxError('encoding problem: utf-8')
                          encoding += '-sig'
                      return encoding
                  first = read_or_stop()
                  if first.startswith(BOM_UTF8):
                      bom_found = True
                      first = first[3:]
                      default = 'utf-8-sig'
                  if not first:
                      return default, []
                  encoding = find_cookie(first)
                  if encoding:
                      return encoding, [first]
                  second = read_or_stop()
                  if not second:
                      return default, [first]
                  encoding = find_cookie(second)
                  if encoding:
                      return encoding, [first, second]
                  return default, [first, second]
              def open(filename):
                  """Open a file in read only mode using the encoding detected by
                  detect_encoding().
                  """
                  buffer = builtins.open(filename, 'rb')
                  encoding, lines = detect_encoding(buffer.readline)
                  buffer.seek(0)
                  text = TextIOWrapper(buffer, encoding, line_buffering=True)
                  text.mode = 'r'
                  return text
              def tokenize(readline):
                  """
                  The tokenize() generator requires one argument, readline, which
                  must be a callable object which provides the same interface as the
                  readline() method of built-in file objects.  Each call to the function
                  should return one line of input as bytes.  Alternately, readline
                  can be a callable function terminating with :class:`StopIteration`::
                      readline = open(myfile, 'rb').__next__  # Example of alternate readline
                  The generator produces 5-tuples with these members: the token type; the
                  token string; a 2-tuple (srow, scol) of ints specifying the row and
                  column where the token begins in the source; a 2-tuple (erow, ecol) of
                  ints specifying the row and column where the token ends in the source;
                  and the line on which the token was found.  The line passed is the
                  logical line; continuation lines are included.
                  The first token sequence will always be an ENCODING token
                  which tells you which encoding was used to decode the bytes stream.
                  """
                  # This import is here to avoid problems when the itertools module is not
                  # built yet and tokenize is imported.
                  from itertools import chain, repeat
                  encoding, consumed = detect_encoding(readline)
                  rl_gen = iter(readline, b"")
                  empty = repeat(b"")
                  return _tokenize(chain(consumed, rl_gen, empty).__next__, encoding)
              def _tokenize(readline, encoding):
                  lnum = parenlev = continued = 0
                  numchars = '0123456789'
                  contstr, needcont = '', 0
                  contline = None
                  indents = [0]
                  if encoding is not None:
                      if encoding == "utf-8-sig":
                          # BOM will already have been stripped.
                          encoding = "utf-8"
                      yield TokenInfo(ENCODING, encoding, (0, 0), (0, 0), '')
                  while True:             # loop over lines in stream
                      try:
                          line = readline()
                      except StopIteration:
                          line = b''
                      if encoding is not None:
                          line = line.decode(encoding)
                      lnum += 1
                      pos, max = 0, len(line)
                      if contstr:                            # continued string
                          if not line:
                              raise TokenError("EOF in multi-line string", strstart)
                          endmatch = endprog.match(line)
                          if endmatch:
                              pos = end = endmatch.end(0)
                              yield TokenInfo(STRING, contstr + line[:end],
                                     strstart, (lnum, end), contline + line)
                              contstr, needcont = '', 0
                              contline = None
                          elif needcont and line[-2:] != '\\\n' and line[-3:] != '\\\r\n':
                              yield TokenInfo(ERRORTOKEN, contstr + line,
                                         strstart, (lnum, len(line)), contline)
                              contstr = ''
                              contline = None
                              continue
                          else:
                              contstr = contstr + line
                              contline = contline + line
                              continue
                      elif parenlev == 0 and not continued:  # new statement
                          if not line: break
                          column = 0
                          while pos < max:                   # measure leading whitespace
                              if line[pos] == ' ':
                                  column += 1
                              elif line[pos] == '\t':
                                  column = (column//tabsize + 1)*tabsize
                              elif line[pos] == '\f':
                                  column = 0
                              else:
                                  break
                              pos += 1
                          if pos == max:
                              break
                          if line[pos] in '#\r\n':           # skip comments or blank lines
                              if line[pos] == '#':
                                  comment_token = line[pos:].rstrip('\r\n')
                                  nl_pos = pos + len(comment_token)
                                  yield TokenInfo(COMMENT, comment_token,
                                         (lnum, pos), (lnum, pos + len(comment_token)), line)
                                  yield TokenInfo(NEWLINE, line[nl_pos:],
                                         (lnum, nl_pos), (lnum, len(line)), line)
                              else:
                                  yield TokenInfo(NEWLINE, line[pos:],
                                         (lnum, pos), (lnum, len(line)), line)
                              continue
                          if column > indents[-1]:           # count indents or dedents
                              indents.append(column)
                              yield TokenInfo(INDENT, line[:pos], (lnum, 0), (lnum, pos), line)
                          while column < indents[-1]:
                              if column not in indents:
                                  raise IndentationError(
                                      "unindent does not match any outer indentation level",
                                      ("<tokenize>", lnum, pos, line))
                              indents = indents[:-1]
                              yield TokenInfo(DEDENT, '', (lnum, pos), (lnum, pos), line)
                      else:                                  # continued statement
                          if not line:
                              raise TokenError("EOF in multi-line statement", (lnum, 0))
                          continued = 0
                      while pos < max:
                          pseudomatch = pseudoprog.match(line, pos)
                          if pseudomatch:                                # scan for tokens
                              start, end = pseudomatch.span(1)
                              spos, epos, pos = (lnum, start), (lnum, end), end
                              token, initial = line[start:end], line[start]
                              if (initial in numchars or                  # ordinary number
                                  (initial == '.' and token != '.' and token != '...')):
                                  yield TokenInfo(NUMBER, token, spos, epos, line)
                              elif initial in '\r\n':
                                  yield TokenInfo(NL if parenlev > 0 else NEWLINE,
                                         token, spos, epos, line)
                              elif initial == '#':
                                  assert not token.endswith("\n")
                                  yield TokenInfo(COMMENT, token, spos, epos, line)
                              elif token in triple_quoted:
                                  endprog = endprogs[token]
                                  endmatch = endprog.match(line, pos)
                                  if endmatch:                           # all on one line
                                      pos = endmatch.end(0)
                                      token = line[start:pos]
                                      yield TokenInfo(STRING, token, spos, (lnum, pos), line)
                                  else:
                                      strstart = (lnum, start)           # multiple lines
                                      contstr = line[start:]
                                      contline = line
                                      break
                              elif initial in single_quoted or \
                                  token[:2] in single_quoted or \
                                  token[:3] in single_quoted:
                                  if token[-1] == '\n':                  # continued string
                                      strstart = (lnum, start)
                                      endprog = (endprogs[initial] or endprogs[token[1]] or
                                                 endprogs[token[2]])
                                      contstr, needcont = line[start:], 1
                                      contline = line
                                      break
                                  else:                                  # ordinary string
                                      yield TokenInfo(STRING, token, spos, epos, line)
                              elif initial.isidentifier():               # ordinary name
                                  yield TokenInfo(NAME, token, spos, epos, line)
                              elif initial == '\\':                      # continued stmt
                                  continued = 1
                              else:
                                  if initial in '([{':
                                      parenlev += 1
                                  elif initial in ')]}':
                                      parenlev -= 1
                                  yield TokenInfo(OP, token, spos, epos, line)
                          else:
                              yield TokenInfo(ERRORTOKEN, line[pos],
                                         (lnum, pos), (lnum, pos+1), line)
                              pos += 1
                  for indent in indents[1:]:                 # pop remaining indent levels
                      yield TokenInfo(DEDENT, '', (lnum, 0), (lnum, 0), '')
                  yield TokenInfo(ENDMARKER, '', (lnum, 0), (lnum, 0), '')
              # An undocumented, backwards compatible, API for all the places in the standard
              # library that expect to be able to use tokenize with strings
              def generate_tokens(readline):
                  return _tokenize(readline, None)
              if __name__ == "__main__":
                  # Quick sanity check
                  s = b'''def parseline(self, line):
                          """Parse the line into a command name and a string containing
                          the arguments.  Returns a tuple containing (command, args, line).
                          'command' and 'args' may be None if the line couldn't be parsed.
                          """
                          line = line.strip()
                          if not line:
                              return None, None, line
                          elif line[0] == '?':
                              line = 'help ' + line[1:]
                          elif line[0] == '!':
                              if hasattr(self, 'do_shell'):
                                  line = 'shell ' + line[1:]
                              else:
                                  return None, None, line
                          i, n = 0, len(line)
                          while i < n and line[i] in self.identchars: i = i+1
                          cmd, arg = line[:i], line[i:].strip()
                          return cmd, arg, line
                  '''
                  for tok in tokenize(iter(s.splitlines()).__next__):
                      print(tok)

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages