rhodecode-enterprise-ce Commit - r5083:875cd526

diffs: python3 port

super-admin -

r5083:875cd526 default

parent child

rhodecode/lib/diff_match_patch.py

0 +6 -4

              import re
              import sys
              import time
-             import urllib.request, urllib.parse, urllib.error
+             import urllib.request
+             import urllib.parse
+             import urllib.error
              class diff_match_patch:
                          diffs = [
                              (self.DIFF_INSERT, longtext[:i]),
                              (self.DIFF_EQUAL, shorttext),
-                             (self.DIFF_INSERT, longtext[i + len(shorttext) :]),
+                             (self.DIFF_INSERT, longtext[i + len(shorttext):]),
                          ]
                          # Swap insertions for deletions if diff is reversed.
                          if len(text1) > len(text2):
                              if count_delete >= 1 and count_insert >= 1:
                                  # Delete the offending records and add the merged ones.
                                  a = self.diff_main(text_delete, text_insert, False, deadline)
-                                 diffs[pointer - count_delete - count_insert : pointer] = a
+                                 diffs[pointer - count_delete - count_insert: pointer] = a
                                  pointer = pointer - count_delete - count_insert + len(a)
                              count_insert = 0
                              count_delete = 0
                          return patches
                      text = textline.split("\n")
                      while len(text) != 0:
-                         m = re.match("^@@ -(\d+),?(\d*) \+(\d+),?(\d*) @@$", text[0])
+                         m = re.match(r"^@@ -(\d+),?(\d*) \+(\d+),?(\d*) @@$", text[0])
                          if not m:
                              raise ValueError("Invalid patch string: " + text[0])
                          patch = patch_obj()

rhodecode/lib/diffs.py

0 +161 -286

              """
              Set of diffing helpers, previously part of vcs
              """
+             import dataclasses
              import os
              import re
              import bz2
              import gzip
              import time
-             import collections
              import difflib
              import logging
              import pickle
              from rhodecode.lib.vcs.exceptions import VCSError
              from rhodecode.lib.vcs.nodes import FileNode, SubModuleNode
-             from rhodecode.lib.utils2 import safe_unicode, safe_str
+             from rhodecode.lib.vcs.backends import base
+             from rhodecode.lib.str_utils import safe_str
              log = logging.getLogger(__name__)
                  return request.GET.get('ignorews', '') == '1'
-             class OPS(object):
-                 ADD = 'A'
-                 MOD = 'M'
-                 DEL = 'D'
+             @dataclasses.dataclass
+             class OPS:
+                 ADD: str = 'A'
+                 MOD: str = 'M'
+                 DEL: str = 'D'
+             @dataclasses.dataclass
+             class DiffLineNumber:
+                 old: int | None
+                 new: int | None
+                 def __iter__(self):
+                     yield self.old
+                     yield self.new
              def get_gitdiff(filenode_old, filenode_new, ignore_whitespace=True, context=3):
                  for filenode in (filenode_old, filenode_new):
                      if not isinstance(filenode, FileNode):
-                         raise VCSError(
-                             "Given object should be FileNode object, not %s"
-                             % filenode.__class__)
+                         raise VCSError(f"Given object should be FileNode object, not {filenode.__class__}")
                  repo = filenode_new.commit.repository
                  old_commit = filenode_old.commit or repo.EMPTY_COMMIT
              class LimitedDiffContainer(object):
-                 def __init__(self, diff_limit, cur_diff_size, diff):
+                 def __init__(self, diff_limit: int, cur_diff_size, diff):
                      self.diff = diff
                      self.diff_limit = diff_limit
                      self.cur_diff_size = cur_diff_size
              class DiffProcessor(object):
                  """
-                 Give it a unified or git diff and it returns a list of the files that were
+                 Give it a unified or git diff, and it returns a list of the files that were
                  mentioned in the diff together with a dict of meta information that
-                 can be used to render it in a HTML template.
+                 can be used to render it in an HTML template.
                  .. note:: Unicode handling
                     since the result is intended for presentation to the user.
                  """
-                 _chunk_re = re.compile(r'^@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@(.*)')
-                 _newline_marker = re.compile(r'^\\ No newline at end of file')
+                 _chunk_re = re.compile(br'^@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@(.*)')
+                 _newline_marker = re.compile(br'^\\ No newline at end of file')
                  # used for inline highlighter word split
-                 _token_re = re.compile(r'()(&gt;|&lt;|&amp;|\W+?)')
+                 _token_re = re.compile(br'()(&gt;|&lt;|&amp;|\W+?)')
                  # collapse ranges of commits over given number
                  _collapse_commits_over = 5
-                 def __init__(self, diff, format='gitdiff', diff_limit=None,
-                              file_limit=None, show_full_diff=True):
+                 def __init__(self, diff: base.Diff, diff_format='gitdiff', diff_limit: int = 0,
+                              file_limit: int = 0, show_full_diff=True):
                      """
                      :param diff: A `Diff` object representing a diff from a vcs backend
-                     :param format: format of diff passed, `udiff` or `gitdiff`
+                     :param diff_format: format of diff passed, `udiff` or `gitdiff`
                      :param diff_limit: define the size of diff that is considered "big"
                          based on that parameter cut off will be triggered, set to None
                          to show full diff
                      """
                      self._diff = diff
-                     self._format = format
+                     self._format = diff_format
                      self.adds = 0
                      self.removes = 0
                      # calculate diff size
                      self.parsed = False
                      self.parsed_diff = []
-                     log.debug('Initialized DiffProcessor with %s mode', format)
-                     if format == 'gitdiff':
+                     log.debug('Initialized DiffProcessor with %s mode', diff_format)
+                     self.differ = self._highlight_line_udiff
+                     self._parser = self._new_parse_gitdiff
+                     if diff_format == 'gitdiff':
                          self.differ = self._highlight_line_difflib
                          self._parser = self._parse_gitdiff
-                     else:
-                         self.differ = self._highlight_line_udiff
-                         self._parser = self._new_parse_gitdiff
+                         raise DeprecationWarning('gitdiff usage is deprecated')
                  def _copy_iterator(self):
                      """
                      self.__udiff, iterator_copy = tee(self.__udiff)
                      return iterator_copy
-                 def _escaper(self, string):
+                 def _escaper(self, diff_string):
                      """
                      Escaper for diff escapes special chars and checks the diff limit
                      :param string:
                      """
-                     self.cur_diff_size += len(string)
+                     self.cur_diff_size += len(diff_string)
                      if not self.show_full_diff and (self.cur_diff_size > self.diff_limit):
                          raise DiffLimitExceeded('Diff Limit Exceeded')
-                     return string \
-                         .replace('&', '&amp;')\
-                         .replace('<', '&lt;')\
-                         .replace('>', '&gt;')
+                     return diff_string \
+                         .replace(b'&', b'&amp;')\
+                         .replace(b'<', b'&lt;')\
+                         .replace(b'>', b'&gt;')
-                 def _line_counter(self, l):
+                 def _line_counter(self, diff_line):
                      """
                      Checks each line and bumps total adds/removes for this diff
-                     :param l:
+                     :param diff_line:
                      """
-                     if l.startswith('+') and not l.startswith('+++'):
+                     if diff_line.startswith(b'+') and not diff_line.startswith(b'+++'):
                          self.adds += 1
-                     elif l.startswith('-') and not l.startswith('---'):
+                     elif diff_line.startswith(b'-') and not diff_line.startswith(b'---'):
                          self.removes += 1
-                     return safe_unicode(l)
+                     return diff_line
                  def _highlight_line_difflib(self, line, next_):
                      """
                          newfrag = ''.join(newwords[j1:j2])
                          if tag != 'equal':
                              if oldfrag:
-                                 oldfrag = '<del>%s</del>' % oldfrag
+                                 oldfrag = f'<del>{oldfrag}</del>'
                              if newfrag:
-                                 newfrag = '<ins>%s</ins>' % newfrag
+                                 newfrag = f'<ins>{newfrag}</ins>'
                          oldfragments.append(oldfrag)
                          newfragments.append(newfrag)
                                  tag = 'ins'
                              else:
                                  tag = 'del'
-                             l['line'] = '%s<%s>%s</%s>%s' % (
-                                 l['line'][:start],
-                                 tag,
-                                 l['line'][start:last],
-                                 tag,
-                                 l['line'][last:]
+                             )
+                             l['line'] = f"{l['line'][:start]}<{tag}>{l['line'][start:last]}</{tag}>{l['line'][last:]}"
                          do(line)
                          do(next_)
-                 def _clean_line(self, line, command):
+                 def _clean_line(self, line, command: str):
                      if command in ['+', '-', ' ']:
                          # only modify the line if it's actually a diff thing
                          line = line[1:]
                  def _parse_gitdiff(self, inline_diff=True):
                      _files = []
-                     diff_container = lambda arg: arg
+                     def diff_container(arg):
+                         return arg
                      for chunk in self._diff.chunks():
                          head = chunk.header
                          elif head['new_file_mode']:
                              op = OPS.ADD
                              stats['binary'] = True
-                             stats['ops'][NEW_FILENODE] = 'new file %s' % head['new_file_mode']
-                         else:  # modify operation, can be copy, rename or chmod
+                             stats['ops'][NEW_FILENODE] = f"new file {safe_str(head['new_file_mode'])}"
+                         else:  # modify operation, can be: copy, rename or chmod
                              # CHMOD
                              if head['new_mode'] and head['old_mode']:
                                  op = OPS.MOD
                                  stats['binary'] = True
-                                 stats['ops'][CHMOD_FILENODE] = (
-                                     'modified file chmod %s => %s' % (
-                                         head['old_mode'], head['new_mode']))
+                                 stats['ops'][CHMOD_FILENODE] = f"modified file chmod {safe_str(head['old_mode'])} => {safe_str(head['new_mode'])}"
                              # RENAME
                              if head['rename_from'] != head['rename_to']:
                                  op = OPS.MOD
                                  stats['binary'] = True
-                                 stats['ops'][RENAMED_FILENODE] = (
-                                     'file renamed from %s to %s' % (
-                                         head['rename_from'], head['rename_to']))
+                                 stats['ops'][RENAMED_FILENODE] = f"file renamed from {safe_str(head['rename_from'])} to {safe_str(head['rename_to'])}"
                              # COPY
                              if head.get('copy_from') and head.get('copy_to'):
                                  op = OPS.MOD
                                  stats['binary'] = True
-                                 stats['ops'][COPIED_FILENODE] = (
-                                     'file copied from %s to %s' % (
-                                         head['copy_from'], head['copy_to']))
+                                 stats['ops'][COPIED_FILENODE] = f"file copied from {safe_str(head['copy_from'])} to {safe_str(head['copy_to'])}"
                              # If our new parsed headers didn't match anything fallback to
                              # old style detection
                                      raise DiffLimitExceeded('File Limit Exceeded')
                              except DiffLimitExceeded:
-                                 diff_container = lambda _diff: \
-                                     LimitedDiffContainer(
-                                         self.diff_limit, self.cur_diff_size, _diff)
+                                 def diff_container(_diff):
+                                     return LimitedDiffContainer(self.diff_limit, self.cur_diff_size, _diff)
                                  exceeds_limit = len(raw_diff) > self.file_limit
                                  limited_diff = True
                          else:  # GIT format binary patch, or possibly empty diff
                              if head['bin_patch']:
                                  # we have operation already extracted, but we mark simply
-                                 # it's a diff we wont show for binary files
+                                 # it's a diff we won't show for binary files
                                  stats['ops'][BIN_FILENODE] = 'binary diff hidden'
                              chunks = []
                              # to see the content of the file
                              chunks = []
-                         chunks.insert(0, [{
-                                               'old_lineno': '',
-                                               'new_lineno': '',
-                                               'action': Action.CONTEXT,
-                                               'line': msg,
-                                           } for _op, msg in stats['ops'].items()
-                                           if _op not in [MOD_FILENODE]])
+                         frag = [{
+                             'old_lineno': '',
+                             'new_lineno': '',
+                             'action': Action.CONTEXT,
+                             'line': msg,
+                         } for _op, msg in list(stats['ops'].items())
+                             if _op not in [MOD_FILENODE]]
+                         chunks.insert(0, frag)
                          _files.append({
-                             'filename': safe_unicode(head['b_path']),
+                             'filename': safe_str(head['b_path']),
                              'old_revision': head['a_blob_id'],
                              'new_revision': head['b_blob_id'],
                              'chunks': chunks,
-                             'raw_diff': safe_unicode(raw_diff),
+                             'raw_diff': safe_str(raw_diff),
                              'operation': op,
                              'stats': stats,
                              'exceeds_limit': exceeds_limit,
                              'is_limited_diff': limited_diff,
                          })
-                     sorter = lambda info: {OPS.ADD: 0, OPS.MOD: 1,
-                                            OPS.DEL: 2}.get(info['operation'])
+                     def operation_sorter(info):
+                         return {OPS.ADD: 0, OPS.MOD: 1, OPS.DEL: 2}.get(info['operation'])
                      if not inline_diff:
-                         return diff_container(sorted(_files, key=sorter))
+                         return diff_container(sorted(_files, key=operation_sorter))
                      # highlight inline changes
                      for diff_data in _files:
                              except StopIteration:
                                  pass
-                     return diff_container(sorted(_files, key=sorter))
+                     return diff_container(sorted(_files, key=operation_sorter))
                  def _check_large_diff(self):
                      if self.diff_limit:
                          log.debug('Checking if diff exceeds current diff_limit of %s', self.diff_limit)
                      if not self.show_full_diff and (self.cur_diff_size > self.diff_limit):
-                         raise DiffLimitExceeded('Diff Limit `%s` Exceeded', self.diff_limit)
+                         raise DiffLimitExceeded(f'Diff Limit `{self.diff_limit}` Exceeded')
                  # FIXME: NEWDIFFS: dan: this replaces _parse_gitdiff
                  def _new_parse_gitdiff(self, inline_diff=True):
                      _files = []
-                     # this can be overriden later to a LimitedDiffContainer type
-                     diff_container = lambda arg: arg
+                     # this can be overridden later to a LimitedDiffContainer type
+                     def diff_container(arg):
+                         return arg
                      for chunk in self._diff.chunks():
-                         head = chunk.header
-                         log.debug('parsing diff %r', head)
+                         head = chunk.header_as_str
+                         log.debug('parsing diff chunk %r', chunk)
                          raw_diff = chunk.raw
                          limited_diff = False
                              'added': 0,
                              'deleted': 0,
                              'binary': False,
-                             'old_mode': None,
-                             'new_mode': None,
+                             'old_mode': '',
+                             'new_mode': '',
                              'ops': {},
                          }
                          if head['old_mode']:
                          elif head['new_file_mode']:
                              op = OPS.ADD
                              stats['binary'] = True
-                             stats['old_mode'] = None
+                             stats['old_mode'] = ''
                              stats['new_mode'] = head['new_file_mode']
-                             stats['ops'][NEW_FILENODE] = 'new file %s' % head['new_file_mode']
+                             stats['ops'][NEW_FILENODE] = f"new file {head['new_file_mode']}"
-                         # modify operation, can be copy, rename or chmod
+                         # modify operation, can be: copy, rename or chmod
                          else:
                              # CHMOD
                              if head['new_mode'] and head['old_mode']:
                                  op = OPS.MOD
                                  stats['binary'] = True
-                                 stats['ops'][CHMOD_FILENODE] = (
-                                     'modified file chmod %s => %s' % (
-                                         head['old_mode'], head['new_mode']))
+                                 stats['ops'][CHMOD_FILENODE] = f"modified file chmod {head['old_mode']} => {head['new_mode']}"
                              # RENAME
                              if head['rename_from'] != head['rename_to']:
                                  op = OPS.MOD
                                  stats['binary'] = True
                                  stats['renamed'] = (head['rename_from'], head['rename_to'])
-                                 stats['ops'][RENAMED_FILENODE] = (
-                                     'file renamed from %s to %s' % (
-                                         head['rename_from'], head['rename_to']))
+                                 stats['ops'][RENAMED_FILENODE] = f"file renamed from {head['rename_from']} to {head['rename_to']}"
                              # COPY
                              if head.get('copy_from') and head.get('copy_to'):
                                  op = OPS.MOD
                                  stats['binary'] = True
                                  stats['copied'] = (head['copy_from'], head['copy_to'])
-                                 stats['ops'][COPIED_FILENODE] = (
-                                     'file copied from %s to %s' % (
-                                         head['copy_from'], head['copy_to']))
+                                 stats['ops'][COPIED_FILENODE] = f"file copied from {head['copy_from']} to {head['copy_to']}"
                              # If our new parsed headers didn't match anything fallback to
                              # old style detection
                                  # but the browser is the bottleneck.
                                  if not self.show_full_diff and exceeds_limit:
                                      log.debug('File `%s` exceeds current file_limit of %s',
-                                               safe_unicode(head['b_path']), self.file_limit)
-                                     raise DiffLimitExceeded(
-                                         'File Limit %s Exceeded', self.file_limit)
+                                               head['b_path'], self.file_limit)
+                                     raise DiffLimitExceeded(f'File Limit {self.file_limit} Exceeded')
                                  self._check_large_diff()
                                      stats['ops'][MOD_FILENODE] = 'modified file'
                              except DiffLimitExceeded:
-                                 diff_container = lambda _diff: \
-                                     LimitedDiffContainer(
-                                         self.diff_limit, self.cur_diff_size, _diff)
+                                 def limited_diff_container(_diff):
+                                     return LimitedDiffContainer(self.diff_limit, self.cur_diff_size, _diff)
+                                 # re-definition of our container wrapper
+                                 diff_container = limited_diff_container
                                  limited_diff = True
                                  chunks = []
                          else:  # GIT format binary patch, or possibly empty diff
                              if head['bin_patch']:
                                  # we have operation already extracted, but we mark simply
-                                 # it's a diff we wont show for binary files
+                                 # it's a diff we won't show for binary files
                                  stats['ops'][BIN_FILENODE] = 'binary diff hidden'
                              chunks = []
                              # to see the content of the file
                              chunks = []
-                         chunks.insert(
-, [{'old_lineno': '',
-                                  'new_lineno': '',
-                                  'action': Action.CONTEXT,
-                                  'line': msg,
-                                  } for _op, msg in stats['ops'].items()
-                                 if _op not in [MOD_FILENODE]])
+                         frag = [
+                             {'old_lineno': '',
+                              'new_lineno': '',
+                              'action': Action.CONTEXT,
+                              'line': msg,
+                              } for _op, msg in list(stats['ops'].items())
+                             if _op not in [MOD_FILENODE]]
-                         original_filename = safe_unicode(head['a_path'])
+                         chunks.insert(0, frag)
+                         original_filename = safe_str(head['a_path'])
                          _files.append({
                              'original_filename': original_filename,
-                             'filename': safe_unicode(head['b_path']),
+                             'filename': safe_str(head['b_path']),
                              'old_revision': head['a_blob_id'],
                              'new_revision': head['b_blob_id'],
                              'chunks': chunks,
-                             'raw_diff': safe_unicode(raw_diff),
+                             'raw_diff': safe_str(raw_diff),
                              'operation': op,
                              'stats': stats,
                              'exceeds_limit': exceeds_limit,
                              'is_limited_diff': limited_diff,
                          })
-                     sorter = lambda info: {OPS.ADD: 0, OPS.MOD: 1,
-                                            OPS.DEL: 2}.get(info['operation'])
+                     def sorter(info):
+                         return {OPS.ADD: 0, OPS.MOD: 1, OPS.DEL: 2}.get(info['operation'])
                      return diff_container(sorted(_files, key=sorter))
                  # FIXME: NEWDIFFS: dan: this gets replaced by _new_parse_lines
                              line = next(diff_iter)
                              while old_line < old_end or new_line < new_end:
-                                 command = ' '
+                                 command = b' '
                                  if line:
                                      command = line[0]
                                  affects_old = affects_new = False
                                  # ignore those if we don't expect them
-                                 if command in '#@':
+                                 if command in b'#@':
                                      continue
-                                 elif command == '+':
+                                 elif command == b'+':
                                      affects_new = True
                                      action = Action.ADD
                                      stats[0] += 1
-                                 elif command == '-':
+                                 elif command == b'-':
                                      affects_old = True
                                      action = Action.DELETE
                                      stats[1] += 1
                                      old_line += affects_old
                                      new_line += affects_new
                                      lines.append({
-                                         'old_lineno':   affects_old and old_line or '',
-                                         'new_lineno':   affects_new and new_line or '',
+                                         'old_lineno':   affects_old and old_line or b'',
+                                         'new_lineno':   affects_new and new_line or b'',
                                          'action':       action,
                                          'line':         self._clean_line(line, command)
                                      })
                      try:
                          line = next(diff_iter)
+                         assert isinstance(line, bytes)
                          while line:
                              raw_diff.append(line)
                                  break
                              gr = match.groups()
                              (old_line, old_end,
                               new_line, new_end) = [int(x or 1) for x in gr[:-1]]
                              old_line -= 1
                              new_line -= 1
-                             context = len(gr) == 5
+                             len(gr) == 5
                              old_end += old_line
                              new_end += new_line
                              while old_line < old_end or new_line < new_end:
                                  command = ' '
                                  if line:
-                                     command = line[0]
+                                     # This is bytes, so we need to convert it to a str
+                                     command: str = chr(line[0])
                                  affects_old = affects_new = False
                                      old_line += affects_old
                                      new_line += affects_new
                                      lines.append({
-                                         'old_lineno':   affects_old and old_line or '',
-                                         'new_lineno':   affects_new and new_line or '',
+                                         'old_lineno':   affects_old and old_line or None,
+                                         'new_lineno':   affects_new and new_line or None,
                                          'action':       action,
                                          'line':         self._clean_line(line, command)
                                      })
                      except StopIteration:
                          pass
-                     return ''.join(raw_diff), chunks, stats
+                     return b''.join(raw_diff), chunks, stats
                  def _safe_id(self, idstring):
                      """Make a string safe for including in an id attribute.
                      """
                      # Transform all whitespace to underscore
-                     idstring = re.sub(r'\s', "_", '%s' % idstring)
+                     idstring = re.sub(r'\s', "_", f'{idstring}')
                      # Remove everything that is not a hyphen or a member of \w
                      idstring = re.sub(r'(?!-)\W', "", idstring).lower()
                      return idstring
                  @classmethod
-                 def diff_splitter(cls, string):
+                 def diff_splitter(cls, diff_string: bytes):
                      """
                      Diff split that emulates .splitlines() but works only on \n
                      """
-                     if not string:
+                     if not diff_string:
                          return
-                     elif string == '\n':
-                         yield '\n'
+                     elif diff_string == b'\n':
+                         yield b'\n'
                      else:
-                         has_newline = string.endswith('\n')
-                         elements = string.split('\n')
+                         has_newline = diff_string.endswith(b'\n')
+                         elements = diff_string.split(b'\n')
                          if has_newline:
                              # skip last element as it's empty string from newlines
                              elements = elements[:-1]
                          for cnt, line in enumerate(elements, start=1):
                              last_line = cnt == len_elements
                              if last_line and not has_newline:
-                                 yield safe_unicode(line)
+                                 yield line
                              else:
-                                 yield safe_unicode(line) + '\n'
+                                 yield line + b'\n'
                  def prepare(self, inline_diff=True):
                      """
                      """
                      Returns raw diff as a byte string
                      """
-                     return self._diff.raw
-                 def as_html(self, table_class='code-difftable', line_class='line',
-                             old_lineno_class='lineno old', new_lineno_class='lineno new',
-                             code_class='code', enable_comments=False, parsed_lines=None):
-                     """
-                     Return given diff as html table with customized css classes
-                     """
-                     # TODO(marcink): not sure how to pass in translator
-                     # here in an efficient way, leave the _ for proper gettext extraction
-                     _ = lambda s: s
-                     def _link_to_if(condition, label, url):
-                         """
-                         Generates a link if condition is meet or just the label if not.
-                         """
-                         if condition:
-                             return '''<a href="%(url)s" class="tooltip"
-                             title="%(title)s">%(label)s</a>''' % {
-                                 'title': _('Click to select line'),
-                                 'url': url,
-                                 'label': label
+                             }
-                         else:
-                             return label
-                     if not self.parsed:
-                         self.prepare()
-                     diff_lines = self.parsed_diff
-                     if parsed_lines:
-                         diff_lines = parsed_lines
-                     _html_empty = True
-                     _html = []
-                     _html.append('''<table class="%(table_class)s">\n''' % {
-                         'table_class': table_class
-                     })
-                     for diff in diff_lines:
-                         for line in diff['chunks']:
-                             _html_empty = False
-                             for change in line:
-                                 _html.append('''<tr class="%(lc)s %(action)s">\n''' % {
-                                     'lc': line_class,
-                                     'action': change['action']
-                                 })
-                                 anchor_old_id = ''
-                                 anchor_new_id = ''
-                                 anchor_old = "%(filename)s_o%(oldline_no)s" % {
-                                     'filename': self._safe_id(diff['filename']),
-                                     'oldline_no': change['old_lineno']
+                                 }
-                                 anchor_new = "%(filename)s_n%(oldline_no)s" % {
-                                     'filename': self._safe_id(diff['filename']),
-                                     'oldline_no': change['new_lineno']
+                                 }
-                                 cond_old = (change['old_lineno'] != '...' and
-                                             change['old_lineno'])
-                                 cond_new = (change['new_lineno'] != '...' and
-                                             change['new_lineno'])
-                                 if cond_old:
-                                     anchor_old_id = 'id="%s"' % anchor_old
-                                 if cond_new:
-                                     anchor_new_id = 'id="%s"' % anchor_new
-                                 if change['action'] != Action.CONTEXT:
-                                     anchor_link = True
-                                 else:
-                                     anchor_link = False
-                                 ###########################################################
-                                 # COMMENT ICONS
-                                 ###########################################################
-                                 _html.append('''\t<td class="add-comment-line"><span class="add-comment-content">''')
-                                 if enable_comments and change['action'] != Action.CONTEXT:
-                                     _html.append('''<a href="#"><span class="icon-comment-add"></span></a>''')
-                                 _html.append('''</span></td><td class="comment-toggle tooltip" title="Toggle Comment Thread"><i class="icon-comment"></i></td>\n''')
-                                 ###########################################################
-                                 # OLD LINE NUMBER
-                                 ###########################################################
-                                 _html.append('''\t<td %(a_id)s class="%(olc)s">''' % {
-                                     'a_id': anchor_old_id,
-                                     'olc': old_lineno_class
-                                 })
-                                 _html.append('''%(link)s''' % {
-                                     'link': _link_to_if(anchor_link, change['old_lineno'],
-                                                         '#%s' % anchor_old)
-                                 })
-                                 _html.append('''</td>\n''')
-                                 ###########################################################
-                                 # NEW LINE NUMBER
-                                 ###########################################################
-                                 _html.append('''\t<td %(a_id)s class="%(nlc)s">''' % {
-                                     'a_id': anchor_new_id,
-                                     'nlc': new_lineno_class
-                                 })
-                                 _html.append('''%(link)s''' % {
-                                     'link': _link_to_if(anchor_link, change['new_lineno'],
-                                                         '#%s' % anchor_new)
-                                 })
-                                 _html.append('''</td>\n''')
-                                 ###########################################################
-                                 # CODE
-                                 ###########################################################
-                                 code_classes = [code_class]
-                                 if (not enable_comments or
-                                         change['action'] == Action.CONTEXT):
-                                     code_classes.append('no-comment')
-                                 _html.append('\t<td class="%s">' % ' '.join(code_classes))
-                                 _html.append('''\n\t\t<pre>%(code)s</pre>\n''' % {
-                                     'code': change['line']
-                                 })
-                                 _html.append('''\t</td>''')
-                                 _html.append('''\n</tr>\n''')
-                     _html.append('''</table>''')
-                     if _html_empty:
-                         return None
-                     return ''.join(_html)
+                     return self._diff.raw.tobytes()
                  def stat(self):
                      """
                      return self.adds, self.removes
                  def get_context_of_line(
-                         self, path, diff_line=None, context_before=3, context_after=3):
+                         self, path, diff_line: DiffLineNumber = None, context_before: int = 3, context_after: int = 3):
                      """
                      Returns the context lines for the specified diff line.
-                     :type diff_line: :class:`DiffLineNumber`
                      """
                      assert self.parsed, "DiffProcessor is not initialized."
                      if None not in diff_line:
-                         raise ValueError(
-                             "Cannot specify both line numbers: {}".format(diff_line))
+                         raise ValueError(f"Cannot specify both line numbers in diff_line: {diff_line}")
                      file_diff = self._get_file_diff(path)
                      chunk, idx = self._find_chunk_line_index(file_diff, diff_line)
                      first_line_to_include = max(idx - context_before, 0)
                      first_line_after_context = idx + context_after + 1
-                     context_lines = chunk[first_line_to_include:first_line_after_context]
+                     context_lines = chunk['lines'][first_line_to_include:first_line_after_context]
                      line_contents = [
                          _context_line(line) for line in context_lines
-                         if _is_diff_content(line)]
+                         if _is_diff_content(line)
+                     ]
                      # TODO: johbo: Interim fixup, the diff chunks drop the final newline.
                      # Once they are fixed, we can drop this line here.
                      if line_contents:
                          line_contents[-1] = (
-                             line_contents[-1][0], line_contents[-1][1].rstrip('\n') + '\n')
+                             line_contents[-1][0], line_contents[-1][1].rstrip(b'\n') + b'\n')
                      return line_contents
                  def find_context(self, path, context, offset=0):
                      file_diff = self._get_file_diff(path)
                      for chunk in file_diff['chunks']:
+                         if not isinstance(chunk, dict):
+                             continue
                          context_iter = iter(context)
-                         for line_idx, line in enumerate(chunk):
+                         for line_idx, line in enumerate(chunk['lines']):
                              try:
                                  if _context_line(line) == next(context_iter):
                                      continue
                      effective_offset = len(context) - offset
                      found_at_diff_lines = [
-                         _line_to_diff_line_number(chunk[idx - effective_offset])
+                         _line_to_diff_line_number(chunk['lines'][idx - effective_offset])
                          for idx, chunk in matches]
                      return found_at_diff_lines
                          if file_diff['filename'] == path:
                              break
                      else:
-                         raise FileNotInDiffException("File {} not in diff".format(path))
+                         raise FileNotInDiffException(f"File {path} not in diff")
                      return file_diff
                  def _find_chunk_line_index(self, file_diff, diff_line):
                      for chunk in file_diff['chunks']:
-                         for idx, line in enumerate(chunk):
-                             if line['old_lineno'] == diff_line.old:
-                                 return chunk, idx
-                             if line['new_lineno'] == diff_line.new:
-                                 return chunk, idx
-                     raise LineNotInDiffException(
-                         "The line {} is not part of the diff.".format(diff_line))
+                         if not isinstance(chunk, dict):
+                             continue
+                         for line_idx, line in enumerate(chunk['lines']):
+                             if diff_line.old and line['old_lineno'] == diff_line.old:
+                                 return chunk, line_idx
+                             if diff_line.new and line['new_lineno'] == diff_line.new:
+                                 return chunk, line_idx
+                     raise LineNotInDiffException(f"The line {diff_line} is not part of the diff.")
              def _is_diff_content(line):
              def _context_line(line):
-                 return (line['action'], line['line'])
-             DiffLineNumber = collections.namedtuple('DiffLineNumber', ['old', 'new'])
+                 return line['action'], line['line']
              def _line_to_diff_line_number(line):
                          with bz2.BZ2File(cached_diff_file, 'wb') as f:
                              pickle.dump(struct, f)
                  except Exception:
-                     log.warn('Failed to save cache', exc_info=True)
+                     log.warning('Failed to save cache', exc_info=True)
                      _cleanup_cache_file(cached_diff_file)
                  log.debug('Saved diff cache under %s in %.4fs', cached_diff_file, time.time() - start)
                          with bz2.BZ2File(cached_diff_file, 'rb') as f:
                              data = pickle.load(f)
                  except Exception:
-                     log.warn('Failed to read diff cache file', exc_info=True)
+                     log.warning('Failed to read diff cache file', exc_info=True)
                  if not data:
                      data = default_struct
                      return input_param or None  # prevent empty string arguments
                  return '_'.join([
-                     '{}' for i in range(len(args))]).format(*map(arg_mapper, args))
+                     '{}' for _i in range(len(args))]).format(*list(map(arg_mapper, args)))
              def diff_cache_exist(cache_storage, *args):
                  cache_file_path = os.path.join(cache_storage, cache_key)
                  # prevent path traversal attacks using some param that have e.g '../../'
                  if not os.path.abspath(cache_file_path).startswith(cache_storage):
-                     raise ValueError('Final path must be within {}'.format(cache_storage))
+                     raise ValueError(f'Final path must be within {cache_storage}')
                  return cache_file_path

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages