rhodecode-enterprise-ce Commit - r5083:875cd526

diffs: python3 port

super-admin -

r5083:875cd526 default

parent child

rhodecode/lib/diff_match_patch.py

0 +6 -4

             import re
             import sys
             import time
-            import urllib.request, urllib.parse, urllib.error
+            import urllib.request
+            import urllib.parse
+            import urllib.error
             class diff_match_patch:
                         diffs = [
                             (self.DIFF_INSERT, longtext[:i]),
                             (self.DIFF_EQUAL, shorttext),
-                            (self.DIFF_INSERT, longtext[i + len(shorttext) :]),
+                            (self.DIFF_INSERT, longtext[i + len(shorttext):]),
                         ]
                         # Swap insertions for deletions if diff is reversed.
                         if len(text1) > len(text2):
                             if count_delete >= 1 and count_insert >= 1:
                                 # Delete the offending records and add the merged ones.
                                 a = self.diff_main(text_delete, text_insert, False, deadline)
-                                diffs[pointer - count_delete - count_insert : pointer] = a
+                                diffs[pointer - count_delete - count_insert: pointer] = a
                                 pointer = pointer - count_delete - count_insert + len(a)
                             count_insert = 0
                             count_delete = 0
                         return patches
                     text = textline.split("\n")
                     while len(text) != 0:
-                        m = re.match("^@@ -(\d+),?(\d*) \+(\d+),?(\d*) @@$", text[0])
+                        m = re.match(r"^@@ -(\d+),?(\d*) \+(\d+),?(\d*) @@$", text[0])
                         if not m:
                             raise ValueError("Invalid patch string: " + text[0])
                         patch = patch_obj()

rhodecode/lib/diffs.py

0 +161 -286

             """
             Set of diffing helpers, previously part of vcs
             """
+            import dataclasses
             import os
             import re
             import bz2
             import gzip
             import time
-            import collections
             import difflib
             import logging
             import pickle
             from rhodecode.lib.vcs.exceptions import VCSError
             from rhodecode.lib.vcs.nodes import FileNode, SubModuleNode
-            from rhodecode.lib.utils2 import safe_unicode, safe_str
+            from rhodecode.lib.vcs.backends import base
+            from rhodecode.lib.str_utils import safe_str
             log = logging.getLogger(__name__)
                 return request.GET.get('ignorews', '') == '1'
-            class OPS(object):
+            @dataclasses.dataclass
-                ADD = 'A'
+            class OPS:
-                MOD = 'M'
+                ADD: str = 'A'
-                DEL = 'D'
+                MOD: str = 'M'
+                DEL: str = 'D'
+            @dataclasses.dataclass
+            class DiffLineNumber:
+                old: int | None
+                new: int | None
+                def __iter__(self):
+                    yield self.old
+                    yield self.new
             def get_gitdiff(filenode_old, filenode_new, ignore_whitespace=True, context=3):
                 for filenode in (filenode_old, filenode_new):
                     if not isinstance(filenode, FileNode):
-                        raise VCSError(
+                        raise VCSError(f"Given object should be FileNode object, not {filenode.__class__}")
-                            "Given object should be FileNode object, not %s"
-                            % filenode.__class__)
                 repo = filenode_new.commit.repository
                 old_commit = filenode_old.commit or repo.EMPTY_COMMIT
             class LimitedDiffContainer(object):
-                def __init__(self, diff_limit, cur_diff_size, diff):
+                def __init__(self, diff_limit: int, cur_diff_size, diff):
                     self.diff = diff
                     self.diff_limit = diff_limit
                     self.cur_diff_size = cur_diff_size
             class DiffProcessor(object):
                 """
-                Give it a unified or git diff and it returns a list of the files that were
+                Give it a unified or git diff, and it returns a list of the files that were
                 mentioned in the diff together with a dict of meta information that
-                can be used to render it in a HTML template.
+                can be used to render it in an HTML template.
                 .. note:: Unicode handling
                    since the result is intended for presentation to the user.
                 """
-                _chunk_re = re.compile(r'^@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@(.*)')
+                _chunk_re = re.compile(br'^@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@(.*)')
-                _newline_marker = re.compile(r'^\\ No newline at end of file')
+                _newline_marker = re.compile(br'^\\ No newline at end of file')
                 # used for inline highlighter word split
-                _token_re = re.compile(r'()(&gt;|&lt;|&amp;|\W+?)')
+                _token_re = re.compile(br'()(&gt;|&lt;|&amp;|\W+?)')
                 # collapse ranges of commits over given number
                 _collapse_commits_over = 5
-                def __init__(self, diff, format='gitdiff', diff_limit=None,
+                def __init__(self, diff: base.Diff, diff_format='gitdiff', diff_limit: int = 0,
-                             file_limit=None, show_full_diff=True):
+                             file_limit: int = 0, show_full_diff=True):
                     """
                     :param diff: A `Diff` object representing a diff from a vcs backend
-                    :param format: format of diff passed, `udiff` or `gitdiff`
+                    :param diff_format: format of diff passed, `udiff` or `gitdiff`
                     :param diff_limit: define the size of diff that is considered "big"
                         based on that parameter cut off will be triggered, set to None
                         to show full diff
                     """
                     self._diff = diff
-                    self._format = format
+                    self._format = diff_format
                     self.adds = 0
                     self.removes = 0
                     # calculate diff size
                     self.parsed = False
                     self.parsed_diff = []
-                    log.debug('Initialized DiffProcessor with %s mode', format)
+                    log.debug('Initialized DiffProcessor with %s mode', diff_format)
-                    if format == 'gitdiff':
+                    self.differ = self._highlight_line_udiff
+                    self._parser = self._new_parse_gitdiff
+                    if diff_format == 'gitdiff':
                         self.differ = self._highlight_line_difflib
                         self._parser = self._parse_gitdiff
-                    else:
+                        raise DeprecationWarning('gitdiff usage is deprecated')
-                        self.differ = self._highlight_line_udiff
-                        self._parser = self._new_parse_gitdiff
                 def _copy_iterator(self):
                     """
                     self.__udiff, iterator_copy = tee(self.__udiff)
                     return iterator_copy
-                def _escaper(self, string):
+                def _escaper(self, diff_string):
                     """
                     Escaper for diff escapes special chars and checks the diff limit
                     :param string:
                     """
-                    self.cur_diff_size += len(string)
+                    self.cur_diff_size += len(diff_string)
                     if not self.show_full_diff and (self.cur_diff_size > self.diff_limit):
                         raise DiffLimitExceeded('Diff Limit Exceeded')
-                    return string \
+                    return diff_string \
-                        .replace('&', '&amp;')\
+                        .replace(b'&', b'&amp;')\
-                        .replace('<', '&lt;')\
+                        .replace(b'<', b'&lt;')\
-                        .replace('>', '&gt;')
+                        .replace(b'>', b'&gt;')
-                def _line_counter(self, l):
+                def _line_counter(self, diff_line):
                     """
                     Checks each line and bumps total adds/removes for this diff
-                    :param l:
+                    :param diff_line:
                     """
-                    if l.startswith('+') and not l.startswith('+++'):
+                    if diff_line.startswith(b'+') and not diff_line.startswith(b'+++'):
                         self.adds += 1
-                    elif l.startswith('-') and not l.startswith('---'):
+                    elif diff_line.startswith(b'-') and not diff_line.startswith(b'---'):
                         self.removes += 1
-                    return safe_unicode(l)
+                    return diff_line
                 def _highlight_line_difflib(self, line, next_):
                     """
                         newfrag = ''.join(newwords[j1:j2])
                         if tag != 'equal':
                             if oldfrag:
-                                oldfrag = '<del>%s</del>' % oldfrag
+                                oldfrag = f'<del>{oldfrag}</del>'
                             if newfrag:
-                                newfrag = '<ins>%s</ins>' % newfrag
+                                newfrag = f'<ins>{newfrag}</ins>'
                         oldfragments.append(oldfrag)
                         newfragments.append(newfrag)
                                 tag = 'ins'
                             else:
                                 tag = 'del'
-                            l['line'] = '%s<%s>%s</%s>%s' % (
+                            l['line'] = f"{l['line'][:start]}<{tag}>{l['line'][start:last]}</{tag}>{l['line'][last:]}"
-                                l['line'][:start],
-                                tag,
-                                l['line'][start:last],
-                                tag,
-                                l['line'][last:]
                         do(line)
                         do(next_)
-                def _clean_line(self, line, command):
+                def _clean_line(self, line, command: str):
                     if command in ['+', '-', ' ']:
                         # only modify the line if it's actually a diff thing
                         line = line[1:]
                 def _parse_gitdiff(self, inline_diff=True):
                     _files = []
-                    diff_container = lambda arg: arg
+                    def diff_container(arg):
+                        return arg
                     for chunk in self._diff.chunks():
                         head = chunk.header
                         elif head['new_file_mode']:
                             op = OPS.ADD
                             stats['binary'] = True
-                            stats['ops'][NEW_FILENODE] = 'new file %s' % head['new_file_mode']
+                            stats['ops'][NEW_FILENODE] = f"new file {safe_str(head['new_file_mode'])}"
-                        else:  # modify operation, can be copy, rename or chmod
+                        else:  # modify operation, can be: copy, rename or chmod
                             # CHMOD
                             if head['new_mode'] and head['old_mode']:
                                 op = OPS.MOD
                                 stats['binary'] = True
-                                stats['ops'][CHMOD_FILENODE] = (
+                                stats['ops'][CHMOD_FILENODE] = f"modified file chmod {safe_str(head['old_mode'])} => {safe_str(head['new_mode'])}"
-                                    'modified file chmod %s => %s' % (
-                                        head['old_mode'], head['new_mode']))
                             # RENAME
                             if head['rename_from'] != head['rename_to']:
                                 op = OPS.MOD
                                 stats['binary'] = True
-                                stats['ops'][RENAMED_FILENODE] = (
+                                stats['ops'][RENAMED_FILENODE] = f"file renamed from {safe_str(head['rename_from'])} to {safe_str(head['rename_to'])}"
-                                    'file renamed from %s to %s' % (
-                                        head['rename_from'], head['rename_to']))
                             # COPY
                             if head.get('copy_from') and head.get('copy_to'):
                                 op = OPS.MOD
                                 stats['binary'] = True
-                                stats['ops'][COPIED_FILENODE] = (
+                                stats['ops'][COPIED_FILENODE] = f"file copied from {safe_str(head['copy_from'])} to {safe_str(head['copy_to'])}"
-                                    'file copied from %s to %s' % (
-                                        head['copy_from'], head['copy_to']))
                             # If our new parsed headers didn't match anything fallback to
                             # old style detection
                                     raise DiffLimitExceeded('File Limit Exceeded')
                             except DiffLimitExceeded:
-                                diff_container = lambda _diff: \
+                                def diff_container(_diff):
-                                    LimitedDiffContainer(
+                                    return LimitedDiffContainer(self.diff_limit, self.cur_diff_size, _diff)
-                                        self.diff_limit, self.cur_diff_size, _diff)
                                 exceeds_limit = len(raw_diff) > self.file_limit
                                 limited_diff = True
                         else:  # GIT format binary patch, or possibly empty diff
                             if head['bin_patch']:
                                 # we have operation already extracted, but we mark simply
-                                # it's a diff we wont show for binary files
+                                # it's a diff we won't show for binary files
                                 stats['ops'][BIN_FILENODE] = 'binary diff hidden'
                             chunks = []
                             # to see the content of the file
                             chunks = []
-                        chunks.insert(0, [{
+                        frag = [{
-                                              'old_lineno': '',
+                            'old_lineno': '',
-                                              'new_lineno': '',
+                            'new_lineno': '',
-                                              'action': Action.CONTEXT,
+                            'action': Action.CONTEXT,
-                                              'line': msg,
+                            'line': msg,
-                                          } for _op, msg in stats['ops'].items()
+                        } for _op, msg in list(stats['ops'].items())
-                                          if _op not in [MOD_FILENODE]])
+                            if _op not in [MOD_FILENODE]]
+                        chunks.insert(0, frag)
                         _files.append({
-                            'filename': safe_unicode(head['b_path']),
+                            'filename': safe_str(head['b_path']),
                             'old_revision': head['a_blob_id'],
                             'new_revision': head['b_blob_id'],
                             'chunks': chunks,
-                            'raw_diff': safe_unicode(raw_diff),
+                            'raw_diff': safe_str(raw_diff),
                             'operation': op,
                             'stats': stats,
                             'exceeds_limit': exceeds_limit,
                             'is_limited_diff': limited_diff,
                         })
-                    sorter = lambda info: {OPS.ADD: 0, OPS.MOD: 1,
+                    def operation_sorter(info):
-                                           OPS.DEL: 2}.get(info['operation'])
+                        return {OPS.ADD: 0, OPS.MOD: 1, OPS.DEL: 2}.get(info['operation'])
                     if not inline_diff:
-                        return diff_container(sorted(_files, key=sorter))
+                        return diff_container(sorted(_files, key=operation_sorter))
                     # highlight inline changes
                     for diff_data in _files:
                             except StopIteration:
                                 pass
-                    return diff_container(sorted(_files, key=sorter))
+                    return diff_container(sorted(_files, key=operation_sorter))
                 def _check_large_diff(self):
                     if self.diff_limit:
                         log.debug('Checking if diff exceeds current diff_limit of %s', self.diff_limit)
                     if not self.show_full_diff and (self.cur_diff_size > self.diff_limit):
-                        raise DiffLimitExceeded('Diff Limit `%s` Exceeded', self.diff_limit)
+                        raise DiffLimitExceeded(f'Diff Limit `{self.diff_limit}` Exceeded')
                 # FIXME: NEWDIFFS: dan: this replaces _parse_gitdiff
                 def _new_parse_gitdiff(self, inline_diff=True):
                     _files = []
-                    # this can be overriden later to a LimitedDiffContainer type
+                    # this can be overridden later to a LimitedDiffContainer type
-                    diff_container = lambda arg: arg
+                    def diff_container(arg):
+                        return arg
                     for chunk in self._diff.chunks():
-                        head = chunk.header
+                        head = chunk.header_as_str
-                        log.debug('parsing diff %r', head)
+                        log.debug('parsing diff chunk %r', chunk)
                         raw_diff = chunk.raw
                         limited_diff = False
                             'added': 0,
                             'deleted': 0,
                             'binary': False,
-                            'old_mode': None,
+                            'old_mode': '',
-                            'new_mode': None,
+                            'new_mode': '',
                             'ops': {},
                         }
                         if head['old_mode']:
                         elif head['new_file_mode']:
                             op = OPS.ADD
                             stats['binary'] = True
-                            stats['old_mode'] = None
+                            stats['old_mode'] = ''
                             stats['new_mode'] = head['new_file_mode']
-                            stats['ops'][NEW_FILENODE] = 'new file %s' % head['new_file_mode']
+                            stats['ops'][NEW_FILENODE] = f"new file {head['new_file_mode']}"
-                        # modify operation, can be copy, rename or chmod
+                        # modify operation, can be: copy, rename or chmod
                         else:
                             # CHMOD
                             if head['new_mode'] and head['old_mode']:
                                 op = OPS.MOD
                                 stats['binary'] = True
-                                stats['ops'][CHMOD_FILENODE] = (
+                                stats['ops'][CHMOD_FILENODE] = f"modified file chmod {head['old_mode']} => {head['new_mode']}"
-                                    'modified file chmod %s => %s' % (
-                                        head['old_mode'], head['new_mode']))
                             # RENAME
                             if head['rename_from'] != head['rename_to']:
                                 op = OPS.MOD
                                 stats['binary'] = True
                                 stats['renamed'] = (head['rename_from'], head['rename_to'])
-                                stats['ops'][RENAMED_FILENODE] = (
+                                stats['ops'][RENAMED_FILENODE] = f"file renamed from {head['rename_from']} to {head['rename_to']}"
-                                    'file renamed from %s to %s' % (
-                                        head['rename_from'], head['rename_to']))
                             # COPY
                             if head.get('copy_from') and head.get('copy_to'):
                                 op = OPS.MOD
                                 stats['binary'] = True
                                 stats['copied'] = (head['copy_from'], head['copy_to'])
-                                stats['ops'][COPIED_FILENODE] = (
+                                stats['ops'][COPIED_FILENODE] = f"file copied from {head['copy_from']} to {head['copy_to']}"
-                                    'file copied from %s to %s' % (
-                                        head['copy_from'], head['copy_to']))
                             # If our new parsed headers didn't match anything fallback to
                             # old style detection
                                 # but the browser is the bottleneck.
                                 if not self.show_full_diff and exceeds_limit:
                                     log.debug('File `%s` exceeds current file_limit of %s',
-                                              safe_unicode(head['b_path']), self.file_limit)
+                                              head['b_path'], self.file_limit)
-                                    raise DiffLimitExceeded(
+                                    raise DiffLimitExceeded(f'File Limit {self.file_limit} Exceeded')
-                                        'File Limit %s Exceeded', self.file_limit)
                                 self._check_large_diff()
                                     stats['ops'][MOD_FILENODE] = 'modified file'
                             except DiffLimitExceeded:
-                                diff_container = lambda _diff: \
+                                def limited_diff_container(_diff):
-                                    LimitedDiffContainer(
+                                    return LimitedDiffContainer(self.diff_limit, self.cur_diff_size, _diff)
-                                        self.diff_limit, self.cur_diff_size, _diff)
+                                # re-definition of our container wrapper
+                                diff_container = limited_diff_container
                                 limited_diff = True
                                 chunks = []
                         else:  # GIT format binary patch, or possibly empty diff
                             if head['bin_patch']:
                                 # we have operation already extracted, but we mark simply
-                                # it's a diff we wont show for binary files
+                                # it's a diff we won't show for binary files
                                 stats['ops'][BIN_FILENODE] = 'binary diff hidden'
                             chunks = []
                             # to see the content of the file
                             chunks = []
-                        chunks.insert(
+                        frag = [
-, [{'old_lineno': '',
+                            {'old_lineno': '',
-                                 'new_lineno': '',
+                             'new_lineno': '',
-                                 'action': Action.CONTEXT,
+                             'action': Action.CONTEXT,
-                                 'line': msg,
+                             'line': msg,
-                                 } for _op, msg in stats['ops'].items()
+                             } for _op, msg in list(stats['ops'].items())
-                                if _op not in [MOD_FILENODE]])
+                            if _op not in [MOD_FILENODE]]
-                        original_filename = safe_unicode(head['a_path'])
+                        chunks.insert(0, frag)
+                        original_filename = safe_str(head['a_path'])
                         _files.append({
                             'original_filename': original_filename,
-                            'filename': safe_unicode(head['b_path']),
+                            'filename': safe_str(head['b_path']),
                             'old_revision': head['a_blob_id'],
                             'new_revision': head['b_blob_id'],
                             'chunks': chunks,
-                            'raw_diff': safe_unicode(raw_diff),
+                            'raw_diff': safe_str(raw_diff),
                             'operation': op,
                             'stats': stats,
                             'exceeds_limit': exceeds_limit,
                             'is_limited_diff': limited_diff,
                         })
-                    sorter = lambda info: {OPS.ADD: 0, OPS.MOD: 1,
+                    def sorter(info):
-                                           OPS.DEL: 2}.get(info['operation'])
+                        return {OPS.ADD: 0, OPS.MOD: 1, OPS.DEL: 2}.get(info['operation'])
                     return diff_container(sorted(_files, key=sorter))
                 # FIXME: NEWDIFFS: dan: this gets replaced by _new_parse_lines
                             line = next(diff_iter)
                             while old_line < old_end or new_line < new_end:
-                                command = ' '
+                                command = b' '
                                 if line:
                                     command = line[0]
                                 affects_old = affects_new = False
                                 # ignore those if we don't expect them
-                                if command in '#@':
+                                if command in b'#@':
                                     continue
-                                elif command == '+':
+                                elif command == b'+':
                                     affects_new = True
                                     action = Action.ADD
                                     stats[0] += 1
-                                elif command == '-':
+                                elif command == b'-':
                                     affects_old = True
                                     action = Action.DELETE
                                     stats[1] += 1
                                     old_line += affects_old
                                     new_line += affects_new
                                     lines.append({
-                                        'old_lineno':   affects_old and old_line or '',
+                                        'old_lineno':   affects_old and old_line or b'',
-                                        'new_lineno':   affects_new and new_line or '',
+                                        'new_lineno':   affects_new and new_line or b'',
                                         'action':       action,
                                         'line':         self._clean_line(line, command)
                                     })
                     try:
                         line = next(diff_iter)
+                        assert isinstance(line, bytes)
                         while line:
                             raw_diff.append(line)
                                 break
                             gr = match.groups()
                             (old_line, old_end,
                              new_line, new_end) = [int(x or 1) for x in gr[:-1]]
                             old_line -= 1
                             new_line -= 1
-                            context = len(gr) == 5
+                            len(gr) == 5
                             old_end += old_line
                             new_end += new_line
                             while old_line < old_end or new_line < new_end:
                                 command = ' '
                                 if line:
-                                    command = line[0]
+                                    # This is bytes, so we need to convert it to a str
+                                    command: str = chr(line[0])
                                 affects_old = affects_new = False
                                     old_line += affects_old
                                     new_line += affects_new
                                     lines.append({
-                                        'old_lineno':   affects_old and old_line or '',
+                                        'old_lineno':   affects_old and old_line or None,
-                                        'new_lineno':   affects_new and new_line or '',
+                                        'new_lineno':   affects_new and new_line or None,
                                         'action':       action,
                                         'line':         self._clean_line(line, command)
                                     })
                     except StopIteration:
                         pass
-                    return ''.join(raw_diff), chunks, stats
+                    return b''.join(raw_diff), chunks, stats
                 def _safe_id(self, idstring):
                     """Make a string safe for including in an id attribute.
                     """
                     # Transform all whitespace to underscore
-                    idstring = re.sub(r'\s', "_", '%s' % idstring)
+                    idstring = re.sub(r'\s', "_", f'{idstring}')
                     # Remove everything that is not a hyphen or a member of \w
                     idstring = re.sub(r'(?!-)\W', "", idstring).lower()
                     return idstring
                 @classmethod
-                def diff_splitter(cls, string):
+                def diff_splitter(cls, diff_string: bytes):
                     """
                     Diff split that emulates .splitlines() but works only on \n
                     """
-                    if not string:
+                    if not diff_string:
                         return
-                    elif string == '\n':
+                    elif diff_string == b'\n':
-                        yield '\n'
+                        yield b'\n'
                     else:
-                        has_newline = string.endswith('\n')
+                        has_newline = diff_string.endswith(b'\n')
-                        elements = string.split('\n')
+                        elements = diff_string.split(b'\n')
                         if has_newline:
                             # skip last element as it's empty string from newlines
                             elements = elements[:-1]
                         for cnt, line in enumerate(elements, start=1):
                             last_line = cnt == len_elements
                             if last_line and not has_newline:
-                                yield safe_unicode(line)
+                                yield line
                             else:
-                                yield safe_unicode(line) + '\n'
+                                yield line + b'\n'
                 def prepare(self, inline_diff=True):
                     """
                     """
                     Returns raw diff as a byte string
                     """
-                    return self._diff.raw
+                    return self._diff.raw.tobytes()
-                def as_html(self, table_class='code-difftable', line_class='line',
-                            old_lineno_class='lineno old', new_lineno_class='lineno new',
-                            code_class='code', enable_comments=False, parsed_lines=None):
-                    """
-                    Return given diff as html table with customized css classes
-                    """
-                    # TODO(marcink): not sure how to pass in translator
-                    # here in an efficient way, leave the _ for proper gettext extraction
-                    _ = lambda s: s
-                    def _link_to_if(condition, label, url):
-                        """
-                        Generates a link if condition is meet or just the label if not.
-                        """
-                        if condition:
-                            return '''<a href="%(url)s" class="tooltip"
-                            title="%(title)s">%(label)s</a>''' % {
-                                'title': _('Click to select line'),
-                                'url': url,
-                                'label': label
-                        else:
-                            return label
-                    if not self.parsed:
-                        self.prepare()
-                    diff_lines = self.parsed_diff
-                    if parsed_lines:
-                        diff_lines = parsed_lines
-                    _html_empty = True
-                    _html = []
-                    _html.append('''<table class="%(table_class)s">\n''' % {
-                        'table_class': table_class
-                    })
-                    for diff in diff_lines:
-                        for line in diff['chunks']:
-                            _html_empty = False
-                            for change in line:
-                                _html.append('''<tr class="%(lc)s %(action)s">\n''' % {
-                                    'lc': line_class,
-                                    'action': change['action']
-                                })
-                                anchor_old_id = ''
-                                anchor_new_id = ''
-                                anchor_old = "%(filename)s_o%(oldline_no)s" % {
-                                    'filename': self._safe_id(diff['filename']),
-                                    'oldline_no': change['old_lineno']
-                                anchor_new = "%(filename)s_n%(oldline_no)s" % {
-                                    'filename': self._safe_id(diff['filename']),
-                                    'oldline_no': change['new_lineno']
-                                cond_old = (change['old_lineno'] != '...' and
-                                            change['old_lineno'])
-                                cond_new = (change['new_lineno'] != '...' and
-                                            change['new_lineno'])
-                                if cond_old:
-                                    anchor_old_id = 'id="%s"' % anchor_old
-                                if cond_new:
-                                    anchor_new_id = 'id="%s"' % anchor_new
-                                if change['action'] != Action.CONTEXT:
-                                    anchor_link = True
-                                else:
-                                    anchor_link = False
-                                ###########################################################
-                                # COMMENT ICONS
-                                ###########################################################
-                                _html.append('''\t<td class="add-comment-line"><span class="add-comment-content">''')
-                                if enable_comments and change['action'] != Action.CONTEXT:
-                                    _html.append('''<a href="#"><span class="icon-comment-add"></span></a>''')
-                                _html.append('''</span></td><td class="comment-toggle tooltip" title="Toggle Comment Thread"><i class="icon-comment"></i></td>\n''')
-                                ###########################################################
-                                # OLD LINE NUMBER
-                                ###########################################################
-                                _html.append('''\t<td %(a_id)s class="%(olc)s">''' % {
-                                    'a_id': anchor_old_id,
-                                    'olc': old_lineno_class
-                                })
-                                _html.append('''%(link)s''' % {
-                                    'link': _link_to_if(anchor_link, change['old_lineno'],
-                                                        '#%s' % anchor_old)
-                                })
-                                _html.append('''</td>\n''')
-                                ###########################################################
-                                # NEW LINE NUMBER
-                                ###########################################################
-                                _html.append('''\t<td %(a_id)s class="%(nlc)s">''' % {
-                                    'a_id': anchor_new_id,
-                                    'nlc': new_lineno_class
-                                })
-                                _html.append('''%(link)s''' % {
-                                    'link': _link_to_if(anchor_link, change['new_lineno'],
-                                                        '#%s' % anchor_new)
-                                })
-                                _html.append('''</td>\n''')
-                                ###########################################################
-                                # CODE
-                                ###########################################################
-                                code_classes = [code_class]
-                                if (not enable_comments or
-                                        change['action'] == Action.CONTEXT):
-                                    code_classes.append('no-comment')
-                                _html.append('\t<td class="%s">' % ' '.join(code_classes))
-                                _html.append('''\n\t\t<pre>%(code)s</pre>\n''' % {
-                                    'code': change['line']
-                                })
-                                _html.append('''\t</td>''')
-                                _html.append('''\n</tr>\n''')
-                    _html.append('''</table>''')
-                    if _html_empty:
-                        return None
-                    return ''.join(_html)
                 def stat(self):
                     """
                     return self.adds, self.removes
                 def get_context_of_line(
-                        self, path, diff_line=None, context_before=3, context_after=3):
+                        self, path, diff_line: DiffLineNumber = None, context_before: int = 3, context_after: int = 3):
                     """
                     Returns the context lines for the specified diff line.
-                    :type diff_line: :class:`DiffLineNumber`
                     """
                     assert self.parsed, "DiffProcessor is not initialized."
                     if None not in diff_line:
-                        raise ValueError(
+                        raise ValueError(f"Cannot specify both line numbers in diff_line: {diff_line}")
-                            "Cannot specify both line numbers: {}".format(diff_line))
                     file_diff = self._get_file_diff(path)
                     chunk, idx = self._find_chunk_line_index(file_diff, diff_line)
                     first_line_to_include = max(idx - context_before, 0)
                     first_line_after_context = idx + context_after + 1
-                    context_lines = chunk[first_line_to_include:first_line_after_context]
+                    context_lines = chunk['lines'][first_line_to_include:first_line_after_context]
                     line_contents = [
                         _context_line(line) for line in context_lines
-                        if _is_diff_content(line)]
+                        if _is_diff_content(line)
+                    ]
                     # TODO: johbo: Interim fixup, the diff chunks drop the final newline.
                     # Once they are fixed, we can drop this line here.
                     if line_contents:
                         line_contents[-1] = (
-                            line_contents[-1][0], line_contents[-1][1].rstrip('\n') + '\n')
+                            line_contents[-1][0], line_contents[-1][1].rstrip(b'\n') + b'\n')
                     return line_contents
                 def find_context(self, path, context, offset=0):
                     file_diff = self._get_file_diff(path)
                     for chunk in file_diff['chunks']:
+                        if not isinstance(chunk, dict):
+                            continue
                         context_iter = iter(context)
-                        for line_idx, line in enumerate(chunk):
+                        for line_idx, line in enumerate(chunk['lines']):
                             try:
                                 if _context_line(line) == next(context_iter):
                                     continue
                     effective_offset = len(context) - offset
                     found_at_diff_lines = [
-                        _line_to_diff_line_number(chunk[idx - effective_offset])
+                        _line_to_diff_line_number(chunk['lines'][idx - effective_offset])
                         for idx, chunk in matches]
                     return found_at_diff_lines
                         if file_diff['filename'] == path:
                             break
                     else:
-                        raise FileNotInDiffException("File {} not in diff".format(path))
+                        raise FileNotInDiffException(f"File {path} not in diff")
                     return file_diff
                 def _find_chunk_line_index(self, file_diff, diff_line):
                     for chunk in file_diff['chunks']:
-                        for idx, line in enumerate(chunk):
+                        if not isinstance(chunk, dict):
-                            if line['old_lineno'] == diff_line.old:
+                            continue
-                                return chunk, idx
+                        for line_idx, line in enumerate(chunk['lines']):
-                            if line['new_lineno'] == diff_line.new:
+                            if diff_line.old and line['old_lineno'] == diff_line.old:
-                                return chunk, idx
+                                return chunk, line_idx
-                    raise LineNotInDiffException(
+                            if diff_line.new and line['new_lineno'] == diff_line.new:
-                        "The line {} is not part of the diff.".format(diff_line))
+                                return chunk, line_idx
+                    raise LineNotInDiffException(f"The line {diff_line} is not part of the diff.")
             def _is_diff_content(line):
             def _context_line(line):
-                return (line['action'], line['line'])
+                return line['action'], line['line']
-            DiffLineNumber = collections.namedtuple('DiffLineNumber', ['old', 'new'])
             def _line_to_diff_line_number(line):
                         with bz2.BZ2File(cached_diff_file, 'wb') as f:
                             pickle.dump(struct, f)
                 except Exception:
-                    log.warn('Failed to save cache', exc_info=True)
+                    log.warning('Failed to save cache', exc_info=True)
                     _cleanup_cache_file(cached_diff_file)
                 log.debug('Saved diff cache under %s in %.4fs', cached_diff_file, time.time() - start)
                         with bz2.BZ2File(cached_diff_file, 'rb') as f:
                             data = pickle.load(f)
                 except Exception:
-                    log.warn('Failed to read diff cache file', exc_info=True)
+                    log.warning('Failed to read diff cache file', exc_info=True)
                 if not data:
                     data = default_struct
                     return input_param or None  # prevent empty string arguments
                 return '_'.join([
-                    '{}' for i in range(len(args))]).format(*map(arg_mapper, args))
+                    '{}' for _i in range(len(args))]).format(*list(map(arg_mapper, args)))
             def diff_cache_exist(cache_storage, *args):
                 cache_file_path = os.path.join(cache_storage, cache_key)
                 # prevent path traversal attacks using some param that have e.g '../../'
                 if not os.path.abspath(cache_file_path).startswith(cache_storage):
-                    raise ValueError('Final path must be within {}'.format(cache_storage))
+                    raise ValueError(f'Final path must be within {cache_storage}')
                 return cache_file_path

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages