rhodecode-enterprise-ce Commit - r3962:605faead

nodes: expose line counts in node information. This would be used in full text search

marcink -

r3962:605faead default

parent child

rhodecode/lib/vcs/nodes.py

0 +21 -16

             # -*- coding: utf-8 -*-
             # Copyright (C) 2014-2019 RhodeCode GmbH
             #
             # This program is free software: you can redistribute it and/or modify
             # it under the terms of the GNU Affero General Public License, version 3
             # (only), as published by the Free Software Foundation.
             #
             # This program is distributed in the hope that it will be useful,
             # but WITHOUT ANY WARRANTY; without even the implied warranty of
             # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
             # GNU General Public License for more details.
             #
             # You should have received a copy of the GNU Affero General Public License
             # along with this program.  If not, see <http://www.gnu.org/licenses/>.
             #
             # This program is dual-licensed. If you wish to learn more about the
             # RhodeCode Enterprise Edition, including its added features, Support services,
             # and proprietary license terms, please see https://rhodecode.com/licenses/
             """
             Module holding everything related to vcs nodes, with vcs2 architecture.
             """
             import os
             import stat
             from zope.cachedescriptors.property import Lazy as LazyProperty
             import rhodecode
             from rhodecode.config.conf import LANGUAGES_EXTENSIONS_MAP
             from rhodecode.lib.utils import safe_unicode, safe_str
             from rhodecode.lib.utils2 import md5
             from rhodecode.lib.vcs import path as vcspath
             from rhodecode.lib.vcs.backends.base import EmptyCommit, FILEMODE_DEFAULT
             from rhodecode.lib.vcs.conf.mtypes import get_mimetypes_db
             from rhodecode.lib.vcs.exceptions import NodeError, RemovedFileNodeError
             LARGEFILE_PREFIX = '.hglf'
             class NodeKind:
                 SUBMODULE = -1
                 DIR = 1
                 FILE = 2
                 LARGEFILE = 3
             class NodeState:
                 ADDED = u'added'
                 CHANGED = u'changed'
                 NOT_CHANGED = u'not changed'
                 REMOVED = u'removed'
             class NodeGeneratorBase(object):
                 """
                 Base class for removed added and changed filenodes, it's a lazy generator
                 class that will create filenodes only on iteration or call
                 The len method doesn't need to create filenodes at all
                 """
                 def __init__(self, current_paths, cs):
                     self.cs = cs
                     self.current_paths = current_paths
                 def __call__(self):
                     return [n for n in self]
                 def __getslice__(self, i, j):
                     for p in self.current_paths[i:j]:
                         yield self.cs.get_node(p)
                 def __len__(self):
                     return len(self.current_paths)
                 def __iter__(self):
                     for p in self.current_paths:
                         yield self.cs.get_node(p)
             class AddedFileNodesGenerator(NodeGeneratorBase):
                 """
                 Class holding added files for current commit
                 """
             class ChangedFileNodesGenerator(NodeGeneratorBase):
                 """
                 Class holding changed files for current commit
                 """
             class RemovedFileNodesGenerator(NodeGeneratorBase):
                 """
                 Class holding removed files for current commit
                 """
                 def __iter__(self):
                     for p in self.current_paths:
                         yield RemovedFileNode(path=p)
                 def __getslice__(self, i, j):
                     for p in self.current_paths[i:j]:
                         yield RemovedFileNode(path=p)
             class Node(object):
                 """
                 Simplest class representing file or directory on repository.  SCM backends
                 should use ``FileNode`` and ``DirNode`` subclasses rather than ``Node``
                 directly.
                 Node's ``path`` cannot start with slash as we operate on *relative* paths
                 only. Moreover, every single node is identified by the ``path`` attribute,
                 so it cannot end with slash, too. Otherwise, path could lead to mistakes.
                 """
                 RTLO_MARKER = u"\u202E"  # RTLO marker allows swapping text, and certain
                                          # security attacks could be used with this
                 commit = None
                 def __init__(self, path, kind):
                     self._validate_path(path)  # can throw exception if path is invalid
                     self.path = safe_str(path.rstrip('/'))  # we store paths as str
                     if path == '' and kind != NodeKind.DIR:
                         raise NodeError("Only DirNode and its subclasses may be "
                                         "initialized with empty path")
                     self.kind = kind
                     if self.is_root() and not self.is_dir():
                         raise NodeError("Root node cannot be FILE kind")
                 def _validate_path(self, path):
                     if path.startswith('/'):
                         raise NodeError(
                             "Cannot initialize Node objects with slash at "
                             "the beginning as only relative paths are supported. "
                             "Got %s" % (path,))
                 @LazyProperty
                 def parent(self):
                     parent_path = self.get_parent_path()
                     if parent_path:
                         if self.commit:
                             return self.commit.get_node(parent_path)
                         return DirNode(parent_path)
                     return None
                 @LazyProperty
                 def unicode_path(self):
                     return safe_unicode(self.path)
                 @LazyProperty
                 def has_rtlo(self):
                     """Detects if a path has right-to-left-override marker"""
                     return self.RTLO_MARKER in self.unicode_path
                 @LazyProperty
                 def unicode_path_safe(self):
                     """
                     Special SAFE representation of path without the right-to-left-override.
                     This should be only used for "showing" the file, cannot be used for any
                     urls etc.
                     """
                     return safe_unicode(self.path).replace(self.RTLO_MARKER, '')
                 @LazyProperty
                 def dir_path(self):
                     """
                     Returns name of the directory from full path of this vcs node. Empty
                     string is returned if there's no directory in the path
                     """
                     _parts = self.path.rstrip('/').rsplit('/', 1)
                     if len(_parts) == 2:
                         return safe_unicode(_parts[0])
                     return u''
                 @LazyProperty
                 def name(self):
                     """
                     Returns name of the node so if its path
                     then only last part is returned.
                     """
                     return safe_unicode(self.path.rstrip('/').split('/')[-1])
                 @property
                 def kind(self):
                     return self._kind
                 @kind.setter
                 def kind(self, kind):
                     if hasattr(self, '_kind'):
                         raise NodeError("Cannot change node's kind")
                     else:
                         self._kind = kind
                         # Post setter check (path's trailing slash)
                         if self.path.endswith('/'):
                             raise NodeError("Node's path cannot end with slash")
                 def __cmp__(self, other):
                     """
                     Comparator using name of the node, needed for quick list sorting.
                     """
                     kind_cmp = cmp(self.kind, other.kind)
                     if kind_cmp:
                         if isinstance(self, SubModuleNode):
                             # we make submodules equal to dirnode for "sorting" purposes
                             return NodeKind.DIR
                         return kind_cmp
                     return cmp(self.name, other.name)
                 def __eq__(self, other):
                     for attr in ['name', 'path', 'kind']:
                         if getattr(self, attr) != getattr(other, attr):
                             return False
                     if self.is_file():
                         if self.content != other.content:
                             return False
                     else:
                         # For DirNode's check without entering each dir
                         self_nodes_paths = list(sorted(n.path for n in self.nodes))
                         other_nodes_paths = list(sorted(n.path for n in self.nodes))
                         if self_nodes_paths != other_nodes_paths:
                             return False
                     return True
                 def __ne__(self, other):
                     return not self.__eq__(other)
                 def __repr__(self):
                     return '<%s %r>' % (self.__class__.__name__, self.path)
                 def __str__(self):
                     return self.__repr__()
                 def __unicode__(self):
                     return self.name
                 def get_parent_path(self):
                     """
                     Returns node's parent path or empty string if node is root.
                     """
                     if self.is_root():
                         return ''
                     return vcspath.dirname(self.path.rstrip('/')) + '/'
                 def is_file(self):
                     """
                     Returns ``True`` if node's kind is ``NodeKind.FILE``, ``False``
                     otherwise.
                     """
                     return self.kind == NodeKind.FILE
                 def is_dir(self):
                     """
                     Returns ``True`` if node's kind is ``NodeKind.DIR``, ``False``
                     otherwise.
                     """
                     return self.kind == NodeKind.DIR
                 def is_root(self):
                     """
                     Returns ``True`` if node is a root node and ``False`` otherwise.
                     """
                     return self.kind == NodeKind.DIR and self.path == ''
                 def is_submodule(self):
                     """
                     Returns ``True`` if node's kind is ``NodeKind.SUBMODULE``, ``False``
                     otherwise.
                     """
                     return self.kind == NodeKind.SUBMODULE
                 def is_largefile(self):
                     """
                     Returns ``True`` if node's kind is ``NodeKind.LARGEFILE``, ``False``
                     otherwise
                     """
                     return self.kind == NodeKind.LARGEFILE
                 def is_link(self):
                     if self.commit:
                         return self.commit.is_link(self.path)
                     return False
                 @LazyProperty
                 def added(self):
                     return self.state is NodeState.ADDED
                 @LazyProperty
                 def changed(self):
                     return self.state is NodeState.CHANGED
                 @LazyProperty
                 def not_changed(self):
                     return self.state is NodeState.NOT_CHANGED
                 @LazyProperty
                 def removed(self):
                     return self.state is NodeState.REMOVED
             class FileNode(Node):
                 """
                 Class representing file nodes.
                 :attribute: path: path to the node, relative to repository's root
                 :attribute: content: if given arbitrary sets content of the file
                 :attribute: commit: if given, first time content is accessed, callback
                 :attribute: mode: stat mode for a node. Default is `FILEMODE_DEFAULT`.
                 """
                 _filter_pre_load = []
                 def __init__(self, path, content=None, commit=None, mode=None, pre_load=None):
                     """
                     Only one of ``content`` and ``commit`` may be given. Passing both
                     would raise ``NodeError`` exception.
                     :param path: relative path to the node
                     :param content: content may be passed to constructor
                     :param commit: if given, will use it to lazily fetch content
                     :param mode: ST_MODE (i.e. 0100644)
                     """
                     if content and commit:
                         raise NodeError("Cannot use both content and commit")
                     super(FileNode, self).__init__(path, kind=NodeKind.FILE)
                     self.commit = commit
                     self._content = content
                     self._mode = mode or FILEMODE_DEFAULT
                     self._set_bulk_properties(pre_load)
                 def _set_bulk_properties(self, pre_load):
                     if not pre_load:
                         return
                     pre_load = [entry for entry in pre_load
                                 if entry not in self._filter_pre_load]
                     if not pre_load:
                         return
                     for attr_name in pre_load:
                         result = getattr(self, attr_name)
                         if callable(result):
                             result = result()
                         self.__dict__[attr_name] = result
                 @LazyProperty
                 def mode(self):
                     """
                     Returns lazily mode of the FileNode. If `commit` is not set, would
                     use value given at initialization or `FILEMODE_DEFAULT` (default).
                     """
                     if self.commit:
                         mode = self.commit.get_file_mode(self.path)
                     else:
                         mode = self._mode
                     return mode
                 @LazyProperty
                 def raw_bytes(self):
                     """
                     Returns lazily the raw bytes of the FileNode.
                     """
                     if self.commit:
                         if self._content is None:
                             self._content = self.commit.get_file_content(self.path)
                         content = self._content
                     else:
                         content = self._content
                     return content
                 def stream_bytes(self):
                     """
                     Returns an iterator that will stream the content of the file directly from
                     vcsserver without loading it to memory.
                     """
                     if self.commit:
                         return self.commit.get_file_content_streamed(self.path)
                     raise NodeError("Cannot retrieve stream_bytes without related commit attribute")
                 @LazyProperty
                 def md5(self):
                     """
                     Returns md5 of the file node.
                     """
                     return md5(self.raw_bytes)
                 def metadata_uncached(self):
                     """
                     Returns md5, binary flag of the file node, without any cache usage.
                     """
                     content = self.content_uncached()
                     is_binary = content and '\0' in content
                     size = 0
                     if content:
                         size = len(content)
                     return is_binary, md5(content), size, content
                 def content_uncached(self):
                     """
                     Returns lazily content of the FileNode. If possible, would try to
                     decode content from UTF-8.
                     """
                     if self.commit:
                         content = self.commit.get_file_content(self.path)
                     else:
                         content = self._content
                     return content
                 @LazyProperty
                 def content(self):
                     """
                     Returns lazily content of the FileNode. If possible, would try to
                     decode content from UTF-8.
                     """
                     content = self.raw_bytes
                     if self.is_binary:
                         return content
                     return safe_unicode(content)
                 @LazyProperty
                 def size(self):
                     if self.commit:
                         return self.commit.get_file_size(self.path)
                     raise NodeError(
                         "Cannot retrieve size of the file without related "
                         "commit attribute")
                 @LazyProperty
                 def message(self):
                     if self.commit:
                         return self.last_commit.message
                     raise NodeError(
                         "Cannot retrieve message of the file without related "
                         "commit attribute")
                 @LazyProperty
                 def last_commit(self):
                     if self.commit:
                         pre_load = ["author", "date", "message", "parents"]
                         return self.commit.get_path_commit(self.path, pre_load=pre_load)
                     raise NodeError(
                         "Cannot retrieve last commit of the file without "
                         "related commit attribute")
                 def get_mimetype(self):
                     """
                     Mimetype is calculated based on the file's content. If ``_mimetype``
                     attribute is available, it will be returned (backends which store
                     mimetypes or can easily recognize them, should set this private
                     attribute to indicate that type should *NOT* be calculated).
                     """
                     if hasattr(self, '_mimetype'):
                         if (isinstance(self._mimetype, (tuple, list,)) and
                                 len(self._mimetype) == 2):
                             return self._mimetype
                         else:
                             raise NodeError('given _mimetype attribute must be an 2 '
                                             'element list or tuple')
                     db = get_mimetypes_db()
                     mtype, encoding = db.guess_type(self.name)
                     if mtype is None:
                         if self.is_binary:
                             mtype = 'application/octet-stream'
                             encoding = None
                         else:
                             mtype = 'text/plain'
                             encoding = None
                             # try with pygments
                             try:
                                 from pygments.lexers import get_lexer_for_filename
                                 mt = get_lexer_for_filename(self.name).mimetypes
                             except Exception:
                                 mt = None
                             if mt:
                                 mtype = mt[0]
                     return mtype, encoding
                 @LazyProperty
                 def mimetype(self):
                     """
                     Wrapper around full mimetype info. It returns only type of fetched
                     mimetype without the encoding part. use get_mimetype function to fetch
                     full set of (type,encoding)
                     """
                     return self.get_mimetype()[0]
                 @LazyProperty
                 def mimetype_main(self):
                     return self.mimetype.split('/')[0]
                 @classmethod
                 def get_lexer(cls, filename, content=None):
                     from pygments import lexers
                     extension = filename.split('.')[-1]
                     lexer = None
                     try:
                         lexer = lexers.guess_lexer_for_filename(
                             filename, content, stripnl=False)
                     except lexers.ClassNotFound:
                         lexer = None
                     # try our EXTENSION_MAP
                     if not lexer:
                         try:
                             lexer_class = LANGUAGES_EXTENSIONS_MAP.get(extension)
                             if lexer_class:
                                 lexer = lexers.get_lexer_by_name(lexer_class[0])
                         except lexers.ClassNotFound:
                             lexer = None
                     if not lexer:
                         lexer = lexers.TextLexer(stripnl=False)
                     return lexer
                 @LazyProperty
                 def lexer(self):
                     """
                     Returns pygment's lexer class. Would try to guess lexer taking file's
                     content, name and mimetype.
                     """
                     return self.get_lexer(self.name, self.content)
                 @LazyProperty
                 def lexer_alias(self):
                     """
                     Returns first alias of the lexer guessed for this file.
                     """
                     return self.lexer.aliases[0]
                 @LazyProperty
                 def history(self):
                     """
                     Returns a list of commit for this file in which the file was changed
                     """
                     if self.commit is None:
                         raise NodeError('Unable to get commit for this FileNode')
                     return self.commit.get_path_history(self.path)
                 @LazyProperty
                 def annotate(self):
                     """
                     Returns a list of three element tuples with lineno, commit and line
                     """
                     if self.commit is None:
                         raise NodeError('Unable to get commit for this FileNode')
                     pre_load = ["author", "date", "message", "parents"]
                     return self.commit.get_file_annotate(self.path, pre_load=pre_load)
                 @LazyProperty
                 def state(self):
                     if not self.commit:
                         raise NodeError(
                             "Cannot check state of the node if it's not "
                             "linked with commit")
                     elif self.path in (node.path for node in self.commit.added):
                         return NodeState.ADDED
                     elif self.path in (node.path for node in self.commit.changed):
                         return NodeState.CHANGED
                     else:
                         return NodeState.NOT_CHANGED
                 @LazyProperty
                 def is_binary(self):
                     """
                     Returns True if file has binary content.
                     """
                     if self.commit:
                         return self.commit.is_node_binary(self.path)
                     else:
                         raw_bytes = self._content
                         return raw_bytes and '\0' in raw_bytes
                 @LazyProperty
                 def extension(self):
                     """Returns filenode extension"""
                     return self.name.split('.')[-1]
                 @property
                 def is_executable(self):
                     """
                     Returns ``True`` if file has executable flag turned on.
                     """
                     return bool(self.mode & stat.S_IXUSR)
                 def get_largefile_node(self):
                     """
                     Try to return a Mercurial FileNode from this node. It does internal
                     checks inside largefile store, if that file exist there it will
                     create special instance of LargeFileNode which can get content from
                     LF store.
                     """
                     if self.commit:
                         return self.commit.get_largefile_node(self.path)
+                def count_lines(self, content, count_empty=False):
+                    if count_empty:
+                        all_lines = 0
+                        empty_lines = 0
+                        for line in content.splitlines(True):
+                            if line == '\n':
+                                empty_lines += 1
+                            all_lines += 1
+                        return all_lines, all_lines - empty_lines
+                    else:
+                        # fast method
+                        empty_lines = all_lines = content.count('\n')
+                        if all_lines == 0 and content:
+                            # one-line without a newline
+                            empty_lines = all_lines = 1
+                    return all_lines, empty_lines
                 def lines(self, count_empty=False):
                     all_lines, empty_lines = 0, 0
                     if not self.is_binary:
                         content = self.content
-                        if count_empty:
+                        all_lines, empty_lines = self.count_lines(content, count_empty=count_empty)
-                            all_lines = 0
-                            empty_lines = 0
-                            for line in content.splitlines(True):
-                                if line == '\n':
-                                    empty_lines += 1
-                                all_lines += 1
-                            return all_lines, all_lines - empty_lines
-                        else:
-                            # fast method
-                            empty_lines = all_lines = content.count('\n')
-                            if all_lines == 0 and content:
-                                # one-line without a newline
-                                empty_lines = all_lines = 1
                     return all_lines, empty_lines
                 def __repr__(self):
                     return '<%s %r @ %s>' % (self.__class__.__name__, self.path,
                                              getattr(self.commit, 'short_id', ''))
             class RemovedFileNode(FileNode):
                 """
                 Dummy FileNode class - trying to access any public attribute except path,
                 name, kind or state (or methods/attributes checking those two) would raise
                 RemovedFileNodeError.
                 """
                 ALLOWED_ATTRIBUTES = [
                     'name', 'path', 'state', 'is_root', 'is_file', 'is_dir', 'kind',
                     'added', 'changed', 'not_changed', 'removed'
                 ]
                 def __init__(self, path):
                     """
                     :param path: relative path to the node
                     """
                     super(RemovedFileNode, self).__init__(path=path)
                 def __getattribute__(self, attr):
                     if attr.startswith('_') or attr in RemovedFileNode.ALLOWED_ATTRIBUTES:
                         return super(RemovedFileNode, self).__getattribute__(attr)
                     raise RemovedFileNodeError(
                         "Cannot access attribute %s on RemovedFileNode" % attr)
                 @LazyProperty
                 def state(self):
                     return NodeState.REMOVED
             class DirNode(Node):
                 """
                 DirNode stores list of files and directories within this node.
                 Nodes may be used standalone but within repository context they
                 lazily fetch data within same repository's commit.
                 """
                 def __init__(self, path, nodes=(), commit=None):
                     """
                     Only one of ``nodes`` and ``commit`` may be given. Passing both
                     would raise ``NodeError`` exception.
                     :param path: relative path to the node
                     :param nodes: content may be passed to constructor
                     :param commit: if given, will use it to lazily fetch content
                     """
                     if nodes and commit:
                         raise NodeError("Cannot use both nodes and commit")
                     super(DirNode, self).__init__(path, NodeKind.DIR)
                     self.commit = commit
                     self._nodes = nodes
                 @LazyProperty
                 def content(self):
                     raise NodeError(
                         "%s represents a dir and has no `content` attribute" % self)
                 @LazyProperty
                 def nodes(self):
                     if self.commit:
                         nodes = self.commit.get_nodes(self.path)
                     else:
                         nodes = self._nodes
                     self._nodes_dict = dict((node.path, node) for node in nodes)
                     return sorted(nodes)
                 @LazyProperty
                 def files(self):
                     return sorted((node for node in self.nodes if node.is_file()))
                 @LazyProperty
                 def dirs(self):
                     return sorted((node for node in self.nodes if node.is_dir()))
                 def __iter__(self):
                     for node in self.nodes:
                         yield node
                 def get_node(self, path):
                     """
                     Returns node from within this particular ``DirNode``, so it is now
                     allowed to fetch, i.e. node located at 'docs/api/index.rst' from node
                     'docs'. In order to access deeper nodes one must fetch nodes between
                     them first - this would work::
                        docs = root.get_node('docs')
                        docs.get_node('api').get_node('index.rst')
                     :param: path - relative to the current node
                     .. note::
                        To access lazily (as in example above) node have to be initialized
                        with related commit object - without it node is out of
                        context and may know nothing about anything else than nearest
                        (located at same level) nodes.
                     """
                     try:
                         path = path.rstrip('/')
                         if path == '':
                             raise NodeError("Cannot retrieve node without path")
                         self.nodes  # access nodes first in order to set _nodes_dict
                         paths = path.split('/')
                         if len(paths) == 1:
                             if not self.is_root():
                                 path = '/'.join((self.path, paths[0]))
                             else:
                                 path = paths[0]
                             return self._nodes_dict[path]
                         elif len(paths) > 1:
                             if self.commit is None:
                                 raise NodeError("Cannot access deeper nodes without commit")
                             else:
                                 path1, path2 = paths[0], '/'.join(paths[1:])
                                 return self.get_node(path1).get_node(path2)
                         else:
                             raise KeyError
                     except KeyError:
                         raise NodeError("Node does not exist at %s" % path)
                 @LazyProperty
                 def state(self):
                     raise NodeError("Cannot access state of DirNode")
                 @LazyProperty
                 def size(self):
                     size = 0
                     for root, dirs, files in self.commit.walk(self.path):
                         for f in files:
                             size += f.size
                     return size
                 @LazyProperty
                 def last_commit(self):
                     if self.commit:
                         pre_load = ["author", "date", "message", "parents"]
                         return self.commit.get_path_commit(self.path, pre_load=pre_load)
                     raise NodeError(
                         "Cannot retrieve last commit of the file without "
                         "related commit attribute")
                 def __repr__(self):
                     return '<%s %r @ %s>' % (self.__class__.__name__, self.path,
                                              getattr(self.commit, 'short_id', ''))
             class RootNode(DirNode):
                 """
                 DirNode being the root node of the repository.
                 """
                 def __init__(self, nodes=(), commit=None):
                     super(RootNode, self).__init__(path='', nodes=nodes, commit=commit)
                 def __repr__(self):
                     return '<%s>' % self.__class__.__name__
             class SubModuleNode(Node):
                 """
                 represents a SubModule of Git or SubRepo of Mercurial
                 """
                 is_binary = False
                 size = 0
                 def __init__(self, name, url=None, commit=None, alias=None):
                     self.path = name
                     self.kind = NodeKind.SUBMODULE
                     self.alias = alias
                     # we have to use EmptyCommit here since this can point to svn/git/hg
                     # submodules we cannot get from repository
                     self.commit = EmptyCommit(str(commit), alias=alias)
                     self.url = url or self._extract_submodule_url()
                 def __repr__(self):
                     return '<%s %r @ %s>' % (self.__class__.__name__, self.path,
                                              getattr(self.commit, 'short_id', ''))
                 def _extract_submodule_url(self):
                     # TODO: find a way to parse gits submodule file and extract the
                     # linking URL
                     return self.path
                 @LazyProperty
                 def name(self):
                     """
                     Returns name of the node so if its path
                     then only last part is returned.
                     """
                     org = safe_unicode(self.path.rstrip('/').split('/')[-1])
                     return u'%s @ %s' % (org, self.commit.short_id)
             class LargeFileNode(FileNode):
                 def __init__(self, path, url=None, commit=None, alias=None, org_path=None):
                     self.path = path
                     self.org_path = org_path
                     self.kind = NodeKind.LARGEFILE
                     self.alias = alias
                 def _validate_path(self, path):
                     """
                     we override check since the LargeFileNode path is system absolute
                     """
                     pass
                 def __repr__(self):
                     return '<%s %r>' % (self.__class__.__name__, self.path)
                 @LazyProperty
                 def size(self):
                     return os.stat(self.path).st_size
                 @LazyProperty
                 def raw_bytes(self):
                     with open(self.path, 'rb') as f:
                         content = f.read()
                     return content
                 @LazyProperty
                 def name(self):
                     """
                     Overwrites name to be the org lf path
                     """
                     return self.org_path
                 def stream_bytes(self):
                     with open(self.path, 'rb') as stream:
                         while True:
                             data = stream.read(16 * 1024)
                             if not data:
                                 break
                             yield data

rhodecode/model/scm.py

0 +6 0

             # -*- coding: utf-8 -*-
             # Copyright (C) 2010-2019 RhodeCode GmbH
             #
             # This program is free software: you can redistribute it and/or modify
             # it under the terms of the GNU Affero General Public License, version 3
             # (only), as published by the Free Software Foundation.
             #
             # This program is distributed in the hope that it will be useful,
             # but WITHOUT ANY WARRANTY; without even the implied warranty of
             # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
             # GNU General Public License for more details.
             #
             # You should have received a copy of the GNU Affero General Public License
             # along with this program.  If not, see <http://www.gnu.org/licenses/>.
             #
             # This program is dual-licensed. If you wish to learn more about the
             # RhodeCode Enterprise Edition, including its added features, Support services,
             # and proprietary license terms, please see https://rhodecode.com/licenses/
             """
             Scm model for RhodeCode
             """
             import os.path
             import traceback
             import logging
             import cStringIO
             from sqlalchemy import func
             from zope.cachedescriptors.property import Lazy as LazyProperty
             import rhodecode
             from rhodecode.lib.vcs import get_backend
             from rhodecode.lib.vcs.exceptions import RepositoryError, NodeNotChangedError
             from rhodecode.lib.vcs.nodes import FileNode
             from rhodecode.lib.vcs.backends.base import EmptyCommit
             from rhodecode.lib import helpers as h, rc_cache
             from rhodecode.lib.auth import (
                 HasRepoPermissionAny, HasRepoGroupPermissionAny,
                 HasUserGroupPermissionAny)
             from rhodecode.lib.exceptions import NonRelativePathError, IMCCommitError
             from rhodecode.lib import hooks_utils
             from rhodecode.lib.utils import (
                 get_filesystem_repos, make_db_config)
             from rhodecode.lib.utils2 import (safe_str, safe_unicode)
             from rhodecode.lib.system_info import get_system_info
             from rhodecode.model import BaseModel
             from rhodecode.model.db import (
                 Repository, CacheKey, UserFollowing, UserLog, User, RepoGroup,
                 PullRequest)
             from rhodecode.model.settings import VcsSettingsModel
             from rhodecode.model.validation_schema.validators import url_validator, InvalidCloneUrl
             log = logging.getLogger(__name__)
             class UserTemp(object):
                 def __init__(self, user_id):
                     self.user_id = user_id
                 def __repr__(self):
                     return "<%s('id:%s')>" % (self.__class__.__name__, self.user_id)
             class RepoTemp(object):
                 def __init__(self, repo_id):
                     self.repo_id = repo_id
                 def __repr__(self):
                     return "<%s('id:%s')>" % (self.__class__.__name__, self.repo_id)
             class SimpleCachedRepoList(object):
                 """
                 Lighter version of of iteration of repos without the scm initialisation,
                 and with cache usage
                 """
                 def __init__(self, db_repo_list, repos_path, order_by=None, perm_set=None):
                     self.db_repo_list = db_repo_list
                     self.repos_path = repos_path
                     self.order_by = order_by
                     self.reversed = (order_by or '').startswith('-')
                     if not perm_set:
                         perm_set = ['repository.read', 'repository.write',
                                     'repository.admin']
                     self.perm_set = perm_set
                 def __len__(self):
                     return len(self.db_repo_list)
                 def __repr__(self):
                     return '<%s (%s)>' % (self.__class__.__name__, self.__len__())
                 def __iter__(self):
                     for dbr in self.db_repo_list:
                         # check permission at this level
                         has_perm = HasRepoPermissionAny(*self.perm_set)(
                             dbr.repo_name, 'SimpleCachedRepoList check')
                         if not has_perm:
                             continue
                         tmp_d = {
                             'name': dbr.repo_name,
                             'dbrepo': dbr.get_dict(),
                             'dbrepo_fork': dbr.fork.get_dict() if dbr.fork else {}
                         }
                         yield tmp_d
             class _PermCheckIterator(object):
                 def __init__(
                         self, obj_list, obj_attr, perm_set, perm_checker,
                         extra_kwargs=None):
                     """
                     Creates iterator from given list of objects, additionally
                     checking permission for them from perm_set var
                     :param obj_list: list of db objects
                     :param obj_attr: attribute of object to pass into perm_checker
                     :param perm_set: list of permissions to check
                     :param perm_checker: callable to check permissions against
                     """
                     self.obj_list = obj_list
                     self.obj_attr = obj_attr
                     self.perm_set = perm_set
                     self.perm_checker = perm_checker
                     self.extra_kwargs = extra_kwargs or {}
                 def __len__(self):
                     return len(self.obj_list)
                 def __repr__(self):
                     return '<%s (%s)>' % (self.__class__.__name__, self.__len__())
                 def __iter__(self):
                     checker = self.perm_checker(*self.perm_set)
                     for db_obj in self.obj_list:
                         # check permission at this level
                         name = getattr(db_obj, self.obj_attr, None)
                         if not checker(name, self.__class__.__name__, **self.extra_kwargs):
                             continue
                         yield db_obj
             class RepoList(_PermCheckIterator):
                 def __init__(self, db_repo_list, perm_set=None, extra_kwargs=None):
                     if not perm_set:
                         perm_set = [
                             'repository.read', 'repository.write', 'repository.admin']
                     super(RepoList, self).__init__(
                         obj_list=db_repo_list,
                         obj_attr='repo_name', perm_set=perm_set,
                         perm_checker=HasRepoPermissionAny,
                         extra_kwargs=extra_kwargs)
             class RepoGroupList(_PermCheckIterator):
                 def __init__(self, db_repo_group_list, perm_set=None, extra_kwargs=None):
                     if not perm_set:
                         perm_set = ['group.read', 'group.write', 'group.admin']
                     super(RepoGroupList, self).__init__(
                         obj_list=db_repo_group_list,
                         obj_attr='group_name', perm_set=perm_set,
                         perm_checker=HasRepoGroupPermissionAny,
                         extra_kwargs=extra_kwargs)
             class UserGroupList(_PermCheckIterator):
                 def __init__(self, db_user_group_list, perm_set=None, extra_kwargs=None):
                     if not perm_set:
                         perm_set = ['usergroup.read', 'usergroup.write', 'usergroup.admin']
                     super(UserGroupList, self).__init__(
                         obj_list=db_user_group_list,
                         obj_attr='users_group_name', perm_set=perm_set,
                         perm_checker=HasUserGroupPermissionAny,
                         extra_kwargs=extra_kwargs)
             class ScmModel(BaseModel):
                 """
                 Generic Scm Model
                 """
                 @LazyProperty
                 def repos_path(self):
                     """
                     Gets the repositories root path from database
                     """
                     settings_model = VcsSettingsModel(sa=self.sa)
                     return settings_model.get_repos_location()
                 def repo_scan(self, repos_path=None):
                     """
                     Listing of repositories in given path. This path should not be a
                     repository itself. Return a dictionary of repository objects
                     :param repos_path: path to directory containing repositories
                     """
                     if repos_path is None:
                         repos_path = self.repos_path
                     log.info('scanning for repositories in %s', repos_path)
                     config = make_db_config()
                     config.set('extensions', 'largefiles', '')
                     repos = {}
                     for name, path in get_filesystem_repos(repos_path, recursive=True):
                         # name need to be decomposed and put back together using the /
                         # since this is internal storage separator for rhodecode
                         name = Repository.normalize_repo_name(name)
                         try:
                             if name in repos:
                                 raise RepositoryError('Duplicate repository name %s '
                                                       'found in %s' % (name, path))
                             elif path[0] in rhodecode.BACKENDS:
                                 backend = get_backend(path[0])
                                 repos[name] = backend(path[1], config=config,
                                                       with_wire={"cache": False})
                         except OSError:
                             continue
                     log.debug('found %s paths with repositories', len(repos))
                     return repos
                 def get_repos(self, all_repos=None, sort_key=None):
                     """
                     Get all repositories from db and for each repo create it's
                     backend instance and fill that backed with information from database
                     :param all_repos: list of repository names as strings
                         give specific repositories list, good for filtering
                     :param sort_key: initial sorting of repositories
                     """
                     if all_repos is None:
                         all_repos = self.sa.query(Repository)\
                             .filter(Repository.group_id == None)\
                             .order_by(func.lower(Repository.repo_name)).all()
                     repo_iter = SimpleCachedRepoList(
                         all_repos, repos_path=self.repos_path, order_by=sort_key)
                     return repo_iter
                 def get_repo_groups(self, all_groups=None):
                     if all_groups is None:
                         all_groups = RepoGroup.query()\
                             .filter(RepoGroup.group_parent_id == None).all()
                     return [x for x in RepoGroupList(all_groups)]
                 def mark_for_invalidation(self, repo_name, delete=False):
                     """
                     Mark caches of this repo invalid in the database. `delete` flag
                     removes the cache entries
                     :param repo_name: the repo_name for which caches should be marked
                         invalid, or deleted
                     :param delete: delete the entry keys instead of setting bool
                         flag on them, and also purge caches used by the dogpile
                     """
                     repo = Repository.get_by_repo_name(repo_name)
                     if repo:
                         invalidation_namespace = CacheKey.REPO_INVALIDATION_NAMESPACE.format(
                             repo_id=repo.repo_id)
                         CacheKey.set_invalidate(invalidation_namespace, delete=delete)
                         repo_id = repo.repo_id
                         config = repo._config
                         config.set('extensions', 'largefiles', '')
                         repo.update_commit_cache(config=config, cs_cache=None)
                         if delete:
                             cache_namespace_uid = 'cache_repo.{}'.format(repo_id)
                             rc_cache.clear_cache_namespace('cache_repo', cache_namespace_uid)
                 def toggle_following_repo(self, follow_repo_id, user_id):
                     f = self.sa.query(UserFollowing)\
                         .filter(UserFollowing.follows_repo_id == follow_repo_id)\
                         .filter(UserFollowing.user_id == user_id).scalar()
                     if f is not None:
                         try:
                             self.sa.delete(f)
                             return
                         except Exception:
                             log.error(traceback.format_exc())
                             raise
                     try:
                         f = UserFollowing()
                         f.user_id = user_id
                         f.follows_repo_id = follow_repo_id
                         self.sa.add(f)
                     except Exception:
                         log.error(traceback.format_exc())
                         raise
                 def toggle_following_user(self, follow_user_id, user_id):
                     f = self.sa.query(UserFollowing)\
                         .filter(UserFollowing.follows_user_id == follow_user_id)\
                         .filter(UserFollowing.user_id == user_id).scalar()
                     if f is not None:
                         try:
                             self.sa.delete(f)
                             return
                         except Exception:
                             log.error(traceback.format_exc())
                             raise
                     try:
                         f = UserFollowing()
                         f.user_id = user_id
                         f.follows_user_id = follow_user_id
                         self.sa.add(f)
                     except Exception:
                         log.error(traceback.format_exc())
                         raise
                 def is_following_repo(self, repo_name, user_id, cache=False):
                     r = self.sa.query(Repository)\
                         .filter(Repository.repo_name == repo_name).scalar()
                     f = self.sa.query(UserFollowing)\
                         .filter(UserFollowing.follows_repository == r)\
                         .filter(UserFollowing.user_id == user_id).scalar()
                     return f is not None
                 def is_following_user(self, username, user_id, cache=False):
                     u = User.get_by_username(username)
                     f = self.sa.query(UserFollowing)\
                         .filter(UserFollowing.follows_user == u)\
                         .filter(UserFollowing.user_id == user_id).scalar()
                     return f is not None
                 def get_followers(self, repo):
                     repo = self._get_repo(repo)
                     return self.sa.query(UserFollowing)\
                         .filter(UserFollowing.follows_repository == repo).count()
                 def get_forks(self, repo):
                     repo = self._get_repo(repo)
                     return self.sa.query(Repository)\
                         .filter(Repository.fork == repo).count()
                 def get_pull_requests(self, repo):
                     repo = self._get_repo(repo)
                     return self.sa.query(PullRequest)\
                         .filter(PullRequest.target_repo == repo)\
                         .filter(PullRequest.status != PullRequest.STATUS_CLOSED).count()
                 def mark_as_fork(self, repo, fork, user):
                     repo = self._get_repo(repo)
                     fork = self._get_repo(fork)
                     if fork and repo.repo_id == fork.repo_id:
                         raise Exception("Cannot set repository as fork of itself")
                     if fork and repo.repo_type != fork.repo_type:
                         raise RepositoryError(
                             "Cannot set repository as fork of repository with other type")
                     repo.fork = fork
                     self.sa.add(repo)
                     return repo
                 def pull_changes(self, repo, username, remote_uri=None, validate_uri=True):
                     dbrepo = self._get_repo(repo)
                     remote_uri = remote_uri or dbrepo.clone_uri
                     if not remote_uri:
                         raise Exception("This repository doesn't have a clone uri")
                     repo = dbrepo.scm_instance(cache=False)
                     repo.config.clear_section('hooks')
                     try:
                         # NOTE(marcink): add extra validation so we skip invalid urls
                         # this is due this tasks can be executed via scheduler without
                         # proper validation of remote_uri
                         if validate_uri:
                             config = make_db_config(clear_session=False)
                             url_validator(remote_uri, dbrepo.repo_type, config)
                     except InvalidCloneUrl:
                         raise
                     repo_name = dbrepo.repo_name
                     try:
                         # TODO: we need to make sure those operations call proper hooks !
                         repo.fetch(remote_uri)
                         self.mark_for_invalidation(repo_name)
                     except Exception:
                         log.error(traceback.format_exc())
                         raise
                 def push_changes(self, repo, username, remote_uri=None, validate_uri=True):
                     dbrepo = self._get_repo(repo)
                     remote_uri = remote_uri or dbrepo.push_uri
                     if not remote_uri:
                         raise Exception("This repository doesn't have a clone uri")
                     repo = dbrepo.scm_instance(cache=False)
                     repo.config.clear_section('hooks')
                     try:
                         # NOTE(marcink): add extra validation so we skip invalid urls
                         # this is due this tasks can be executed via scheduler without
                         # proper validation of remote_uri
                         if validate_uri:
                             config = make_db_config(clear_session=False)
                             url_validator(remote_uri, dbrepo.repo_type, config)
                     except InvalidCloneUrl:
                         raise
                     try:
                         repo.push(remote_uri)
                     except Exception:
                         log.error(traceback.format_exc())
                         raise
                 def commit_change(self, repo, repo_name, commit, user, author, message,
                                   content, f_path):
                     """
                     Commits changes
                     :param repo: SCM instance
                     """
                     user = self._get_user(user)
                     # decoding here will force that we have proper encoded values
                     # in any other case this will throw exceptions and deny commit
                     content = safe_str(content)
                     path = safe_str(f_path)
                     # message and author needs to be unicode
                     # proper backend should then translate that into required type
                     message = safe_unicode(message)
                     author = safe_unicode(author)
                     imc = repo.in_memory_commit
                     imc.change(FileNode(path, content, mode=commit.get_file_mode(f_path)))
                     try:
                         # TODO: handle pre-push action !
                         tip = imc.commit(
                             message=message, author=author, parents=[commit],
                             branch=commit.branch)
                     except Exception as e:
                         log.error(traceback.format_exc())
                         raise IMCCommitError(str(e))
                     finally:
                         # always clear caches, if commit fails we want fresh object also
                         self.mark_for_invalidation(repo_name)
                     # We trigger the post-push action
                     hooks_utils.trigger_post_push_hook(
                         username=user.username, action='push_local', hook_type='post_push',
                         repo_name=repo_name, repo_alias=repo.alias, commit_ids=[tip.raw_id])
                     return tip
                 def _sanitize_path(self, f_path):
                     if f_path.startswith('/') or f_path.startswith('./') or '../' in f_path:
                         raise NonRelativePathError('%s is not an relative path' % f_path)
                     if f_path:
                         f_path = os.path.normpath(f_path)
                     return f_path
                 def get_dirnode_metadata(self, request, commit, dir_node):
                     if not dir_node.is_dir():
                         return []
                     data = []
                     for node in dir_node:
                         if not node.is_file():
                             # we skip file-nodes
                             continue
                         last_commit = node.last_commit
                         last_commit_date = last_commit.date
                         data.append({
                             'name': node.name,
                             'size': h.format_byte_size_binary(node.size),
                             'modified_at': h.format_date(last_commit_date),
                             'modified_ts': last_commit_date.isoformat(),
                             'revision': last_commit.revision,
                             'short_id': last_commit.short_id,
                             'message': h.escape(last_commit.message),
                             'author': h.escape(last_commit.author),
                             'user_profile': h.gravatar_with_user(
                                 request, last_commit.author),
                         })
                     return data
                 def get_nodes(self, repo_name, commit_id, root_path='/', flat=True,
                               extended_info=False, content=False, max_file_bytes=None):
                     """
                     recursive walk in root dir and return a set of all path in that dir
                     based on repository walk function
                     :param repo_name: name of repository
                     :param commit_id: commit id for which to list nodes
                     :param root_path: root path to list
                     :param flat: return as a list, if False returns a dict with description
                     :param extended_info: show additional info such as md5, binary, size etc
                     :param content: add nodes content to the return data
                     :param max_file_bytes: will not return file contents over this limit
                     """
                     _files = list()
                     _dirs = list()
                     try:
                         _repo = self._get_repo(repo_name)
                         commit = _repo.scm_instance().get_commit(commit_id=commit_id)
                         root_path = root_path.lstrip('/')
                         for __, dirs, files in commit.walk(root_path):
                             for f in files:
                                 _content = None
                                 _data = f_name = f.unicode_path
                                 if not flat:
                                     _data = {
                                         "name": h.escape(f_name),
                                         "type": "file",
                                         }
                                     if extended_info:
                                         _data.update({
                                             "md5": f.md5,
                                             "binary": f.is_binary,
                                             "size": f.size,
                                             "extension": f.extension,
                                             "mimetype": f.mimetype,
                                             "lines": f.lines()[0]
                                         })
                                     if content:
                                         over_size_limit = (max_file_bytes is not None
                                                            and f.size > max_file_bytes)
                                         full_content = None
                                         if not f.is_binary and not over_size_limit:
                                             full_content = safe_str(f.content)
                                         _data.update({
                                             "content": full_content,
                                         })
                                 _files.append(_data)
                             for d in dirs:
                                 _data = d_name = d.unicode_path
                                 if not flat:
                                     _data = {
                                         "name": h.escape(d_name),
                                         "type": "dir",
                                         }
                                 if extended_info:
                                     _data.update({
                                         "md5": None,
                                         "binary": None,
                                         "size": None,
                                         "extension": None,
                                     })
                                 if content:
                                     _data.update({
                                         "content": None
                                     })
                                 _dirs.append(_data)
                     except RepositoryError:
                         log.exception("Exception in get_nodes")
                         raise
                     return _dirs, _files
                 def get_quick_filter_nodes(self, repo_name, commit_id, root_path='/'):
                     """
                     Generate files for quick filter in files view
                     """
                     _files = list()
                     _dirs = list()
                     try:
                         _repo = self._get_repo(repo_name)
                         commit = _repo.scm_instance().get_commit(commit_id=commit_id)
                         root_path = root_path.lstrip('/')
                         for __, dirs, files in commit.walk(root_path):
                             for f in files:
                                 _data = {
                                     "name": h.escape(f.unicode_path),
                                     "type": "file",
                                     }
                                 _files.append(_data)
                             for d in dirs:
                                 _data = {
                                     "name": h.escape(d.unicode_path),
                                     "type": "dir",
                                     }
                                 _dirs.append(_data)
                     except RepositoryError:
                         log.exception("Exception in get_quick_filter_nodes")
                         raise
                     return _dirs, _files
                 def get_node(self, repo_name, commit_id, file_path,
                              extended_info=False, content=False, max_file_bytes=None, cache=True):
                     """
                     retrieve single node from commit
                     """
                     try:
                         _repo = self._get_repo(repo_name)
                         commit = _repo.scm_instance().get_commit(commit_id=commit_id)
                         file_node = commit.get_node(file_path)
                         if file_node.is_dir():
                             raise RepositoryError('The given path is a directory')
                         _content = None
                         f_name = file_node.unicode_path
                         file_data = {
                             "name": h.escape(f_name),
                             "type": "file",
                         }
                         if extended_info:
                             file_data.update({
                                 "extension": file_node.extension,
                                 "mimetype": file_node.mimetype,
                             })
                             if cache:
                                 md5 = file_node.md5
                                 is_binary = file_node.is_binary
                                 size = file_node.size
                             else:
                                 is_binary, md5, size, _content = file_node.metadata_uncached()
                             file_data.update({
                                 "md5": md5,
                                 "binary": is_binary,
                                 "size": size,
                             })
                         if content and cache:
                             # get content + cache
                             size = file_node.size
                             over_size_limit = (max_file_bytes is not None and size > max_file_bytes)
                             full_content = None
+                            all_lines = 0
                             if not file_node.is_binary and not over_size_limit:
                                 full_content = safe_unicode(file_node.content)
+                                all_lines, empty_lines = file_node.count_lines(full_content)
                             file_data.update({
                                 "content": full_content,
+                                "lines": all_lines
                             })
                         elif content:
                             # get content *without* cache
                             if _content is None:
                                 is_binary, md5, size, _content = file_node.metadata_uncached()
                             over_size_limit = (max_file_bytes is not None and size > max_file_bytes)
                             full_content = None
+                            all_lines = 0
                             if not is_binary and not over_size_limit:
                                 full_content = safe_unicode(_content)
+                                all_lines, empty_lines = file_node.count_lines(full_content)
                             file_data.update({
                                 "content": full_content,
+                                "lines": all_lines
                             })
                     except RepositoryError:
                         log.exception("Exception in get_node")
                         raise
                     return file_data
                 def get_fts_data(self, repo_name, commit_id, root_path='/'):
                     """
                     Fetch node tree for usage in full text search
                     """
                     tree_info = list()
                     try:
                         _repo = self._get_repo(repo_name)
                         commit = _repo.scm_instance().get_commit(commit_id=commit_id)
                         root_path = root_path.lstrip('/')
                         for __, dirs, files in commit.walk(root_path):
                             for f in files:
                                 is_binary, md5, size, _content = f.metadata_uncached()
                                 _data = {
                                     "name": f.unicode_path,
                                     "md5": md5,
                                     "extension": f.extension,
                                     "binary": is_binary,
                                     "size": size
                                 }
                                 tree_info.append(_data)
                     except RepositoryError:
                         log.exception("Exception in get_nodes")
                         raise
                     return tree_info
                 def create_nodes(self, user, repo, message, nodes, parent_commit=None,
                                  author=None, trigger_push_hook=True):
                     """
                     Commits given multiple nodes into repo
                     :param user: RhodeCode User object or user_id, the commiter
                     :param repo: RhodeCode Repository object
                     :param message: commit message
                     :param nodes: mapping {filename:{'content':content},...}
                     :param parent_commit: parent commit, can be empty than it's
                        initial commit
                     :param author: author of commit, cna be different that commiter
                        only for git
                     :param trigger_push_hook: trigger push hooks
                     :returns: new commited commit
                     """
                     user = self._get_user(user)
                     scm_instance = repo.scm_instance(cache=False)
                     processed_nodes = []
                     for f_path in nodes:
                         f_path = self._sanitize_path(f_path)
                         content = nodes[f_path]['content']
                         f_path = safe_str(f_path)
                         # decoding here will force that we have proper encoded values
                         # in any other case this will throw exceptions and deny commit
                         if isinstance(content, (basestring,)):
                             content = safe_str(content)
                         elif isinstance(content, (file, cStringIO.OutputType,)):
                             content = content.read()
                         else:
                             raise Exception('Content is of unrecognized type %s' % (
                                 type(content)
                             ))
                         processed_nodes.append((f_path, content))
                     message = safe_unicode(message)
                     commiter = user.full_contact
                     author = safe_unicode(author) if author else commiter
                     imc = scm_instance.in_memory_commit
                     if not parent_commit:
                         parent_commit = EmptyCommit(alias=scm_instance.alias)
                     if isinstance(parent_commit, EmptyCommit):
                         # EmptyCommit means we we're editing empty repository
                         parents = None
                     else:
                         parents = [parent_commit]
                     # add multiple nodes
                     for path, content in processed_nodes:
                         imc.add(FileNode(path, content=content))
                     # TODO: handle pre push scenario
                     tip = imc.commit(message=message,
                                      author=author,
                                      parents=parents,
                                      branch=parent_commit.branch)
                     self.mark_for_invalidation(repo.repo_name)
                     if trigger_push_hook:
                         hooks_utils.trigger_post_push_hook(
                             username=user.username, action='push_local',
                             repo_name=repo.repo_name, repo_alias=scm_instance.alias,
                             hook_type='post_push',
                             commit_ids=[tip.raw_id])
                     return tip
                 def update_nodes(self, user, repo, message, nodes, parent_commit=None,
                                  author=None, trigger_push_hook=True):
                     user = self._get_user(user)
                     scm_instance = repo.scm_instance(cache=False)
                     message = safe_unicode(message)
                     commiter = user.full_contact
                     author = safe_unicode(author) if author else commiter
                     imc = scm_instance.in_memory_commit
                     if not parent_commit:
                         parent_commit = EmptyCommit(alias=scm_instance.alias)
                     if isinstance(parent_commit, EmptyCommit):
                         # EmptyCommit means we we're editing empty repository
                         parents = None
                     else:
                         parents = [parent_commit]
                     # add multiple nodes
                     for _filename, data in nodes.items():
                         # new filename, can be renamed from the old one, also sanitaze
                         # the path for any hack around relative paths like ../../ etc.
                         filename = self._sanitize_path(data['filename'])
                         old_filename = self._sanitize_path(_filename)
                         content = data['content']
                         file_mode = data.get('mode')
                         filenode = FileNode(old_filename, content=content, mode=file_mode)
                         op = data['op']
                         if op == 'add':
                             imc.add(filenode)
                         elif op == 'del':
                             imc.remove(filenode)
                         elif op == 'mod':
                             if filename != old_filename:
                                 # TODO: handle renames more efficient, needs vcs lib changes
                                 imc.remove(filenode)
                                 imc.add(FileNode(filename, content=content, mode=file_mode))
                             else:
                                 imc.change(filenode)
                     try:
                         # TODO: handle pre push scenario commit changes
                         tip = imc.commit(message=message,
                                          author=author,
                                          parents=parents,
                                          branch=parent_commit.branch)
                     except NodeNotChangedError:
                         raise
                     except Exception as e:
                         log.exception("Unexpected exception during call to imc.commit")
                         raise IMCCommitError(str(e))
                     finally:
                         # always clear caches, if commit fails we want fresh object also
                         self.mark_for_invalidation(repo.repo_name)
                     if trigger_push_hook:
                         hooks_utils.trigger_post_push_hook(
                             username=user.username, action='push_local', hook_type='post_push',
                             repo_name=repo.repo_name, repo_alias=scm_instance.alias,
                             commit_ids=[tip.raw_id])
                     return tip
                 def delete_nodes(self, user, repo, message, nodes, parent_commit=None,
                                  author=None, trigger_push_hook=True):
                     """
                     Deletes given multiple nodes into `repo`
                     :param user: RhodeCode User object or user_id, the committer
                     :param repo: RhodeCode Repository object
                     :param message: commit message
                     :param nodes: mapping {filename:{'content':content},...}
                     :param parent_commit: parent commit, can be empty than it's initial
                        commit
                     :param author: author of commit, cna be different that commiter only
                        for git
                     :param trigger_push_hook: trigger push hooks
                     :returns: new commit after deletion
                     """
                     user = self._get_user(user)
                     scm_instance = repo.scm_instance(cache=False)
                     processed_nodes = []
                     for f_path in nodes:
                         f_path = self._sanitize_path(f_path)
                         # content can be empty but for compatabilty it allows same dicts
                         # structure as add_nodes
                         content = nodes[f_path].get('content')
                         processed_nodes.append((f_path, content))
                     message = safe_unicode(message)
                     commiter = user.full_contact
                     author = safe_unicode(author) if author else commiter
                     imc = scm_instance.in_memory_commit
                     if not parent_commit:
                         parent_commit = EmptyCommit(alias=scm_instance.alias)
                     if isinstance(parent_commit, EmptyCommit):
                         # EmptyCommit means we we're editing empty repository
                         parents = None
                     else:
                         parents = [parent_commit]
                     # add multiple nodes
                     for path, content in processed_nodes:
                         imc.remove(FileNode(path, content=content))
                     # TODO: handle pre push scenario
                     tip = imc.commit(message=message,
                                      author=author,
                                      parents=parents,
                                      branch=parent_commit.branch)
                     self.mark_for_invalidation(repo.repo_name)
                     if trigger_push_hook:
                         hooks_utils.trigger_post_push_hook(
                             username=user.username, action='push_local', hook_type='post_push',
                             repo_name=repo.repo_name, repo_alias=scm_instance.alias,
                             commit_ids=[tip.raw_id])
                     return tip
                 def strip(self, repo, commit_id, branch):
                     scm_instance = repo.scm_instance(cache=False)
                     scm_instance.config.clear_section('hooks')
                     scm_instance.strip(commit_id, branch)
                     self.mark_for_invalidation(repo.repo_name)
                 def get_unread_journal(self):
                     return self.sa.query(UserLog).count()
                 @classmethod
                 def backend_landing_ref(cls, repo_type):
                     """
                     Return a default landing ref based on a repository type.
                     """
                     landing_ref = {
                         'hg': ('branch:default', 'default'),
                         'git': ('branch:master', 'master'),
                         'svn': ('rev:tip', 'latest tip'),
                         'default': ('rev:tip', 'latest tip'),
                     }
                     return landing_ref.get(repo_type) or landing_ref['default']
                 def get_repo_landing_revs(self, translator, repo=None):
                     """
                     Generates select option with tags branches and bookmarks (for hg only)
                     grouped by type
                     :param repo:
                     """
                     _ = translator
                     repo = self._get_repo(repo)
                     if repo:
                         repo_type = repo.repo_type
                     else:
                         repo_type = 'default'
                     default_landing_ref, landing_ref_lbl = self.backend_landing_ref(repo_type)
                     default_ref_options = [
                         [default_landing_ref, landing_ref_lbl]
                     ]
                     default_choices = [
                         default_landing_ref
                     ]
                     if not repo:
                         return default_choices, default_ref_options
                     repo = repo.scm_instance()
                     ref_options = [('rev:tip', 'latest tip')]
                     choices = ['rev:tip']
                     # branches
                     branch_group = [(u'branch:%s' % safe_unicode(b), safe_unicode(b)) for b in repo.branches]
                     if not branch_group:
                         # new repo, or without maybe a branch?
                         branch_group = default_ref_options
                     branches_group = (branch_group, _("Branches"))
                     ref_options.append(branches_group)
                     choices.extend([x[0] for x in branches_group[0]])
                     # bookmarks for HG
                     if repo.alias == 'hg':
                         bookmarks_group = (
                             [(u'book:%s' % safe_unicode(b), safe_unicode(b))
                                 for b in repo.bookmarks],
                             _("Bookmarks"))
                         ref_options.append(bookmarks_group)
                         choices.extend([x[0] for x in bookmarks_group[0]])
                     # tags
                     tags_group = (
                         [(u'tag:%s' % safe_unicode(t), safe_unicode(t))
                             for t in repo.tags],
                         _("Tags"))
                     ref_options.append(tags_group)
                     choices.extend([x[0] for x in tags_group[0]])
                     return choices, ref_options
                 def get_server_info(self, environ=None):
                     server_info = get_system_info(environ)
                     return server_info

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages