upstream/kallithea Files · rhodecode/lib/indexers/daemon.py

fixed issue with public journal rss/atom feeds after journal filter implementation

marcink - - Load All Authors

File last commit:

r3016:b3c8a3a5 beta


                r3075:25029d6f

beta

Download file

             daemon.py
        
                    416 lines
            
             | 16.1 KiB
            
                | text/x-python
            
             |
                PythonLexer
            
             / rhodecode / lib / indexers / daemon.py
          
                    History
                
                 |
                  Source
                 | Raw
                 |Copy content
                 |Copy permalink

        marcink
    
fixes to #92, updated changelog

              r885
            
      # -*- coding: utf-8 -*-

      """

          rhodecode.lib.indexers.daemon

          ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~

        marcink
    
fixed daemon typos

              r1377
            
          A daemon will read from task table and run tasks

        marcink
    
Fixed whoosh daemon, for depracated walk method

              r947
            
        marcink
    
fixes to #92, updated changelog

              r885
            
          :created_on: Jan 26, 2010

          :author: marcink

        marcink
    
2012 copyrights

              r1824
            
          :copyright: (C) 2010-2012 Marcin Kuzminski <marcin@python-works.com>

        marcink
    
fixes to #92, updated changelog

              r885
            
          :license: GPLv3, see COPYING for more details.

      """

        marcink
    
fixed license  issue #149

              r1206
            
      # This program is free software: you can redistribute it and/or modify

      # it under the terms of the GNU General Public License as published by

      # the Free Software Foundation, either version 3 of the License, or

      # (at your option) any later version.

        marcink
    
Fixed whoosh daemon, for depracated walk method

              r947
            
      #

        marcink
    
renamed project to rhodecode

              r547
            
      # This program is distributed in the hope that it will be useful,

      # but WITHOUT ANY WARRANTY; without even the implied warranty of

      # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

      # GNU General Public License for more details.

        marcink
    
Fixed whoosh daemon, for depracated walk method

              r947
            
      #

        marcink
    
renamed project to rhodecode

              r547
            
      # You should have received a copy of the GNU General Public License

        marcink
    
fixed license  issue #149

              r1206
            
      # along with this program.  If not, see <http://www.gnu.org/licenses/>.

        Indra Talip
    
import with_statment to make daemon.py python 2.5 compatible

              r2641
            
      from __future__ import with_statement

        marcink
    
renamed project to rhodecode

              r547
            
        marcink
    
simplified str2bool, and moved safe_unicode out of helpers since it was not html specific function

              r1154
            
      import os

        marcink
    
renamed project to rhodecode

              r547
            
      import sys

        marcink
    
simplified str2bool, and moved safe_unicode out of helpers since it was not html specific function

              r1154
            
      import logging

        marcink
    
fixes to #92, updated changelog

              r885
            
      import traceback

        marcink
    
simplified str2bool, and moved safe_unicode out of helpers since it was not html specific function

              r1154
            
      from shutil import rmtree

      from time import mktime

        marcink
    
renamed project to rhodecode

              r547
            
      from os.path import dirname as dn

      from os.path import join as jn

      #to get the rhodecode import

      project_path = dn(dn(dn(dn(os.path.realpath(__file__)))))

      sys.path.append(project_path)

        marcink
    
utils/conf...

              r2109
            
      from rhodecode.config.conf import INDEX_EXTENSIONS

        marcink
    
Refactor codes for scm model...

              r691
            
      from rhodecode.model.scm import ScmModel

        marcink
    
fixed issues some people had with whoosh indexers and unicode decode...

              r3016
            
      from rhodecode.lib.utils2 import safe_unicode, safe_str

        marcink
    
little code cleanup...

              r2648
            
      from rhodecode.lib.indexers import SCHEMA, IDX_NAME, CHGSETS_SCHEMA, \

          CHGSET_IDX_NAME

        marcink
    
renamed project to rhodecode

              r547
            
        marcink
    
Added VCS into rhodecode core for faster and easier deployments of new versions

              r2007
            
      from rhodecode.lib.vcs.exceptions import ChangesetError, RepositoryError, \

        marcink
    
fixes issue with whoosh reindexing files that were removed or renamed

              r1711
            
          NodeDoesNotExistError

        marcink
    
rewrote whoosh indexing to run internal repository.walk() instead of filesystem....

              r560
            
        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
      from whoosh.index import create_in, open_dir, exists_in

      from whoosh.query import *

      from whoosh.qparser import QueryParser

        marcink
    
simplified str2bool, and moved safe_unicode out of helpers since it was not html specific function

              r1154
            
        marcink
    
code garden

              r2101
            
      log = logging.getLogger('whoosh_indexer')

        marcink
    
renamed project to rhodecode

              r547
            
        marcink
    
bumbed whoosh to 2.3.X series...

              r1995
            
        marcink
    
renamed project to rhodecode

              r547
            
      class WhooshIndexingDaemon(object):

        marcink
    
rewrote whoosh indexing to run internal repository.walk() instead of filesystem....

              r560
            
          """

        marcink
    
#469 added --update-only option to whoosh to re-index only given list...

              r2373
            
          Daemon for atomic indexing jobs

        marcink
    
rewrote whoosh indexing to run internal repository.walk() instead of filesystem....

              r560
            
          """

        marcink
    
renamed project to rhodecode

              r547
            
        marcink
    
bumbed whoosh to 2.3.X series...

              r1995
            
          def __init__(self, indexname=IDX_NAME, index_location=None,

        marcink
    
#469 added --update-only option to whoosh to re-index only given list...

              r2373
            
                       repo_location=None, sa=None, repo_list=None,

                       repo_update_list=None):

        marcink
    
renamed project to rhodecode

              r547
            
              self.indexname = indexname

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
              self.index_location = index_location

              if not index_location:

                  raise Exception('You have to provide index location')

        marcink
    
renamed project to rhodecode

              r547
            
              self.repo_location = repo_location

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
              if not repo_location:

                  raise Exception('You have to provide repositories location')

        marcink
    
Major refactoring, removed when possible calls to app globals....

              r1036
            
              self.repo_paths = ScmModel(sa).repo_scan(self.repo_location)

        marcink
    
fixes #90 + docs update

              r894
            
        marcink
    
#469 added --update-only option to whoosh to re-index only given list...

              r2373
            
              #filter repo list

        marcink
    
fixes #90 + docs update

              r894
            
              if repo_list:

        marcink
    
fixed problems with re-indexing non-ascii names of repositories

              r2841
            
                  #Fix non-ascii repo names to unicode

                  repo_list = map(safe_unicode, repo_list)

        marcink
    
#469 added --update-only option to whoosh to re-index only given list...

              r2373
            
                  self.filtered_repo_paths = {}

        marcink
    
fixes #90 + docs update

              r894
            
                  for repo_name, repo in self.repo_paths.items():

                      if repo_name in repo_list:

        marcink
    
#469 added --update-only option to whoosh to re-index only given list...

              r2373
            
                          self.filtered_repo_paths[repo_name] = repo

                  self.repo_paths = self.filtered_repo_paths

        marcink
    
fixes #90 + docs update

              r894
            
        marcink
    
#469 added --update-only option to whoosh to re-index only given list...

              r2373
            
              #filter update repo list

              self.filtered_repo_update_paths = {}

              if repo_update_list:

                  self.filtered_repo_update_paths = {}

                  for repo_name, repo in self.repo_paths.items():

                      if repo_name in repo_update_list:

                          self.filtered_repo_update_paths[repo_name] = repo

                  self.repo_paths = self.filtered_repo_update_paths

        marcink
    
fixes #90 + docs update

              r894
            
        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
              self.initial = True

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
              if not os.path.isdir(self.index_location):

        marcink
    
extended trending languages to more entries, implemented new faster and "fancy"...

              r763
            
                  os.makedirs(self.index_location)

        marcink
    
renamed project to rhodecode

              r547
            
                  log.info('Cannot run incremental index since it does not'

                           ' yet exist running full build')

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
              elif not exists_in(self.index_location, IDX_NAME):

                  log.info('Running full index build as the file content'

                           ' index does not exist')

              elif not exists_in(self.index_location, CHGSET_IDX_NAME):

                  log.info('Running full index build as the changeset'

                           ' index does not exist')

              else:

                  self.initial = False

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
        marcink
    
fixed reindexing, and made some optimizations to reuse repo instances from repo scann list.

              r561
            
          def get_paths(self, repo):

        marcink
    
code garden

              r2101
            
              """

              recursive walk in root dir and return a set of all path in that dir

        marcink
    
rewrote whoosh indexing to run internal repository.walk() instead of filesystem....

              r560
            
              based on repository walk function

              """

        marcink
    
renamed project to rhodecode

              r547
            
              index_paths_ = set()

        marcink
    
fixed whoosh failure on new repository...

              r567
            
              try:

        marcink
    
Fixed whoosh daemon, for depracated walk method

              r947
            
                  tip = repo.get_changeset('tip')

        marcink
    
little code cleanup...

              r2648
            
                  for _topnode, _dirs, files in tip.walk('/'):

        marcink
    
renamed project to rhodecode

              r547
            
                      for f in files:

        marcink
    
fixed issues some people had with whoosh indexers and unicode decode...

              r3016
            
                          index_paths_.add(jn(safe_str(repo.path), safe_str(f.path)))

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
        marcink
    
little code cleanup...

              r2648
            
              except RepositoryError:

        marcink
    
fixes to #92, updated changelog

              r885
            
                  log.debug(traceback.format_exc())

        marcink
    
fixed whoosh failure on new repository...

              r567
            
                  pass

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
              return index_paths_

        marcink
    
fixed reindexing, and made some optimizations to reuse repo instances from repo scann list.

              r561
            
          def get_node(self, repo, path):

              n_path = path[len(repo.path) + 1:]

              node = repo.get_changeset().get_node(n_path)

              return node

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
        marcink
    
fixed reindexing, and made some optimizations to reuse repo instances from repo scann list.

              r561
            
          def get_node_mtime(self, node):

              return mktime(node.last_changeset.date.timetuple())

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
        marcink
    
changes for #56

              r1171
            
          def add_doc(self, writer, path, repo, repo_name):

        marcink
    
code garden

              r2101
            
              """

              Adding doc to writer this function itself fetches data from

              the instance of vcs backend

              """

        marcink
    
fixed reindexing, and made some optimizations to reuse repo instances from repo scann list.

              r561
            
              node = self.get_node(repo, path)

        marcink
    
utils/conf...

              r2109
            
              indexed = indexed_w_content = 0

        marcink
    
code garden

              r2101
            
              # we just index the content of chosen files, and skip binary files

        marcink
    
#92 removed content of binary files for whoosh indexer

              r886
            
              if node.extension in INDEX_EXTENSIONS and not node.is_binary:

        marcink
    
rewrote whoosh indexing to run internal repository.walk() instead of filesystem....

              r560
            
                  u_content = node.content

        marcink
    
fixes to #92, updated changelog

              r885
            
                  if not isinstance(u_content, unicode):

                      log.warning('  >> %s Could not get this content as unicode '

        marcink
    
code garden

              r2101
            
                                  'replacing with empty content' % path)

        marcink
    
fixes to #92, updated changelog

              r885
            
                      u_content = u''

                  else:

                      log.debug('    >> %s [WITH CONTENT]' % path)

        marcink
    
utils/conf...

              r2109
            
                      indexed_w_content += 1

        marcink
    
fixes to #92, updated changelog

              r885
            
        marcink
    
renamed project to rhodecode

              r547
            
              else:

                  log.debug('    >> %s' % path)

        marcink
    
code garden

              r2101
            
                  # just index file name without it's content

        marcink
    
renamed project to rhodecode

              r547
            
                  u_content = u''

        marcink
    
utils/conf...

              r2109
            
                  indexed += 1

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
        marcink
    
#453 added ID field in whoosh SCHEMA that solves the issue of reindexing modified files

              r2388
            
              p = safe_unicode(path)

        marcink
    
code garden

              r2101
            
              writer.add_document(

        marcink
    
#453 added ID field in whoosh SCHEMA that solves the issue of reindexing modified files

              r2388
            
                  fileid=p,

        marcink
    
code garden

              r2101
            
                  owner=unicode(repo.contact),

                  repository=safe_unicode(repo_name),

        marcink
    
#453 added ID field in whoosh SCHEMA that solves the issue of reindexing modified files

              r2388
            
                  path=p,

        marcink
    
code garden

              r2101
            
                  content=u_content,

                  modtime=self.get_node_mtime(node),

                  extension=node.extension

              )

        marcink
    
utils/conf...

              r2109
            
              return indexed, indexed_w_content

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
        Indra Talip
    
when indexing changesets use the raw_id to locate the point from...

              r2643
            
          def index_changesets(self, writer, repo_name, repo, start_rev=None):

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
              """

              Add all changeset in the vcs repo starting at start_rev

              to the index writer

        Indra Talip
    
when indexing changesets use the raw_id to locate the point from...

              r2643
            
              :param writer: the whoosh index writer to add to

              :param repo_name: name of the repository from whence the

                changeset originates including the repository group

              :param repo: the vcs repository instance to index changesets for,

                the presumption is the repo has changesets to index

              :param start_rev=None: the full sha id to start indexing from

                if start_rev is None then index from the first changeset in

                the repo

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
              """

        Indra Talip
    
when indexing changesets use the raw_id to locate the point from...

              r2643
            
              if start_rev is None:

                  start_rev = repo[0].raw_id

        marcink
    
little code cleanup...

              r2648
            
              log.debug('indexing changesets in %s starting at rev: %s' %

                        (repo_name, start_rev))

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
        marcink
    
little code cleanup...

              r2648
            
              indexed = 0

        Indra Talip
    
when indexing changesets use the raw_id to locate the point from...

              r2643
            
              for cs in repo.get_changesets(start=start_rev):

        marcink
    
little code cleanup...

              r2648
            
                  log.debug('    >> %s' % cs)

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                  writer.add_document(

        Indra Talip
    
rename changeset index key to match raw_id rather than path for greater consistency

              r2642
            
                      raw_id=unicode(cs.raw_id),

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                      owner=unicode(repo.contact),

        marcink
    
Extended commit search schema with date of commit

              r2693
            
                      date=cs._timestamp,

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                      repository=safe_unicode(repo_name),

                      author=cs.author,

                      message=cs.message,

                      last=cs.last,

        marcink
    
#548 Fixed issue with non-ascii paths in whoosh indexer

              r2763
            
                      added=u' '.join([safe_unicode(node.path) for node in cs.added]).lower(),

                      removed=u' '.join([safe_unicode(node.path) for node in cs.removed]).lower(),

                      changed=u' '.join([safe_unicode(node.path) for node in cs.changed]).lower(),

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                      parents=u' '.join([cs.raw_id for cs in cs.parents]),

                  )

                  indexed += 1

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
              log.debug('indexed %d changesets for repo %s' % (indexed, repo_name))

        marcink
    
little code cleanup...

              r2648
            
              return indexed

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
          def index_files(self, file_idx_writer, repo_name, repo):

        marcink
    
little code cleanup...

              r2648
            
              """

              Index files for given repo_name

              :param file_idx_writer: the whoosh index writer to add to

              :param repo_name: name of the repository we're indexing

              :param repo: instance of vcs repo

              """

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
              i_cnt = iwc_cnt = 0

              log.debug('building index for [%s]' % repo.path)

              for idx_path in self.get_paths(repo):

                  i, iwc = self.add_doc(file_idx_writer, idx_path, repo, repo_name)

                  i_cnt += i

                  iwc_cnt += iwc

        marcink
    
little code cleanup...

              r2648
            
              log.debug('added %s files %s with content for repo %s' %

                        (i_cnt + iwc_cnt, iwc_cnt, repo.path))

              return i_cnt, iwc_cnt

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
          def update_changeset_index(self):

              idx = open_dir(self.index_location, indexname=CHGSET_IDX_NAME)

        marcink
    
Little better logging in whoosh indexer

              r2569
            
        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
              with idx.searcher() as searcher:

                  writer = idx.writer()

                  writer_is_dirty = False

                  try:

        marcink
    
little code cleanup...

              r2648
            
                      indexed_total = 0

        marcink
    
Fix possible exception about repo_name not defined, on whoosh indexer when using index-only option

              r2839
            
                      repo_name = None

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                      for repo_name, repo in self.repo_paths.items():

                          # skip indexing if there aren't any revs in the repo

        Indra Talip
    
when indexing changesets use the raw_id to locate the point from...

              r2643
            
                          num_of_revs = len(repo)

                          if num_of_revs < 1:

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                              continue

                          qp = QueryParser('repository', schema=CHGSETS_SCHEMA)

                          q = qp.parse(u"last:t AND %s" % repo_name)

        Indra Talip
    
when indexing changesets use the raw_id to locate the point from...

              r2643
            
                          results = searcher.search(q)

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
        Indra Talip
    
when indexing changesets use the raw_id to locate the point from...

              r2643
            
                          # default to scanning the entire repo

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                          last_rev = 0

        Indra Talip
    
when indexing changesets use the raw_id to locate the point from...

              r2643
            
                          start_id = None

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                          if len(results) > 0:

        Indra Talip
    
when indexing changesets use the raw_id to locate the point from...

              r2643
            
                              # assuming that there is only one result, if not this

                              # may require a full re-index.

                              start_id = results[0]['raw_id']

                              last_rev = repo.get_changeset(revision=start_id).revision

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                          # there are new changesets to index or a new repo to index

        Indra Talip
    
when indexing changesets use the raw_id to locate the point from...

              r2643
            
                          if last_rev == 0 or num_of_revs > last_rev + 1:

        marcink
    
little code cleanup...

              r2648
            
                              # delete the docs in the index for the previous

                              # last changeset(s)

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                              for hit in results:

        marcink
    
little code cleanup...

              r2648
            
                                  q = qp.parse(u"last:t AND %s AND raw_id:%s" %

        Indra Talip
    
rename changeset index key to match raw_id rather than path for greater consistency

              r2642
            
                                                  (repo_name, hit['raw_id']))

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                                  writer.delete_by_query(q)

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                              # index from the previous last changeset + all new ones

        marcink
    
little code cleanup...

              r2648
            
                              indexed_total += self.index_changesets(writer,

                                                      repo_name, repo, start_id)

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                              writer_is_dirty = True

        marcink
    
little code cleanup...

              r2648
            
                      log.debug('indexed %s changesets for repo %s' % (

                                   indexed_total, repo_name)

                      )

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                  finally:

                      if writer_is_dirty:

                          log.debug('>> COMMITING CHANGES TO CHANGESET INDEX<<')

                          writer.commit(merge=True)

        marcink
    
fixed logging messages on whoosh indexer

              r2840
            
                          log.debug('>>> FINISHED REBUILDING CHANGESET INDEX <<<')

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                      else:

                          writer.cancel

        marcink
    
fixed logging messages on whoosh indexer

              r2840
            
                          log.debug('>> NOTHING TO COMMIT TO CHANGESET INDEX<<')

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
          def update_file_index(self):

        marcink
    
#469 added --update-only option to whoosh to re-index only given list...

              r2373
            
              log.debug((u'STARTING INCREMENTAL INDEXING UPDATE FOR EXTENSIONS %s '

                         'AND REPOS %s') % (INDEX_EXTENSIONS, self.repo_paths.keys()))

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
              idx = open_dir(self.index_location, indexname=self.indexname)

        marcink
    
renamed project to rhodecode

              r547
            
              # The set of all paths in the index

              indexed_paths = set()

              # The set of all paths we need to re-index

              to_index = set()

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
        marcink
    
renamed project to rhodecode

              r547
            
              writer = idx.writer()

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
              writer_is_dirty = False

              try:

                  with idx.reader() as reader:

                      # Loop over the stored fields in the index

                      for fields in reader.all_stored_fields():

                          indexed_path = fields['path']

                          indexed_repo_path = fields['repository']

                          indexed_paths.add(indexed_path)

                          if not indexed_repo_path in self.filtered_repo_update_paths:

                              continue

                          repo = self.repo_paths[indexed_repo_path]

                          try:

                              node = self.get_node(repo, indexed_path)

                              # Check if this file was changed since it was indexed

                              indexed_time = fields['modtime']

                              mtime = self.get_node_mtime(node)

                              if mtime > indexed_time:

        marcink
    
little code cleanup...

              r2648
            
                                  # The file has changed, delete it and add it to

                                  # the list of files to reindex

                                  log.debug(

                                      'adding to reindex list %s mtime: %s vs %s' % (

                                          indexed_path, mtime, indexed_time)

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                                  )

                                  writer.delete_by_term('fileid', indexed_path)

                                  writer_is_dirty = True

                                  to_index.add(indexed_path)

                          except (ChangesetError, NodeDoesNotExistError):

                              # This file was deleted since it was indexed

                              log.debug('removing from index %s' % indexed_path)

                              writer.delete_by_term('path', indexed_path)

                              writer_is_dirty = True

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                  # Loop over the files in the filesystem

                  # Assume we have a function that gathers the filenames of the

                  # documents to be indexed

                  ri_cnt_total = 0  # indexed

                  riwc_cnt_total = 0  # indexed with content

                  for repo_name, repo in self.repo_paths.items():

                      # skip indexing if there aren't any revisions

                      if len(repo) < 1:

                          continue

                      ri_cnt = 0   # indexed

                      riwc_cnt = 0  # indexed with content

                      for path in self.get_paths(repo):

                          path = safe_unicode(path)

                          if path in to_index or path not in indexed_paths:

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                              # This is either a file that's changed, or a new file

                              # that wasn't indexed before. So index it!

                              i, iwc = self.add_doc(writer, path, repo, repo_name)

                              writer_is_dirty = True

                              log.debug('re indexing %s' % path)

                              ri_cnt += i

                              ri_cnt_total += 1

                              riwc_cnt += iwc

                              riwc_cnt_total += iwc

                      log.debug('added %s files %s with content for repo %s' % (

                                   ri_cnt + riwc_cnt, riwc_cnt, repo.path)

                      )

                  log.debug('indexed %s files in total and %s with content' % (

                              ri_cnt_total, riwc_cnt_total)

                  )

              finally:

                  if writer_is_dirty:

        marcink
    
fixed logging messages on whoosh indexer

              r2840
            
                      log.debug('>> COMMITING CHANGES TO FILE INDEX <<')

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                      writer.commit(merge=True)

        marcink
    
fixed logging messages on whoosh indexer

              r2840
            
                      log.debug('>>> FINISHED REBUILDING FILE INDEX <<<')

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                  else:

        marcink
    
fixed logging messages on whoosh indexer

              r2840
            
                      log.debug('>> NOTHING TO COMMIT TO FILE INDEX <<')

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                      writer.cancel()

          def build_indexes(self):

              if os.path.exists(self.index_location):

                  log.debug('removing previous index')

                  rmtree(self.index_location)

              if not os.path.exists(self.index_location):

                  os.mkdir(self.index_location)

        marcink
    
little code cleanup...

              r2648
            
              chgset_idx = create_in(self.index_location, CHGSETS_SCHEMA,

                                     indexname=CHGSET_IDX_NAME)

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
              chgset_idx_writer = chgset_idx.writer()

              file_idx = create_in(self.index_location, SCHEMA, indexname=IDX_NAME)

              file_idx_writer = file_idx.writer()

              log.debug('BUILDING INDEX FOR EXTENSIONS %s '

                        'AND REPOS %s' % (INDEX_EXTENSIONS, self.repo_paths.keys()))

              for repo_name, repo in self.repo_paths.items():

                  # skip indexing if there aren't any revisions

                  if len(repo) < 1:

        marcink
    
#469 added --update-only option to whoosh to re-index only given list...

              r2373
            
                      continue

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                  self.index_files(file_idx_writer, repo_name, repo)

                  self.index_changesets(chgset_idx_writer, repo_name, repo)

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
              log.debug('>> COMMITING CHANGES <<')

              file_idx_writer.commit(merge=True)

              chgset_idx_writer.commit(merge=True)

              log.debug('>>> FINISHED BUILDING INDEX <<<')

        marcink
    
#453 added ID field in whoosh SCHEMA that solves the issue of reindexing modified files

              r2388
            
        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
          def update_indexes(self):

              self.update_file_index()

              self.update_changeset_index()

        marcink
    
Hacking for git support,and new faster repo scan

              r631
            
        marcink
    
renamed project to rhodecode

              r547
            
          def run(self, full_index=False):

              """Run daemon"""

              if full_index or self.initial:

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                  self.build_indexes()

        marcink
    
renamed project to rhodecode

              r547
            
              else:

        Indra Talip
    
create an index for commit messages and the ability to search them and see results

              r2640
            
                  self.update_indexes()

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages