# Copyright (C) 2012-2023 RhodeCode GmbH # # This program is free software: you can redistribute it and/or modify # it under the terms of the GNU Affero General Public License, version 3 # (only), as published by the Free Software Foundation. # # This program is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # # You should have received a copy of the GNU Affero General Public License # along with this program. If not, see <http://www.gnu.org/licenses/>. # # This program is dual-licensed. If you wish to learn more about the # RhodeCode Enterprise Edition, including its added features, Support services, # and proprietary license terms, please see https://rhodecode.com/licenses/ """ Index schema for RhodeCode """ import importlib import logging from rhodecode.lib.index.search_utils import normalize_text_for_matching log = logging.getLogger(__name__) # leave defaults for backward compat default_searcher = 'rhodecode.lib.index.whoosh' default_location = '%(here)s/data/index' ES_VERSION_2 = '2' ES_VERSION_6 = '6' # for legacy reasons we keep 2 compat as default DEFAULT_ES_VERSION = ES_VERSION_2 try: from rhodecode_tools.lib.fts_index.elasticsearch_engine_6 import ES_CONFIG # pragma: no cover except ImportError: log.warning('rhodecode_tools not available, use of full text search is limited') pass class BaseSearcher(object): query_lang_doc = '' es_version = None name = None DIRECTION_ASC = 'asc' DIRECTION_DESC = 'desc' def __init__(self): pass def cleanup(self): pass def search(self, query, document_type, search_user, repo_name=None, repo_group_name=None, raise_on_exc=True): raise Exception('NotImplemented') @staticmethod def query_to_mark(query, default_field=None): """ Formats the query to mark token for jquery.mark.js highlighting. ES could have a different format optionally. :param default_field: :param query: """ return ' '.join(normalize_text_for_matching(query).split()) @property def is_es_6(self): return self.es_version == ES_VERSION_6 def get_handlers(self): return {} @staticmethod def extract_search_tags(query): return [] @staticmethod def escape_specials(val): """ Handle and escape reserved chars for search """ return val def sort_def(self, search_type, direction, sort_field): """ Defines sorting for search. This function should decide if for given search_type, sorting can be done with sort_field. It also should translate common sort fields into backend specific. e.g elasticsearch """ raise NotImplementedError() @staticmethod def get_sort(search_type, search_val): """ Method used to parse the GET search sort value to a field and direction. e.g asc:lines == asc, lines There's also a legacy support for newfirst/oldfirst which defines commit sorting only """ direction = BaseSearcher.DIRECTION_ASC sort_field = None if not search_val: return direction, sort_field if search_val.startswith('asc:'): sort_field = search_val[4:] direction = BaseSearcher.DIRECTION_ASC elif search_val.startswith('desc:'): sort_field = search_val[5:] direction = BaseSearcher.DIRECTION_DESC elif search_val == 'newfirst' and search_type == 'commit': sort_field = 'date' direction = BaseSearcher.DIRECTION_DESC elif search_val == 'oldfirst' and search_type == 'commit': sort_field = 'date' direction = BaseSearcher.DIRECTION_ASC return direction, sort_field def search_config(config, prefix='search.'): _config = {} for key in config.keys(): if key.startswith(prefix): _config[key[len(prefix):]] = config[key] return _config def searcher_from_config(config, prefix='search.'): _config = search_config(config, prefix) if 'location' not in _config: _config['location'] = default_location if 'es_version' not in _config: # use an old legacy ES version set to 2 _config['es_version'] = '2' imported = importlib.import_module(_config.get('module', default_searcher)) searcher = imported.Searcher(config=_config) return searcher