appenlight Commit - r87:86095bc8 · RhodeCode Free Hosting

redis: some cleanups and use of pipelines for better performance

ergo -

r87:86095bc8

parent child

backend/src/appenlight/celery/tasks.py

0 +38 -23

             # -*- coding: utf-8 -*-
             # Copyright (C) 2010-2016  RhodeCode GmbH
             #
             # This program is free software: you can redistribute it and/or modify
             # it under the terms of the GNU Affero General Public License, version 3
             # (only), as published by the Free Software Foundation.
             #
             # This program is distributed in the hope that it will be useful,
             # but WITHOUT ANY WARRANTY; without even the implied warranty of
             # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
             # GNU General Public License for more details.
             #
             # You should have received a copy of the GNU Affero General Public License
             # along with this program.  If not, see <http://www.gnu.org/licenses/>.
             #
             # This program is dual-licensed. If you wish to learn more about the
             # AppEnlight Enterprise Edition, including its added features, Support
             # services, and proprietary license terms, please see
             # https://rhodecode.com/licenses/
             import bisect
             import collections
             import math
             from datetime import datetime, timedelta
             import sqlalchemy as sa
             import pyelasticsearch
             from celery.utils.log import get_task_logger
             from zope.sqlalchemy import mark_changed
             from pyramid.threadlocal import get_current_request, get_current_registry
             from appenlight.celery import celery
             from appenlight.models.report_group import ReportGroup
             from appenlight.models import DBSession, Datastores
             from appenlight.models.report import Report
             from appenlight.models.log import Log
             from appenlight.models.metric import Metric
             from appenlight.models.event import Event
             from appenlight.models.services.application import ApplicationService
             from appenlight.models.services.event import EventService
             from appenlight.models.services.log import LogService
             from appenlight.models.services.report import ReportService
             from appenlight.models.services.report_group import ReportGroupService
             from appenlight.models.services.user import UserService
             from appenlight.models.tag import Tag
             from appenlight.lib import print_traceback
             from appenlight.lib.utils import parse_proto, in_batches
             from appenlight.lib.ext_json import json
             from appenlight.lib.redis_keys import REDIS_KEYS
             from appenlight.lib.enums import ReportType
             log = get_task_logger(__name__)
             sample_boundries = list(range(100, 1000, 100)) + \
                                list(range(1000, 10000, 1000)) + \
                                list(range(10000, 100000, 5000))
             def pick_sample(total_occurences, report_type=None):
                 every = 1.0
                 position = bisect.bisect_left(sample_boundries, total_occurences)
                 if position > 0:
                     if report_type == ReportType.not_found:
                         divide = 10.0
                     else:
                         divide = 100.0
                     every = sample_boundries[position - 1] / divide
                 return total_occurences % every == 0
             @celery.task(queue="default", default_retry_delay=1, max_retries=2)
             def test_exception_task():
                 log.error('test celery log', extra={'location': 'celery'})
                 log.warning('test celery log', extra={'location': 'celery'})
                 raise Exception('Celery exception test')
             @celery.task(queue="default", default_retry_delay=1, max_retries=2)
             def test_retry_exception_task():
                 try:
                     import time
                     time.sleep(1.3)
                     log.error('test retry celery log', extra={'location': 'celery'})
                     log.warning('test retry celery log', extra={'location': 'celery'})
                     raise Exception('Celery exception test')
                 except Exception as exc:
                     test_retry_exception_task.retry(exc=exc)
             @celery.task(queue="reports", default_retry_delay=600, max_retries=144)
-            def add_reports(resource_id, params, dataset, environ=None, **kwargs):
+            def add_reports(resource_id, request_params, dataset, **kwargs):
-                proto_version = parse_proto(params.get('protocol_version', ''))
+                proto_version = parse_proto(request_params.get('protocol_version', ''))
                 current_time = datetime.utcnow().replace(second=0, microsecond=0)
                 try:
                     # we will store solr docs here for single insert
                     es_report_docs = {}
                     es_report_group_docs = {}
                     resource = ApplicationService.by_id(resource_id)
                     tags = []
                     es_slow_calls_docs = {}
                     es_reports_stats_rows = {}
                     for report_data in dataset:
                         # build report details for later
                         added_details = 0
                         report = Report()
                         report.set_data(report_data, resource, proto_version)
                         report._skip_ft_index = True
                         report_group = ReportGroupService.by_hash_and_resource(
                             report.resource_id,
                             report.grouping_hash
                         )
                         occurences = report_data.get('occurences', 1)
                         if not report_group:
                             # total reports will be +1 moment later
                             report_group = ReportGroup(grouping_hash=report.grouping_hash,
                                                        occurences=0, total_reports=0,
                                                        last_report=0,
                                                        priority=report.priority,
                                                        error=report.error,
                                                        first_timestamp=report.start_time)
                             report_group._skip_ft_index = True
                             report_group.report_type = report.report_type
                         report.report_group_time = report_group.first_timestamp
                         add_sample = pick_sample(report_group.occurences,
                                                  report_type=report_group.report_type)
                         if add_sample:
                             resource.report_groups.append(report_group)
                             report_group.reports.append(report)
                             added_details += 1
                             DBSession.flush()
                             if report.partition_id not in es_report_docs:
                                 es_report_docs[report.partition_id] = []
                             es_report_docs[report.partition_id].append(report.es_doc())
                             tags.extend(list(report.tags.items()))
                             slow_calls = report.add_slow_calls(report_data, report_group)
                             DBSession.flush()
                             for s_call in slow_calls:
                                 if s_call.partition_id not in es_slow_calls_docs:
                                     es_slow_calls_docs[s_call.partition_id] = []
                                 es_slow_calls_docs[s_call.partition_id].append(
                                     s_call.es_doc())
                                 # try generating new stat rows if needed
                         else:
                             # required for postprocessing to not fail later
                             report.report_group = report_group
                         stat_row = ReportService.generate_stat_rows(
                             report, resource, report_group)
                         if stat_row.partition_id not in es_reports_stats_rows:
                             es_reports_stats_rows[stat_row.partition_id] = []
                         es_reports_stats_rows[stat_row.partition_id].append(
                             stat_row.es_doc())
                         # see if we should mark 10th occurence of report
                         last_occurences_10 = int(math.floor(report_group.occurences / 10))
                         curr_occurences_10 = int(math.floor(
                             (report_group.occurences + report.occurences) / 10))
                         last_occurences_100 = int(
                             math.floor(report_group.occurences / 100))
                         curr_occurences_100 = int(math.floor(
                             (report_group.occurences + report.occurences) / 100))
                         notify_occurences_10 = last_occurences_10 != curr_occurences_10
                         notify_occurences_100 = last_occurences_100 != curr_occurences_100
                         report_group.occurences = ReportGroup.occurences + occurences
                         report_group.last_timestamp = report.start_time
                         report_group.summed_duration = ReportGroup.summed_duration + report.duration
                         summed_duration = ReportGroup.summed_duration + report.duration
                         summed_occurences = ReportGroup.occurences + occurences
                         report_group.average_duration = summed_duration / summed_occurences
                         report_group.run_postprocessing(report)
                         if added_details:
                             report_group.total_reports = ReportGroup.total_reports + 1
                             report_group.last_report = report.id
                         report_group.set_notification_info(notify_10=notify_occurences_10,
                                                            notify_100=notify_occurences_100)
                         DBSession.flush()
                         report_group.get_report().notify_channel(report_group)
                         if report_group.partition_id not in es_report_group_docs:
                             es_report_group_docs[report_group.partition_id] = []
                         es_report_group_docs[report_group.partition_id].append(
                             report_group.es_doc())
                         action = 'REPORT'
                         log_msg = '%s: %s %s, client: %s, proto: %s' % (
                             action,
                             report_data.get('http_status', 'unknown'),
                             str(resource),
                             report_data.get('client'),
                             proto_version)
                         log.info(log_msg)
                     total_reports = len(dataset)
+                    redis_pipeline = Datastores.redis.pipeline(transaction=False)
                     key = REDIS_KEYS['counters']['reports_per_minute'].format(current_time)
-                    Datastores.redis.incr(key, total_reports)
+                    redis_pipeline.incr(key, total_reports)
-                    Datastores.redis.expire(key, 3600 * 24)
+                    redis_pipeline.expire(key, 3600 * 24)
-                    key = REDIS_KEYS['counters']['reports_per_minute_per_app'].format(
+                    key = REDIS_KEYS['counters']['reports_per_hour_per_app'].format(
-                        resource_id, current_time)
+                        resource_id, current_time.replace(minute=0))
-                    Datastores.redis.incr(key, total_reports)
+                    redis_pipeline.incr(key, total_reports)
-                    Datastores.redis.expire(key, 3600 * 24)
+                    redis_pipeline.expire(key, 3600 * 24 * 7)
+                    redis_pipeline.sadd(
+                        REDIS_KEYS['apps_that_got_new_data_per_hour'],
+                        resource_id, current_time.replace(minute=0))
+                    redis_pipeline.execute()
                     add_reports_es(es_report_group_docs, es_report_docs)
                     add_reports_slow_calls_es(es_slow_calls_docs)
                     add_reports_stats_rows_es(es_reports_stats_rows)
                     return True
                 except Exception as exc:
                     print_traceback(log)
                     add_reports.retry(exc=exc)
             @celery.task(queue="es", default_retry_delay=600, max_retries=144)
             def add_reports_es(report_group_docs, report_docs):
                 for k, v in report_group_docs.items():
                     Datastores.es.bulk_index(k, 'report_group', v, id_field="_id")
                 for k, v in report_docs.items():
                     Datastores.es.bulk_index(k, 'report', v, id_field="_id",
                                              parent_field='_parent')
             @celery.task(queue="es", default_retry_delay=600, max_retries=144)
             def add_reports_slow_calls_es(es_docs):
                 for k, v in es_docs.items():
                     Datastores.es.bulk_index(k, 'log', v)
             @celery.task(queue="es", default_retry_delay=600, max_retries=144)
             def add_reports_stats_rows_es(es_docs):
                 for k, v in es_docs.items():
                     Datastores.es.bulk_index(k, 'log', v)
             @celery.task(queue="logs", default_retry_delay=600, max_retries=144)
-            def add_logs(resource_id, request, dataset, environ=None, **kwargs):
+            def add_logs(resource_id, request_params, dataset, **kwargs):
-                proto_version = request.get('protocol_version')
+                proto_version = request_params.get('protocol_version')
                 current_time = datetime.utcnow().replace(second=0, microsecond=0)
                 try:
                     es_docs = collections.defaultdict(list)
                     application = ApplicationService.by_id(resource_id)
                     ns_pairs = []
                     for entry in dataset:
                         # gather pk and ns so we can remove older versions of row later
                         if entry['primary_key'] is not None:
                             ns_pairs.append({"pk": entry['primary_key'],
                                              "ns": entry['namespace']})
                         log_entry = Log()
                         log_entry.set_data(entry, resource=application)
                         log_entry._skip_ft_index = True
                         application.logs.append(log_entry)
                         DBSession.flush()
                         # insert non pk rows first
                         if entry['primary_key'] is None:
                             es_docs[log_entry.partition_id].append(log_entry.es_doc())
                     # 2nd pass to delete all log entries from db foe same pk/ns pair
                     if ns_pairs:
                         ids_to_delete = []
                         es_docs = collections.defaultdict(list)
                         es_docs_to_delete = collections.defaultdict(list)
                         found_pkey_logs = LogService.query_by_primary_key_and_namespace(
                             list_of_pairs=ns_pairs)
                         log_dict = {}
                         for log_entry in found_pkey_logs:
                             log_key = (log_entry.primary_key, log_entry.namespace)
                             if log_key not in log_dict:
                                 log_dict[log_key] = []
                             log_dict[log_key].append(log_entry)
                         for ns, entry_list in log_dict.items():
                             entry_list = sorted(entry_list, key=lambda x: x.timestamp)
                             # newest row needs to be indexed in es
                             log_entry = entry_list[-1]
                             # delete everything from pg and ES, leave the last row in pg
                             for e in entry_list[:-1]:
                                 ids_to_delete.append(e.log_id)
                                 es_docs_to_delete[e.partition_id].append(e.delete_hash)
                             es_docs_to_delete[log_entry.partition_id].append(
                                 log_entry.delete_hash)
                             es_docs[log_entry.partition_id].append(log_entry.es_doc())
                         if ids_to_delete:
                             query = DBSession.query(Log).filter(
                                 Log.log_id.in_(ids_to_delete))
                             query.delete(synchronize_session=False)
                         if es_docs_to_delete:
                             # batch this to avoid problems with default ES bulk limits
                             for es_index in es_docs_to_delete.keys():
                                 for batch in in_batches(es_docs_to_delete[es_index], 20):
                                     query = {'terms': {'delete_hash': batch}}
                                     try:
                                         Datastores.es.delete_by_query(
                                             es_index, 'log', query)
                                     except pyelasticsearch.ElasticHttpNotFoundError as exc:
                                         msg = 'skipping index {}'.format(es_index)
                                         log.info(msg)
                     total_logs = len(dataset)
                     log_msg = 'LOG_NEW: %s, entries: %s, proto:%s' % (
                         str(application),
                         total_logs,
                         proto_version)
                     log.info(log_msg)
                     # mark_changed(session)
+                    redis_pipeline = Datastores.redis.pipeline(transaction=False)
                     key = REDIS_KEYS['counters']['logs_per_minute'].format(current_time)
-                    Datastores.redis.incr(key, total_logs)
+                    redis_pipeline.incr(key, total_logs)
-                    Datastores.redis.expire(key, 3600 * 24)
+                    redis_pipeline.expire(key, 3600 * 24)
-                    key = REDIS_KEYS['counters']['logs_per_minute_per_app'].format(
+                    key = REDIS_KEYS['counters']['logs_per_hour_per_app'].format(
-                        resource_id, current_time)
+                        resource_id, current_time.replace(minute=0))
-                    Datastores.redis.incr(key, total_logs)
+                    redis_pipeline.incr(key, total_logs)
-                    Datastores.redis.expire(key, 3600 * 24)
+                    redis_pipeline.expire(key, 3600 * 24 * 7)
+                    redis_pipeline.sadd(
+                        REDIS_KEYS['apps_that_got_new_data_per_hour'],
+                        resource_id, current_time.replace(minute=0))
+                    redis_pipeline.execute()
                     add_logs_es(es_docs)
                     return True
                 except Exception as exc:
                     print_traceback(log)
                     add_logs.retry(exc=exc)
             @celery.task(queue="es", default_retry_delay=600, max_retries=144)
             def add_logs_es(es_docs):
                 for k, v in es_docs.items():
                     Datastores.es.bulk_index(k, 'log', v)
             @celery.task(queue="metrics", default_retry_delay=600, max_retries=144)
-            def add_metrics(resource_id, request, dataset, proto_version):
+            def add_metrics(resource_id, request_params, dataset, proto_version):
                 current_time = datetime.utcnow().replace(second=0, microsecond=0)
                 try:
                     application = ApplicationService.by_id_cached()(resource_id)
                     application = DBSession.merge(application, load=False)
                     es_docs = []
                     rows = []
                     for metric in dataset:
                         tags = dict(metric['tags'])
                         server_n = tags.get('server_name', metric['server_name']).lower()
                         tags['server_name'] = server_n or 'unknown'
                         new_metric = Metric(
                             timestamp=metric['timestamp'],
                             resource_id=application.resource_id,
                             namespace=metric['namespace'],
                             tags=tags)
                         rows.append(new_metric)
                         es_docs.append(new_metric.es_doc())
                     session = DBSession()
                     session.bulk_save_objects(rows)
                     session.flush()
                     action = 'METRICS'
                     metrics_msg = '%s: %s, metrics: %s, proto:%s' % (
                         action,
                         str(application),
                         len(dataset),
                         proto_version
                     )
                     log.info(metrics_msg)
                     mark_changed(session)
+                    redis_pipeline = Datastores.redis.pipeline(transaction=False)
                     key = REDIS_KEYS['counters']['metrics_per_minute'].format(current_time)
-                    Datastores.redis.incr(key, len(rows))
+                    redis_pipeline.incr(key, len(rows))
-                    Datastores.redis.expire(key, 3600 * 24)
+                    redis_pipeline.expire(key, 3600 * 24)
-                    key = REDIS_KEYS['counters']['metrics_per_minute_per_app'].format(
+                    key = REDIS_KEYS['counters']['metrics_per_hour_per_app'].format(
-                        resource_id, current_time)
+                        resource_id, current_time.replace(minute=0))
-                    Datastores.redis.incr(key, len(rows))
+                    redis_pipeline.incr(key, len(rows))
-                    Datastores.redis.expire(key, 3600 * 24)
+                    redis_pipeline.expire(key, 3600 * 24 * 7)
+                    redis_pipeline.sadd(
+                        REDIS_KEYS['apps_that_got_new_data_per_hour'],
+                        resource_id, current_time.replace(minute=0))
+                    redis_pipeline.execute()
                     add_metrics_es(es_docs)
                     return True
                 except Exception as exc:
                     print_traceback(log)
                     add_metrics.retry(exc=exc)
             @celery.task(queue="es", default_retry_delay=600, max_retries=144)
             def add_metrics_es(es_docs):
                 for doc in es_docs:
                     partition = 'rcae_m_%s' % doc['timestamp'].strftime('%Y_%m_%d')
                     Datastores.es.index(partition, 'log', doc)
             @celery.task(queue="default", default_retry_delay=5, max_retries=2)
             def check_user_report_notifications(resource_id):
                 since_when = datetime.utcnow()
                 try:
                     request = get_current_request()
                     application = ApplicationService.by_id(resource_id)
                     if not application:
                         return
                     error_key = REDIS_KEYS['reports_to_notify_per_type_per_app'].format(
                         ReportType.error, resource_id)
                     slow_key = REDIS_KEYS['reports_to_notify_per_type_per_app'].format(
                         ReportType.slow, resource_id)
                     error_group_ids = Datastores.redis.smembers(error_key)
                     slow_group_ids = Datastores.redis.smembers(slow_key)
                     Datastores.redis.delete(error_key)
                     Datastores.redis.delete(slow_key)
                     err_gids = [int(g_id) for g_id in error_group_ids]
                     slow_gids = [int(g_id) for g_id in list(slow_group_ids)]
                     group_ids = err_gids + slow_gids
                     occurence_dict = {}
                     for g_id in group_ids:
                         key = REDIS_KEYS['counters']['report_group_occurences'].format(
                             g_id)
                         val = Datastores.redis.get(key)
                         Datastores.redis.delete(key)
                         if val:
                             occurence_dict[g_id] = int(val)
                         else:
                             occurence_dict[g_id] = 1
                     report_groups = ReportGroupService.by_ids(group_ids)
                     report_groups.options(sa.orm.joinedload(ReportGroup.last_report_ref))
                     ApplicationService.check_for_groups_alert(
                         application, 'alert', report_groups=report_groups,
                         occurence_dict=occurence_dict)
                     users = set([p.user for p in application.users_for_perm('view')])
                     report_groups = report_groups.all()
                     for user in users:
                         UserService.report_notify(user, request, application,
                                                   report_groups=report_groups,
                                                   occurence_dict=occurence_dict)
                     for group in report_groups:
                         # marks report_groups as notified
                         if not group.notified:
                             group.notified = True
                 except Exception as exc:
                     print_traceback(log)
                     raise
             @celery.task(queue="default", default_retry_delay=5, max_retries=2)
             def check_alerts(resource_id):
                 since_when = datetime.utcnow()
                 try:
                     request = get_current_request()
                     application = ApplicationService.by_id(resource_id)
                     if not application:
                         return
                     error_key = REDIS_KEYS[
                         'reports_to_notify_per_type_per_app_alerting'].format(
                         ReportType.error, resource_id)
                     slow_key = REDIS_KEYS[
                         'reports_to_notify_per_type_per_app_alerting'].format(
                         ReportType.slow, resource_id)
                     error_group_ids = Datastores.redis.smembers(error_key)
                     slow_group_ids = Datastores.redis.smembers(slow_key)
                     Datastores.redis.delete(error_key)
                     Datastores.redis.delete(slow_key)
                     err_gids = [int(g_id) for g_id in error_group_ids]
                     slow_gids = [int(g_id) for g_id in list(slow_group_ids)]
                     group_ids = err_gids + slow_gids
                     occurence_dict = {}
                     for g_id in group_ids:
                         key = REDIS_KEYS['counters'][
                             'report_group_occurences_alerting'].format(
                             g_id)
                         val = Datastores.redis.get(key)
                         Datastores.redis.delete(key)
                         if val:
                             occurence_dict[g_id] = int(val)
                         else:
                             occurence_dict[g_id] = 1
                     report_groups = ReportGroupService.by_ids(group_ids)
                     report_groups.options(sa.orm.joinedload(ReportGroup.last_report_ref))
                     ApplicationService.check_for_groups_alert(
                         application, 'alert', report_groups=report_groups,
                         occurence_dict=occurence_dict, since_when=since_when)
                 except Exception as exc:
                     print_traceback(log)
                     raise
             @celery.task(queue="default", default_retry_delay=1, max_retries=2)
             def close_alerts():
                 log.warning('Checking alerts')
                 since_when = datetime.utcnow()
                 try:
                     event_types = [Event.types['error_report_alert'],
                                    Event.types['slow_report_alert'], ]
                     statuses = [Event.statuses['active']]
                     # get events older than 5 min
                     events = EventService.by_type_and_status(
                         event_types,
                         statuses,
                         older_than=(since_when - timedelta(minutes=5)))
                     for event in events:
                         # see if we can close them
                         event.validate_or_close(
                             since_when=(since_when - timedelta(minutes=1)))
                 except Exception as exc:
                     print_traceback(log)
                     raise
             @celery.task(queue="default", default_retry_delay=600, max_retries=144)
             def update_tag_counter(tag_name, tag_value, count):
                 try:
                     query = DBSession.query(Tag).filter(Tag.name == tag_name).filter(
                         sa.cast(Tag.value, sa.types.TEXT) == sa.cast(json.dumps(tag_value),
                                                                      sa.types.TEXT))
                     query.update({'times_seen': Tag.times_seen + count,
                                   'last_timestamp': datetime.utcnow()},
                                  synchronize_session=False)
                     session = DBSession()
                     mark_changed(session)
                     return True
                 except Exception as exc:
                     print_traceback(log)
                     update_tag_counter.retry(exc=exc)
             @celery.task(queue="default")
             def update_tag_counters():
                 """
                 Sets task to update counters for application tags
                 """
                 tags = Datastores.redis.lrange(REDIS_KEYS['seen_tag_list'], 0, -1)
                 Datastores.redis.delete(REDIS_KEYS['seen_tag_list'])
                 c = collections.Counter(tags)
                 for t_json, count in c.items():
                     tag_info = json.loads(t_json)
                     update_tag_counter.delay(tag_info[0], tag_info[1], count)
             @celery.task(queue="default")
             def daily_digest():
                 """
                 Sends daily digest with top 50 error reports
                 """
                 request = get_current_request()
                 apps = Datastores.redis.smembers(REDIS_KEYS['apps_that_had_reports'])
                 Datastores.redis.delete(REDIS_KEYS['apps_that_had_reports'])
                 since_when = datetime.utcnow() - timedelta(hours=8)
                 log.warning('Generating daily digests')
                 for resource_id in apps:
                     resource_id = resource_id.decode('utf8')
                     end_date = datetime.utcnow().replace(microsecond=0, second=0)
                     filter_settings = {'resource': [resource_id],
                                        'tags': [{'name': 'type',
                                                  'value': ['error'], 'op': None}],
                                        'type': 'error', 'start_date': since_when,
                                        'end_date': end_date}
                     reports = ReportGroupService.get_trending(
                         request, filter_settings=filter_settings, limit=50)
                     application = ApplicationService.by_id(resource_id)
                     if application:
                         users = set([p.user for p in application.users_for_perm('view')])
                         for user in users:
                             user.send_digest(request, application, reports=reports,
                                              since_when=since_when)
             @celery.task(queue="default")
             def notifications_reports():
                 """
                 Loop that checks redis for info and then issues new tasks to celery to
                 issue notifications
                 """
                 apps = Datastores.redis.smembers(REDIS_KEYS['apps_that_had_reports'])
                 Datastores.redis.delete(REDIS_KEYS['apps_that_had_reports'])
                 for app in apps:
                     log.warning('Notify for app: %s' % app)
                     check_user_report_notifications.delay(app.decode('utf8'))
             @celery.task(queue="default")
             def alerting_reports():
                 """
                 Loop that checks redis for info and then issues new tasks to celery to
                 perform the following:
                 - which applications should have new alerts opened
                 """
                 apps = Datastores.redis.smembers(REDIS_KEYS['apps_that_had_reports_alerting'])
                 Datastores.redis.delete(REDIS_KEYS['apps_that_had_reports_alerting'])
                 for app in apps:
                     log.warning('Notify for app: %s' % app)
                     check_alerts.delay(app.decode('utf8'))
             @celery.task(queue="default", soft_time_limit=3600 * 4,
                          hard_time_limit=3600 * 4, max_retries=144)
             def logs_cleanup(resource_id, filter_settings):
                 request = get_current_request()
                 request.tm.begin()
                 es_query = {
                     "_source": False,
                     "size": 5000,
                     "query": {
                         "filtered": {
                             "filter": {
                                 "and": [{"term": {"resource_id": resource_id}}]
                             }
                         }
                     }
                 }
                 query = DBSession.query(Log).filter(Log.resource_id == resource_id)
                 if filter_settings['namespace']:
                     query = query.filter(Log.namespace == filter_settings['namespace'][0])
                     es_query['query']['filtered']['filter']['and'].append(
                         {"term": {"namespace": filter_settings['namespace'][0]}}
                     )
                 query.delete(synchronize_session=False)
                 request.tm.commit()
                 result = request.es_conn.search(es_query, index='rcae_l_*',
                                                 doc_type='log', es_scroll='1m',
                                                 es_search_type='scan')
                 scroll_id = result['_scroll_id']
                 while True:
                     log.warning('log_cleanup, app:{} ns:{} batch'.format(
                         resource_id,
                         filter_settings['namespace']
                     ))
                     es_docs_to_delete = []
                     result = request.es_conn.send_request(
                         'POST', ['_search', 'scroll'],
                         body=scroll_id, query_params={"scroll": '1m'})
                     scroll_id = result['_scroll_id']
                     if not result['hits']['hits']:
                         break
                     for doc in result['hits']['hits']:
                         es_docs_to_delete.append({"id": doc['_id'],
                                                   "index": doc['_index']})
                     for batch in in_batches(es_docs_to_delete, 10):
                         Datastores.es.bulk([Datastores.es.delete_op(doc_type='log',
                                                                     **to_del)
                                             for to_del in batch])

backend/src/appenlight/lib/api.py

0 +5 -2

             # -*- coding: utf-8 -*-
             # Copyright (C) 2010-2016  RhodeCode GmbH
             #
             # This program is free software: you can redistribute it and/or modify
             # it under the terms of the GNU Affero General Public License, version 3
             # (only), as published by the Free Software Foundation.
             #
             # This program is distributed in the hope that it will be useful,
             # but WITHOUT ANY WARRANTY; without even the implied warranty of
             # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
             # GNU General Public License for more details.
             #
             # You should have received a copy of the GNU Affero General Public License
             # along with this program.  If not, see <http://www.gnu.org/licenses/>.
             #
             # This program is dual-licensed. If you wish to learn more about the
             # AppEnlight Enterprise Edition, including its added features, Support
             # services, and proprietary license terms, please see
             # https://rhodecode.com/licenses/
             import datetime
             import logging
             from pyramid.httpexceptions import HTTPForbidden, HTTPTooManyRequests
             from appenlight.models import Datastores
             from appenlight.models.services.config import ConfigService
             from appenlight.lib.redis_keys import REDIS_KEYS
             log = logging.getLogger(__name__)
             def rate_limiting(request, resource, section, to_increment=1):
                 tsample = datetime.datetime.utcnow().replace(second=0, microsecond=0)
                 key = REDIS_KEYS['rate_limits'][section].format(tsample,
                                                                 resource.resource_id)
-                current_count = Datastores.redis.incr(key, to_increment)
+                redis_pipeline = request.registry.redis_conn.pipeline()
-                Datastores.redis.expire(key, 3600 * 24)
+                redis_pipeline.incr(key, to_increment)
+                redis_pipeline.expire(key, 3600 * 24)
+                results = redis_pipeline.execute()
+                current_count = results[0]
                 config = ConfigService.by_key_and_section(section, 'global')
                 limit = config.value if config else 1000
                 if current_count > int(limit):
                     log.info('RATE LIMITING: {}: {}, {}'.format(
                         section, resource, current_count))
                     abort_msg = 'Rate limits are in effect for this application'
                     raise HTTPTooManyRequests(abort_msg,
                                               headers={'X-AppEnlight': abort_msg})
             def check_cors(request, application, should_return=True):
                 """
                 Performs a check and validation if request comes from authorized domain for
                 application, otherwise return 403
                 """
                 origin_found = False
                 origin = request.headers.get('Origin')
                 if should_return:
                     log.info('CORS for %s' % origin)
                 if not origin:
                     return False
                 for domain in application.domains.split('\n'):
                     if domain in origin:
                         origin_found = True
                 if origin_found:
                     request.response.headers.add('Access-Control-Allow-Origin', origin)
                     request.response.headers.add('XDomainRequestAllowed', '1')
                     request.response.headers.add('Access-Control-Allow-Methods',
                                                  'GET, POST, OPTIONS')
                     request.response.headers.add('Access-Control-Allow-Headers',
                                                  'Accept-Encoding, Accept-Language, '
                                                  'Content-Type, '
                                                  'Depth, User-Agent, X-File-Size, '
                                                  'X-Requested-With, If-Modified-Since, '
                                                  'X-File-Name, '
                                                  'Cache-Control, Host, Pragma, Accept, '
                                                  'Origin, Connection, '
                                                  'Referer, Cookie, '
                                                  'X-appenlight-public-api-key, '
                                                  'x-appenlight-public-api-key')
                     request.response.headers.add('Access-Control-Max-Age', '86400')
                     return request.response
                 else:
                     return HTTPForbidden()

backend/src/appenlight/lib/redis_keys.py

0 +7 -6

             # -*- coding: utf-8 -*-
             # Copyright (C) 2010-2016  RhodeCode GmbH
             #
             # This program is free software: you can redistribute it and/or modify
             # it under the terms of the GNU Affero General Public License, version 3
             # (only), as published by the Free Software Foundation.
             #
             # This program is distributed in the hope that it will be useful,
             # but WITHOUT ANY WARRANTY; without even the implied warranty of
             # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
             # GNU General Public License for more details.
             #
             # You should have received a copy of the GNU Affero General Public License
             # along with this program.  If not, see <http://www.gnu.org/licenses/>.
             #
             # This program is dual-licensed. If you wish to learn more about the
             # AppEnlight Enterprise Edition, including its added features, Support
             # services, and proprietary license terms, please see
             # https://rhodecode.com/licenses/
             BASE = 'appenlight:data:{}'
             REDIS_KEYS = {
                 'tasks': {
                     'add_reports_lock': BASE.format('add_reports_lock:{}'),
                     'add_logs_lock': BASE.format('add_logs_lock:{}'),
                 },
                 'counters': {
                     'reports_per_minute': BASE.format('reports_per_minute:{}'),
-                    'reports_per_minute_per_app': BASE.format(
+                    'reports_per_hour_per_app': BASE.format(
-                        'reports_per_minute_per_app:{}:{}'),
+                        'reports_per_hour_per_app:{}:{}'),
                     'reports_per_type': BASE.format('reports_per_type:{}'),
                     'logs_per_minute': BASE.format('logs_per_minute:{}'),
-                    'logs_per_minute_per_app': BASE.format(
+                    'logs_per_hour_per_app': BASE.format(
-                        'logs_per_minute_per_app:{}:{}'),
+                        'logs_per_hour_per_app:{}:{}'),
                     'metrics_per_minute': BASE.format('metrics_per_minute:{}'),
-                    'metrics_per_minute_per_app': BASE.format(
+                    'metrics_per_hour_per_app': BASE.format(
-                        'metrics_per_minute_per_app:{}:{}'),
+                        'metrics_per_hour_per_app:{}:{}'),
                     'report_group_occurences': BASE.format('report_group_occurences:{}'),
                     'report_group_occurences_alerting': BASE.format(
                         'report_group_occurences_alerting:{}'),
                     'report_group_occurences_10th': BASE.format(
                         'report_group_occurences_10th:{}'),
                     'report_group_occurences_100th': BASE.format(
                         'report_group_occurences_100th:{}'),
                 },
                 'rate_limits': {
                     'per_application_reports_rate_limit': BASE.format(
                         'per_application_reports_limit:{}:{}'),
                     'per_application_logs_rate_limit': BASE.format(
                         'per_application_logs_rate_limit:{}:{}'),
                     'per_application_metrics_rate_limit': BASE.format(
                         'per_application_metrics_rate_limit:{}:{}'),
                 },
+                'apps_that_got_new_data_per_hour': BASE.format('apps_that_got_new_data_per_hour'),
                 'apps_that_had_reports': BASE.format('apps_that_had_reports'),
                 'apps_that_had_error_reports': BASE.format('apps_that_had_error_reports'),
                 'apps_that_had_reports_alerting': BASE.format(
                     'apps_that_had_reports_alerting'),
                 'apps_that_had_error_reports_alerting': BASE.format(
                     'apps_that_had_error_reports_alerting'),
                 'reports_to_notify_per_type_per_app': BASE.format(
                     'reports_to_notify_per_type_per_app:{}:{}'),
                 'reports_to_notify_per_type_per_app_alerting': BASE.format(
                     'reports_to_notify_per_type_per_app_alerting:{}:{}'),
                 'seen_tag_list': BASE.format('seen_tag_list')
             }

backend/src/appenlight/models/report_group.py

0 +21 -20

             # -*- coding: utf-8 -*-
             # Copyright (C) 2010-2016  RhodeCode GmbH
             #
             # This program is free software: you can redistribute it and/or modify
             # it under the terms of the GNU Affero General Public License, version 3
             # (only), as published by the Free Software Foundation.
             #
             # This program is distributed in the hope that it will be useful,
             # but WITHOUT ANY WARRANTY; without even the implied warranty of
             # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
             # GNU General Public License for more details.
             #
             # You should have received a copy of the GNU Affero General Public License
             # along with this program.  If not, see <http://www.gnu.org/licenses/>.
             #
             # This program is dual-licensed. If you wish to learn more about the
             # AppEnlight Enterprise Edition, including its added features, Support
             # services, and proprietary license terms, please see
             # https://rhodecode.com/licenses/
             import logging
             import sqlalchemy as sa
             from datetime import datetime
             from pyramid.threadlocal import get_current_request
             from sqlalchemy.dialects.postgresql import JSON
             from ziggurat_foundations.models.base import BaseModel
             from appenlight.models import Base, get_db_session, Datastores
             from appenlight.lib.enums import ReportType
             from appenlight.lib.rule import Rule
             from appenlight.lib.redis_keys import REDIS_KEYS
             from appenlight.models.report import REPORT_TYPE_MATRIX
             log = logging.getLogger(__name__)
             class ReportGroup(Base, BaseModel):
                 __tablename__ = 'reports_groups'
                 __table_args__ = {'implicit_returning': False}
                 id = sa.Column(sa.BigInteger(), nullable=False, primary_key=True)
                 resource_id = sa.Column(sa.Integer(),
                                         sa.ForeignKey('applications.resource_id',
                                                       onupdate='CASCADE',
                                                       ondelete='CASCADE'),
                                         nullable=False,
                                         index=True)
                 priority = sa.Column(sa.Integer, nullable=False, index=True, default=5,
                                      server_default='5')
                 first_timestamp = sa.Column(sa.DateTime(), default=datetime.utcnow,
                                             server_default=sa.func.now())
                 last_timestamp = sa.Column(sa.DateTime(), default=datetime.utcnow,
                                            server_default=sa.func.now())
                 error = sa.Column(sa.UnicodeText(), index=True)
                 grouping_hash = sa.Column(sa.String(40), default='')
                 triggered_postprocesses_ids = sa.Column(JSON(), nullable=False,
                                                         default=list)
                 report_type = sa.Column(sa.Integer, default=1)
                 total_reports = sa.Column(sa.Integer, default=1)
                 last_report = sa.Column(sa.Integer)
                 occurences = sa.Column(sa.Integer, default=1)
                 average_duration = sa.Column(sa.Float, default=0)
                 summed_duration = sa.Column(sa.Float, default=0)
                 read = sa.Column(sa.Boolean(), index=True, default=False)
                 fixed = sa.Column(sa.Boolean(), index=True, default=False)
                 notified = sa.Column(sa.Boolean(), index=True, default=False)
                 public = sa.Column(sa.Boolean(), index=True, default=False)
                 reports = sa.orm.relationship('Report',
                                               lazy='dynamic',
                                               backref='report_group',
                                               cascade="all, delete-orphan",
                                               passive_deletes=True,
                                               passive_updates=True, )
                 comments = sa.orm.relationship('ReportComment',
                                                lazy='dynamic',
                                                backref='report',
                                                cascade="all, delete-orphan",
                                                passive_deletes=True,
                                                passive_updates=True,
                                                order_by="ReportComment.comment_id")
                 assigned_users = sa.orm.relationship('User',
                                                      backref=sa.orm.backref(
                                                          'assigned_reports_relation',
                                                          lazy='dynamic',
                                                          order_by=sa.desc(
                                                              "reports_groups.id")
                                                      ),
                                                      passive_deletes=True,
                                                      passive_updates=True,
                                                      secondary='reports_assignments',
                                                      order_by="User.user_name")
                 stats = sa.orm.relationship('ReportStat',
                                             lazy='dynamic',
                                             backref='report',
                                             passive_deletes=True,
                                             passive_updates=True, )
                 last_report_ref = sa.orm.relationship('Report',
                                                       uselist=False,
                                                       primaryjoin="ReportGroup.last_report "
                                                                   "== Report.id",
                                                       foreign_keys="Report.id",
                                                       cascade="all, delete-orphan",
                                                       passive_deletes=True,
                                                       passive_updates=True, )
                 def __repr__(self):
                     return '<ReportGroup id:{}>'.format(self.id)
                 def get_report(self, report_id=None, public=False):
                     """
                     Gets report with specific id or latest report if id was not specified
                     """
                     from .report import Report
                     if not report_id:
                         return self.last_report_ref
                     else:
                         return self.reports.filter(Report.id == report_id).first()
                 def get_public_url(self, request, _app_url=None):
                     url = request.route_url('/', _app_url=_app_url)
                     return (url + 'ui/report/%s') % self.id
                 def run_postprocessing(self, report):
                     """
                     Alters report group priority based on postprocessing configuration
                     """
                     request = get_current_request()
                     get_db_session(None, self).flush()
                     for action in self.application.postprocess_conf:
                         get_db_session(None, self).flush()
                         rule_obj = Rule(action.rule, REPORT_TYPE_MATRIX)
                         report_dict = report.get_dict(request)
                         # if was not processed yet
                         if (rule_obj.match(report_dict) and
                                     action.pkey not in self.triggered_postprocesses_ids):
                             action.postprocess(self)
                             # this way sqla can track mutation of list
                             self.triggered_postprocesses_ids = \
                                 self.triggered_postprocesses_ids + [action.pkey]
                     get_db_session(None, self).flush()
                     # do not go out of bounds
                     if self.priority < 1:
                         self.priority = 1
                     if self.priority > 10:
                         self.priority = 10
                 def get_dict(self, request):
                     instance_dict = super(ReportGroup, self).get_dict()
                     instance_dict['server_name'] = self.get_report().tags.get(
                         'server_name')
                     instance_dict['view_name'] = self.get_report().tags.get('view_name')
                     instance_dict['resource_name'] = self.application.resource_name
                     instance_dict['report_type'] = self.get_report().report_type
                     instance_dict['url_path'] = self.get_report().url_path
                     instance_dict['front_url'] = self.get_report().get_public_url(request)
                     del instance_dict['triggered_postprocesses_ids']
                     return instance_dict
                 def es_doc(self):
                     return {
                         '_id': str(self.id),
                         'pg_id': str(self.id),
                         'resource_id': self.resource_id,
                         'error': self.error,
                         'fixed': self.fixed,
                         'public': self.public,
                         'read': self.read,
                         'priority': self.priority,
                         'occurences': self.occurences,
                         'average_duration': self.average_duration,
                         'summed_duration': self.summed_duration,
                         'first_timestamp': self.first_timestamp,
                         'last_timestamp': self.last_timestamp
                     }
                 def set_notification_info(self, notify_10=False, notify_100=False):
                     """
                     Update redis notification maps for notification job
                     """
                     current_time = datetime.utcnow().replace(second=0, microsecond=0)
                     # global app counter
                     key = REDIS_KEYS['counters']['reports_per_type'].format(
                         self.report_type, current_time)
-                    Datastores.redis.incr(key)
+                    redis_pipeline = Datastores.redis.pipeline()
-                    Datastores.redis.expire(key, 3600 * 24)
+                    redis_pipeline.incr(key)
+                    redis_pipeline.expire(key, 3600 * 24)
                     # detailed app notification for alerts and notifications
-                    Datastores.redis.sadd(REDIS_KEYS['apps_that_had_reports'],
+                    redis_pipeline.sadd(
-                                          self.resource_id)
+                        REDIS_KEYS['apps_that_had_reports'], self.resource_id)
-                    Datastores.redis.sadd(REDIS_KEYS['apps_that_had_reports_alerting'],
+                    redis_pipeline.sadd(
-                                          self.resource_id)
+                        REDIS_KEYS['apps_that_had_reports_alerting'], self.resource_id)
                     # only notify for exceptions here
                     if self.report_type == ReportType.error:
-                        Datastores.redis.sadd(
+                        redis_pipeline.sadd(
-                            REDIS_KEYS['apps_that_had_reports'],
+                            REDIS_KEYS['apps_that_had_reports'], self.resource_id)
-                            self.resource_id)
+                        redis_pipeline.sadd(
-                        Datastores.redis.sadd(
                             REDIS_KEYS['apps_that_had_error_reports_alerting'],
                             self.resource_id)
                     key = REDIS_KEYS['counters']['report_group_occurences'].format(self.id)
-                    Datastores.redis.incr(key)
+                    redis_pipeline.incr(key)
-                    Datastores.redis.expire(key, 3600 * 24)
+                    redis_pipeline.expire(key, 3600 * 24)
                     key = REDIS_KEYS['counters']['report_group_occurences_alerting'].format(self.id)
-                    Datastores.redis.incr(key)
+                    redis_pipeline.incr(key)
-                    Datastores.redis.expire(key, 3600 * 24)
+                    redis_pipeline.expire(key, 3600 * 24)
                     if notify_10:
                         key = REDIS_KEYS['counters'][
                             'report_group_occurences_10th'].format(self.id)
-                        Datastores.redis.setex(key, 3600 * 24, 1)
+                        redis_pipeline.setex(key, 3600 * 24, 1)
                     if notify_100:
                         key = REDIS_KEYS['counters'][
                             'report_group_occurences_100th'].format(self.id)
-                        Datastores.redis.setex(key, 3600 * 24, 1)
+                        redis_pipeline.setex(key, 3600 * 24, 1)
                     key = REDIS_KEYS['reports_to_notify_per_type_per_app'].format(
                         self.report_type, self.resource_id)
-                    Datastores.redis.sadd(key, self.id)
+                    redis_pipeline.sadd(key, self.id)
-                    Datastores.redis.expire(key, 3600 * 24)
+                    redis_pipeline.expire(key, 3600 * 24)
                     key = REDIS_KEYS['reports_to_notify_per_type_per_app_alerting'].format(
                         self.report_type, self.resource_id)
-                    Datastores.redis.sadd(key, self.id)
+                    redis_pipeline.sadd(key, self.id)
-                    Datastores.redis.expire(key, 3600 * 24)
+                    redis_pipeline.expire(key, 3600 * 24)
+                    redis_pipeline.execute()
                 @property
                 def partition_id(self):
                     return 'rcae_r_%s' % self.first_timestamp.strftime('%Y_%m')
             def after_insert(mapper, connection, target):
                 if not hasattr(target, '_skip_ft_index'):
                     data = target.es_doc()
                     data.pop('_id', None)
                     Datastores.es.index(target.partition_id, 'report_group',
                                         data, id=target.id)
             def after_update(mapper, connection, target):
                 if not hasattr(target, '_skip_ft_index'):
                     data = target.es_doc()
                     data.pop('_id', None)
                     Datastores.es.index(target.partition_id, 'report_group',
                                         data, id=target.id)
             def after_delete(mapper, connection, target):
                 query = {'term': {'group_id': target.id}}
                 # TODO: routing seems unnecessary, need to test a bit more
                 #Datastores.es.delete_by_query(target.partition_id, 'report', query,
                 #                              query_params={'routing':str(target.id)})
                 Datastores.es.delete_by_query(target.partition_id, 'report', query)
                 query = {'term': {'pg_id': target.id}}
                 Datastores.es.delete_by_query(target.partition_id, 'report_group', query)
             sa.event.listen(ReportGroup, 'after_insert', after_insert)
             sa.event.listen(ReportGroup, 'after_update', after_update)
             sa.event.listen(ReportGroup, 'after_delete', after_delete)

backend/src/appenlight/views/admin/admin.py

0 +3 -4

             # -*- coding: utf-8 -*-
             # Copyright (C) 2010-2016  RhodeCode GmbH
             #
             # This program is free software: you can redistribute it and/or modify
             # it under the terms of the GNU Affero General Public License, version 3
             # (only), as published by the Free Software Foundation.
             #
             # This program is distributed in the hope that it will be useful,
             # but WITHOUT ANY WARRANTY; without even the implied warranty of
             # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
             # GNU General Public License for more details.
             #
             # You should have received a copy of the GNU Affero General Public License
             # along with this program.  If not, see <http://www.gnu.org/licenses/>.
             #
             # This program is dual-licensed. If you wish to learn more about the
             # AppEnlight Enterprise Edition, including its added features, Support
             # services, and proprietary license terms, please see
             # https://rhodecode.com/licenses/
             import logging
             import os
             import pkg_resources
             from datetime import datetime, timedelta
             import psutil
             import redis
             from pyramid.view import view_config
             from appenlight.models import DBSession
             from appenlight.models import Datastores
             from appenlight.lib.redis_keys import REDIS_KEYS
             def bytes2human(total):
                 giga = 1024.0 ** 3
                 mega = 1024.0 ** 2
                 kilo = 1024.0
                 if giga <= total:
                     return '{:0.1f}G'.format(total / giga)
                 elif mega <= total:
                     return '{:0.1f}M'.format(total / mega)
                 else:
                     return '{:0.1f}K'.format(total / kilo)
             log = logging.getLogger(__name__)
             @view_config(route_name='section_view',
                          match_param=['section=admin_section', 'view=system'],
                          renderer='json', permission='root_administration')
             def system(request):
                 current_time = datetime.utcnow(). \
                                    replace(second=0, microsecond=0) - timedelta(minutes=1)
                 # global app counter
+                processed_reports = request.registry.redis_conn.get(
-                processed_reports = Datastores.redis.get(
                     REDIS_KEYS['counters']['reports_per_minute'].format(current_time))
                 processed_reports = int(processed_reports) if processed_reports else 0
-                processed_logs = Datastores.redis.get(
+                processed_logs = request.registry.redis_conn.get(
                     REDIS_KEYS['counters']['logs_per_minute'].format(current_time))
                 processed_logs = int(processed_logs) if processed_logs else 0
-                processed_metrics = Datastores.redis.get(
+                processed_metrics = request.registry.redis_conn.get(
                     REDIS_KEYS['counters']['metrics_per_minute'].format(current_time))
                 processed_metrics = int(processed_metrics) if processed_metrics else 0
                 waiting_reports = 0
                 waiting_logs = 0
                 waiting_metrics = 0
                 waiting_other = 0
                 if 'redis' in request.registry.settings['celery.broker_type']:
                     redis_client = redis.StrictRedis.from_url(
                         request.registry.settings['celery.broker_url'])
                     waiting_reports = redis_client.llen('reports')
                     waiting_logs = redis_client.llen('logs')
                     waiting_metrics = redis_client.llen('metrics')
                     waiting_other = redis_client.llen('default')
                 # process
                 def replace_inf(val):
                     return val if val != psutil.RLIM_INFINITY else 'unlimited'
                 p = psutil.Process()
                 fd = p.rlimit(psutil.RLIMIT_NOFILE)
                 memlock = p.rlimit(psutil.RLIMIT_MEMLOCK)
                 self_info = {
                     'fds': {'soft': replace_inf(fd[0]),
                             'hard': replace_inf(fd[1])},
                     'memlock': {'soft': replace_inf(memlock[0]),
                                 'hard': replace_inf(memlock[1])},
                 }
                 # disks
                 disks = []
                 for part in psutil.disk_partitions(all=False):
                     if os.name == 'nt':
                         if 'cdrom' in part.opts or part.fstype == '':
                             continue
                     usage = psutil.disk_usage(part.mountpoint)
                     disks.append({
                         'device': part.device,
                         'total': bytes2human(usage.total),
                         'used': bytes2human(usage.used),
                         'free': bytes2human(usage.free),
                         'percentage': int(usage.percent),
                         'mountpoint': part.mountpoint,
                         'fstype': part.fstype
                     })
                 # memory
                 memory_v = psutil.virtual_memory()
                 memory_s = psutil.swap_memory()
                 memory = {
                     'total': bytes2human(memory_v.total),
                     'available': bytes2human(memory_v.available),
                     'percentage': memory_v.percent,
                     'used': bytes2human(memory_v.used),
                     'free': bytes2human(memory_v.free),
                     'active': bytes2human(memory_v.active),
                     'inactive': bytes2human(memory_v.inactive),
                     'buffers': bytes2human(memory_v.buffers),
                     'cached': bytes2human(memory_v.cached),
                     'swap_total': bytes2human(memory_s.total),
                     'swap_used': bytes2human(memory_s.used)
                 }
                 # load
                 system_load = os.getloadavg()
                 # processes
                 min_mem = 1024 * 1024 * 40  # 40MB
                 process_info = []
                 for p in psutil.process_iter():
                     mem_used = p.get_memory_info().rss
                     if mem_used < min_mem:
                         continue
                     process_info.append({'owner': p.username(),
                                          'pid': p.pid,
                                          'cpu': round(p.get_cpu_percent(interval=0), 1),
                                          'mem_percentage': round(p.get_memory_percent(),
 ),
                                          'mem_usage': bytes2human(mem_used),
                                          'name': p.name(),
                                          'command': ' '.join(p.cmdline())
                                          })
                 process_info = sorted(process_info, key=lambda x: x['mem_percentage'],
                                       reverse=True)
                 # pg tables
                 db_size_query = '''
                 SELECT tablename, pg_total_relation_size(tablename::text) size
                 FROM pg_tables WHERE tablename NOT LIKE 'pg_%' AND
                 tablename NOT LIKE 'sql_%' ORDER BY size DESC;'''
                 db_tables = []
                 for row in DBSession.execute(db_size_query):
                     db_tables.append({"size_human": bytes2human(row.size),
                                       "table_name": row.tablename})
                 # es indices
                 es_indices = []
                 result = Datastores.es.send_request(
                     'GET', ['_stats', 'store, docs'], query_params={})
                 for ix, stats in result['indices'].items():
                     size = stats['primaries']['store']['size_in_bytes']
                     es_indices.append({'name': ix,
                                        'size': size,
                                        'size_human': bytes2human(size)})
                 # packages
                 packages = ({'name': p.project_name, 'version': p.version}
                             for p in pkg_resources.working_set)
                 return {'db_tables': db_tables,
                         'es_indices': sorted(es_indices,
                                              key=lambda x: x['size'], reverse=True),
                         'process_info': process_info,
                         'system_load': system_load,
                         'disks': disks,
                         'memory': memory,
                         'packages': sorted(packages, key=lambda x: x['name'].lower()),
                         'current_time': current_time,
                         'queue_stats': {
                             'processed_reports': processed_reports,
                             'processed_logs': processed_logs,
                             'processed_metrics': processed_metrics,
                             'waiting_reports': waiting_reports,
                             'waiting_logs': waiting_logs,
                             'waiting_metrics': waiting_metrics,
                             'waiting_other': waiting_other
                         },
                         'self_info': self_info
                         }

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages