mistral-extra/mistral_extra/monitoring/monitoring_server.py

114 lines
3.6 KiB
Python

# Copyright 2023 - NetCracker Technology Corp.
#
# Licensed under the Apache License, Version 2.0 (the "License"); you may
# not use this file except in compliance with the License. You may obtain
# a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
# License for the specific language governing permissions and limitations
# under the License.
import datetime
from flask import Flask
from flask import jsonify
from flask import Response
from importlib_metadata import entry_points
from mistral.service import base as service_base
from mistral_extra.monitoring.prometheus import format_to_prometheus
from oslo_config import cfg
from oslo_log import log as logging
CONF = cfg.CONF
LOG = logging.getLogger(__name__)
def get_oslo_service(setup_profiler=True):
return MonitoringServer(
setup_profiler=setup_profiler
)
class MonitoringServer(service_base.MistralService):
def __init__(self, setup_profiler=True):
super(MonitoringServer, self).__init__(
'monitoring_group',
setup_profiler
)
collectors = entry_points(group='monitoring.metric_collector')
self._metric_collectors = [collector.load()()
for collector in collectors]
self._jobs = []
self._standard_tags = {}
self._metrics = {}
self._prometheus_formatted_metrics = []
self._last_updated = None
self._timedelta = datetime.timedelta(
seconds=CONF.monitoring.metric_collection_interval
)
self.app = Flask(__name__)
self.app.add_url_rule('/metrics', 'metrics', self.metrics)
self.app.add_url_rule('/health', 'health', self.health)
def collect_metrics(self, to_json=False):
now = datetime.datetime.now()
if not self._last_updated or self._outdated(now):
metrics = []
for collector in self._metric_collectors:
metrics.extend(collector.collect())
for metric in metrics:
metric.tags.update(self._standard_tags)
self._metrics = metrics
self._last_updated = now
if to_json:
return list(map(lambda x: x.__dict__, self._metrics))
return self._metrics
def _outdated(self, now):
return self._last_updated <= now - self._timedelta
def _get_prometheus_metrics(self):
metrics = self.collect_metrics(to_json=True)
pr_metrics = format_to_prometheus(metrics)
return ''.join([line.decode('utf-8') for line in pr_metrics])
def metrics(self):
with self.app.app_context():
m = self._get_prometheus_metrics()
return Response(m, 200, content_type='text/plain')
def health(self):
with self.app.app_context():
return jsonify({'status': 'UP'})
def _init_monitoring_jobs(self):
if CONF.recovery_job.enabled:
recovery_jobs = entry_points(group='monitoring.recovery_jobs')
for job in recovery_jobs:
recovery_job = job.load()()
self._jobs.append(recovery_job)
recovery_job.start()
def start(self):
super(MonitoringServer, self).start()
self._init_monitoring_jobs()
self.app.run(host="0.0.0.0", port=9090)
def stop(self, graceful=False):
super(MonitoringServer, self).stop()
for job in self._jobs:
job.stop(graceful)