blob: 9049d953a48529f062f0e0f91828a30e6d53aab0 [file] [log] [blame]
# -*- coding: utf-8 -*-
# Copyright 2018 Whitestack, LLC
# *************************************************************
# This file is part of OSM Monitoring module
# All Rights Reserved to Whitestack, LLC
# Licensed under the Apache License, Version 2.0 (the "License"); you may
# not use this file except in compliance with the License. You may obtain
# a copy of the License at
# http://www.apache.org/licenses/LICENSE-2.0
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
# License for the specific language governing permissions and limitations
# under the License.
# For those usages not covered by the Apache License, Version 2.0 please
# contact: bdiaz@whitestack.com or glavado@whitestack.com
##
import logging
import multiprocessing
from enum import Enum
from typing import Tuple, List
from osm_mon.core.common_db import CommonDbClient
from osm_mon.core.config import Config
from osm_mon.core.models import Alarm
from osm_mon.evaluator.backends.prometheus import PrometheusBackend
log = logging.getLogger(__name__)
BACKENDS = {"prometheus": PrometheusBackend}
class AlarmStatus(Enum):
ALARM = "alarm"
OK = "ok"
INSUFFICIENT = "insufficient-data"
DISABLED = "disabled"
class EvaluatorService:
def __init__(self, config: Config):
self.conf = config
self.common_db = CommonDbClient(self.conf)
self.queue = multiprocessing.Queue()
def _get_metric_value(self, metric_name: str, tags: dict):
return BACKENDS[self.conf.get("evaluator", "backend")](
self.conf
).get_metric_value(metric_name, tags)
def _evaluate_metric(self, alarm: Alarm):
log.debug("_evaluate_metric")
metric_value = self._get_metric_value(alarm.metric, alarm.tags)
if alarm.alarm_status.upper() != AlarmStatus.DISABLED.value.upper():
if metric_value is None:
log.warning("No metric result for alarm %s", alarm.uuid)
self.queue.put((alarm, AlarmStatus.INSUFFICIENT))
else:
if alarm.operation.upper() == "GT":
if metric_value > alarm.threshold:
self.queue.put((alarm, AlarmStatus.ALARM))
else:
self.queue.put((alarm, AlarmStatus.OK))
elif alarm.operation.upper() == "LT":
if metric_value < alarm.threshold:
self.queue.put((alarm, AlarmStatus.ALARM))
else:
self.queue.put((alarm, AlarmStatus.OK))
def update_alarm_status(self, alarm_state, uuid):
alarm_data = self.common_db.get_alarm_by_uuid(uuid)
if alarm_data.get("alarm_status").upper() != AlarmStatus.DISABLED.value.upper():
self.common_db.update_alarm_status(alarm_state, uuid)
return
def evaluate_alarms(self) -> List[Tuple[Alarm, AlarmStatus]]:
log.debug("evaluate_alarms")
processes = []
for alarm in self.common_db.get_alarms():
p = multiprocessing.Process(target=self._evaluate_metric, args=(alarm,))
processes.append(p)
p.start()
for process in processes:
process.join(timeout=10)
alarms_tuples = []
while not self.queue.empty():
alarms_tuples.append(self.queue.get())
return alarms_tuples