Add prometheus data source for watcher decision engine

This adds a new data source for the Watcher decision engine that implements the watcher.decision_engine.datasources.DataSourceBase. related spec was merged at [1]. Implements: blueprint prometheus-datasource [1] https://review.opendev.org/c/openstack/watcher-specs/+/933300 Change-Id: I6a70c4acc70a864c418cf347f5f6951cb92ec906
2024-11-01 10:48:36 +02:00
parent d6cb38289e
commit 3f26dc47f2
9 changed files with 1076 additions and 0 deletions
--- a/watcher/decision_engine/datasources/manager.py
+++ b/watcher/decision_engine/datasources/manager.py
@@ -25,6 +25,7 @@ from watcher.decision_engine.datasources import ceilometer as ceil
 from watcher.decision_engine.datasources import gnocchi as gnoc
 from watcher.decision_engine.datasources import grafana as graf
 from watcher.decision_engine.datasources import monasca as mon
+from watcher.decision_engine.datasources import prometheus as prom

 LOG = log.getLogger(__name__)

@@ -36,6 +37,7 @@ class DataSourceManager(object):
        (ceil.CeilometerHelper.NAME, ceil.CeilometerHelper.METRIC_MAP),
        (mon.MonascaHelper.NAME, mon.MonascaHelper.METRIC_MAP),
        (graf.GrafanaHelper.NAME, graf.GrafanaHelper.METRIC_MAP),
+        (prom.PrometheusHelper.NAME, prom.PrometheusHelper.METRIC_MAP),
    ])
    """Dictionary with all possible datasources, dictionary order is
    the default order for attempting to use datasources
@@ -48,6 +50,7 @@ class DataSourceManager(object):
        self._monasca = None
        self._gnocchi = None
        self._grafana = None
+        self._prometheus = None

        # Dynamically update grafana metric map, only available at runtime
        # The metric map can still be overridden by a yaml config file
@@ -104,6 +107,16 @@ class DataSourceManager(object):
    def grafana(self, grafana):
        self._grafana = grafana

+    @property
+    def prometheus(self):
+        if self._prometheus is None:
+            self._prometheus = prom.PrometheusHelper()
+        return self._prometheus
+
+    @prometheus.setter
+    def prometheus(self, prometheus):
+        self._prometheus = prometheus
+
    def get_backend(self, metrics):
        """Determine the datasource to use from the configuration

--- a/watcher/decision_engine/datasources/prometheus.py
+++ b/watcher/decision_engine/datasources/prometheus.py
@@ -0,0 +1,442 @@
+# Copyright 2024 Red Hat, Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License"); you may
+# not use this file except in compliance with the License. You may obtain
+# a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+# License for the specific language governing permissions and limitations
+# under the License.
+#
+from observabilityclient import prometheus_client
+from oslo_config import cfg
+from oslo_log import log
+import re
+from watcher._i18n import _
+from watcher.common import exception
+from watcher.decision_engine.datasources import base
+
+CONF = cfg.CONF
+LOG = log.getLogger(__name__)
+
+
+class PrometheusHelper(base.DataSourceBase):
+    """PrometheusHelper class for retrieving metrics from Prometheus server
+
+    This class implements the DataSourceBase to allow Watcher to query
+    Prometheus as a data source for metrics.
+    """
+
+    NAME = 'prometheus'
+    METRIC_MAP = dict(host_cpu_usage='node_cpu_seconds_total',
+                      host_ram_usage='node_memory_MemAvailable_bytes',
+                      host_outlet_temp=None,
+                      host_inlet_temp=None,
+                      host_airflow=None,
+                      host_power=None,
+                      instance_cpu_usage=None,
+                      instance_ram_usage=None,
+                      instance_ram_allocated=None,
+                      instance_l3_cache_usage=None,
+                      instance_root_disk_size=None,
+                      )
+    AGGREGATES_MAP = dict(mean='avg', max='max', min='min', count='avg')
+
+    def __init__(self):
+        """Initialise the PrometheusHelper
+
+        The prometheus helper uses the PrometheusAPIClient provided by
+        python-observabilityclient.
+        The prometheus_fqdn_instance_map maps the fqdn of each node to the
+        Prometheus instance label added to all metrics on that node. When
+        making queries to Prometheus we use the instance label to specify
+        the node for which metrics are to be retrieved.
+        host, port and fqdn_label come from watcher_client
+        config. The prometheus_fqdn_label allows override of the required label
+        in Prometheus scrape configs that specifies each target's fqdn.
+        """
+        self.prometheus = self._setup_prometheus_client()
+        self.prometheus_fqdn_label = (
+            CONF.prometheus_client.fqdn_label
+        )
+        self.prometheus_fqdn_instance_map = (
+            self._build_prometheus_fqdn_instance_map()
+        )
+        self.prometheus_host_instance_map = (
+            self._build_prometheus_host_instance_map()
+        )
+
+    def _setup_prometheus_client(self):
+        """Initialise the prometheus client with config options
+
+        Use the prometheus_client options in watcher.conf to setup
+        the PrometheusAPIClient client object and return it.
+        :raises watcher.common.exception.MissingParameter if
+                prometheus host or port is not set in the watcher.conf
+                under the [prometheus_client] section.
+        :raises watcher.common.exception.InvalidParameter if
+                the prometheus host or port have invalid format.
+        """
+        def _validate_host_port(host, port):
+            if len(host) > 255:
+                return (False, "hostname is too long: '%s'" % host)
+            if host[-1] == '.':
+                host = host[:-1]
+            legal_hostname = re.compile(
+                "(?!-)[a-z0-9-]{1,63}(?<!-)$", re.IGNORECASE)
+            if not all(legal_hostname.match(host_part)
+                       for host_part in host.split(".")):
+                return (False, "hostname '%s' failed regex match " % host)
+            try:
+                assert bool(1 <= int(port) <= 65535)
+            except (AssertionError, ValueError):
+                return (False, "missing or invalid port number '%s' "
+                        % port)
+            return (True, "all good")
+
+        _host = CONF.prometheus_client.host
+        _port = CONF.prometheus_client.port
+        if (not _host or not _port):
+            raise exception.MissingParameter(
+                message=(_(
+                    "prometheus host and port must be set in watcher.conf "
+                    "under the [prometheus_client] section. Can't initialise "
+                    "the datasource without valid host and port."))
+            )
+        validated, reason = _validate_host_port(_host, _port)
+        if (not validated):
+            raise exception.InvalidParameter(
+                message=(_(
+                    "A valid prometheus host and port are required. The #"
+                    "values found in watcher.conf are '%(host)s' '%(port)s'. "
+                    "This fails validation for the following reason: "
+                    "%(reason)s.")
+                    % {'host': _host, 'port': _port, 'reason': reason})
+            )
+        the_client = prometheus_client.PrometheusAPIClient(
+            "%s:%s" % (_host, _port))
+
+        # check if tls options or basic_auth options are set and use them
+        prometheus_user = CONF.prometheus_client.username
+        prometheus_pass = CONF.prometheus_client.password
+        prometheus_ca_cert = CONF.prometheus_client.cafile
+        prometheus_client_cert = CONF.prometheus_client.certfile
+        prometheus_client_key = CONF.prometheus_client.keyfile
+        if (prometheus_ca_cert):
+            the_client.set_ca_cert(prometheus_ca_cert)
+            if (prometheus_client_cert and prometheus_client_key):
+                the_client.set_client_cert(
+                    prometheus_client_cert, prometheus_client_key)
+        if (prometheus_user and prometheus_pass):
+            the_client.set_basic_auth(prometheus_user, prometheus_pass)
+
+        return the_client
+
+    def _build_prometheus_fqdn_instance_map(self):
+        """Build the fqdn<-->instance_label mapping needed for queries
+
+        Watcher knows nodes by their hostname. In Prometheus however the
+        scrape targets (also known as 'instances') are specified by I.P.
+        (or hostname) and port number. This function creates a mapping between
+        the fully qualified domain name of each node and the corresponding
+        instance label used in the scrape config. This relies on a custom
+        'fqdn' label added to Prometheus scrape_configs. Operators can use
+        a different custom label instead by setting the prometheus_fqdn_label
+        config option under the prometheus_client section of watcher config.
+        The built prometheus_fqdn_instance_map is used to match watcher
+        node.hostname if watcher stores fqdn and otherwise the
+        host_instance_map is used instead.
+        :return a dict mapping fqdn to instance label. For example:
+                {'marios-env-again.controlplane.domain': '10.1.2.3:9100'}
+        """
+        prometheus_targets = self.prometheus._get(
+            "targets?state=active")['data']['activeTargets']
+        # >>> prometheus_targets[0]['labels']
+        # {'fqdn': 'marios-env-again.controlplane.domain',
+        #  'instance': 'localhost:9100', 'job': 'node'}
+        fqdn_instance_map = {
+            fqdn: instance for (fqdn, instance) in (
+                (target['labels'].get(self.prometheus_fqdn_label),
+                 target['labels'].get('instance'))
+                for target in prometheus_targets
+                if target.get('labels', {}).get(self.prometheus_fqdn_label)
+            )
+        }
+        if not fqdn_instance_map:
+            LOG.error(
+                "Could not create fqdn instance map from Prometheus "
+                "targets config. Prometheus returned the following: %s",
+                prometheus_targets
+            )
+            return {}
+        return fqdn_instance_map
+
+    def _build_prometheus_host_instance_map(self):
+        """Build the hostname<-->instance_label mapping needed for queries
+
+        The prometheus_fqdn_instance_map has the fully qualified domain name
+        for hosts. This will create a duplicate map containing only the host
+        name part. Depending on the watcher node.hostname either the
+        fqdn_instance_map or the host_instance_map will be used to resolve
+        the correct prometheus instance label for queries. In the event the
+        fqdn_instance_map keys are not valid fqdn (for example it contains
+        hostnames, not fqdn) the host_instance_map cannot be created and
+        an empty dictionary is returned with a warning logged.
+        :return a dict mapping hostname to instance label. For example:
+                {'marios-env-again': 'localhost:9100'}
+        """
+        if not self.prometheus_fqdn_instance_map:
+            LOG.error("Cannot build host_instance_map without "
+                      "fqdn_instance_map")
+            return {}
+        host_instance_map = {
+            host: instance for (host, instance) in (
+                (fqdn.split('.')[0], inst)
+                for fqdn, inst in self.prometheus_fqdn_instance_map.items()
+                if '.' in fqdn
+            )
+        }
+        if not host_instance_map:
+            LOG.warning("Creating empty host instance map. Are the keys "
+                        "in prometheus_fqdn_instance_map valid fqdn?")
+            return {}
+        return host_instance_map
+
+    def _resolve_prometheus_instance_label(self, node_name):
+        """Resolve the prometheus instance label to use in queries
+
+        Given the watcher node.hostname, resolve the prometheus instance
+        label for use in queries, first trying the fqdn_instance_map and
+        then the host_instance_map (watcher.node_name can be fqdn or hostname).
+        If the name is not resolved after the first attempt, rebuild the fqdn
+        and host instance maps and try again. This allows for new hosts added
+        after the initialisation of the fqdn_instance_map.
+        :param node_name: the watcher node.hostname
+        :return String for the prometheus instance label and None if not found
+        """
+        def _query_maps(node):
+            return self.prometheus_fqdn_instance_map.get(
+                node, self.prometheus_host_instance_map.get(node, None))
+
+        instance_label = _query_maps(node_name)
+        # refresh the fqdn and host instance maps and retry
+        if not instance_label:
+            self.prometheus_fqdn_instance_map = (
+                self._build_prometheus_fqdn_instance_map()
+            )
+            self.prometheus_host_instance_map = (
+                self._build_prometheus_host_instance_map()
+            )
+            instance_label = _query_maps(node_name)
+
+        if not instance_label:
+            LOG.error("Cannot query prometheus without instance label. "
+                      "Could not resolve %s", node_name)
+            return None
+        return instance_label
+
+    def _resolve_prometheus_aggregate(self, watcher_aggregate, meter):
+        """Resolve the prometheus aggregate using self.AGGREGATES_MAP
+
+        This uses the AGGREGATES_MAP to resolve the correct prometheus
+        aggregate to use in queries, from the given watcher aggregate
+        """
+        if watcher_aggregate == 'count':
+            LOG.warning('Prometheus data source does not currently support '
+                        ' the count aggregate. Proceeding with mean (avg).')
+        promql_aggregate = self.AGGREGATES_MAP.get(watcher_aggregate)
+        if not promql_aggregate:
+            raise exception.InvalidParameter(
+                message=(_("Unknown Watcher aggregate %s. This does not "
+                           "resolve to any valid prometheus query aggregate.")
+                         % watcher_aggregate)
+            )
+        return promql_aggregate
+
+    def _build_prometheus_query(self, aggregate, meter, instance_label,
+                                period):
+        """Build and return the prometheus query string with the given args
+
+        This function builds and returns the string query that will be sent
+        to the Prometheus server /query endpoint. For host cpu usage we use:
+
+        100 - (avg by (instance)(rate(node_cpu_seconds_total{mode='idle',
+                                       instance='some_host'}[300s])) * 100)
+
+        so using prometheus rate function over the specified period, we average
+        per instance (all cpus) idle time and then 'everything else' is cpu
+        usage time.
+
+        For host memory usage we use:
+
+        (node_memory_MemTotal_bytes{instance='the_host'} -
+        avg_over_time(
+            node_memory_MemAvailable_bytes{instance='the_host'}[300s]))
+            / 1024 / 1024
+
+        So we take total and subtract available memory to determine
+        how much is in use. We use the prometheus xxx_over_time functions
+        avg/max/min depending on the aggregate with the specified time period.
+
+        :param aggregate: one of the values of self.AGGREGATES_MAP
+        :param meter: the name of the Prometheus meter to use
+        :param instance_label: the Prometheus instance label (scrape target).
+        :param period: the period in seconds for which to query
+        :return: a String containing the Prometheus query
+        :raises watcher.common.exception.InvalidParameter if params are None
+        :raises watcher.common.exception.InvalidParameter if meter is not
+                known or currently supported (prometheus meter name).
+        """
+        query_args = None
+        if (meter is None or aggregate is None or instance_label is None or
+                period is None):
+            raise exception.InvalidParameter(
+                message=(_(
+                    "Cannot build prometheus query without args. "
+                    "You provided: meter %(mtr)s, aggregate %(agg)s, "
+                    "instance_label %(inst)s, period %(prd)s")
+                    % {'mtr': meter, 'agg': aggregate,
+                       'inst': instance_label, 'prd': period})
+            )
+
+        if meter == 'node_cpu_seconds_total':
+            query_args = (
+                "100 - (%s by (instance)(rate(%s"
+                "{mode='idle',instance='%s'}[%ss])) * 100)" %
+                (aggregate, meter, instance_label, period)
+            )
+        elif meter == 'node_memory_MemAvailable_bytes':
+            query_args = (
+                "(node_memory_MemTotal_bytes{instance='%s'} "
+                "- %s_over_time(%s{instance='%s'}[%ss])) "
+                "/ 1024 / 1024" %
+                (instance_label, aggregate, meter,
+                 instance_label, period)
+            )
+        else:
+            raise exception.InvalidParameter(
+                message=(_("Cannot process prometheus meter %s") % meter)
+            )
+
+        return query_args
+
+    def check_availability(self):
+        """check if Prometheus server is available for queries
+
+         Performs HTTP get on the prometheus API /status/runtimeinfo endpoint.
+         The prometheus_client will raise a PrometheuAPIClientError if the
+         call is unsuccessful, which is caught here and a warning logged.
+        """
+        try:
+            self.prometheus._get("status/runtimeinfo")
+        except prometheus_client.PrometheusAPIClientError:
+            LOG.warning(
+                "check_availability raised PrometheusAPIClientError. "
+                "Is Prometheus server down?"
+            )
+            return 'not available'
+        return 'available'
+
+    def list_metrics(self):
+        """Fetch all prometheus metrics from api/v1/label/__name__/values
+
+        The prometheus_client will raise a PrometheuAPIClientError if the
+        call is unsuccessful, which is caught here and a warning logged.
+        """
+        try:
+            response = self.prometheus._get("label/__name__/values")
+        except prometheus_client.PrometheusAPIClientError:
+            LOG.warning(
+                "list_metrics raised PrometheusAPIClientError. Is Prometheus"
+                "server down?"
+            )
+            return set()
+        return set(response['data'])
+
+    def statistic_aggregation(self, resource=None, resource_type=None,
+                              meter_name=None, period=300, aggregate='mean',
+                              granularity=300):
+
+        meter = self._get_meter(meter_name)
+        query_args = ''
+        instance_label = ''
+
+        if resource_type == 'compute_node':
+            instance_label = self._resolve_prometheus_instance_label(
+                resource.hostname)
+        else:
+            LOG.warning(
+                "Prometheus data source does not currently support "
+                "resource_type %s", resource_type
+            )
+            return None
+
+        promql_aggregate = self._resolve_prometheus_aggregate(aggregate, meter)
+        query_args = self._build_prometheus_query(
+            promql_aggregate, meter, instance_label, period
+        )
+        if not query_args:
+            LOG.error("Cannot proceed without valid prometheus query")
+            return None
+
+        result = self.query_retry(
+            self.prometheus.query, query_args,
+            ignored_exc=prometheus_client.PrometheusAPIClientError,
+        )
+
+        return float(result[0].value) if result else None
+
+    def statistic_series(self, resource=None, resource_type=None,
+                         meter_name=None, start_time=None, end_time=None,
+                         granularity=300):
+        raise NotImplementedError(
+            _('Prometheus helper currently does not support statistic_series. '
+              'This can be considered for future enhancement.'))
+
+    def _invert_max_min_aggregate(self, agg):
+        """Invert max and min for node/host metric queries from node-exporter
+
+            because we query for 'idle'/'unused' cpu and memory.
+            For Watcher 'max cpu used' we query for prometheus 'min idle time'.
+            For Watcher 'max memory used' we retrieve min 'unused'/'available'
+            memory from Prometheus. This internal function is used exclusively
+            by get_host_cpu_usage and get_host_ram_usage.
+            :param agg: the metric collection aggregate
+            :return: a String aggregate
+
+        """
+        if agg == 'max':
+            return 'min'
+        elif agg == 'min':
+            return 'max'
+        return agg
+
+    def get_host_cpu_usage(self, resource, period=300,
+                           aggregate="mean", granularity=None):
+        """Query prometheus for node_cpu_seconds_total
+
+        This calculates the host cpu usage and returns it as a percentage
+        The calculation is made by using the cpu 'idle' time, per
+        instance (so all CPUs are included). For example the query looks like
+        (100 - (avg by (instance)(rate(node_cpu_seconds_total
+            {mode='idle',instance='localhost:9100'}[300s])) * 100))
+        """
+        aggregate = self._invert_max_min_aggregate(aggregate)
+        cpu_usage = self.statistic_aggregation(
+            resource, 'compute_node',
+            'host_cpu_usage', period=period,
+            granularity=granularity, aggregate=aggregate)
+        return float(cpu_usage) if cpu_usage else None
+
+    def get_host_ram_usage(self, resource, period=300,
+                           aggregate="mean", granularity=None):
+        aggregate = self._invert_max_min_aggregate(aggregate)
+        ram_usage = self.statistic_aggregation(
+            resource, 'compute_node',
+            'host_ram_usage', period=period,
+            granularity=granularity, aggregate=aggregate)
+        return float(ram_usage) if ram_usage else None