google · lvaylet · Nov 2, 2022 · Nov 3, 2022 · Nov 3, 2022
diff --git a/slo_generator/backends/cloud_monitoring.py b/slo_generator/backends/cloud_monitoring.py
@@ -13,181 +13,57 @@
 # limitations under the License.
 """
 `cloud_monitoring.py`
-Cloud Monitoring backend implementation.
+Cloud Monitoring backend implementation with MQF (Monitoring Query Filters).
 """
 import logging
 import pprint
-import warnings
-from collections import OrderedDict
+from typing import List, Optional
 
-from google.cloud import monitoring_v3
+from google.api.distribution_pb2 import Distribution
+from google.cloud.monitoring_v3 import Aggregation, ListTimeSeriesRequest, TimeInterval
+from google.cloud.monitoring_v3.services.metric_service import MetricServiceClient
+from google.cloud.monitoring_v3.services.metric_service.pagers import (
+    ListTimeSeriesPager,
+)
+from google.cloud.monitoring_v3.types.metric import TimeSeries
 
-from slo_generator.constants import NO_DATA
+from .cloud_monitoring_abc import CloudMonitoringBackendABC
 
 LOGGER = logging.getLogger(__name__)
 
 
-class CloudMonitoringBackend:
-    """Backend for querying metrics from Cloud Monitoring.
+class CloudMonitoringBackend(CloudMonitoringBackendABC):
+    """Backend for querying metrics from Cloud Monitoring with MQF.
 
     Args:
         project_id (str): Cloud Monitoring host project id.
-        client (google.cloud.monitoring_v3.MetricServiceClient, optional):
-            Existing Cloud Monitoring Metrics client. Initialize a new client
-            if omitted.
+        client (monitoring_v3.services.query_service.MetricServiceClient, optional):
+            Existing Cloud Monitoring Metrics client. Initialize a new client if
+            omitted.
     """
 
-    def __init__(self, project_id, client=None):
+    def __init__(self, project_id: str, client=None):
         self.client = client
         if client is None:
-            self.client = monitoring_v3.MetricServiceClient()
+            self.client = MetricServiceClient()
         self.parent = self.client.common_project_path(project_id)
 
-    # pylint: disable=duplicate-code
-    def good_bad_ratio(self, timestamp, window, slo_config):
-        """Query two timeseries, one containing 'good' events, one containing
-        'bad' events.
-
-        Args:
-            timestamp (int): UNIX timestamp.
-            window (int): Window size (in seconds).
-            slo_config (dict): SLO configuration.
-
-        Returns:
-            tuple: A tuple (good_event_count, bad_event_count)
-        """
-        measurement = slo_config["spec"]["service_level_indicator"]
-        filter_good = measurement["filter_good"]
-        filter_bad = measurement.get("filter_bad")
-        filter_valid = measurement.get("filter_valid")
-
-        # Query 'good events' timeseries
-        good_ts = self.query(
-            timestamp=timestamp,
-            window=window,
-            filter=filter_good,
-        )
-        good_ts = list(good_ts)
-        good_event_count = CM.count(good_ts)
-
-        # Query 'bad events' timeseries
-        if filter_bad:
-            bad_ts = self.query(
-                timestamp=timestamp,
-                window=window,
-                filter=filter_bad,
-            )
-            bad_ts = list(bad_ts)
-            bad_event_count = CM.count(bad_ts)
-        elif filter_valid:
-            valid_ts = self.query(
-                timestamp=timestamp,
-                window=window,
-                filter=filter_valid,
-            )
-            valid_ts = list(valid_ts)
-            bad_event_count = CM.count(valid_ts) - good_event_count
-        else:
-            raise Exception("One of `filter_bad` or `filter_valid` is required.")
-
-        LOGGER.debug(
-            f"Good events: {good_event_count} | " f"Bad events: {bad_event_count}"
-        )
-
-        return good_event_count, bad_event_count
-
-    # pylint: disable=duplicate-code,too-many-locals
-    def distribution_cut(self, timestamp, window, slo_config):
-        """Query one timeseries of type 'exponential'.
-
-        Args:
-            timestamp (int): UNIX timestamp.
-            window (int): Window size (in seconds).
-            slo_config (dict): SLO configuration.
-
-        Returns:
-            tuple: A tuple (good_event_count, bad_event_count).
-        """
-        measurement = slo_config["spec"]["service_level_indicator"]
-        filter_valid = measurement["filter_valid"]
-        threshold_bucket = int(measurement["threshold_bucket"])
-        good_below_threshold = measurement.get("good_below_threshold", True)
-
-        # Query 'valid' events
-        series = self.query(
-            timestamp=timestamp,
-            window=window,
-            filter=filter_valid,
-        )
-        series = list(series)
-
-        if not series:
-            return NO_DATA, NO_DATA  # no timeseries
-
-        distribution_value = series[0].points[0].value.distribution_value
-        # bucket_options = distribution_value.bucket_options
-        bucket_counts = distribution_value.bucket_counts
-        valid_events_count = distribution_value.count
-        # growth_factor = bucket_options.exponential_buckets.growth_factor
-        # scale = bucket_options.exponential_buckets.scale
-
-        # Explicit the exponential distribution result
-        count_sum = 0
-        distribution = OrderedDict()
-        for i, bucket_count in enumerate(bucket_counts):
-            count_sum += bucket_count
-            # upper_bound = scale * math.pow(growth_factor, i)
-            distribution[i] = {
-                # 'upper_bound': upper_bound,
-                # 'bucket_count': bucket_count,
-                "count_sum": count_sum
-            }
-        LOGGER.debug(pprint.pformat(distribution))
-
-        if len(distribution) - 1 < threshold_bucket:
-            # maximum measured metric is below the cut after bucket number
-            lower_events_count = valid_events_count
-            upper_events_count = 0
-        else:
-            lower_events_count = distribution[threshold_bucket]["count_sum"]
-            upper_events_count = valid_events_count - lower_events_count
-
-        if good_below_threshold:
-            good_event_count = lower_events_count
-            bad_event_count = upper_events_count
-        else:
-            good_event_count = upper_events_count
-            bad_event_count = lower_events_count
-
-        return good_event_count, bad_event_count
-
-    def exponential_distribution_cut(self, *args, **kwargs):
-        """Alias for `distribution_cut` method to allow for backwards
-        compatibility.
-        """
-        warnings.warn(
-            "exponential_distribution_cut will be deprecated in version 2.0, "
-            "please use distribution_cut instead",
-            FutureWarning,
-        )
-        return self.distribution_cut(*args, **kwargs)
-
     # pylint: disable=redefined-builtin,too-many-arguments
     def query(
         self,
-        timestamp,
-        window,
-        filter,
-        aligner="ALIGN_SUM",
-        reducer="REDUCE_SUM",
-        group_by=None,
-    ):
-        """Query timeseries from Cloud Monitoring.
+        timestamp: float,
+        window: int,
+        filter_or_query: str,
+        aligner: str = "ALIGN_SUM",
+        reducer: str = "REDUCE_SUM",
+        group_by: Optional[List[str]] = None,
+    ) -> List[TimeSeries]:
+        """Query timeseries from Cloud Monitoring using MQF.
 
         Args:
-            timestamp (int): Current timestamp.
+            timestamp (float): Current timestamp.
             window (int): Window size (in seconds).
-            filter (str): Query filter.
+            filter_or_query (str): Query filter.
             aligner (str, optional): Aligner to use.
             reducer (str, optional): Reducer to use.
             group_by (list, optional): List of fields to group by.
@@ -197,53 +73,41 @@ def query(
         """
         if group_by is None:
             group_by = []
-        measurement_window = CM.get_window(timestamp, window)
-        aggregation = CM.get_aggregation(
-            window, aligner=aligner, reducer=reducer, group_by=group_by
+        measurement_window = self.get_window(timestamp, window)
+        aggregation = self.get_aggregation(window, aligner, reducer, group_by)
+        request = ListTimeSeriesRequest(
+            {
+                "name": self.parent,
+                "filter": filter_or_query,
+                "interval": measurement_window,
+                "view": ListTimeSeriesRequest.TimeSeriesView.FULL,
+                "aggregation": aggregation,
+            }
         )
-        request = monitoring_v3.ListTimeSeriesRequest()
-        request.name = self.parent
-        request.filter = filter
-        request.interval = measurement_window
-        request.view = monitoring_v3.ListTimeSeriesRequest.TimeSeriesView.FULL
-        request.aggregation = aggregation
-        timeseries = self.client.list_time_series(request)
+        timeseries_pager: ListTimeSeriesPager = self.client.list_time_series(request)
+        timeseries: List[TimeSeries] = list(timeseries_pager)
         LOGGER.debug(pprint.pformat(timeseries))
         return timeseries
 
     @staticmethod
-    def count(timeseries):
-        """Count events in time series assuming it was aligned with ALIGN_SUM
-        and reduced with REDUCE_SUM (default).
-
-        Args:
-            :obj:`monitoring_v3.TimeSeries`: Timeseries object.
-
-        Returns:
-            int: Event count.
-        """
-        try:
-            return timeseries[0].points[0].value.int64_value
-        except (IndexError, AttributeError) as exception:
-            LOGGER.debug(exception, exc_info=True)
-            return NO_DATA  # no events in timeseries
-
-    @staticmethod
-    def get_window(timestamp, window):
+    def get_window(
+        timestamp: float,
+        window: int,
+    ) -> TimeInterval:
         """Helper for measurement window.
 
         Args:
-            timestamp (int): Current timestamp.
+            timestamp (float): Current timestamp.
             window (int): Window size (in seconds).
 
         Returns:
-            :obj:`monitoring_v3.types.TimeInterval`: Measurement window object.
+            :obj:`monitoring_v3.TimeInterval`: Measurement window object.
         """
         end_time_seconds = int(timestamp)
         end_time_nanos = int((timestamp - end_time_seconds) * 10**9)
         start_time_seconds = int(timestamp - window)
         start_time_nanos = end_time_nanos
-        measurement_window = monitoring_v3.TimeInterval(
+        measurement_window = TimeInterval(
             {
                 "end_time": {
                     "seconds": end_time_seconds,
@@ -260,11 +124,11 @@ def get_window(timestamp, window):
 
     @staticmethod
     def get_aggregation(
-        window,
-        aligner="ALIGN_SUM",
-        reducer="REDUCE_SUM",
-        group_by=None,
-    ):
+        window: int,
+        aligner: str = "ALIGN_SUM",
+        reducer: str = "REDUCE_SUM",
+        group_by: Optional[List[str]] = None,
+    ) -> Aggregation:
         """Helper for aggregation object.
 
         Default aggregation is `ALIGN_SUM`.
@@ -274,27 +138,46 @@ def get_aggregation(
             window (int): Window size (in seconds).
             aligner (str): Aligner type.
             reducer (str): Reducer type.
-            group_by (list): List of fields to group by.
+            group_by (list, optional): List of fields to group by.
 
         Returns:
-            :obj:`monitoring_v3.types.Aggregation`: Aggregation object.
+            :obj:`monitoring_v3.Aggregation`: Aggregation object.
         """
         if group_by is None:
             group_by = []
-        aggregation = monitoring_v3.Aggregation(
+        aggregation = Aggregation(
             {
                 "alignment_period": {"seconds": window},
-                "per_series_aligner": getattr(
-                    monitoring_v3.Aggregation.Aligner, aligner
-                ),
-                "cross_series_reducer": getattr(
-                    monitoring_v3.Aggregation.Reducer, reducer
-                ),
+                "per_series_aligner": getattr(Aggregation.Aligner, aligner),
+                "cross_series_reducer": getattr(Aggregation.Reducer, reducer),
                 "group_by_fields": group_by,
             }
         )
         LOGGER.debug(pprint.pformat(aggregation))
         return aggregation
 
+    @staticmethod
+    def get_distribution_value_from_timeseries(
+        timeseries: List[TimeSeries],
+    ) -> Distribution:
+        """Extract a distribution from a list of timeseries.
+
+        Args:
+            timeseries (list): List of timeseries.
+
+        Returns:
+            :obj:`google.api.distribution_pb2.Distribution`: Distribution.
+        """
+        return timeseries[0].points[0].value.distribution_value
 
-CM = CloudMonitoringBackend
+    @staticmethod
+    def get_nb_events_from_timeseries(timeseries: List[TimeSeries]) -> int:
+        """Count the events from a list of timeseries.
+
+        Args:
+            timeseries (list): List of timeseries.
+
+        Returns:
+            int: Number of events.
+        """
+        return timeseries[0].points[0].value.int64_value