"""Prometheus monitoring queries.""" # pylint: disable=too-few-public-methods import requests import strawberry from strawberry.scalars import JSON from dataclasses import dataclass from typing import Optional from datetime import datetime, timedelta PROMETHEUS_URL = "http://localhost:9001" @strawberry.type @dataclass class PrometheusQueryResult: result_type: str result: JSON class PrometheusQueries: @staticmethod def _send_query(query: str, start: int, end: int, step: int): try: response = requests.get( f"{PROMETHEUS_URL}/api/v1/query", params={ "query": query, "start": start, "end": end, "step": step, }, ) if response.status_code != 200: raise Exception("Prometheus returned unexpected HTTP status code") json = response.json() return PrometheusQueryResult( result_type=json["resultType"], result=json["result"] ) except Exception as error: raise Exception("Prometheus request failed! " + str(error)) @staticmethod def cpu_usage( start: Optional[int] = None, end: Optional[int] = None, step: int = 60, # seconds ) -> PrometheusQueryResult: """ Get CPU information. Args: start (int, optional): Unix timestamp indicating the start time. Defaults to 20 minutes ago if not provided. end (int, optional): Unix timestamp indicating the end time. Defaults to current time if not provided. step (int): Interval in seconds for querying disk usage data. """ if not start: start = int((datetime.now() - timedelta(minutes=20)).timestamp()) if not end: end = int(datetime.now().timestamp()) query = '100 - (avg by (instance) (rate(node_cpu_seconds_total{mode="idle"}[5m])) * 100)' return PrometheusQueries._send_query(query, start, end, step) @staticmethod def memory_usage( start: Optional[int] = None, end: Optional[int] = None, step: int = 60, # seconds ) -> PrometheusQueryResult: """ Get memory usage. Args: start (int, optional): Unix timestamp indicating the start time. Defaults to 20 minutes ago if not provided. end (int, optional): Unix timestamp indicating the end time. Defaults to current time if not provided. step (int): Interval in seconds for querying memory usage data. """ if not start: start = int((datetime.now() - timedelta(minutes=20)).timestamp()) if not end: end = int(datetime.now().timestamp()) query = "100 - (100 * (node_memory_MemAvailable_bytes / node_memory_MemTotal_bytes))" return PrometheusQueries._send_query(query, start, end, step) @staticmethod def disk_usage( start: Optional[int] = None, end: Optional[int] = None, step: int = 60, # seconds ) -> PrometheusQueryResult: """ Get disk usage information. Args: start (int, optional): Unix timestamp indicating the start time. Defaults to 20 minutes ago if not provided. end (int, optional): Unix timestamp indicating the end time. Defaults to current time if not provided. step (int): Interval in seconds for querying disk usage data. """ if not start: start = int((datetime.now() - timedelta(minutes=20)).timestamp()) if not end: end = int(datetime.now().timestamp()) query = """100 - (100 * sum by (device) (node_filesystem_avail_bytes{fstype!="rootfs"}) / sum by (device) (node_filesystem_size_bytes{fstype!="rootfs"}))""" return PrometheusQueries._send_query(query, start, end, step)