-
Notifications
You must be signed in to change notification settings - Fork 6
Expand file tree
/
Copy pathmonitor.py
More file actions
131 lines (102 loc) · 5.58 KB
/
monitor.py
File metadata and controls
131 lines (102 loc) · 5.58 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
import time
import aiohttp
from typing import Iterator, AsyncGenerator
from urllib.parse import urljoin
from django.conf import settings
query_last_metrics_promql_tpl = """
last_over_time({__name__=~"%s",namespace="%s"}[%s])
"""
query_loadbalancer_promql_tpl = """
kube_service_status_load_balancer_ingress{namespace=~"%s"}
"""
query_network_receive_flow_promql_tpl = """
increase(container_network_receive_bytes_total{namespace=~"%s"}[%s])
"""
query_network_transmit_flow_promql_tpl = """
increase(container_network_transmit_bytes_total{namespace=~"%s"}[%s])
"""
query_cpu_usage_promql_tpl = """
sum (rate (container_cpu_usage_seconds_total{pod=~"^%s-.*$",namespace="%s"}[%s]))
by (pod)
"""
query_memory_usage_promql_tpl = """
sum (avg_over_time (container_memory_working_set_bytes{pod=~"^%s-.*$",namespace="%s"}[%s]))
by (pod)
"""
query_network_receive_usage_promql_tpl = """
sum (rate (container_network_receive_bytes_total{pod=~"^%s-.*$",namespace="%s"}[%s]))
by (pod)
"""
query_network_transmit_usage_promql_tpl = """
sum (rate (container_network_transmit_bytes_total{pod=~"^%s-.*$",namespace="%s"}[%s]))
by (pod)
"""
async def query_prom(url, params) -> list[tuple[dict[str, str], int]]:
async with aiohttp.ClientSession() as session:
async with session.get(url, params=params) as response:
if response.status != 200:
return []
response_json = await response.json()
if response_json['status'] != 'success':
return []
return response_json['data']['result']
async def last_metrics(namespace) -> AsyncGenerator[Iterator, str]:
if not settings.DRYCC_METRICS_CONFIG:
return
url = urljoin(settings.DRYCC_VICTORIAMETRICS_URL, "/select/0/prometheus/api/v1/query")
promql = query_last_metrics_promql_tpl % (
'|'.join(settings.DRYCC_METRICS_CONFIG.keys()),
namespace,
settings.DRYCC_METRICS_INTERVAL)
for item in await query_prom(url, {"query": promql, "start": int(time.time() - 60)}):
yield '%s{%s} %s\n' % (
item['metric']['__name__'],
','.join([
f'{key}="{value}"' for key, value in item['metric'].items()
if key in settings.DRYCC_METRICS_CONFIG[item['metric']['__name__']]
]),
item['value'][1]
)
async def query_loadbalancer(namespaces: Iterator[str], start: int, stop: int
) -> list[tuple[dict[str, str], int]]:
url = urljoin(settings.DRYCC_VICTORIAMETRICS_URL, "/select/0/prometheus/api/v1/query")
promql = query_loadbalancer_promql_tpl % "|".join(namespaces)
return await query_prom(url, {"query": promql, "start": start, "end": stop})
async def query_network_receive_flow(namespaces: Iterator[str], start: int, stop: int
) -> list[tuple[dict[str, str], int]]:
url = urljoin(settings.DRYCC_VICTORIAMETRICS_URL, "/select/0/prometheus/api/v1/query")
promql = query_network_receive_flow_promql_tpl % ("|".join(namespaces), f"{stop-start}s")
return await query_prom(url, {"query": promql, "start": start, "end": stop})
async def query_network_transmit_flow(namespaces: Iterator[str], start: int, stop: int
) -> list[tuple[dict[str, str], int]]:
url = urljoin(settings.DRYCC_VICTORIAMETRICS_URL, "/select/0/prometheus/api/v1/query")
promql = query_network_transmit_flow_promql_tpl % ("|".join(namespaces), f"{stop-start}s")
return await query_prom(url, {"query": promql, "start": start, "end": stop})
async def query_cpu_usage(namespace: str, ptype: str, every: str,
start: int, stop: int, step: int,
) -> list[tuple[dict[str, str], int]]:
url = urljoin(settings.DRYCC_VICTORIAMETRICS_URL, "/select/0/prometheus/api/v1/query_range")
pod_prefix = "%s-%s" % (namespace, ptype)
promql = query_cpu_usage_promql_tpl % (pod_prefix, namespace, every)
return await query_prom(url, {"query": promql, "start": start, "end": stop, "step": step})
async def query_memory_usage(namespace: str, ptype: str, every: str,
start: int, stop: int, step: int,
) -> list[tuple[dict[str, str], int]]:
url = urljoin(settings.DRYCC_VICTORIAMETRICS_URL, "/select/0/prometheus/api/v1/query_range")
pod_prefix = "%s-%s" % (namespace, ptype)
promql = query_memory_usage_promql_tpl % (pod_prefix, namespace, every)
return await query_prom(url, {"query": promql, "start": start, "end": stop, "step": step})
async def query_network_receive_usage(namespace: str, ptype: str, every: str,
start: int, stop: int, step: int,
) -> list[tuple[dict[str, str], int]]:
url = urljoin(settings.DRYCC_VICTORIAMETRICS_URL, "/select/0/prometheus/api/v1/query_range")
pod_prefix = "%s-%s" % (namespace, ptype)
promql = query_network_receive_usage_promql_tpl % (pod_prefix, namespace, every)
return await query_prom(url, {"query": promql, "start": start, "end": stop, "step": step})
async def query_network_transmit_usage(namespace: str, ptype: str, every: str,
start: int, stop: int, step: int,
) -> list[tuple[dict[str, str], int]]:
url = urljoin(settings.DRYCC_VICTORIAMETRICS_URL, "/select/0/prometheus/api/v1/query_range")
pod_prefix = "%s-%s" % (namespace, ptype)
promql = query_network_transmit_usage_promql_tpl % (pod_prefix, namespace, every)
return await query_prom(url, {"query": promql, "start": start, "end": stop, "step": step})