This commit is contained in:
Mitch Ross 2023-02-26 20:31:22 -05:00
parent 92b5606ed4
commit 6c407911f6
3 changed files with 147 additions and 79 deletions

View File

@ -1,7 +1,8 @@
import json
import re
from urllib.request import urlopen
from prometheus_client import CollectorRegistry from prometheus_client import CollectorRegistry
from prometheus_client.metrics_core import GaugeMetricFamily from prometheus_client.metrics_core import GaugeMetricFamily, InfoMetricFamily
from frigate.requester import Requester
@ -11,26 +12,155 @@ def setupRegistry():
return myregistry return myregistry
def add_metric(metric, label, data, key, multiplier=1.0):
try:
string = str(data[key])
value = float(re.findall(r'\d+', string)[0])
metric.add_metric([label], value * multiplier)
except (KeyError, TypeError, IndexError):
pass
class CustomCollector(): class CustomCollector():
def __init__(self): def __init__(self):
self.service_unavailable_url = "https://httpstat.us/503" self.stats_url = "http://localhost:5000/api/stats"
self.ok_url = "https://httpstat.us/200"
def collect(self): def collect(self):
server_unavailable_requester = Requester(self.service_unavailable_url)
ok_requester = Requester(self.ok_url)
server_unavailable_response = server_unavailable_requester.get_request()
ok_response = ok_requester.get_request()
url_up_gauge = GaugeMetricFamily('sample_external_url_up', 'Help text', labels=['url']) data = json.loads(urlopen(self.stats_url).read())
url_response_ms_gauge = GaugeMetricFamily('sample_external_url_response_ms', 'Help text', labels=['url'])
url_up_gauge.add_metric([server_unavailable_response.url], server_unavailable_response.up_or_down) # camera stats
url_response_ms_gauge.add_metric([server_unavailable_response.url], server_unavailable_response.response_ms) ffmpeg_pid = GaugeMetricFamily('frigate_ffmpeg_pid', 'PID for ffmpeg process', labels=['camera'])
capture_pid = GaugeMetricFamily('frigate_capture_pid', 'PID for the ffmpeg process that consumes this camera',
labels=['camera'])
detect_pid = GaugeMetricFamily('frigate_detect_pid', 'PID for the process that runs detection for this camera',
labels=['camera'])
camera_fps = GaugeMetricFamily('frigate_camera_fps', 'Frames per second being consumed from your camera.',
labels=['camera'])
detection_fps = GaugeMetricFamily('frigate_detection_fps', 'Number of times detection is run per second.',
labels=['camera'])
process_fps = GaugeMetricFamily('frigate_process_fps', 'Frames per second being processed by frigate.',
labels=['camera'])
skipped_fps = GaugeMetricFamily('frigate_skipped_fps', 'Frames per second skip for processing by frigate.',
labels=['camera'])
detection_enabled = GaugeMetricFamily('frigate_detection_enabled', 'Detection enabled for camera',
labels=['camera'])
url_up_gauge.add_metric([ok_response.url], ok_response.up_or_down) for k, d in data.items():
url_response_ms_gauge.add_metric([ok_response.url], ok_response.response_ms) add_metric(ffmpeg_pid, k, d, 'ffmpeg_pid')
add_metric(detect_pid, k, d, 'pid')
add_metric(capture_pid, k, d, 'capture_pid')
add_metric(camera_fps, k, d, 'camera_fps')
add_metric(detection_fps, k, d, 'detection_fps')
add_metric(process_fps, k, d, 'process_fps')
add_metric(skipped_fps, k, d, 'skipped_fps')
add_metric(detection_enabled, k, d, 'detection_enabled')
yield ffmpeg_pid
yield capture_pid
yield detect_pid
yield camera_fps
yield detection_fps
yield process_fps
yield skipped_fps
yield detection_enabled
# detector stats
try:
yield GaugeMetricFamily('frigate_detection_total_fps',
'Sum of detection_fps across all cameras and detectors.',
value=data['detection_fps'])
except KeyError:
pass
detector_inference_speed = GaugeMetricFamily('frigate_detector_inference_speed_seconds',
'Time spent running object detection in seconds.', labels=['name'])
detector_pid = GaugeMetricFamily('frigate_detector_pid',
'PID for the shared process that runs object detection on the detector',
labels=['name'])
detector_detection_start = GaugeMetricFamily('frigate_detection_start',
'Detector start time (unix timestamp)',
labels=['name'])
try:
for k, d in data['detectors'].items():
add_metric(detector_inference_speed, k, d, 'inference_speed', 0.001) # ms to seconds
add_metric(detector_pid, k, d, 'pid')
add_metric(detector_detection_start, k, d, 'detection_start')
except KeyError:
pass
yield detector_inference_speed
yield detector_pid
yield detector_detection_start
# process stats
cpu_usages = GaugeMetricFamily('frigate_cpu_usage_percent', 'Process CPU usage %', labels=['pid'])
mem_usages = GaugeMetricFamily('frigate_mem_usage_percent', 'Process memory usage %', labels=['pid'])
try:
for k, d in data['cpu_usages'].items():
add_metric(cpu_usages, k, d, 'cpu')
add_metric(mem_usages, k, d, 'mem')
except KeyError:
pass
yield cpu_usages
yield mem_usages
# gpu stats
gpu_usages = GaugeMetricFamily('frigate_gpu_usage_percent', 'GPU utilisation %', labels=['gpu'])
gpu_mem_usages = GaugeMetricFamily('frigate_gpu_mem_usage_percent', 'GPU memory usage %', labels=['gpu'])
try:
for k, d in data['gpu_usages'].items():
add_metric(gpu_usages, k, d, 'gpu')
add_metric(gpu_usages, k, d, 'mem')
except KeyError:
pass
yield gpu_usages
yield gpu_mem_usages
# service stats
uptime_seconds = GaugeMetricFamily('frigate_service_uptime_seconds', 'Uptime seconds')
last_updated_timestamp = GaugeMetricFamily('frigate_service_last_updated_timestamp',
'Stats recorded time (unix timestamp)')
try:
s = data['service']
add_metric(uptime_seconds, '', s, 'uptime')
add_metric(last_updated_timestamp, '', s, 'last_updated')
info = {'latest_version': data['service']['latest_version'], 'version': data['service']['version']}
yield InfoMetricFamily('frigate_service', 'Frigate version info', value=info)
except KeyError:
pass
yield uptime_seconds
yield last_updated_timestamp
# service->temperatures: no data for me
storage_free = GaugeMetricFamily('frigate_storage_free_bytes', 'Storage free bytes', labels=['storage'])
storage_mount_type = InfoMetricFamily('frigate_storage_mount_type', 'Storage mount type', labels=['storage'])
storage_total = GaugeMetricFamily('frigate_storage_total_bytes', 'Storage total bytes', labels=['storage'])
storage_used = GaugeMetricFamily('frigate_storage_used_bytes', 'Storage used bytes', labels=['storage'])
try:
for k, d in data['service']['storage'].items():
add_metric(storage_free, k, d, 'free', 1e6) # MB to bytes
add_metric(storage_total, k, d, 'total', 1e6) # MB to bytes
add_metric(storage_used, k, d, 'used', 1e6) # MB to bytes
storage_mount_type.add_metric(k, {'mount_type': d['mount_type']})
except KeyError:
pass
yield storage_free
yield storage_mount_type
yield storage_total
yield storage_used
yield url_up_gauge
yield url_response_ms_gauge

View File

@ -1,28 +0,0 @@
import json
from urllib.request import urlopen
from prometheus_client import CollectorRegistry
from prometheus_client.metrics_core import GaugeMetricFamily
from requester import Requester
def setupRegistry():
myregistry = CollectorRegistry()
myregistry.register(CustomCollector())
return myregistry
class CustomCollector():
def __init__(self):
self.stats_url = "http://localhost:5000/api/stats"
def collect(self):
data = json.loads(urlopen(self.url).read())
for k, d in data.items():
print("".format(k, d))

View File

@ -1,34 +0,0 @@
import requests
def convertMicroToMilliSeconds(microseconds):
if microseconds is not None:
return microseconds / 1000
return 0
class CustomResponse:
def __init__(self, url, response_ms, up_or_down):
self.url = url
self.response_ms = response_ms
self.up_or_down = up_or_down
def __str__(self):
return f"{self.url}:\nstatus -> {self.up_or_down}\nresponse_ms -> {self.response_ms}\n"
class Requester:
def __init__(self, url):
self.url = url
def get_request(self):
res = requests.get(self.url)
if res is not None:
upDown = 0
if res.status_code == 200:
upDown = 1
milliseconds = convertMicroToMilliSeconds(res.elapsed.microseconds)
return CustomResponse(self.url, milliseconds, upDown)
else:
# The request did not return anything
return CustomResponse(self.url, 0, 0)