add gemini handler and revert docker-compose

2026-02-07 03:35:26 +03:00 · 2023-12-14 03:13:46 -05:00 · 2023-12-14 03:13:46 -05:00 · 338a635056
commit 338a635056
parent af7cfee82d
2 changed files with 86 additions and 7 deletions
--- a/docker-compose.yml
+++ b/docker-compose.yml
@ -15,13 +15,13 @@ services:
      # Use target devcontainer-trt for TensorRT dev
      target: devcontainer
    ## Uncomment this block for nvidia gpu support
-    deploy:
-          resources:
-              reservations:
-                  devices:
-                      - driver: nvidia
-                        count: 1
-                        capabilities: [gpu]
+    # deploy:
+    #       resources:
+    #           reservations:
+    #               devices:
+    #                   - driver: nvidia
+    #                     count: 1
+    #                     capabilities: [gpu]
    environment:
      YOLO_MODELS: yolov7-320
    devices:
--- a/frigate/gemini.py
+++ b/frigate/gemini.py
@ -0,0 +1,79 @@
+"""Process captions through Google Gemini."""
+
+import base64
+import logging
+import queue
+import threading
+import time
+from multiprocessing import Queue
+from multiprocessing.synchronize import Event as MpEvent
+
+import google.generativeai as genai
+
+from frigate.config import FrigateConfig
+from frigate.models import Event
+
+logger = logging.getLogger(__name__)
+
+
+class GeminiProcessor(threading.Thread):
+    """Handle gemini queue and post event updates."""
+
+    def __init__(
+        self,
+        config: FrigateConfig,
+        queue: Queue,
+        stop_event: MpEvent,
+    ) -> None:
+        threading.Thread.__init__(self)
+        self.name = "gemini_processor"
+        self.config = config
+        self.queue = queue
+        self.stop_event = stop_event
+        genai.configure(api_key=config.gemini.api_key)
+        self.model = genai.GenerativeModel("gemini-pro-vision")
+
+    def run(self) -> None:
+        while not self.stop_event.is_set():
+            try:
+                (
+                    camera,
+                    event_data,
+                ) = self.queue.get(timeout=1)
+            except queue.Empty:
+                continue
+
+            camera_config = self.config.cameras[camera]
+
+            st = time.time()
+            thumbnail = {
+                "mime_type": "image/jpeg",
+                "data": base64.b64decode(event_data["thumbnail"]),
+            }
+            prompt = camera_config.gemini.object_prompts.get(
+                event_data["label"], camera_config.gemini.prompt
+            )
+
+            response = self.model.generate_content(
+                [thumbnail, prompt],
+                generation_config=genai.types.GenerationConfig(
+                    candidate_count=1,
+                    stop_sequences=["."],
+                ),
+            )
+
+            sub_label = response.text.strip()
+            Event.update(sub_label=sub_label).where(
+                Event.id == event_data["id"]
+                and (
+                    camera_config.gemini.override_existing or Event.sub_label.is_null()
+                )
+            ).execute()
+
+            logger.info(
+                "Generated sub label for %s on %s in %.4f seconds: %s",
+                event_data["id"],
+                camera,
+                time.time() - st,
+                sub_label,
+            )