Initial vector similarity implementation

2026-02-07 11:45:24 +03:00 · 2023-12-18 02:12:53 -05:00 · 2023-12-18 02:12:53 -05:00 · 3b529ede36
commit 3b529ede36
parent 21609631f9
29 changed files with 475 additions and 6 deletions
--- a/.devcontainer/devcontainer.json
+++ b/.devcontainer/devcontainer.json
@ -10,7 +10,7 @@
  "features": {
    "ghcr.io/devcontainers/features/common-utils:1": {}
  },
-  "forwardPorts": [5000, 5001, 5173, 1935, 8554, 8555],
+  "forwardPorts": [5000, 5001, 5173, 1935, 8000, 8554, 8555],
  "portsAttributes": {
    "5000": {
      "label": "NGINX",
@ -28,6 +28,10 @@
      "label": "RTMP",
      "onAutoForward": "silent"
    },
+    "8000": {
+      "label": "Chroma",
+      "onAutoForward": "silent"
+    },
    "8554": {
      "label": "gortc RTSP",
      "onAutoForward": "silent"
--- a/docker/main/Dockerfile
+++ b/docker/main/Dockerfile
@ -8,7 +8,7 @@ ARG SLIM_BASE=debian:11-slim

 FROM ${BASE_IMAGE} AS base

-FROM --platform=${BUILDPLATFORM} debian:11 AS base_host
+FROM --platform=${BUILDPLATFORM} ${BASE_IMAGE} AS base_host

 FROM ${SLIM_BASE} AS slim-base

@ -176,6 +176,9 @@ ARG APT_KEY_DONT_WARN_ON_DANGEROUS_USAGE=DontWarn
 ENV NVIDIA_VISIBLE_DEVICES=all
 ENV NVIDIA_DRIVER_CAPABILITIES="compute,video,utility"

+# Turn off Chroma Telemetry: https://docs.trychroma.com/telemetry#opting-out
+ENV ANONYMIZED_TELEMETRY=False
+
 ENV PATH="/usr/lib/btbn-ffmpeg/bin:/usr/local/go2rtc/bin:/usr/local/nginx/sbin:${PATH}"

 # Install dependencies
--- a/docker/main/requirements-wheels.txt
+++ b/docker/main/requirements-wheels.txt
@ -27,3 +27,9 @@ unidecode == 1.3.*
 # Openvino Library - Custom built with MYRIAD support
 openvino @ https://github.com/NateMeyer/openvino-wheels/releases/download/multi-arch_2022.3.1/openvino-2022.3.1-1-cp39-cp39-manylinux_2_31_x86_64.whl; platform_machine == 'x86_64'
 openvino @ https://github.com/NateMeyer/openvino-wheels/releases/download/multi-arch_2022.3.1/openvino-2022.3.1-1-cp39-cp39-linux_aarch64.whl; platform_machine == 'aarch64'
+# Embeddings
+onnxruntime == 1.16.*
+onnx_clip == 4.0.*
+pysqlite3-binary == 0.5.2
+chromadb == 0.4.20
+google-generativeai == 0.3.*
--- a/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma-log/consumer-for
+++ b/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma-log/consumer-for
@ -0,0 +1 @@
+chroma
--- a/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma-log/dependencies.d/log-prepare
+++ b/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma-log/dependencies.d/log-prepare
--- a/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma-log/pipeline-name
+++ b/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma-log/pipeline-name
@ -0,0 +1 @@
+chroma-pipeline
--- a/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma-log/run
+++ b/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma-log/run
@ -0,0 +1,4 @@
+#!/command/with-contenv bash
+# shellcheck shell=bash
+
+exec logutil-service /dev/shm/logs/chroma
--- a/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma-log/type
+++ b/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma-log/type
@ -0,0 +1 @@
+longrun
--- a/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma/dependencies.d/base
+++ b/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma/dependencies.d/base
--- a/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma/finish
+++ b/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma/finish
@ -0,0 +1,28 @@
+#!/command/with-contenv bash
+# shellcheck shell=bash
+# Take down the S6 supervision tree when the service exits
+
+set -o errexit -o nounset -o pipefail
+
+# Logs should be sent to stdout so that s6 can collect them
+
+declare exit_code_container
+exit_code_container=$(cat /run/s6-linux-init-container-results/exitcode)
+readonly exit_code_container
+readonly exit_code_service="${1}"
+readonly exit_code_signal="${2}"
+readonly service="ChromaDB"
+
+echo "[INFO] Service ${service} exited with code ${exit_code_service} (by signal ${exit_code_signal})"
+
+if [[ "${exit_code_service}" -eq 256 ]]; then
+  if [[ "${exit_code_container}" -eq 0 ]]; then
+    echo $((128 + exit_code_signal)) >/run/s6-linux-init-container-results/exitcode
+  fi
+elif [[ "${exit_code_service}" -ne 0 ]]; then
+  if [[ "${exit_code_container}" -eq 0 ]]; then
+    echo "${exit_code_service}" >/run/s6-linux-init-container-results/exitcode
+  fi
+fi
+
+exec /run/s6/basedir/bin/halt
--- a/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma/producer-for
+++ b/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma/producer-for
@ -0,0 +1 @@
+chroma-log
--- a/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma/run
+++ b/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma/run
@ -0,0 +1,16 @@
+#!/command/with-contenv bash
+# shellcheck shell=bash
+# Start the Frigate service
+
+set -o errexit -o nounset -o pipefail
+
+# Logs should be sent to stdout so that s6 can collect them
+
+# Tell S6-Overlay not to restart this service
+s6-svc -O .
+
+echo "[INFO] Starting ChromaDB..."
+
+# Replace the bash process with the Frigate process, redirecting stderr to stdout
+exec 2>&1
+exec /usr/local/chroma run --path /config/chroma --host 127.0.0.1
--- a/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma/timeout-kill
+++ b/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma/timeout-kill
@ -0,0 +1 @@
+120000
--- a/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma/type
+++ b/docker/main/rootfs/etc/s6-overlay/s6-rc.d/chroma/type
@ -0,0 +1 @@
+longrun
--- a/docker/main/rootfs/etc/s6-overlay/s6-rc.d/frigate/dependencies.d/chroma
+++ b/docker/main/rootfs/etc/s6-overlay/s6-rc.d/frigate/dependencies.d/chroma
--- a/docker/main/rootfs/etc/s6-overlay/s6-rc.d/log-prepare/run
+++ b/docker/main/rootfs/etc/s6-overlay/s6-rc.d/log-prepare/run
@ -4,7 +4,7 @@

 set -o errexit -o nounset -o pipefail

-dirs=(/dev/shm/logs/frigate /dev/shm/logs/go2rtc /dev/shm/logs/nginx)
+dirs=(/dev/shm/logs/frigate /dev/shm/logs/go2rtc /dev/shm/logs/nginx /dev/shm/logs/chroma)

 mkdir -p "${dirs[@]}"
 chown nobody:nogroup "${dirs[@]}"
--- a/docker/main/rootfs/usr/local/chroma
+++ b/docker/main/rootfs/usr/local/chroma
@ -0,0 +1,14 @@
+#!/usr/bin/python3
+# -*- coding: utf-8 -*-s
+__import__("pysqlite3")
+
+import re
+import sys
+
+sys.modules["sqlite3"] = sys.modules.pop("pysqlite3")
+
+from chromadb.cli.cli import app
+
+if __name__ == "__main__":
+    sys.argv[0] = re.sub(r"(-script\.pyw|\.exe)?$", "", sys.argv[0])
+    sys.exit(app())
--- a/frigate/main.py
+++ b/frigate/main.py
@ -1,3 +1,8 @@
+__import__("pysqlite3")
+import sys
+
+sys.modules["sqlite3"] = sys.modules.pop("pysqlite3")
+
 import faulthandler
 import threading

--- a/frigate/app.py
+++ b/frigate/app.py
@ -31,6 +31,7 @@ from frigate.const import (
    MODEL_CACHE_DIR,
    RECORD_DIR,
 )
+from frigate.embeddings.processor import EmbeddingProcessor
 from frigate.events.audio import listen_to_audio
 from frigate.events.cleanup import EventCleanup
 from frigate.events.external import ExternalEventProcessor
@ -273,6 +274,9 @@ class FrigateApp:
        # Queue for timeline events
        self.timeline_queue: Queue = mp.Queue()

+        # Queue for embeddings process
+        self.embeddings_queue: Queue = mp.Queue()
+
        # Queue for inter process communication
        self.inter_process_queue: Queue = mp.Queue()

@ -584,6 +588,12 @@ class FrigateApp:
        )
        self.timeline_processor.start()

+    def start_embeddings_processor(self) -> None:
+        self.embeddings_processor = EmbeddingProcessor(
+            self.config, self.embeddings_queue, self.stop_event
+        )
+        self.embeddings_processor.start()
+
    def start_event_processor(self) -> None:
        self.event_processor = EventProcessor(
            self.config,
@ -591,6 +601,7 @@ class FrigateApp:
            self.event_queue,
            self.event_processed_queue,
            self.timeline_queue,
+            self.embeddings_queue,
            self.stop_event,
        )
        self.event_processor.start()
@ -700,6 +711,7 @@ class FrigateApp:
        self.init_external_event_processor()
        self.init_web_server()
        self.start_timeline_processor()
+        self.start_embeddings_processor()
        self.start_event_processor()
        self.start_event_cleanup()
        self.start_record_cleanup()
@ -742,6 +754,7 @@ class FrigateApp:
        self.record_cleanup.join()
        self.stats_emitter.join()
        self.frigate_watchdog.join()
+        self.embeddings_processor.join()
        self.db.stop()

        while len(self.detection_shms) > 0:
@ -758,6 +771,7 @@ class FrigateApp:
            self.audio_recordings_info_queue,
            self.log_queue,
            self.inter_process_queue,
+            self.embeddings_queue,
        ]:
            if queue is not None:
                while not queue.empty():
--- a/frigate/config.py
+++ b/frigate/config.py
@ -680,6 +680,23 @@ class SnapshotsConfig(FrigateBaseModel):
    )


+class SemanticSearchConfig(FrigateBaseModel):
+    enabled: bool = Field(default=False, title="Enable semantic search.")
+
+
+class GeminiConfig(FrigateBaseModel):
+    enabled: bool = Field(default=False, title="Enable Google Gemini captioning.")
+    override_existing: bool = Field(
+        default=False, title="Override existing sub labels."
+    )
+    api_key: str = Field(default="", title="Google AI Studio API Key.")
+    prompt: str = Field(
+        default="Describe the {label} in this image with as much detail as possible. Do not describe the background.",
+        title="Default caption prompt.",
+    )
+    object_prompts: Dict[str, str] = Field(default={}, title="Object specific prompts.")
+
+
 class ColorConfig(FrigateBaseModel):
    red: int = Field(default=255, ge=0, le=255, title="Red")
    green: int = Field(default=255, ge=0, le=255, title="Green")
@ -783,6 +800,9 @@ class CameraConfig(FrigateBaseModel):
    onvif: OnvifConfig = Field(
        default_factory=OnvifConfig, title="Camera Onvif Configuration."
    )
+    gemini: GeminiConfig = Field(
+        default_factory=GeminiConfig, title="Google Gemini Configuration."
+    )
    ui: CameraUiConfig = Field(
        default_factory=CameraUiConfig, title="Camera UI Modifications."
    )
@ -1051,6 +1071,12 @@ class FrigateConfig(FrigateBaseModel):
    snapshots: SnapshotsConfig = Field(
        default_factory=SnapshotsConfig, title="Global snapshots configuration."
    )
+    semantic_search: SemanticSearchConfig = Field(
+        default_factory=SemanticSearchConfig, title="Semantic Search configuration."
+    )
+    gemini: GeminiConfig = Field(
+        default_factory=GeminiConfig, title="Global Google Gemini Configuration."
+    )
    live: CameraLiveConfig = Field(
        default_factory=CameraLiveConfig, title="Live playback settings."
    )
@ -1090,6 +1116,10 @@ class FrigateConfig(FrigateBaseModel):
            config.mqtt.user = config.mqtt.user.format(**FRIGATE_ENV_VARS)
            config.mqtt.password = config.mqtt.password.format(**FRIGATE_ENV_VARS)

+        # Gemini API Key substitutions
+        if config.gemini.api_key:
+            config.gemini.api_key = config.gemini.api_key.format(**FRIGATE_ENV_VARS)
+
        # set default min_score for object attributes
        for attribute in ALL_ATTRIBUTE_LABELS:
            if not config.objects.filters.get(attribute):
@ -1110,6 +1140,7 @@ class FrigateConfig(FrigateBaseModel):
                "detect": ...,
                "ffmpeg": ...,
                "timestamp_style": ...,
+                "gemini": ...,
            },
            exclude_unset=True,
        )
@ -1176,6 +1207,13 @@ class FrigateConfig(FrigateBaseModel):
                camera_config.onvif.password = camera_config.onvif.password.format(
                    **FRIGATE_ENV_VARS
                )
+
+            # Gemini substitution
+            if camera_config.gemini.api_key:
+                camera_config.gemini.api_key = camera_config.gemini.api_key.format(
+                    **FRIGATE_ENV_VARS
+                )
+
            # set config pre-value
            camera_config.record.enabled_in_config = camera_config.record.enabled
            camera_config.audio.enabled_in_config = camera_config.audio.enabled
--- a/frigate/const.py
+++ b/frigate/const.py
@ -1,6 +1,7 @@
 CONFIG_DIR = "/config"
 DEFAULT_DB_PATH = f"{CONFIG_DIR}/frigate.db"
 MODEL_CACHE_DIR = f"{CONFIG_DIR}/model_cache"
+DEFAULT_CHROMA_DB_PATH = f"{CONFIG_DIR}/chroma"
 BASE_DIR = "/media/frigate"
 CLIPS_DIR = f"{BASE_DIR}/clips"
 RECORD_DIR = f"{BASE_DIR}/recordings"
--- a/frigate/embeddings/init.py
+++ b/frigate/embeddings/init.py
--- a/frigate/embeddings/functions/clip.py
+++ b/frigate/embeddings/functions/clip.py
@ -0,0 +1,62 @@
+"""CLIP Embeddings for Frigate."""
+import os
+from typing import Tuple, Union
+
+import onnxruntime as ort
+from chromadb import EmbeddingFunction, Embeddings
+from chromadb.api.types import (
+    Documents,
+    Images,
+    is_document,
+    is_image,
+)
+from onnx_clip import OnnxClip
+
+from frigate.const import MODEL_CACHE_DIR
+
+
+class Clip(OnnxClip):
+    """Override load models to download to cache directory."""
+
+    @staticmethod
+    def _load_models(
+        model: str,
+        silent: bool,
+    ) -> Tuple[ort.InferenceSession, ort.InferenceSession]:
+        """
+        These models are a part of the container. Treat as as such.
+        """
+        if model == "ViT-B/32":
+            IMAGE_MODEL_FILE = "clip_image_model_vitb32.onnx"
+            TEXT_MODEL_FILE = "clip_text_model_vitb32.onnx"
+        elif model == "RN50":
+            IMAGE_MODEL_FILE = "clip_image_model_rn50.onnx"
+            TEXT_MODEL_FILE = "clip_text_model_rn50.onnx"
+        else:
+            raise ValueError(f"Unexpected model {model}. No `.onnx` file found.")
+
+        models = []
+        for model_file in [IMAGE_MODEL_FILE, TEXT_MODEL_FILE]:
+            path = os.path.join(MODEL_CACHE_DIR, "clip", model_file)
+            models.append(OnnxClip._load_model(path, silent))
+
+        return models[0], models[1]
+
+
+class ClipEmbedding(EmbeddingFunction):
+    """Embedding function for CLIP model used in Chroma."""
+
+    def __init__(self, model: str = "ViT-B/32"):
+        """Initialize CLIP Embedding function."""
+        self.model = Clip(model)
+
+    def __call__(self, input: Union[Documents, Images]) -> Embeddings:
+        embeddings: Embeddings = []
+        for item in input:
+            if is_image(item):
+                result = self.model.get_image_embeddings([item])
+                embeddings.append(result[0, :].tolist())
+            elif is_document(item):
+                result = self.model.get_text_embeddings([item])
+                embeddings.append(result[0, :].tolist())
+        return embeddings
--- a/frigate/embeddings/functions/minilm_l6_v2.py
+++ b/frigate/embeddings/functions/minilm_l6_v2.py
@ -0,0 +1,12 @@
+"""Embedding function for ONNX MiniLM-L6 model used in Chroma."""
+
+
+from chromadb.utils.embedding_functions import ONNXMiniLM_L6_V2
+
+from frigate.const import MODEL_CACHE_DIR
+
+
+class MiniLMEmbedding(ONNXMiniLM_L6_V2):
+    """Override DOWNLOAD_PATH to download to cache directory."""
+
+    DOWNLOAD_PATH = f"{MODEL_CACHE_DIR}/all-MiniLM-L6-v2"
--- a/frigate/embeddings/processor.py
+++ b/frigate/embeddings/processor.py
@ -0,0 +1,170 @@
+"""Create a Chroma vector database for semantic search."""
+
+import base64
+import io
+import logging
+import queue
+import threading
+from multiprocessing import Queue
+from multiprocessing.synchronize import Event as MpEvent
+
+import google.generativeai as genai
+import numpy as np
+from chromadb import Collection
+from chromadb import HttpClient as ChromaClient
+from chromadb.config import Settings
+from peewee import DoesNotExist
+from PIL import Image
+from playhouse.shortcuts import model_to_dict
+
+from frigate.config import FrigateConfig
+from frigate.models import Event
+
+from .functions.clip import ClipEmbedding
+from .functions.minilm_l6_v2 import MiniLMEmbedding
+
+logger = logging.getLogger(__name__)
+
+
+class EmbeddingProcessor(threading.Thread):
+    """Handle gemini queue and post event updates."""
+
+    def __init__(
+        self,
+        config: FrigateConfig,
+        queue: Queue,
+        stop_event: MpEvent,
+    ) -> None:
+        threading.Thread.__init__(self)
+        self.name = "chroma"
+        self.config = config
+        self.queue = queue
+        self.stop_event = stop_event
+        self.chroma: ChromaClient = None
+        self.thumbnail: Collection = None
+        self.description: Collection = None
+        self.gemini: genai.GenerativeModel = None
+
+    def run(self) -> None:
+        """Maintain a Chroma vector database for semantic search."""
+
+        # Exit if disabled
+        if not self.config.semantic_search.enabled:
+            return
+
+        # Create the database
+        self.chroma = ChromaClient(settings=Settings(anonymized_telemetry=False))
+
+        # Create/Load the collection(s)
+        self.thumbnail = self.chroma.get_or_create_collection(
+            name="event_thumbnail", embedding_function=ClipEmbedding()
+        )
+        self.description = self.chroma.get_or_create_collection(
+            name="event_description", embedding_function=MiniLMEmbedding()
+        )
+
+        ## Initialize Gemini
+        if self.config.gemini.enabled:
+            genai.configure(api_key=self.config.gemini.api_key)
+            self.gemini = genai.GenerativeModel("gemini-pro-vision")
+
+        # Process events
+        while not self.stop_event.is_set():
+            try:
+                (
+                    event_id,
+                    camera,
+                ) = self.queue.get(timeout=1)
+            except queue.Empty:
+                continue
+
+            camera_config = self.config.cameras[camera]
+
+            try:
+                event: Event = Event.get(Event.id == event_id)
+            except DoesNotExist:
+                continue
+
+            # Extract valid event metadata
+            metadata = {
+                k: v
+                for k, v in model_to_dict(event).items()
+                if k not in ["id", "thumbnail"]
+                and v is not None
+                and isinstance(v, (str, int, float, bool))
+            }
+            thumbnail = base64.b64decode(event.thumbnail)
+
+            # Encode the thumbnail
+            self._embed_thumbnail(event.id, thumbnail, metadata)
+
+            # Skip if we aren't generating descriptions with Gemini
+            if not camera_config.gemini.enabled or (
+                not camera_config.gemini.override_existing
+                and event.data.get("description") is not None
+            ):
+                continue
+
+            # Generate the description. Call happens in a thread since it is network bound.
+            threading.Thread(
+                target=self._embed_description,
+                name=f"_embed_description_{event.id}",
+                daemon=True,
+                args=(
+                    event,
+                    thumbnail,
+                    metadata,
+                ),
+            ).start()
+
+    def _embed_thumbnail(self, event_id: str, thumbnail: bytes, metadata: dict) -> None:
+        """Embed the thumbnail for an event."""
+
+        # Encode the thumbnail
+        img = np.array(Image.open(io.BytesIO(thumbnail)).convert("RGB"))
+        self.thumbnail.add(
+            images=[img],
+            metadatas=[metadata],
+            ids=[event_id],
+        )
+
+    def _embed_description(
+        self, event: Event, thumbnail: bytes, metadata: dict
+    ) -> None:
+        """Embed the description for an event."""
+
+        content = {
+            "mime_type": "image/jpeg",
+            "data": thumbnail,
+        }
+
+        # Fetch the prompt from the config and format the string replacing variables from the event
+        prompt = self.config.gemini.object_prompts.get(
+            event.label, self.config.gemini.prompt
+        ).format(**metadata)
+
+        response = self.gemini.generate_content(
+            [content, prompt],
+            generation_config=genai.types.GenerationConfig(
+                candidate_count=1,
+            ),
+        )
+
+        try:
+            description = response.text.strip()
+        except ValueError:
+            # No description was generated
+            return
+
+        # Update the event to add the description
+        event.data["description"] = description
+        event.save()
+
+        # Encode the description
+        self.description.add(
+            documents=[description],
+            metadatas=[metadata],
+            ids=[event.id],
+        )
+
+        logger.info("Generated description for %s: %s", event.id, description)
--- a/frigate/events/maintainer.py
+++ b/frigate/events/maintainer.py
@ -62,6 +62,7 @@ class EventProcessor(threading.Thread):
        event_queue: Queue,
        event_processed_queue: Queue,
        timeline_queue: Queue,
+        embeddings_queue: Queue,
        stop_event: MpEvent,
    ):
        threading.Thread.__init__(self)
@ -71,6 +72,7 @@ class EventProcessor(threading.Thread):
        self.event_queue = event_queue
        self.event_processed_queue = event_processed_queue
        self.timeline_queue = timeline_queue
+        self.embeddings_queue = embeddings_queue
        self.events_in_process: Dict[str, Event] = {}
        self.stop_event = stop_event

@ -240,6 +242,7 @@ class EventProcessor(threading.Thread):
        if event_type == "end":
            del self.events_in_process[event_data["id"]]
            self.event_processed_queue.put((event_data["id"], camera))
+            self.embeddings_queue.put((event_data["id"], camera))

    def handle_external_detection(self, event_type: str, event_data: Event) -> None:
        if event_type == "new":
--- a/frigate/http.py
+++ b/frigate/http.py
@ -17,6 +17,9 @@ import cv2
 import numpy as np
 import pytz
 import requests
+from chromadb import Collection, QueryResult
+from chromadb import HttpClient as ChromaClient
+from chromadb.config import Settings
 from flask import (
    Blueprint,
    Flask,
@ -42,6 +45,8 @@ from frigate.const import (
    MAX_SEGMENT_DURATION,
    RECORD_DIR,
 )
+from frigate.embeddings.functions.clip import ClipEmbedding
+from frigate.embeddings.functions.minilm_l6_v2 import MiniLMEmbedding
 from frigate.events.external import ExternalEventProcessor
 from frigate.models import Event, Previews, Recordings, Regions, Timeline
 from frigate.object_processing import TrackedObject
@ -103,6 +108,13 @@ def create_app(
    app.plus_api = plus_api
    app.camera_error_image = None
    app.hwaccel_errors = []
+    app.chroma = ChromaClient(settings=Settings(anonymized_telemetry=False))
+    app.thumbnail_collection = app.chroma.get_or_create_collection(
+        name="event_thumbnail", embedding_function=ClipEmbedding()
+    )
+    app.description_collection = app.chroma.get_or_create_collection(
+        name="event_description", embedding_function=MiniLMEmbedding()
+    )

    app.register_blueprint(bp)

@ -998,6 +1010,7 @@ def events():
    is_submitted = request.args.get("is_submitted", type=int)
    min_length = request.args.get("min_length", type=float)
    max_length = request.args.get("max_length", type=float)
+    search = request.args.get("search", type=str) or None

    clauses = []

@ -1019,16 +1032,24 @@ def events():
        Event.data,
    ]

+    # Start collecting filters for the embeddings metadata.
+    # We won't be able to do all the filters like we do against the DB
+    # because the table might have been modified after, but we should
+    # do what we can.
+    embeddings_filters = []
+
    if camera != "all":
        clauses.append((Event.camera == camera))

    if cameras != "all":
        camera_list = cameras.split(",")
        clauses.append((Event.camera << camera_list))
+        embeddings_filters.append({"camera": {"$in": camera_list}})

    if labels != "all":
        label_list = labels.split(",")
        clauses.append((Event.label << label_list))
+        embeddings_filters.append({"label": {"$in": label_list}})

    if sub_labels != "all":
        # use matching so joined sub labels are included
@ -1071,9 +1092,11 @@ def events():

    if after:
        clauses.append((Event.start_time > after))
+        embeddings_filters.append({"start_time": {"$gt": after}})

    if before:
        clauses.append((Event.start_time < before))
+        embeddings_filters.append({"start_time": {"$lt": before}})

    if time_range != DEFAULT_TIME_RANGE:
        # get timezone arg to ensure browser times are used
@ -1141,6 +1164,40 @@ def events():
    if len(clauses) == 0:
        clauses.append((True))

+    # Handle semantic search
+    event_order = None
+    if search is not None:
+        where = None
+        if len(embeddings_filters) > 1:
+            where = {"$and": embeddings_filters}
+        elif len(embeddings_filters) == 1:
+            where = embeddings_filters[0]
+
+        # Grab the ids of the events that match based on CLIP embeddings
+        thumbnails: Collection = current_app.thumbnail_collection
+        thumb_result: QueryResult = thumbnails.query(
+            query_texts=[search],
+            n_results=int(limit),
+            where=where,
+        )
+        thumb_ids = dict(zip(thumb_result["ids"][0], thumb_result["distances"][0]))
+
+        # Grab the ids of the events that match based on MiniLM embeddings
+        descriptions: Collection = current_app.description_collection
+        desc_result: QueryResult = descriptions.query(
+            query_texts=[search],
+            n_results=int(limit),
+            where=where,
+        )
+        desc_ids = dict(zip(desc_result["ids"][0], desc_result["distances"][0]))
+
+        event_order = {
+            k: min(i for i in (thumb_ids.get(k), desc_ids.get(k)) if i is not None)
+            for k in thumb_ids.keys() | desc_ids
+        }
+
+        clauses.append((Event.id << list(event_order.keys())))
+
    events = (
        Event.select(*selected_columns)
        .where(reduce(operator.and_, clauses))
@ -1149,8 +1206,16 @@ def events():
        .dicts()
        .iterator()
    )
+    events = list(events)

-    return jsonify(list(events))
+    if event_order is not None:
+        events = [
+            {**events, "search_similarity": event_order[events["id"]]}
+            for events in events
+        ]
+        events = sorted(events, key=lambda x: x["search_similarity"])
+
+    return jsonify(events)


@bp.route("/events/<camera_name>/<label>/create", methods=["POST"])
@ -2326,6 +2391,7 @@ def logs(service: str):
        "frigate": "/dev/shm/logs/frigate/current",
        "go2rtc": "/dev/shm/logs/go2rtc/current",
        "nginx": "/dev/shm/logs/nginx/current",
+        "chroma": "/dev/shm/logs/chroma/current",
    }
    service_location = log_locations.get(service)

--- a/web-old/src/components/TextField.jsx
+++ b/web-old/src/components/TextField.jsx
@ -71,7 +71,7 @@ export default function TextField({
          ) : null}
          <div className="relative w-full">
            <input
-              className="h-6 mt-6 w-full bg-transparent focus:outline-none focus:ring-0"
+              className="h-6 mt-6 w-full bg-transparent border-0 focus:outline-none focus:ring-0"
              onBlur={handleBlur}
              onFocus={handleFocus}
              onInput={handleChange}
--- a/web-old/src/routes/Events.jsx
+++ b/web-old/src/routes/Events.jsx
@ -27,6 +27,7 @@ import Button from '../components/Button';
 import Dialog from '../components/Dialog';
 import MultiSelect from '../components/MultiSelect';
 import { formatUnixTimestampToDateTime, getDurationFromTimestamps } from '../utils/dateUtil';
+import TextField from '../components/TextField';
 import TimeAgo from '../components/TimeAgo';
 import Timepicker from '../components/TimePicker';
 import TimelineSummary from '../components/TimelineSummary';
@ -186,6 +187,17 @@ export default function Events({ path, ...props }) {
    }
  };

+  let searchTimeout;
+  const onChangeSearchText = (text) => {
+    if (searchParams?.search == text) {
+      return;
+    }
+    clearTimeout(searchTimeout);
+    searchTimeout = setTimeout(() => {
+      onFilter('search', text);
+    }, 500);
+  };
+
  const onToggleNamedFilter = (name, item) => {
    let items;

@ -367,6 +379,9 @@ export default function Events({ path, ...props }) {
  return (
    <div className="space-y-4 p-2 px-4 w-full">
      <Heading>Events</Heading>
+      <div className="flex flex-wrap gap-2 items-center">
+        <TextField label="Search" onChangeText={(text) => onChangeSearchText(text)} />
+      </div>
      <div className="flex flex-wrap gap-2 items-center">
        <MultiSelect
          className="basis-1/5 cursor-pointer rounded dark:bg-slate-800"
@ -801,7 +816,9 @@ function Event({
              {event.label.replaceAll('_', ' ')}
              {event.sub_label ? `: ${event.sub_label.replaceAll('_', ' ')}` : null}
            </div>
-
+            {event?.data?.description ? (
+              <div className="text-sm flex flex-col grow pb-2">{event.data.description}</div>
+            ) : null}
            <div className="text-sm flex">
              <Clock className="h-5 w-5 mr-2 inline" />
              {formatUnixTimestampToDateTime(event.start_time, { ...config.ui })}