Merge branch 'dev' of https://github.com/blakeblackshear/frigate into addon_config

2026-05-05 13:07:44 +03:00 · 2025-03-09 14:29:42 -03:00 · 2025-03-09 14:29:42 -03:00 · 12460e65f2
commit 12460e65f2
parent 5b99d7d9e7 95b5854449
191 changed files with 7204 additions and 4120 deletions
--- a/.devcontainer/devcontainer.json
+++ b/.devcontainer/devcontainer.json
@ -8,9 +8,25 @@
  "overrideCommand": false,
  "remoteUser": "vscode",
  "features": {
-    "ghcr.io/devcontainers/features/common-utils:1": {}
+    "ghcr.io/devcontainers/features/common-utils:2": {}
+    // Uncomment the following lines to use ONNX Runtime with CUDA support
+    // "ghcr.io/devcontainers/features/nvidia-cuda:1": {
+    //   "installCudnn": true,
+    //   "installNvtx": true,
+    //   "installToolkit": true,
+    //   "cudaVersion": "12.5",
+    //   "cudnnVersion": "9.4.0.58"
+    // },
+    // "./features/onnxruntime-gpu": {}
  },
-  "forwardPorts": [8971, 5000, 5001, 5173, 8554, 8555],
+  "forwardPorts": [
+    8971,
+    5000,
+    5001,
+    5173,
+    8554,
+    8555
+  ],
  "portsAttributes": {
    "8971": {
      "label": "External NGINX",
@ -64,10 +80,18 @@
        "editor.formatOnType": true,
        "python.testing.pytestEnabled": false,
        "python.testing.unittestEnabled": true,
-        "python.testing.unittestArgs": ["-v", "-s", "./frigate/test"],
+        "python.testing.unittestArgs": [
+          "-v",
+          "-s",
+          "./frigate/test"
+        ],
        "files.trimTrailingWhitespace": true,
-        "eslint.workingDirectories": ["./web"],
-        "isort.args": ["--settings-path=./pyproject.toml"],
+        "eslint.workingDirectories": [
+          "./web"
+        ],
+        "isort.args": [
+          "--settings-path=./pyproject.toml"
+        ],
        "[python]": {
          "editor.defaultFormatter": "charliermarsh.ruff",
          "editor.formatOnSave": true,
@ -86,9 +110,16 @@
          ],
          "editor.tabSize": 2
        },
-        "cSpell.ignoreWords": ["rtmp"],
-        "cSpell.words": ["preact", "astype", "hwaccel", "mqtt"]
+        "cSpell.ignoreWords": [
+          "rtmp"
+        ],
+        "cSpell.words": [
+          "preact",
+          "astype",
+          "hwaccel",
+          "mqtt"
+        ]
      }
    }
  }
-}
+}
--- a/.devcontainer/features/onnxruntime-gpu/devcontainer-feature.json
+++ b/.devcontainer/features/onnxruntime-gpu/devcontainer-feature.json
@ -0,0 +1,22 @@
+{
+  "id": "onnxruntime-gpu",
+  "version": "0.0.1",
+  "name": "ONNX Runtime GPU (Nvidia)",
+  "description": "Installs ONNX Runtime for Nvidia GPUs.",
+  "documentationURL": "",
+  "options": {
+    "version": {
+      "type": "string",
+      "proposals": [
+        "latest",
+        "1.20.1",
+        "1.20.0"
+      ],
+      "default": "latest",
+      "description": "Version of ONNX Runtime to install"
+    }
+  },
+  "installsAfter": [
+    "ghcr.io/devcontainers/features/nvidia-cuda"
+  ]
+}
--- a/.devcontainer/features/onnxruntime-gpu/install.sh
+++ b/.devcontainer/features/onnxruntime-gpu/install.sh
@ -0,0 +1,15 @@
+#!/usr/bin/env bash
+
+set -e
+
+VERSION=${VERSION}
+
+python3 -m pip config set global.break-system-packages true
+# if VERSION == "latest" or VERSION is empty, install the latest version
+if [ "$VERSION" == "latest" ] || [ -z "$VERSION" ]; then
+    python3 -m pip install onnxruntime-gpu
+else
+    python3 -m pip install onnxruntime-gpu==$VERSION
+fi
+
+echo "Done!"
--- a/.devcontainer/post_create.sh
+++ b/.devcontainer/post_create.sh
@ -19,7 +19,7 @@ sudo chown -R "$(id -u):$(id -g)" /media/frigate
 # When started as a service, LIBAVFORMAT_VERSION_MAJOR is defined in the
 # s6 service file. For dev, where frigate is started from an interactive
 # shell, we define it in .bashrc instead.
-echo 'export LIBAVFORMAT_VERSION_MAJOR=$(/usr/lib/ffmpeg/7.0/bin/ffmpeg -version | grep -Po "libavformat\W+\K\d+")' >> $HOME/.bashrc
+echo 'export LIBAVFORMAT_VERSION_MAJOR=$("$(python3 /usr/local/ffmpeg/get_ffmpeg_path.py)" -version | grep -Po "libavformat\W+\K\d+")' >> "$HOME/.bashrc"

 make version

--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@ -42,7 +42,7 @@ jobs:
          tags: ${{ steps.setup.outputs.image-name }}-amd64
          cache-from: type=registry,ref=${{ steps.setup.outputs.cache-name }}-amd64
  arm64_build:
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-22.04-arm
    name: ARM Build
    steps:
      - name: Check out code
@ -107,7 +107,7 @@ jobs:
            *.cache-from=type=registry,ref=${{ steps.setup.outputs.cache-name }}-jp5
            *.cache-to=type=registry,ref=${{ steps.setup.outputs.cache-name }}-jp5,mode=max
  jetson_jp6_build:
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-22.04-arm
    name: Jetson Jetpack 6
    steps:
      - name: Check out code
@ -175,9 +175,10 @@ jobs:
          files: docker/rocm/rocm.hcl
          set: |
            rocm.tags=${{ steps.setup.outputs.image-name }}-rocm
+            *.cache-to=type=registry,ref=${{ steps.setup.outputs.cache-name }}-rocm,mode=max
            *.cache-from=type=gha
  arm64_extra_builds:
-    runs-on: ubuntu-22.04
+    runs-on: ubuntu-22.04-arm
    name: ARM Extra Build
    needs:
      - arm64_build
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@ -24,7 +24,7 @@ jobs:
          persist-credentials: false
      - uses: actions/setup-node@master
        with:
-          node-version: 16.x
+          node-version: 20.x
      - name: Install devcontainer cli
        run: npm install --global @devcontainers/cli
      - name: Build devcontainer
@ -64,6 +64,9 @@ jobs:
          node-version: 20.x
      - run: npm install
        working-directory: ./web
+      - name: Build web
+        run: npm run build
+        working-directory: ./web
      # - name: Test
      #   run: npm run test
      #   working-directory: ./web
@ -77,7 +80,7 @@ jobs:
        with:
          persist-credentials: false
      - name: Set up Python ${{ env.DEFAULT_PYTHON }}
-        uses: actions/setup-python@v5.3.0
+        uses: actions/setup-python@v5.4.0
        with:
          python-version: ${{ env.DEFAULT_PYTHON }}
      - name: Install requirements
@ -99,14 +102,6 @@ jobs:
        uses: actions/checkout@v4
        with:
          persist-credentials: false
-      - uses: actions/setup-node@master
-        with:
-          node-version: 16.x
-      - run: npm install
-        working-directory: ./web
-      - name: Build web
-        run: npm run build
-        working-directory: ./web
      - name: Set up QEMU
        uses: docker/setup-qemu-action@v3
      - name: Set up Docker Buildx
--- a/docker/main/Dockerfile
+++ b/docker/main/Dockerfile
@ -14,16 +14,18 @@ ARG BASE_HOOK=

 FROM ${BASE_IMAGE} AS base
 ARG PIP_BREAK_SYSTEM_PACKAGES
+ARG BASE_HOOK

-RUN ${BASE_HOOK}
+RUN sh -c "$BASE_HOOK"

 FROM --platform=${BUILDPLATFORM} debian:12 AS base_host
 ARG PIP_BREAK_SYSTEM_PACKAGES

 FROM ${SLIM_BASE} AS slim-base
 ARG PIP_BREAK_SYSTEM_PACKAGES
+ARG BASE_HOOK

-RUN ${BASE_HOOK}
+RUN sh -c "$BASE_HOOK"

 FROM slim-base AS wget
 ARG DEBIAN_FRONTEND
@ -37,10 +39,7 @@ ARG DEBIAN_FRONTEND
 ENV CCACHE_DIR /root/.ccache
 ENV CCACHE_MAXSIZE 2G

-# bind /var/cache/apt to tmpfs to speed up nginx build
-RUN --mount=type=tmpfs,target=/tmp --mount=type=tmpfs,target=/var/cache/apt \
-    --mount=type=bind,source=docker/main/build_nginx.sh,target=/deps/build_nginx.sh \
-    --mount=type=cache,target=/root/.ccache \
+RUN --mount=type=bind,source=docker/main/build_nginx.sh,target=/deps/build_nginx.sh \
    /deps/build_nginx.sh

 FROM wget AS sqlite-vec
@ -223,14 +222,22 @@ ENV TRANSFORMERS_NO_ADVISORY_WARNINGS=1
 # Set OpenCV ffmpeg loglevel to fatal: https://ffmpeg.org/doxygen/trunk/log_8h.html
 ENV OPENCV_FFMPEG_LOGLEVEL=8

+# Set HailoRT to disable logging
+ENV HAILORT_LOGGER_PATH=NONE
+
 ENV PATH="/usr/local/go2rtc/bin:/usr/local/tempio/bin:/usr/local/nginx/sbin:${PATH}"

 # Install dependencies
 RUN --mount=type=bind,source=docker/main/install_deps.sh,target=/deps/install_deps.sh \
    /deps/install_deps.sh

+ENV DEFAULT_FFMPEG_VERSION="7.0"
+ENV INCLUDED_FFMPEG_VERSIONS="${DEFAULT_FFMPEG_VERSION}:5.0"
+
+RUN wget -q https://bootstrap.pypa.io/get-pip.py -O get-pip.py \
+    && python3 get-pip.py "pip"
+
 RUN --mount=type=bind,from=wheels,source=/wheels,target=/deps/wheels \
-    python3 -m pip install --upgrade pip && \
    pip3 install -U /deps/wheels/*.whl

 COPY --from=deps-rootfs / /
--- a/docker/main/install_deps.sh
+++ b/docker/main/install_deps.sh
@ -6,13 +6,13 @@ apt-get -qq update

 apt-get -qq install --no-install-recommends -y \
    apt-transport-https \
+    ca-certificates \
    gnupg \
    wget \
    lbzip2 \
    procps vainfo \
    unzip locales tzdata libxml2 xz-utils \
    python3.11 \
-    python3-pip \
    curl \
    lsof \
    jq \
@ -31,28 +31,28 @@ unset DEBIAN_FRONTEND
 yes | dpkg -i /tmp/libedgetpu1-max.deb && export DEBIAN_FRONTEND=noninteractive
 rm /tmp/libedgetpu1-max.deb

-# btbn-ffmpeg -> amd64
+# ffmpeg -> amd64
 if [[ "${TARGETARCH}" == "amd64" ]]; then
    mkdir -p /usr/lib/ffmpeg/5.0
+    wget -qO ffmpeg.tar.xz "https://github.com/NickM-27/FFmpeg-Builds/releases/download/autobuild-2022-07-31-12-37/ffmpeg-n5.1-2-g915ef932a3-linux64-gpl-5.1.tar.xz"
+    tar -xf ffmpeg.tar.xz -C /usr/lib/ffmpeg/5.0 --strip-components 1 amd64/bin/ffmpeg amd64/bin/ffprobe
+    rm -rf ffmpeg.tar.xz
    mkdir -p /usr/lib/ffmpeg/7.0
-    wget -qO btbn-ffmpeg.tar.xz "https://github.com/NickM-27/FFmpeg-Builds/releases/download/autobuild-2022-07-31-12-37/ffmpeg-n5.1-2-g915ef932a3-linux64-gpl-5.1.tar.xz"
-    tar -xf btbn-ffmpeg.tar.xz -C /usr/lib/ffmpeg/5.0 --strip-components 1
-    rm -rf btbn-ffmpeg.tar.xz /usr/lib/ffmpeg/5.0/doc /usr/lib/ffmpeg/5.0/bin/ffplay
-    wget -qO btbn-ffmpeg.tar.xz "https://github.com/NickM-27/FFmpeg-Builds/releases/download/autobuild-2024-09-19-12-51/ffmpeg-n7.0.2-18-g3e6cec1286-linux64-gpl-7.0.tar.xz"
-    tar -xf btbn-ffmpeg.tar.xz -C /usr/lib/ffmpeg/7.0 --strip-components 1
-    rm -rf btbn-ffmpeg.tar.xz /usr/lib/ffmpeg/7.0/doc /usr/lib/ffmpeg/7.0/bin/ffplay
+    wget -qO ffmpeg.tar.xz "https://github.com/NickM-27/FFmpeg-Builds/releases/download/autobuild-2024-09-19-12-51/ffmpeg-n7.0.2-18-g3e6cec1286-linux64-gpl-7.0.tar.xz"
+    tar -xf ffmpeg.tar.xz -C /usr/lib/ffmpeg/7.0 --strip-components 1 amd64/bin/ffmpeg amd64/bin/ffprobe
+    rm -rf ffmpeg.tar.xz
 fi

 # ffmpeg -> arm64
 if [[ "${TARGETARCH}" == "arm64" ]]; then
    mkdir -p /usr/lib/ffmpeg/5.0
+    wget -qO ffmpeg.tar.xz "https://github.com/NickM-27/FFmpeg-Builds/releases/download/autobuild-2022-07-31-12-37/ffmpeg-n5.1-2-g915ef932a3-linuxarm64-gpl-5.1.tar.xz"
+    tar -xf ffmpeg.tar.xz -C /usr/lib/ffmpeg/5.0 --strip-components 1 arm64/bin/ffmpeg arm64/bin/ffprobe
+    rm -f ffmpeg.tar.xz
    mkdir -p /usr/lib/ffmpeg/7.0
-    wget -qO btbn-ffmpeg.tar.xz "https://github.com/NickM-27/FFmpeg-Builds/releases/download/autobuild-2022-07-31-12-37/ffmpeg-n5.1-2-g915ef932a3-linuxarm64-gpl-5.1.tar.xz"
-    tar -xf btbn-ffmpeg.tar.xz -C /usr/lib/ffmpeg/5.0 --strip-components 1
-    rm -rf btbn-ffmpeg.tar.xz /usr/lib/ffmpeg/5.0/doc /usr/lib/ffmpeg/5.0/bin/ffplay
-    wget -qO btbn-ffmpeg.tar.xz "https://github.com/NickM-27/FFmpeg-Builds/releases/download/autobuild-2024-09-19-12-51/ffmpeg-n7.0.2-18-g3e6cec1286-linuxarm64-gpl-7.0.tar.xz"
-    tar -xf btbn-ffmpeg.tar.xz -C /usr/lib/ffmpeg/7.0 --strip-components 1
-    rm -rf btbn-ffmpeg.tar.xz /usr/lib/ffmpeg/7.0/doc /usr/lib/ffmpeg/7.0/bin/ffplay
+    wget -qO ffmpeg.tar.xz "https://github.com/NickM-27/FFmpeg-Builds/releases/download/autobuild-2024-09-19-12-51/ffmpeg-n7.0.2-18-g3e6cec1286-linuxarm64-gpl-7.0.tar.xz"
+    tar -xf ffmpeg.tar.xz -C /usr/lib/ffmpeg/7.0 --strip-components 1 arm64/bin/ffmpeg arm64/bin/ffprobe
+    rm -f ffmpeg.tar.xz
 fi

 # arch specific packages
--- a/docker/main/requirements-wheels.txt
+++ b/docker/main/requirements-wheels.txt
@ -1,7 +1,7 @@
 aiofiles == 24.1.*
 click == 8.1.*
 # FastAPI
-aiohttp == 3.11.2
+aiohttp == 3.11.3
 starlette == 0.41.2
 starlette-context == 0.3.6
 fastapi == 0.115.*
@ -20,9 +20,9 @@ pandas == 2.2.*
 peewee == 3.17.*
 peewee_migrate == 1.13.*
 psutil == 6.1.*
-pydantic == 2.8.*
+pydantic == 2.10.*
 git+https://github.com/fbcotter/py3nvml#egg=py3nvml
-pytz == 2024.*
+pytz == 2025.*
 pyzmq == 26.2.*
 ruamel.yaml == 0.18.*
 tzlocal == 5.2
@ -34,8 +34,8 @@ ws4py == 0.5.*
 unidecode == 1.3.*
 # Image Manipulation
 numpy == 1.26.*
-opencv-python-headless == 4.10.0.*
-opencv-contrib-python == 4.9.0.*
+opencv-python-headless == 4.11.0.*
+opencv-contrib-python == 4.11.0.*
 scipy == 1.14.*
 # OpenVino & ONNX
 openvino == 2024.4.*
@ -46,7 +46,7 @@ transformers == 4.45.*
 # Generative AI
 google-generativeai == 0.8.*
 ollama == 0.3.*
-openai == 1.51.*
+openai == 1.65.*
 # push notifications
 py-vapid == 1.9.*
 pywebpush == 2.0.*
@ -54,7 +54,6 @@ pywebpush == 2.0.*
 pyclipper == 1.3.*
 shapely == 2.0.*
 Levenshtein==0.26.*
-prometheus-client == 0.21.*
 # HailoRT Wheels
 appdirs==1.4.*
 argcomplete==2.0.*
@ -70,5 +69,5 @@ verboselogs==1.7.*
 virtualenv==20.17.*
 prometheus-client == 0.21.*
 # TFLite
-tflite_runtime @ https://github.com/feranick/TFlite-builds/releases/download/v2.17.1/tflite_runtime-2.17.1-cp311-cp311-linux_x86_64.whl; platform_machine == 'x86_64'
+tflite_runtime @ https://github.com/frigate-nvr/TFlite-builds/releases/download/v2.17.1/tflite_runtime-2.17.1-cp311-cp311-linux_x86_64.whl; platform_machine == 'x86_64'
 tflite_runtime @ https://github.com/feranick/TFlite-builds/releases/download/v2.17.1/tflite_runtime-2.17.1-cp311-cp311-linux_aarch64.whl; platform_machine == 'aarch64'
--- a/docker/main/rootfs/etc/s6-overlay/s6-rc.d/frigate/run
+++ b/docker/main/rootfs/etc/s6-overlay/s6-rc.d/frigate/run
@ -82,8 +82,10 @@ function migrate_db_from_media_to_config() {
 }

 function set_libva_version() {
-    local ffmpeg_path=$(python3 /usr/local/ffmpeg/get_ffmpeg_path.py)
-    export LIBAVFORMAT_VERSION_MAJOR=$($ffmpeg_path -version | grep -Po "libavformat\W+\K\d+")
+    local ffmpeg_path
+    ffmpeg_path=$(python3 /usr/local/ffmpeg/get_ffmpeg_path.py)
+    LIBAVFORMAT_VERSION_MAJOR=$("$ffmpeg_path" -version | grep -Po "libavformat\W+\K\d+")
+    export LIBAVFORMAT_VERSION_MAJOR
 }

 echo "[INFO] Preparing Frigate..."
--- a/docker/main/rootfs/etc/s6-overlay/s6-rc.d/go2rtc/run
+++ b/docker/main/rootfs/etc/s6-overlay/s6-rc.d/go2rtc/run
@ -44,10 +44,14 @@ function get_ip_and_port_from_supervisor() {
 }

 function set_libva_version() {
-    local ffmpeg_path=$(python3 /usr/local/ffmpeg/get_ffmpeg_path.py)
-    export LIBAVFORMAT_VERSION_MAJOR=$($ffmpeg_path -version | grep -Po "libavformat\W+\K\d+")
+    local ffmpeg_path
+    ffmpeg_path=$(python3 /usr/local/ffmpeg/get_ffmpeg_path.py)
+    LIBAVFORMAT_VERSION_MAJOR=$("$ffmpeg_path" -version | grep -Po "libavformat\W+\K\d+")
+    export LIBAVFORMAT_VERSION_MAJOR
 }

+set_libva_version
+
 if [[ -f "/dev/shm/go2rtc.yaml" ]]; then
    echo "[INFO] Removing stale config from last run..."
    rm /dev/shm/go2rtc.yaml
@ -66,8 +70,6 @@ else
    echo "[WARNING] Unable to remove existing go2rtc config. Changes made to your frigate config file may not be recognized. Please remove the /dev/shm/go2rtc.yaml from your docker host manually."
 fi

-set_libva_version
-
 readonly config_path="/config"

 if [[ -x "${config_path}/go2rtc" ]]; then
--- a/docker/main/rootfs/usr/local/ffmpeg/get_ffmpeg_path.py
+++ b/docker/main/rootfs/usr/local/ffmpeg/get_ffmpeg_path.py
@ -1,6 +1,5 @@
 import json
 import os
-import shutil
 import sys

 from ruamel.yaml import YAML
@ -35,10 +34,7 @@ except FileNotFoundError:

 path = config.get("ffmpeg", {}).get("path", "default")
 if path == "default":
-    if shutil.which("ffmpeg") is None:
-        print(f"/usr/lib/ffmpeg/{DEFAULT_FFMPEG_VERSION}/bin/ffmpeg")
-    else:
-        print("ffmpeg")
+    print(f"/usr/lib/ffmpeg/{DEFAULT_FFMPEG_VERSION}/bin/ffmpeg")
 elif path in INCLUDED_FFMPEG_VERSIONS:
    print(f"/usr/lib/ffmpeg/{path}/bin/ffmpeg")
 else:
--- a/docker/main/rootfs/usr/local/go2rtc/create_config.py
+++ b/docker/main/rootfs/usr/local/go2rtc/create_config.py
@ -2,7 +2,6 @@

 import json
 import os
-import shutil
 import sys
 from pathlib import Path

@ -13,6 +12,7 @@ from frigate.const import (
    BIRDSEYE_PIPE,
    DEFAULT_FFMPEG_VERSION,
    INCLUDED_FFMPEG_VERSIONS,
+    LIBAVFORMAT_VERSION_MAJOR,
 )
 from frigate.ffmpeg_presets import parse_preset_hardware_acceleration_encode

@ -115,10 +115,7 @@ else:
 # ensure ffmpeg path is set correctly
 path = config.get("ffmpeg", {}).get("path", "default")
 if path == "default":
-    if shutil.which("ffmpeg") is None:
-        ffmpeg_path = f"/usr/lib/ffmpeg/{DEFAULT_FFMPEG_VERSION}/bin/ffmpeg"
-    else:
-        ffmpeg_path = "ffmpeg"
+    ffmpeg_path = f"/usr/lib/ffmpeg/{DEFAULT_FFMPEG_VERSION}/bin/ffmpeg"
 elif path in INCLUDED_FFMPEG_VERSIONS:
    ffmpeg_path = f"/usr/lib/ffmpeg/{path}/bin/ffmpeg"
 else:
@ -130,14 +127,12 @@ elif go2rtc_config["ffmpeg"].get("bin") is None:
    go2rtc_config["ffmpeg"]["bin"] = ffmpeg_path

 # need to replace ffmpeg command when using ffmpeg4
-if int(os.environ.get("LIBAVFORMAT_VERSION_MAJOR", "59") or "59") < 59:
-    if go2rtc_config["ffmpeg"].get("rtsp") is None:
-        go2rtc_config["ffmpeg"]["rtsp"] = (
-            "-fflags nobuffer -flags low_delay -stimeout 5000000 -user_agent go2rtc/ffmpeg -rtsp_transport tcp -i {input}"
-        )
-else:
+if LIBAVFORMAT_VERSION_MAJOR < 59:
+    rtsp_args = "-fflags nobuffer -flags low_delay -stimeout 5000000 -user_agent go2rtc/ffmpeg -rtsp_transport tcp -i {input}"
    if go2rtc_config.get("ffmpeg") is None:
-        go2rtc_config["ffmpeg"] = {"path": ""}
+        go2rtc_config["ffmpeg"] = {"rtsp": rtsp_args}
+    elif go2rtc_config["ffmpeg"].get("rtsp") is None:
+        go2rtc_config["ffmpeg"]["rtsp"] = rtsp_args

 for name in go2rtc_config.get("streams", {}):
    stream = go2rtc_config["streams"][name]
--- a/docker/main/rootfs/usr/local/nginx/conf/auth_request.conf
+++ b/docker/main/rootfs/usr/local/nginx/conf/auth_request.conf
@ -1,14 +1,16 @@
 ## Send a subrequest to verify if the user is authenticated and has permission to access the resource.
 auth_request /auth;

-## Save the upstream metadata response headers from Authelia to variables.
+## Save the upstream metadata response headers from the auth request to variables
 auth_request_set $user $upstream_http_remote_user;
+auth_request_set $role $upstream_http_remote_role;
 auth_request_set $groups $upstream_http_remote_groups;
 auth_request_set $name $upstream_http_remote_name;
 auth_request_set $email $upstream_http_remote_email;

 ## Inject the metadata response headers from the variables into the request made to the backend.
 proxy_set_header Remote-User $user;
+proxy_set_header Remote-Role $role;
 proxy_set_header Remote-Groups $groups;
 proxy_set_header Remote-Email $email;
 proxy_set_header Remote-Name $name;
--- a/docker/rockchip/Dockerfile
+++ b/docker/rockchip/Dockerfile
@ -3,6 +3,9 @@
 # https://askubuntu.com/questions/972516/debian-frontend-environment-variable
 ARG DEBIAN_FRONTEND=noninteractive

+# Globally set pip break-system-packages option to avoid having to specify it every time
+ARG PIP_BREAK_SYSTEM_PACKAGES=1
+
 FROM wheels as rk-wheels
 COPY docker/main/requirements-wheels.txt /requirements-wheels.txt
 COPY docker/rockchip/requirements-wheels-rk.txt /requirements-wheels-rk.txt
@ -13,6 +16,7 @@ RUN rm -rf /rk-wheels/opencv_python-*

 FROM deps AS rk-frigate
 ARG TARGETARCH
+ARG PIP_BREAK_SYSTEM_PACKAGES

 RUN --mount=type=bind,from=rk-wheels,source=/rk-wheels,target=/deps/rk-wheels \
    pip3 install --no-deps -U /deps/rk-wheels/*.whl
@ -24,8 +28,7 @@ COPY docker/rockchip/conv2rknn.py /opt/conv2rknn.py

 ADD https://github.com/MarcA711/rknn-toolkit2/releases/download/v2.3.0/librknnrt.so /usr/lib/

-RUN rm -rf /usr/lib/btbn-ffmpeg/bin/ffmpeg
-RUN rm -rf /usr/lib/btbn-ffmpeg/bin/ffprobe
 ADD --chmod=111 https://github.com/MarcA711/Rockchip-FFmpeg-Builds/releases/download/6.1-7/ffmpeg /usr/lib/ffmpeg/6.0/bin/
 ADD --chmod=111 https://github.com/MarcA711/Rockchip-FFmpeg-Builds/releases/download/6.1-7/ffprobe /usr/lib/ffmpeg/6.0/bin/
-ENV PATH="/usr/lib/ffmpeg/6.0/bin/:${PATH}"
+ENV DEFAULT_FFMPEG_VERSION="6.0"
+ENV INCLUDED_FFMPEG_VERSIONS="${DEFAULT_FFMPEG_VERSION}:${INCLUDED_FFMPEG_VERSIONS}"
--- a/docker/rocm/Dockerfile
+++ b/docker/rocm/Dockerfile
@ -2,79 +2,49 @@

 # https://askubuntu.com/questions/972516/debian-frontend-environment-variable
 ARG DEBIAN_FRONTEND=noninteractive
-ARG ROCM=5.7.3
+ARG ROCM=6.3.3
 ARG AMDGPU=gfx900
 ARG HSA_OVERRIDE_GFX_VERSION
 ARG HSA_OVERRIDE

 #######################################################################
-FROM ubuntu:focal as rocm
+FROM wget AS rocm

 ARG ROCM
+ARG AMDGPU

-RUN apt-get update && apt-get -y upgrade
-RUN apt-get -y install gnupg wget
-
-RUN mkdir --parents --mode=0755 /etc/apt/keyrings
-
-RUN wget https://repo.radeon.com/rocm/rocm.gpg.key -O - | gpg --dearmor | tee /etc/apt/keyrings/rocm.gpg > /dev/null
-COPY docker/rocm/rocm.list /etc/apt/sources.list.d/
-COPY docker/rocm/rocm-pin-600 /etc/apt/preferences.d/
-
-RUN apt-get update
-
-RUN apt-get -y install --no-install-recommends migraphx hipfft roctracer
-RUN apt-get -y install --no-install-recommends migraphx-dev
+RUN apt update && \
+    apt install -y wget gpg && \
+    wget -O rocm.deb https://repo.radeon.com/amdgpu-install/$ROCM/ubuntu/jammy/amdgpu-install_6.3.60303-1_all.deb && \
+    apt install -y ./rocm.deb && \
+    apt update && \
+    apt install -y rocm

 RUN mkdir -p /opt/rocm-dist/opt/rocm-$ROCM/lib
-RUN cd /opt/rocm-$ROCM/lib && cp -dpr libMIOpen*.so* libamd*.so* libhip*.so* libhsa*.so* libmigraphx*.so* librocm*.so* librocblas*.so* libroctracer*.so* librocfft*.so* /opt/rocm-dist/opt/rocm-$ROCM/lib/
+RUN cd /opt/rocm-$ROCM/lib && \
+    cp -dpr libMIOpen*.so* libamd*.so* libhip*.so* libhsa*.so* libmigraphx*.so* librocm*.so* librocblas*.so* libroctracer*.so* librocfft*.so* librocprofiler*.so* libroctx*.so* /opt/rocm-dist/opt/rocm-$ROCM/lib/ && \
+    mkdir -p /opt/rocm-dist/opt/rocm-$ROCM/lib/migraphx/lib && \
+    cp -dpr migraphx/lib/* /opt/rocm-dist/opt/rocm-$ROCM/lib/migraphx/lib
 RUN cd /opt/rocm-dist/opt/ && ln -s rocm-$ROCM rocm

 RUN mkdir -p /opt/rocm-dist/etc/ld.so.conf.d/
 RUN echo /opt/rocm/lib|tee /opt/rocm-dist/etc/ld.so.conf.d/rocm.conf

-#######################################################################
-FROM --platform=linux/amd64 debian:12 as debian-base
-
-RUN apt-get update && apt-get -y upgrade
-RUN apt-get -y install --no-install-recommends libelf1 libdrm2 libdrm-amdgpu1 libnuma1 kmod
-
-RUN apt-get -y install python3
-
-#######################################################################
-# ROCm does not come with migraphx wrappers for python 3.9, so we build it here
-FROM debian-base as debian-build
-
-ARG ROCM
-
-COPY --from=rocm /opt/rocm-$ROCM /opt/rocm-$ROCM
-RUN ln -s /opt/rocm-$ROCM /opt/rocm
-
-RUN apt-get -y install g++ cmake
-RUN apt-get -y install python3-pybind11 python3-distutils python3-dev
-
-WORKDIR /opt/build
-
-COPY docker/rocm/migraphx .
-
-RUN mkdir build && cd build && cmake .. && make install
-
 #######################################################################
 FROM deps AS deps-prelim

-# need this to install libnuma1
-RUN apt-get update
-# no ugprade?!?!
-RUN apt-get -y install libnuma1
+RUN apt-get update && apt-get install -y libnuma1

-WORKDIR /opt/frigate/
+WORKDIR /opt/frigate
 COPY --from=rootfs / /

-# Temporarily disabled to see if a new wheel can be built to support py3.11
-#COPY docker/rocm/requirements-wheels-rocm.txt /requirements.txt
-#RUN python3 -m pip install --upgrade pip \
-#    && pip3 uninstall -y onnxruntime-openvino \
-#    && pip3 install -r /requirements.txt
+RUN wget -q https://bootstrap.pypa.io/get-pip.py -O get-pip.py \
+    && python3 get-pip.py "pip" --break-system-packages
+RUN python3 -m pip config set global.break-system-packages true
+
+COPY docker/rocm/requirements-wheels-rocm.txt /requirements.txt
+RUN pip3 uninstall -y onnxruntime-openvino \
+    && pip3 install -r /requirements.txt

 #######################################################################
 FROM scratch AS rocm-dist
@ -87,12 +57,11 @@ COPY --from=rocm /opt/rocm-$ROCM/share/miopen/db/*$AMDGPU* /opt/rocm-$ROCM/share
 COPY --from=rocm /opt/rocm-$ROCM/share/miopen/db/*gfx908* /opt/rocm-$ROCM/share/miopen/db/
 COPY --from=rocm /opt/rocm-$ROCM/lib/rocblas/library/*$AMDGPU* /opt/rocm-$ROCM/lib/rocblas/library/
 COPY --from=rocm /opt/rocm-dist/ /
-COPY --from=debian-build /opt/rocm/lib/migraphx.cpython-311-x86_64-linux-gnu.so /opt/rocm-$ROCM/lib/

 #######################################################################
 FROM deps-prelim AS rocm-prelim-hsa-override0
-\
-    ENV HSA_ENABLE_SDMA=0
+ENV HSA_ENABLE_SDMA=0
+ENV MIGRAPHX_ENABLE_NHWC=1

 COPY --from=rocm-dist / /

--- a/docker/rocm/migraphx/CMakeLists.txt
+++ b/docker/rocm/migraphx/CMakeLists.txt
@ -1,26 +0,0 @@
-
-cmake_minimum_required(VERSION 3.1)
-
-set(CMAKE_CXX_STANDARD 17)
-set(CMAKE_CXX_STANDARD_REQUIRED ON)
-set(CMAKE_CXX_EXTENSIONS OFF)
-
-if(NOT CMAKE_BUILD_TYPE)
-  set(CMAKE_BUILD_TYPE Release)
-endif()
-
-SET(CMAKE_INSTALL_RPATH_USE_LINK_PATH TRUE)
-
-project(migraphx_py)
-
-include_directories(/opt/rocm/include)
-
-find_package(pybind11 REQUIRED)
-pybind11_add_module(migraphx migraphx_py.cpp)
-
-target_link_libraries(migraphx PRIVATE /opt/rocm/lib/libmigraphx.so /opt/rocm/lib/libmigraphx_tf.so /opt/rocm/lib/libmigraphx_onnx.so)
-
-install(TARGETS migraphx
-  COMPONENT python
-  LIBRARY DESTINATION /opt/rocm/lib
-)
--- a/docker/rocm/migraphx/migraphx_py.cpp
+++ b/docker/rocm/migraphx/migraphx_py.cpp
@ -1,582 +0,0 @@
-/*
- * The MIT License (MIT)
- *
- * Copyright (c) 2015-2022 Advanced Micro Devices, Inc. All rights reserved.
- *
- * Permission is hereby granted, free of charge, to any person obtaining a copy
- * of this software and associated documentation files (the "Software"), to deal
- * in the Software without restriction, including without limitation the rights
- * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
- * copies of the Software, and to permit persons to whom the Software is
- * furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice shall be included in
- * all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
- * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
- * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
- * THE SOFTWARE.
- */
-
-#include <pybind11/pybind11.h>
-#include <pybind11/stl.h>
-#include <pybind11/numpy.h>
-#include <migraphx/program.hpp>
-#include <migraphx/instruction_ref.hpp>
-#include <migraphx/operation.hpp>
-#include <migraphx/quantization.hpp>
-#include <migraphx/generate.hpp>
-#include <migraphx/instruction.hpp>
-#include <migraphx/ref/target.hpp>
-#include <migraphx/stringutils.hpp>
-#include <migraphx/tf.hpp>
-#include <migraphx/onnx.hpp>
-#include <migraphx/load_save.hpp>
-#include <migraphx/register_target.hpp>
-#include <migraphx/json.hpp>
-#include <migraphx/make_op.hpp>
-#include <migraphx/op/common.hpp>
-
-#ifdef HAVE_GPU
-#include <migraphx/gpu/hip.hpp>
-#endif
-
-using half   = half_float::half;
-namespace py = pybind11;
-
-#ifdef __clang__
-#define MIGRAPHX_PUSH_UNUSED_WARNING \
-    _Pragma("clang diagnostic push") \
-        _Pragma("clang diagnostic ignored \"-Wused-but-marked-unused\"")
-#define MIGRAPHX_POP_WARNING _Pragma("clang diagnostic pop")
-#else
-#define MIGRAPHX_PUSH_UNUSED_WARNING
-#define MIGRAPHX_POP_WARNING
-#endif
-#define MIGRAPHX_PYBIND11_MODULE(...) \
-    MIGRAPHX_PUSH_UNUSED_WARNING      \
-    PYBIND11_MODULE(__VA_ARGS__)      \
-    MIGRAPHX_POP_WARNING
-
-#define MIGRAPHX_PYTHON_GENERATE_SHAPE_ENUM(x, t) .value(#x, migraphx::shape::type_t::x)
-namespace migraphx {
-
-migraphx::value to_value(py::kwargs kwargs);
-migraphx::value to_value(py::list lst);
-
-template <class T, class F>
-void visit_py(T x, F f)
-{
-    if(py::isinstance<py::kwargs>(x))
-    {
-        f(to_value(x.template cast<py::kwargs>()));
-    }
-    else if(py::isinstance<py::list>(x))
-    {
-        f(to_value(x.template cast<py::list>()));
-    }
-    else if(py::isinstance<py::bool_>(x))
-    {
-        f(x.template cast<bool>());
-    }
-    else if(py::isinstance<py::int_>(x) or py::hasattr(x, "__index__"))
-    {
-        f(x.template cast<int>());
-    }
-    else if(py::isinstance<py::float_>(x))
-    {
-        f(x.template cast<float>());
-    }
-    else if(py::isinstance<py::str>(x))
-    {
-        f(x.template cast<std::string>());
-    }
-    else if(py::isinstance<migraphx::shape::dynamic_dimension>(x))
-    {
-        f(migraphx::to_value(x.template cast<migraphx::shape::dynamic_dimension>()));
-    }
-    else
-    {
-        MIGRAPHX_THROW("VISIT_PY: Unsupported data type!");
-    }
-}
-
-migraphx::value to_value(py::list lst)
-{
-    migraphx::value v = migraphx::value::array{};
-    for(auto val : lst)
-    {
-        visit_py(val, [&](auto py_val) { v.push_back(py_val); });
-    }
-
-    return v;
-}
-
-migraphx::value to_value(py::kwargs kwargs)
-{
-    migraphx::value v = migraphx::value::object{};
-
-    for(auto arg : kwargs)
-    {
-        auto&& key = py::str(arg.first);
-        auto&& val = arg.second;
-        visit_py(val, [&](auto py_val) { v[key] = py_val; });
-    }
-    return v;
-}
-} // namespace migraphx
-
-namespace pybind11 {
-namespace detail {
-
-template <>
-struct npy_format_descriptor<half>
-{
-    static std::string format()
-    {
-        // following: https://docs.python.org/3/library/struct.html#format-characters
-        return "e";
-    }
-    static constexpr auto name() { return _("half"); }
-};
-
-} // namespace detail
-} // namespace pybind11
-
-template <class F>
-void visit_type(const migraphx::shape& s, F f)
-{
-    s.visit_type(f);
-}
-
-template <class T, class F>
-void visit(const migraphx::raw_data<T>& x, F f)
-{
-    x.visit(f);
-}
-
-template <class F>
-void visit_types(F f)
-{
-    migraphx::shape::visit_types(f);
-}
-
-template <class T>
-py::buffer_info to_buffer_info(T& x)
-{
-    migraphx::shape s = x.get_shape();
-    assert(s.type() != migraphx::shape::tuple_type);
-    if(s.dynamic())
-        MIGRAPHX_THROW("MIGRAPHX PYTHON: dynamic shape argument passed to to_buffer_info");
-    auto strides = s.strides();
-    std::transform(
-        strides.begin(), strides.end(), strides.begin(), [&](auto i) { return i * s.type_size(); });
-    py::buffer_info b;
-    visit_type(s, [&](auto as) {
-        // migraphx use int8_t data to store bool type, we need to
-        // explicitly specify the data type as bool for python
-        if(s.type() == migraphx::shape::bool_type)
-        {
-            b = py::buffer_info(x.data(),
-                                as.size(),
-                                py::format_descriptor<bool>::format(),
-                                s.ndim(),
-                                s.lens(),
-                                strides);
-        }
-        else
-        {
-            b = py::buffer_info(x.data(),
-                                as.size(),
-                                py::format_descriptor<decltype(as())>::format(),
-                                s.ndim(),
-                                s.lens(),
-                                strides);
-        }
-    });
-    return b;
-}
-
-migraphx::shape to_shape(const py::buffer_info& info)
-{
-    migraphx::shape::type_t t;
-    std::size_t n = 0;
-    visit_types([&](auto as) {
-        if(info.format == py::format_descriptor<decltype(as())>::format() or
-           (info.format == "l" and py::format_descriptor<decltype(as())>::format() == "q") or
-           (info.format == "L" and py::format_descriptor<decltype(as())>::format() == "Q"))
-        {
-            t = as.type_enum();
-            n = sizeof(as());
-        }
-        else if(info.format == "?" and py::format_descriptor<decltype(as())>::format() == "b")
-        {
-            t = migraphx::shape::bool_type;
-            n = sizeof(bool);
-        }
-    });
-
-    if(n == 0)
-    {
-        MIGRAPHX_THROW("MIGRAPHX PYTHON: Unsupported data type " + info.format);
-    }
-
-    auto strides = info.strides;
-    std::transform(strides.begin(), strides.end(), strides.begin(), [&](auto i) -> std::size_t {
-        return n > 0 ? i / n : 0;
-    });
-
-    // scalar support
-    if(info.shape.empty())
-    {
-        return migraphx::shape{t};
-    }
-    else
-    {
-        return migraphx::shape{t, info.shape, strides};
-    }
-}
-
-MIGRAPHX_PYBIND11_MODULE(migraphx, m)
-{
-    py::class_<migraphx::shape> shape_cls(m, "shape");
-    shape_cls
-        .def(py::init([](py::kwargs kwargs) {
-            auto v = migraphx::to_value(kwargs);
-            auto t = migraphx::shape::parse_type(v.get("type", "float"));
-            if(v.contains("dyn_dims"))
-            {
-                auto dyn_dims =
-                    migraphx::from_value<std::vector<migraphx::shape::dynamic_dimension>>(
-                        v.at("dyn_dims"));
-                return migraphx::shape(t, dyn_dims);
-            }
-            auto lens = v.get<std::size_t>("lens", {1});
-            if(v.contains("strides"))
-                return migraphx::shape(t, lens, v.at("strides").to_vector<std::size_t>());
-            else
-                return migraphx::shape(t, lens);
-        }))
-        .def("type", &migraphx::shape::type)
-        .def("lens", &migraphx::shape::lens)
-        .def("strides", &migraphx::shape::strides)
-        .def("ndim", &migraphx::shape::ndim)
-        .def("elements", &migraphx::shape::elements)
-        .def("bytes", &migraphx::shape::bytes)
-        .def("type_string", &migraphx::shape::type_string)
-        .def("type_size", &migraphx::shape::type_size)
-        .def("dyn_dims", &migraphx::shape::dyn_dims)
-        .def("packed", &migraphx::shape::packed)
-        .def("transposed", &migraphx::shape::transposed)
-        .def("broadcasted", &migraphx::shape::broadcasted)
-        .def("standard", &migraphx::shape::standard)
-        .def("scalar", &migraphx::shape::scalar)
-        .def("dynamic", &migraphx::shape::dynamic)
-        .def("__eq__", std::equal_to<migraphx::shape>{})
-        .def("__ne__", std::not_equal_to<migraphx::shape>{})
-        .def("__repr__", [](const migraphx::shape& s) { return migraphx::to_string(s); });
-
-    py::enum_<migraphx::shape::type_t>(shape_cls, "type_t")
-        MIGRAPHX_SHAPE_VISIT_TYPES(MIGRAPHX_PYTHON_GENERATE_SHAPE_ENUM);
-
-    py::class_<migraphx::shape::dynamic_dimension>(shape_cls, "dynamic_dimension")
-        .def(py::init<>())
-        .def(py::init<std::size_t, std::size_t>())
-        .def(py::init<std::size_t, std::size_t, std::set<std::size_t>>())
-        .def_readwrite("min", &migraphx::shape::dynamic_dimension::min)
-        .def_readwrite("max", &migraphx::shape::dynamic_dimension::max)
-        .def_readwrite("optimals", &migraphx::shape::dynamic_dimension::optimals)
-        .def("is_fixed", &migraphx::shape::dynamic_dimension::is_fixed);
-
-    py::class_<migraphx::argument>(m, "argument", py::buffer_protocol())
-        .def_buffer([](migraphx::argument& x) -> py::buffer_info { return to_buffer_info(x); })
-        .def(py::init([](py::buffer b) {
-            py::buffer_info info = b.request();
-            return migraphx::argument(to_shape(info), info.ptr);
-        }))
-        .def("get_shape", &migraphx::argument::get_shape)
-        .def("data_ptr",
-             [](migraphx::argument& x) { return reinterpret_cast<std::uintptr_t>(x.data()); })
-        .def("tolist",
-             [](migraphx::argument& x) {
-                 py::list l{x.get_shape().elements()};
-                 visit(x, [&](auto data) { l = py::cast(data.to_vector()); });
-                 return l;
-             })
-        .def("__eq__", std::equal_to<migraphx::argument>{})
-        .def("__ne__", std::not_equal_to<migraphx::argument>{})
-        .def("__repr__", [](const migraphx::argument& x) { return migraphx::to_string(x); });
-
-    py::class_<migraphx::target>(m, "target");
-
-    py::class_<migraphx::instruction_ref>(m, "instruction_ref")
-        .def("shape", [](migraphx::instruction_ref i) { return i->get_shape(); })
-        .def("op", [](migraphx::instruction_ref i) { return i->get_operator(); });
-
-    py::class_<migraphx::module, std::unique_ptr<migraphx::module, py::nodelete>>(m, "module")
-        .def("print", [](const migraphx::module& mm) { std::cout << mm << std::endl; })
-        .def(
-            "add_instruction",
-            [](migraphx::module& mm,
-               const migraphx::operation& op,
-               std::vector<migraphx::instruction_ref>& args,
-               std::vector<migraphx::module*>& mod_args) {
-                return mm.add_instruction(op, args, mod_args);
-            },
-            py::arg("op"),
-            py::arg("args"),
-            py::arg("mod_args") = std::vector<migraphx::module*>{})
-        .def(
-            "add_literal",
-            [](migraphx::module& mm, py::buffer data) {
-                py::buffer_info info = data.request();
-                auto literal_shape   = to_shape(info);
-                return mm.add_literal(literal_shape, reinterpret_cast<char*>(info.ptr));
-            },
-            py::arg("data"))
-        .def(
-            "add_parameter",
-            [](migraphx::module& mm, const std::string& name, const migraphx::shape shape) {
-                return mm.add_parameter(name, shape);
-            },
-            py::arg("name"),
-            py::arg("shape"))
-        .def(
-            "add_return",
-            [](migraphx::module& mm, std::vector<migraphx::instruction_ref>& args) {
-                return mm.add_return(args);
-            },
-            py::arg("args"))
-        .def("__repr__", [](const migraphx::module& mm) { return migraphx::to_string(mm); });
-
-    py::class_<migraphx::program>(m, "program")
-        .def(py::init([]() { return migraphx::program(); }))
-        .def("get_parameter_names", &migraphx::program::get_parameter_names)
-        .def("get_parameter_shapes", &migraphx::program::get_parameter_shapes)
-        .def("get_output_shapes", &migraphx::program::get_output_shapes)
-        .def("is_compiled", &migraphx::program::is_compiled)
-        .def(
-            "compile",
-            [](migraphx::program& p,
-               const migraphx::target& t,
-               bool offload_copy,
-               bool fast_math,
-               bool exhaustive_tune) {
-                migraphx::compile_options options;
-                options.offload_copy    = offload_copy;
-                options.fast_math       = fast_math;
-                options.exhaustive_tune = exhaustive_tune;
-                p.compile(t, options);
-            },
-            py::arg("t"),
-            py::arg("offload_copy")    = true,
-            py::arg("fast_math")       = true,
-            py::arg("exhaustive_tune") = false)
-        .def("get_main_module", [](const migraphx::program& p) { return p.get_main_module(); })
-        .def(
-            "create_module",
-            [](migraphx::program& p, const std::string& name) { return p.create_module(name); },
-            py::arg("name"))
-        .def("run",
-             [](migraphx::program& p, py::dict params) {
-                 migraphx::parameter_map pm;
-                 for(auto x : params)
-                 {
-                     std::string key      = x.first.cast<std::string>();
-                     py::buffer b         = x.second.cast<py::buffer>();
-                     py::buffer_info info = b.request();
-                     pm[key]              = migraphx::argument(to_shape(info), info.ptr);
-                 }
-                 return p.eval(pm);
-             })
-        .def("run_async",
-             [](migraphx::program& p,
-                py::dict params,
-                std::uintptr_t stream,
-                std::string stream_name) {
-                 migraphx::parameter_map pm;
-                 for(auto x : params)
-                 {
-                     std::string key      = x.first.cast<std::string>();
-                     py::buffer b         = x.second.cast<py::buffer>();
-                     py::buffer_info info = b.request();
-                     pm[key]              = migraphx::argument(to_shape(info), info.ptr);
-                 }
-                 migraphx::execution_environment exec_env{
-                     migraphx::any_ptr(reinterpret_cast<void*>(stream), stream_name), true};
-                 return p.eval(pm, exec_env);
-             })
-        .def("sort", &migraphx::program::sort)
-        .def("print", [](const migraphx::program& p) { std::cout << p << std::endl; })
-        .def("__eq__", std::equal_to<migraphx::program>{})
-        .def("__ne__", std::not_equal_to<migraphx::program>{})
-        .def("__repr__", [](const migraphx::program& p) { return migraphx::to_string(p); });
-
-    py::class_<migraphx::operation> op(m, "op");
-    op.def(py::init([](const std::string& name, py::kwargs kwargs) {
-          migraphx::value v = migraphx::value::object{};
-          if(kwargs)
-          {
-              v = migraphx::to_value(kwargs);
-          }
-          return migraphx::make_op(name, v);
-      }))
-        .def("name", &migraphx::operation::name);
-
-    py::enum_<migraphx::op::pooling_mode>(op, "pooling_mode")
-        .value("average", migraphx::op::pooling_mode::average)
-        .value("max", migraphx::op::pooling_mode::max)
-        .value("lpnorm", migraphx::op::pooling_mode::lpnorm);
-
-    py::enum_<migraphx::op::rnn_direction>(op, "rnn_direction")
-        .value("forward", migraphx::op::rnn_direction::forward)
-        .value("reverse", migraphx::op::rnn_direction::reverse)
-        .value("bidirectional", migraphx::op::rnn_direction::bidirectional);
-
-    m.def(
-        "argument_from_pointer",
-        [](const migraphx::shape shape, const int64_t address) {
-            return migraphx::argument(shape, reinterpret_cast<void*>(address));
-        },
-        py::arg("shape"),
-        py::arg("address"));
-
-    m.def(
-        "parse_tf",
-        [](const std::string& filename,
-           bool is_nhwc,
-           unsigned int batch_size,
-           std::unordered_map<std::string, std::vector<std::size_t>> map_input_dims,
-           std::vector<std::string> output_names) {
-            return migraphx::parse_tf(
-                filename, migraphx::tf_options{is_nhwc, batch_size, map_input_dims, output_names});
-        },
-        "Parse tf protobuf (default format is nhwc)",
-        py::arg("filename"),
-        py::arg("is_nhwc")        = true,
-        py::arg("batch_size")     = 1,
-        py::arg("map_input_dims") = std::unordered_map<std::string, std::vector<std::size_t>>(),
-        py::arg("output_names")   = std::vector<std::string>());
-
-    m.def(
-        "parse_onnx",
-        [](const std::string& filename,
-           unsigned int default_dim_value,
-           migraphx::shape::dynamic_dimension default_dyn_dim_value,
-           std::unordered_map<std::string, std::vector<std::size_t>> map_input_dims,
-           std::unordered_map<std::string, std::vector<migraphx::shape::dynamic_dimension>>
-               map_dyn_input_dims,
-           bool skip_unknown_operators,
-           bool print_program_on_error,
-           int64_t max_loop_iterations) {
-            migraphx::onnx_options options;
-            options.default_dim_value      = default_dim_value;
-            options.default_dyn_dim_value  = default_dyn_dim_value;
-            options.map_input_dims         = map_input_dims;
-            options.map_dyn_input_dims     = map_dyn_input_dims;
-            options.skip_unknown_operators = skip_unknown_operators;
-            options.print_program_on_error = print_program_on_error;
-            options.max_loop_iterations    = max_loop_iterations;
-            return migraphx::parse_onnx(filename, options);
-        },
-        "Parse onnx file",
-        py::arg("filename"),
-        py::arg("default_dim_value")     = 0,
-        py::arg("default_dyn_dim_value") = migraphx::shape::dynamic_dimension{1, 1},
-        py::arg("map_input_dims") = std::unordered_map<std::string, std::vector<std::size_t>>(),
-        py::arg("map_dyn_input_dims") =
-            std::unordered_map<std::string, std::vector<migraphx::shape::dynamic_dimension>>(),
-        py::arg("skip_unknown_operators") = false,
-        py::arg("print_program_on_error") = false,
-        py::arg("max_loop_iterations")    = 10);
-
-    m.def(
-        "parse_onnx_buffer",
-        [](const std::string& onnx_buffer,
-           unsigned int default_dim_value,
-           migraphx::shape::dynamic_dimension default_dyn_dim_value,
-           std::unordered_map<std::string, std::vector<std::size_t>> map_input_dims,
-           std::unordered_map<std::string, std::vector<migraphx::shape::dynamic_dimension>>
-               map_dyn_input_dims,
-           bool skip_unknown_operators,
-           bool print_program_on_error) {
-            migraphx::onnx_options options;
-            options.default_dim_value      = default_dim_value;
-            options.default_dyn_dim_value  = default_dyn_dim_value;
-            options.map_input_dims         = map_input_dims;
-            options.map_dyn_input_dims     = map_dyn_input_dims;
-            options.skip_unknown_operators = skip_unknown_operators;
-            options.print_program_on_error = print_program_on_error;
-            return migraphx::parse_onnx_buffer(onnx_buffer, options);
-        },
-        "Parse onnx file",
-        py::arg("filename"),
-        py::arg("default_dim_value")     = 0,
-        py::arg("default_dyn_dim_value") = migraphx::shape::dynamic_dimension{1, 1},
-        py::arg("map_input_dims") = std::unordered_map<std::string, std::vector<std::size_t>>(),
-        py::arg("map_dyn_input_dims") =
-            std::unordered_map<std::string, std::vector<migraphx::shape::dynamic_dimension>>(),
-        py::arg("skip_unknown_operators") = false,
-        py::arg("print_program_on_error") = false);
-
-    m.def(
-        "load",
-        [](const std::string& name, const std::string& format) {
-            migraphx::file_options options;
-            options.format = format;
-            return migraphx::load(name, options);
-        },
-        "Load MIGraphX program",
-        py::arg("filename"),
-        py::arg("format") = "msgpack");
-
-    m.def(
-        "save",
-        [](const migraphx::program& p, const std::string& name, const std::string& format) {
-            migraphx::file_options options;
-            options.format = format;
-            return migraphx::save(p, name, options);
-        },
-        "Save MIGraphX program",
-        py::arg("p"),
-        py::arg("filename"),
-        py::arg("format") = "msgpack");
-
-    m.def("get_target", &migraphx::make_target);
-    m.def("create_argument", [](const migraphx::shape& s, const std::vector<double>& values) {
-        if(values.size() != s.elements())
-            MIGRAPHX_THROW("Values and shape elements do not match");
-        migraphx::argument a{s};
-        a.fill(values.begin(), values.end());
-        return a;
-    });
-    m.def("generate_argument", &migraphx::generate_argument, py::arg("s"), py::arg("seed") = 0);
-    m.def("fill_argument", &migraphx::fill_argument, py::arg("s"), py::arg("value"));
-    m.def("quantize_fp16",
-          &migraphx::quantize_fp16,
-          py::arg("prog"),
-          py::arg("ins_names") = std::vector<std::string>{"all"});
-    m.def("quantize_int8",
-          &migraphx::quantize_int8,
-          py::arg("prog"),
-          py::arg("t"),
-          py::arg("calibration") = std::vector<migraphx::parameter_map>{},
-          py::arg("ins_names")   = std::vector<std::string>{"dot", "convolution"});
-
-#ifdef HAVE_GPU
-    m.def("allocate_gpu", &migraphx::gpu::allocate_gpu, py::arg("s"), py::arg("host") = false);
-    m.def("to_gpu", &migraphx::gpu::to_gpu, py::arg("arg"), py::arg("host") = false);
-    m.def("from_gpu", &migraphx::gpu::from_gpu);
-    m.def("gpu_sync", [] { migraphx::gpu::gpu_sync(); });
-#endif
-
-#ifdef VERSION_INFO
-    m.attr("__version__") = VERSION_INFO;
-#else
-    m.attr("__version__") = "dev";
-#endif
-}
--- a/docker/rocm/requirements-wheels-rocm.txt
+++ b/docker/rocm/requirements-wheels-rocm.txt
@ -1 +1 @@
-onnxruntime-rocm @ https://github.com/NickM-27/frigate-onnxruntime-rocm/releases/download/v1.0.0/onnxruntime_rocm-1.17.3-cp39-cp39-linux_x86_64.whl
+onnxruntime-rocm @ https://github.com/NickM-27/frigate-onnxruntime-rocm/releases/download/v6.3.3/onnxruntime_rocm-1.20.1-cp311-cp311-linux_x86_64.whl
--- a/docker/rocm/rocm-pin-600
+++ b/docker/rocm/rocm-pin-600
@ -1,3 +0,0 @@
-Package: *
-Pin: release o=repo.radeon.com
-Pin-Priority: 600
--- a/docker/rocm/rocm.hcl
+++ b/docker/rocm/rocm.hcl
@ -2,7 +2,7 @@ variable "AMDGPU" {
  default = "gfx900"
 }
 variable "ROCM" {
-  default = "5.7.3"
+  default = "6.3.3"
 }
 variable "HSA_OVERRIDE_GFX_VERSION" {
  default = ""
@ -10,6 +10,13 @@ variable "HSA_OVERRIDE_GFX_VERSION" {
 variable "HSA_OVERRIDE" {
  default = "1"
 }
+
+target wget {
+  dockerfile = "docker/main/Dockerfile"
+  platforms = ["linux/amd64"]
+  target = "wget"
+}
+
 target deps {
  dockerfile = "docker/main/Dockerfile"
  platforms = ["linux/amd64"]
@ -26,6 +33,7 @@ target rocm {
  dockerfile = "docker/rocm/Dockerfile"
  contexts = {
    deps = "target:deps",
+    wget = "target:wget",
    rootfs = "target:rootfs"
  }
  platforms = ["linux/amd64"]
--- a/docker/rocm/rocm.list
+++ b/docker/rocm/rocm.list
@ -1 +0,0 @@
-deb [arch=amd64 signed-by=/etc/apt/keyrings/rocm.gpg] https://repo.radeon.com/rocm/apt/5.7.3 focal main
--- a/docker/rpi/Dockerfile
+++ b/docker/rpi/Dockerfile
@ -6,11 +6,12 @@ ARG DEBIAN_FRONTEND=noninteractive
 FROM deps AS rpi-deps
 ARG TARGETARCH

-RUN rm -rf /usr/lib/btbn-ffmpeg/
-
 # Install dependencies
 RUN --mount=type=bind,source=docker/rpi/install_deps.sh,target=/deps/install_deps.sh \
    /deps/install_deps.sh

+ENV DEFAULT_FFMPEG_VERSION="rpi"
+ENV INCLUDED_FFMPEG_VERSIONS="${DEFAULT_FFMPEG_VERSION}:${INCLUDED_FFMPEG_VERSIONS}"
+
 WORKDIR /opt/frigate/
 COPY --from=rootfs / /
--- a/docker/rpi/install_deps.sh
+++ b/docker/rpi/install_deps.sh
@ -28,4 +28,7 @@ if [[ "${TARGETARCH}" == "arm64" ]]; then
    echo "deb [signed-by=/usr/share/keyrings/raspbian.gpg] https://archive.raspberrypi.org/debian/ bookworm main" | tee /etc/apt/sources.list.d/raspi.list
    apt-get -qq update
    apt-get -qq install --no-install-recommends --no-install-suggests -y ffmpeg
+    mkdir -p /usr/lib/ffmpeg/rpi/bin
+    ln -svf /usr/bin/ffmpeg /usr/lib/ffmpeg/rpi/bin/ffmpeg
+    ln -svf /usr/bin/ffprobe /usr/lib/ffmpeg/rpi/bin/ffprobe
 fi
--- a/docker/tensorrt/Dockerfile.amd64
+++ b/docker/tensorrt/Dockerfile.amd64
@ -3,22 +3,16 @@
 # https://askubuntu.com/questions/972516/debian-frontend-environment-variable
 ARG DEBIAN_FRONTEND=noninteractive

-# Make this a separate target so it can be built/cached optionally
-FROM wheels as trt-wheels
-ARG DEBIAN_FRONTEND
-ARG TARGETARCH
-RUN python3 -m pip config set global.break-system-packages true
-
-# Add TensorRT wheels to another folder
-COPY docker/tensorrt/requirements-amd64.txt /requirements-tensorrt.txt
-RUN mkdir -p /trt-wheels && pip3 wheel --wheel-dir=/trt-wheels -r /requirements-tensorrt.txt
+# Globally set pip break-system-packages option to avoid having to specify it every time
+ARG PIP_BREAK_SYSTEM_PACKAGES=1

 FROM tensorrt-base AS frigate-tensorrt
+ARG PIP_BREAK_SYSTEM_PACKAGES
 ENV TRT_VER=8.6.1
-RUN python3 -m pip config set global.break-system-packages true
-RUN --mount=type=bind,from=trt-wheels,source=/trt-wheels,target=/deps/trt-wheels \
-    pip3 install -U /deps/trt-wheels/*.whl && \
-    ldconfig
+
+# Install TensorRT wheels
+COPY docker/tensorrt/requirements-amd64.txt /requirements-tensorrt.txt
+RUN pip3 install -U -r /requirements-tensorrt.txt && ldconfig

 WORKDIR /opt/frigate/
 COPY --from=rootfs / /
--- a/docker/tensorrt/Dockerfile.arm64
+++ b/docker/tensorrt/Dockerfile.arm64
@ -76,8 +76,9 @@ RUN apt-get update \
    && apt-get install -y python-is-python3 libprotobuf23  \
    && rm -rf /var/lib/apt/lists/*

-RUN rm -rf /usr/lib/btbn-ffmpeg/
 COPY --from=jetson-ffmpeg /rootfs /
+ENV DEFAULT_FFMPEG_VERSION="jetson"
+ENV INCLUDED_FFMPEG_VERSIONS="${DEFAULT_FFMPEG_VERSION}:${INCLUDED_FFMPEG_VERSIONS}"

 # ffmpeg runtime dependencies
 RUN apt-get -qq update \
--- a/docker/tensorrt/Dockerfile.base
+++ b/docker/tensorrt/Dockerfile.base
@ -8,6 +8,7 @@ ARG TRT_BASE=nvcr.io/nvidia/tensorrt:23.12-py3
 # Build TensorRT-specific library
 FROM ${TRT_BASE} AS trt-deps

+ARG TARGETARCH
 ARG COMPUTE_LEVEL

 RUN apt-get update \
@ -16,15 +17,26 @@ RUN apt-get update \
 RUN --mount=type=bind,source=docker/tensorrt/detector/tensorrt_libyolo.sh,target=/tensorrt_libyolo.sh \
    /tensorrt_libyolo.sh

+# COPY required individual CUDA deps
+RUN mkdir -p /usr/local/cuda-deps
+RUN if [ "$TARGETARCH" = "amd64" ]; then \
+      cp /usr/local/cuda-12.3/targets/x86_64-linux/lib/libcurand.so.* /usr/local/cuda-deps/ && \
+      cp /usr/local/cuda-12.3/targets/x86_64-linux/lib/libnvrtc.so.* /usr/local/cuda-deps/ ; \
+    fi
+
 # Frigate w/ TensorRT Support as separate image
 FROM deps AS tensorrt-base

 #Disable S6 Global timeout
 ENV S6_CMD_WAIT_FOR_SERVICES_MAXTIME=0

+# COPY TensorRT Model Generation Deps
 COPY --from=trt-deps /usr/local/lib/libyolo_layer.so /usr/local/lib/libyolo_layer.so
 COPY --from=trt-deps /usr/local/src/tensorrt_demos /usr/local/src/tensorrt_demos
-COPY --from=trt-deps /usr/local/cuda-12.* /usr/local/cuda
+
+# COPY Individual CUDA deps folder
+COPY --from=trt-deps /usr/local/cuda-deps /usr/local/cuda
+
 COPY docker/tensorrt/detector/rootfs/ /
 ENV YOLO_MODELS=""

--- a/docker/tensorrt/build_jetson_ffmpeg.sh
+++ b/docker/tensorrt/build_jetson_ffmpeg.sh
@ -5,7 +5,7 @@

 set -euxo pipefail

-INSTALL_PREFIX=/rootfs/usr/local
+INSTALL_PREFIX=/rootfs/usr/lib/ffmpeg/jetson

 apt-get -qq update
 apt-get -qq install -y --no-install-recommends build-essential ccache clang cmake pkg-config
--- a/docker/tensorrt/detector/rootfs/etc/ld.so.conf.d/cuda_tensorrt.conf
+++ b/docker/tensorrt/detector/rootfs/etc/ld.so.conf.d/cuda_tensorrt.conf
@ -1,5 +1,5 @@
 /usr/local/lib
-/usr/local/cuda/lib64
+/usr/local/cuda
 /usr/local/lib/python3.11/dist-packages/nvidia/cudnn/lib
 /usr/local/lib/python3.11/dist-packages/nvidia/cuda_runtime/lib
 /usr/local/lib/python3.11/dist-packages/nvidia/cublas/lib
--- a/docker/tensorrt/detector/rootfs/etc/s6-overlay/s6-rc.d/trt-model-prepare/run
+++ b/docker/tensorrt/detector/rootfs/etc/s6-overlay/s6-rc.d/trt-model-prepare/run
@ -20,7 +20,7 @@ FIRST_MODEL=true
 MODEL_DOWNLOAD=""
 MODEL_CONVERT=""

-if [ -z "$YOLO_MODELS"]; then
+if [ -z "$YOLO_MODELS" ]; then
    echo "tensorrt model preparation disabled"
    exit 0
 fi
@ -64,7 +64,7 @@ fi
 # order to run libyolo here.
 # On Jetpack 5.0, these libraries are not mounted by the runtime and are supplied by the image.
 if [[ "$(arch)" == "aarch64" ]]; then
-    if [[ ! -e /usr/lib/aarch64-linux-gnu/tegra ]]; then
+    if [[ ! -e /usr/lib/aarch64-linux-gnu/tegra && ! -e /usr/lib/aarch64-linux-gnu/tegra-egl ]]; then
        echo "ERROR: Container must be launched with nvidia runtime"
        exit 1
    elif [[ ! -e /usr/lib/aarch64-linux-gnu/libnvinfer.so.8 ||
--- a/docker/tensorrt/requirements-amd64.txt
+++ b/docker/tensorrt/requirements-amd64.txt
@ -1,14 +1,17 @@
 # NVidia TensorRT Support (amd64 only)
 --extra-index-url 'https://pypi.nvidia.com'
 numpy < 1.24; platform_machine == 'x86_64'
-tensorrt == 8.6.1.*; platform_machine == 'x86_64'
+tensorrt == 8.6.1; platform_machine == 'x86_64'
+tensorrt_bindings == 8.6.1; platform_machine == 'x86_64'
 cuda-python == 11.8.*; platform_machine == 'x86_64'
 cython == 3.0.*; platform_machine == 'x86_64'
 nvidia-cuda-runtime-cu12 == 12.1.*; platform_machine == 'x86_64'
 nvidia-cuda-runtime-cu11 == 11.8.*; platform_machine == 'x86_64'
 nvidia-cublas-cu11 == 11.11.3.6; platform_machine == 'x86_64'
+nvidia-cudnn-cu11 == 8.6.0.*; platform_machine == 'x86_64'
 nvidia-cudnn-cu12 == 9.5.0.*; platform_machine == 'x86_64'
 nvidia-cufft-cu11==10.*; platform_machine == 'x86_64'
+nvidia-cufft-cu12==11.*; platform_machine == 'x86_64'
 onnx==1.16.*; platform_machine == 'x86_64'
 onnxruntime-gpu==1.20.*; platform_machine == 'x86_64'
 protobuf==3.20.3; platform_machine == 'x86_64'
--- a/docker/tensorrt/trt.hcl
+++ b/docker/tensorrt/trt.hcl
@ -14,12 +14,17 @@ variable "COMPUTE_LEVEL" {
  default = ""
 }
 variable "BASE_HOOK" {
-  # Ensure an up-to-date python 3.11 is available in tensorrt/jetson image
+  # Ensure an up-to-date python 3.11 is available in jetson images
  default = <<EOT
 if grep -iq \"ubuntu\" /etc/os-release; then
-  apt-get update &&
-  apt-get install -y software-properties-common &&
-  add-apt-repository ppa:deadsnakes/ppa;
+  . /etc/os-release
+
+  # Add the deadsnakes PPA repository
+  echo "deb https://ppa.launchpadcontent.net/deadsnakes/ppa/ubuntu $VERSION_CODENAME main" >> /etc/apt/sources.list.d/deadsnakes.list
+  echo "deb-src https://ppa.launchpadcontent.net/deadsnakes/ppa/ubuntu $VERSION_CODENAME main" >> /etc/apt/sources.list.d/deadsnakes.list
+
+  # Add deadsnakes signing key
+  apt-key adv --keyserver keyserver.ubuntu.com --recv-keys F23C5A6CF475977595C89F51BA6932366A755776
 fi
 EOT
 }
@ -90,7 +95,6 @@ target "tensorrt" {
    wget = "target:wget",
    tensorrt-base = "target:tensorrt-base",
    rootfs = "target:rootfs"
-    wheels = "target:wheels"
  }
  target = "frigate-tensorrt"
  inherits = ["_build_args"]
--- a/docs/docs/configuration/advanced.md
+++ b/docs/docs/configuration/advanced.md
@ -37,7 +37,7 @@ See [the go2rtc docs](https://github.com/AlexxIT/go2rtc?tab=readme-ov-file#modul
 ```yaml
 go2rtc:
  streams:
-    ...
+    # ...
  log:
    exec: trace
 ```
@ -176,15 +176,13 @@ listen [::]:5000 ipv6only=off;

 ### Custom ffmpeg build

-Included with Frigate is a build of ffmpeg that works for the vast majority of users. However, there exists some hardware setups which have incompatibilities with the included build. In this case, statically built ffmpeg binary can be downloaded to /config and used.
+Included with Frigate is a build of ffmpeg that works for the vast majority of users. However, there exists some hardware setups which have incompatibilities with the included build. In this case, statically built `ffmpeg` and `ffprobe` binaries can be placed in `/config/custom-ffmpeg/bin` for Frigate to use.

 To do this:

-1. Download your ffmpeg build and uncompress to the Frigate config folder.
-2. Update your docker-compose or docker CLI to include `'/home/appdata/frigate/custom-ffmpeg':'/usr/lib/btbn-ffmpeg':'ro'` in the volume mappings.
-3. Restart Frigate and the custom version will be used if the mapping was done correctly.
-
-NOTE: The folder that is set for the config needs to be the folder that contains `/bin`. So if the full structure is `/home/appdata/frigate/custom-ffmpeg/bin/ffmpeg` then the `ffmpeg -> path` field should be `/config/custom-ffmpeg/bin`.
+1. Download your ffmpeg build and uncompress it to the `/config/custom-ffmpeg` folder. Verify that both the `ffmpeg` and `ffprobe` binaries are located in `/config/custom-ffmpeg/bin`.
+2. Update the `ffmpeg.path` in your Frigate config to `/config/custom-ffmpeg`.
+3. Restart Frigate and the custom version will be used if the steps above were done correctly.

 ### Custom go2rtc version

@ -192,7 +190,7 @@ Frigate currently includes go2rtc v1.9.2, there may be certain cases where you w

 To do this:

-1. Download the go2rtc build to the /config folder.
+1. Download the go2rtc build to the `/config` folder.
 2. Rename the build to `go2rtc`.
 3. Give `go2rtc` execute permission.
 4. Restart Frigate and the custom version will be used, you can verify by checking go2rtc logs.
--- a/docs/docs/configuration/cameras.md
+++ b/docs/docs/configuration/cameras.md
@ -7,7 +7,7 @@ title: Camera Configuration

 Several inputs can be configured for each camera and the role of each input can be mixed and matched based on your needs. This allows you to use a lower resolution stream for object detection, but create recordings from a higher resolution stream, or vice versa.

-A camera is enabled by default but can be temporarily disabled by using `enabled: False`. Existing tracked objects and recordings can still be accessed. Live streams, recording and detecting are not working. Camera specific configurations will be used.
+A camera is enabled by default but can be disabled by using `enabled: False`. Cameras that are disabled through the configuration file will not appear in the Frigate UI and will not consume system resources.

 Each role can only be assigned to one input per camera. The options for roles are as follows:

--- a/docs/docs/configuration/face_recognition.md
+++ b/docs/docs/configuration/face_recognition.md
@ -9,7 +9,7 @@ Frigate has support for CV2 Local Binary Pattern Face Recognizer to recognize fa

 ## Configuration

-Face recognition is disabled by default and requires semantic search to be enabled, face recognition must be enabled in your config file before it can be used. Semantic Search and face recognition are global configuration settings.
+Face recognition is disabled by default, face recognition must be enabled in your config file before it can be used. Face recognition is a global configuration setting.

 ```yaml
 face_recognition:
@ -36,6 +36,7 @@ The accuracy of face recognition is heavily dependent on the quality of data giv
 :::tip

 When choosing images to include in the face training set it is recommended to always follow these recommendations:
+
 - If it is difficult to make out details in a persons face it will not be helpful in training.
 - Avoid images with under/over-exposure.
 - Avoid blurry / pixelated images.
@ -52,4 +53,4 @@ Then it is recommended to use the `Face Library` tab in Frigate to select and tr

 ### Step 2 - Expanding The Dataset

-Once straight-on images are performing well, start choosing slightly off-angle images to include for training. It is important to still choose images where enough face detail is visible to recognize someone.
+Once straight-on images are performing well, start choosing slightly off-angle images to include for training. It is important to still choose images where enough face detail is visible to recognize someone.
--- a/docs/docs/configuration/genai.md
+++ b/docs/docs/configuration/genai.md
@ -5,13 +5,7 @@ title: Generative AI

 Generative AI can be used to automatically generate descriptive text based on the thumbnails of your tracked objects. This helps with [Semantic Search](/configuration/semantic_search) in Frigate to provide more context about your tracked objects. Descriptions are accessed via the _Explore_ view in the Frigate UI by clicking on a tracked object's thumbnail.

-Requests for a description are sent off automatically to your AI provider at the end of the tracked object's lifecycle. Descriptions can also be regenerated manually via the Frigate UI.
-
-:::info
-
-Semantic Search must be enabled to use Generative AI.
-
-:::
+Requests for a description are sent off automatically to your AI provider at the end of the tracked object's lifecycle, or can optionally be sent earlier after a number of significantly changed frames, for example in use in more real-time notifications. Descriptions can also be regenerated manually via the Frigate UI. Note that if you are manually entering a description for tracked objects prior to its end, this will be overwritten by the generated response.

 ## Configuration

@ -154,6 +148,15 @@ While generating simple descriptions of detected objects is useful, understandin

 Frigate provides an [MQTT topic](/integrations/mqtt), `frigate/tracked_object_update`, that is updated with a JSON payload containing `event_id` and `description` when your AI provider returns a description for a tracked object. This description could be used directly in notifications, such as sending alerts to your phone or making audio announcements. If additional details from the tracked object are needed, you can query the [HTTP API](/integrations/api/event-events-event-id-get) using the `event_id`, eg: `http://frigate_ip:5000/api/events/<event_id>`.

+If looking to get notifications earlier than when an object ceases to be tracked, an additional send trigger can be configured of `after_significant_updates`.
+
+```yaml
+genai:
+  send_triggers:
+    tracked_object_end: true # default
+    after_significant_updates: 3 # how many updates to a tracked object before we should send an image
+```
+
 ## Custom Prompts

 Frigate sends multiple frames from the tracked object along with a prompt to your Generative AI provider asking it to generate a description. The default prompt is as follows:
--- a/docs/docs/configuration/license_plate_recognition.md
+++ b/docs/docs/configuration/license_plate_recognition.md
@ -3,13 +3,28 @@ id: license_plate_recognition
 title: License Plate Recognition (LPR)
 ---

-Frigate can recognize license plates on vehicles and automatically add the detected characters as a `sub_label` to objects that are of type `car`. A common use case may be to read the license plates of cars pulling into a driveway or cars passing by on a street with a dedicated LPR camera.
+Frigate can recognize license plates on vehicles and automatically add the detected characters or recognized name as a `sub_label` to objects that are of type `car`. A common use case may be to read the license plates of cars pulling into a driveway or cars passing by on a street.
+
+LPR works best when the license plate is clearly visible to the camera. For moving vehicles, Frigate continuously refines the recognition process, keeping the most confident result. However, LPR does not run on stationary vehicles.
+
+When a plate is recognized, the detected characters or recognized name is:
+
+- Added as a `sub_label` to the `car` tracked object.
+- Viewable in the Review Item Details pane in Review and the Tracked Object Details pane in Explore.
+- Filterable through the More Filters menu in Explore.
+- Published via the `frigate/events` MQTT topic as a `sub_label` for the tracked object.
+
+## Model Requirements

 Users running a Frigate+ model (or any custom model that natively detects license plates) should ensure that `license_plate` is added to the [list of objects to track](https://docs.frigate.video/plus/#available-label-types) either globally or for a specific camera. This will improve the accuracy and performance of the LPR model.

-Users without a model that detects license plates can still run LPR. A small, CPU inference, YOLOv9 license plate detection model will be used instead. You should _not_ define `license_plate` in your list of objects to track.
+Users without a model that detects license plates can still run LPR. Frigate uses a lightweight YOLOv9 license plate detection model that runs on your CPU. In this case, you should _not_ define `license_plate` in your list of objects to track.

-LPR is most effective when the vehicle’s license plate is fully visible to the camera. For moving vehicles, Frigate will attempt to read the plate continuously, refining recognition and keeping the most confident result. LPR will not run on stationary vehicles.
+:::note
+
+Frigate needs to first detect a `car` before it can recognize a license plate. If you're using a dedicated LPR camera or have a zoomed-in view, make sure the camera captures enough of the `car` for Frigate to detect it reliably.
+
+:::

 ## Minimum System Requirements

@ -24,6 +39,10 @@ lpr:
  enabled: True
 ```

+Ensure that your camera is configured to detect objects of type `car`, and that a car is actually being detected by Frigate. Otherwise, LPR will not run.
+
+Like the other real-time processors in Frigate, license plate recognition runs on the camera stream defined by the `detect` role in your config. To ensure optimal performance, select a suitable resolution for this stream in your camera's firmware that fits your specific scene and requirements.
+
 ## Advanced Configuration

 Fine-tune the LPR feature using these optional parameters:
@ -35,17 +54,18 @@ Fine-tune the LPR feature using these optional parameters:
  - Note: If you are using a Frigate+ model and you set the `threshold` in your objects config for `license_plate` higher than this value, recognition will never run. It's best to ensure these values match, or this `detection_threshold` is lower than your object config `threshold`.
 - **`min_area`**: Defines the minimum size (in pixels) a license plate must be before recognition runs.
  - Default: `1000` pixels.
-  - Depending on the resolution of your cameras, you can increase this value to ignore small or distant plates.
+  - Depending on the resolution of your camera's `detect` stream, you can increase this value to ignore small or distant plates.

 ### Recognition

 - **`recognition_threshold`**: Recognition confidence score required to add the plate to the object as a sub label.
  - Default: `0.9`.
- **`min_plate_length`**: Specifies the minimum number of characters a detected license plate must have to be added as a sub-label to an object.
+- **`min_plate_length`**: Specifies the minimum number of characters a detected license plate must have to be added as a sub label to an object.
  - Use this to filter out short, incomplete, or incorrect detections.
 - **`format`**: A regular expression defining the expected format of detected plates. Plates that do not match this format will be discarded.
  - `"^[A-Z]{1,3} [A-Z]{1,2} [0-9]{1,4}$"` matches plates like "B AB 1234" or "M X 7"
  - `"^[A-Z]{2}[0-9]{2} [A-Z]{3}$"` matches plates like "AB12 XYZ" or "XY68 ABC"
+  - Websites like https://regex101.com/ can help test regular expressions for your plates.

 ### Matching

@ -53,9 +73,9 @@ Fine-tune the LPR feature using these optional parameters:
  - These labels appear in the UI, filters, and notifications.
 - **`match_distance`**: Allows for minor variations (missing/incorrect characters) when matching a detected plate to a known plate.
  - For example, setting `match_distance: 1` allows a plate `ABCDE` to match `ABCBE` or `ABCD`.
-  - This parameter will not operate on known plates that are defined as regular expressions. You should define the full string of your plate in `known_plates` in order to use `match_distance`.
+  - This parameter will _not_ operate on known plates that are defined as regular expressions. You should define the full string of your plate in `known_plates` in order to use `match_distance`.

-### Examples
+## Configuration Examples

 ```yaml
 lpr:
@ -69,7 +89,9 @@ lpr:
    Johnny:
      - "J*N-*234" # Matches JHN-1234 and JMN-I234, but also note that "*" matches any number of characters
    Sally:
-      - "[S5]LL-1234" # Matches both SLL-1234 and 5LL-1234
+      - "[S5]LL 1234" # Matches both SLL 1234 and 5LL 1234
+    Work Trucks:
+      - "EMP-[0-9]{3}[A-Z]" # Matches plates like EMP-123A, EMP-456Z
 ```

 ```yaml
@ -77,12 +99,54 @@ lpr:
  enabled: True
  min_area: 4000 # Run recognition on larger plates only
  recognition_threshold: 0.85
-  format: "^[A-Z]{3}-[0-9]{4}$" # Only recognize plates that are three letters, followed by a dash, followed by 4 numbers
+  format: "^[A-Z]{2} [A-Z][0-9]{4}$" # Only recognize plates that are two letters, followed by a space, followed by a single letter and 4 numbers
  match_distance: 1 # Allow one character variation in plate matching
  known_plates:
    Delivery Van:
-      - "RJK-5678"
-      - "UPS-1234"
-    Employee Parking:
-      - "EMP-[0-9]{3}[A-Z]" # Matches plates like EMP-123A, EMP-456Z
+      - "RJ K5678"
+      - "UP A1234"
+    Supervisor:
+      - "MN D3163"
 ```
+
+## FAQ
+
+### Why isn't my license plate being detected and recognized?
+
+Ensure that:
+
+- Your camera has a clear, human-readable, well-lit view of the plate. If you can't read the plate, Frigate certainly won't be able to. This may require changing video size, quality, or frame rate settings on your camera, depending on your scene and how fast the vehicles are traveling.
+- The plate is large enough in the image (try adjusting `min_area`) or increasing the resolution of your camera's stream.
+- A `car` is detected first, as LPR only runs on recognized vehicles.
+
+If you are using a Frigate+ model or a custom model that detects license plates, ensure that `license_plate` is added to your list of objects to track.
+If you are using the free model that ships with Frigate, you should _not_ add `license_plate` to the list of objects to track.
+
+### Can I run LPR without detecting `car` objects?
+
+No, Frigate requires a `car` to be detected first before recognizing a license plate.
+
+### How can I improve detection accuracy?
+
+- Use high-quality cameras with good resolution.
+- Adjust `detection_threshold` and `recognition_threshold` values.
+- Define a `format` regex to filter out invalid detections.
+
+### Does LPR work at night?
+
+Yes, but performance depends on camera quality, lighting, and infrared capabilities. Make sure your camera can capture clear images of plates at night.
+
+### How can I match known plates with minor variations?
+
+Use `match_distance` to allow small character mismatches. Alternatively, define multiple variations in `known_plates`.
+
+### How do I debug LPR issues?
+
+- View MQTT messages for `frigate/events` to verify detected plates.
+- Adjust `detection_threshold` and `recognition_threshold` settings.
+- If you are using a Frigate+ model or a model that detects license plates, watch the debug view (Settings --> Debug) to ensure that `license_plate` is being detected with a `car`.
+- Enable debug logs for LPR by adding `frigate.data_processing.common.license_plate: debug` to your `logger` configuration. These logs are _very_ verbose, so only enable this when necessary.
+
+### Will LPR slow down my system?
+
+LPR runs on the CPU, so performance impact depends on your hardware. Ensure you have at least 4GB RAM and a capable CPU for optimal results.
--- a/docs/docs/configuration/live.md
+++ b/docs/docs/configuration/live.md
@ -183,32 +183,46 @@ The default dashboard ("All Cameras") will always use Smart Streaming and the fi

 :::

+### Disabling cameras
+
+Cameras can be temporarily disabled through the Frigate UI and through [MQTT](/integrations/mqtt#frigatecamera_nameenabledset) to conserve system resources. When disabled, Frigate's ffmpeg processes are terminated — recording stops, object detection is paused, and the Live dashboard displays a blank image with a disabled message. Review items, tracked objects, and historical footage for disabled cameras can still be accessed via the UI.
+
+For restreamed cameras, go2rtc remains active but does not use system resources for decoding or processing unless there are active external consumers (such as the Advanced Camera Card in Home Assistant using a go2rtc source).
+
+Note that disabling a camera through the config file (`enabled: False`) removes all related UI elements, including historical footage access. To retain access while disabling the camera, keep it enabled in the config and use the UI or MQTT to disable it temporarily.
+
 ## Live view FAQ

-1. Why don't I have audio in my Live view?
+1. **Why don't I have audio in my Live view?**
+
   You must use go2rtc to hear audio in your live streams. If you have go2rtc already configured, you need to ensure your camera is sending PCMA/PCMU or AAC audio. If you can't change your camera's audio codec, you need to [transcode the audio](https://github.com/AlexxIT/go2rtc?tab=readme-ov-file#source-ffmpeg) using go2rtc.

   Note that the low bandwidth mode player is a video-only stream. You should not expect to hear audio when in low bandwidth mode, even if you've set up go2rtc.

-2. Frigate shows that my live stream is in "low bandwidth mode". What does this mean?
+2. **Frigate shows that my live stream is in "low bandwidth mode". What does this mean?**
+
   Frigate intelligently selects the live streaming technology based on a number of factors (user-selected modes like two-way talk, camera settings, browser capabilities, available bandwidth) and prioritizes showing an actual up-to-date live view of your camera's stream as quickly as possible.

   When you have go2rtc configured, Live view initially attempts to load and play back your stream with a clearer, fluent stream technology (MSE). An initial timeout, a low bandwidth condition that would cause buffering of the stream, or decoding errors in the stream will cause Frigate to switch to the stream defined by the `detect` role, using the jsmpeg format. This is what the UI labels as "low bandwidth mode". On Live dashboards, the mode will automatically reset when smart streaming is configured and activity stops. You can also try using the _Reset_ button to force a reload of your stream.

   If you are still experiencing Frigate falling back to low bandwidth mode, you may need to adjust your camera's settings per the recommendations above or ensure you have enough bandwidth available.

-3. It doesn't seem like my cameras are streaming on the Live dashboard. Why?
+3. **It doesn't seem like my cameras are streaming on the Live dashboard. Why?**
+
   On the default Live dashboard ("All Cameras"), your camera images will update once per minute when no detectable activity is occurring to conserve bandwidth and resources. As soon as any activity is detected, cameras seamlessly switch to a full-resolution live stream. If you want to customize this behavior, use a camera group.

-4. I see a strange diagonal line on my live view, but my recordings look fine. How can I fix it?
+4. **I see a strange diagonal line on my live view, but my recordings look fine. How can I fix it?**
+
   This is caused by incorrect dimensions set in your detect width or height (or incorrectly auto-detected), causing the jsmpeg player's rendering engine to display a slightly distorted image. You should enlarge the width and height of your `detect` resolution up to a standard aspect ratio (example: 640x352 becomes 640x360, and 800x443 becomes 800x450, 2688x1520 becomes 2688x1512, etc). If changing the resolution to match a standard (4:3, 16:9, or 32:9, etc) aspect ratio does not solve the issue, you can enable "compatibility mode" in your camera group dashboard's stream settings. Depending on your browser and device, more than a few cameras in compatibility mode may not be supported, so only use this option if changing your `detect` width and height fails to resolve the color artifacts and diagonal line.

-5. How does "smart streaming" work?
+5. **How does "smart streaming" work?**
+
   Because a static image of a scene looks exactly the same as a live stream with no motion or activity, smart streaming updates your camera images once per minute when no detectable activity is occurring to conserve bandwidth and resources. As soon as any activity (motion or object/audio detection) occurs, cameras seamlessly switch to a live stream.

   This static image is pulled from the stream defined in your config with the `detect` role. When activity is detected, images from the `detect` stream immediately begin updating at ~5 frames per second so you can see the activity until the live player is loaded and begins playing. This usually only takes a second or two. If the live player times out, buffers, or has streaming errors, the jsmpeg player is loaded and plays a video-only stream from the `detect` role. When activity ends, the players are destroyed and a static image is displayed until activity is detected again, and the process repeats.

   This is Frigate's default and recommended setting because it results in a significant bandwidth savings, especially for high resolution cameras.

-6. I have unmuted some cameras on my dashboard, but I do not hear sound. Why?
+6. **I have unmuted some cameras on my dashboard, but I do not hear sound. Why?**
+
   If your camera is streaming (as indicated by a red dot in the upper right, or if it has been set to continuous streaming mode), your browser may be blocking audio until you interact with the page. This is an intentional browser limitation. See [this article](https://developer.mozilla.org/en-US/docs/Web/Media/Autoplay_guide#autoplay_availability). Many browsers have a whitelist feature to change this behavior.
--- a/docs/docs/configuration/notifications.md
+++ b/docs/docs/configuration/notifications.md
@ -14,6 +14,7 @@ In order to use notifications the following requirements must be met:
 - Frigate must be accessed via a secure `https` connection ([see the authorization docs](/configuration/authentication)).
 - A supported browser must be used. Currently Chrome, Firefox, and Safari are known to be supported.
 - In order for notifications to be usable externally, Frigate must be accessible externally.
+- For iOS devices, some users have also indicated that the Notifications switch needs to be enabled in iOS Settings --> Apps --> Safari --> Advanced --> Features.

 ### Configuration

--- a/docs/docs/configuration/object_detectors.md
+++ b/docs/docs/configuration/object_detectors.md
@ -10,25 +10,31 @@ title: Object Detectors
 Frigate supports multiple different detectors that work on different types of hardware:

 **Most Hardware**
+
 - [Coral EdgeTPU](#edge-tpu-detector): The Google Coral EdgeTPU is available in USB and m.2 format allowing for a wide range of compatibility with devices.
 - [Hailo](#hailo-8l): The Hailo8 AI Acceleration module is available in m.2 format with a HAT for RPi devices, offering a wide range of compatibility with devices.

 **AMD**
+
 - [ROCm](#amdrocm-gpu-detector): ROCm can run on AMD Discrete GPUs to provide efficient object detection.
 - [ONNX](#onnx): ROCm will automatically be detected and used as a detector in the `-rocm` Frigate image when a supported ONNX model is configured.

 **Intel**
+
 - [OpenVino](#openvino-detector): OpenVino can run on Intel Arc GPUs, Intel integrated GPUs, and Intel CPUs to provide efficient object detection.
 - [ONNX](#onnx): OpenVINO will automatically be detected and used as a detector in the default Frigate image when a supported ONNX model is configured.

 **Nvidia**
+
 - [TensortRT](#nvidia-tensorrt-detector): TensorRT can run on Nvidia GPUs and Jetson devices, using one of many default models.
 - [ONNX](#onnx): TensorRT will automatically be detected and used as a detector in the `-tensorrt` or `-tensorrt-jp(4/5)` Frigate images when a supported ONNX model is configured.

 **Rockchip**
+
 - [RKNN](#rockchip-platform): RKNN models can run on Rockchip devices with included NPUs.

 **For Testing**
+
 - [CPU Detector (not recommended for actual use](#cpu-detector-not-recommended): Use a CPU to run tflite model, this is not recommended and in most cases OpenVINO can be used in CPU mode with better results.

 :::
@ -43,7 +49,7 @@ This does not affect using hardware for accelerating other tasks such as [semant

 # Officially Supported Detectors

-Frigate provides the following builtin detector types: `cpu`, `edgetpu`, `hailo8l`, `onnx`, `openvino`, `rknn`, `rocm`, and `tensorrt`. By default, Frigate will use a single CPU detector. Other detectors may require additional configuration as described below. When using multiple detectors they will run in dedicated processes, but pull from a common queue of detection requests from across all cameras.
+Frigate provides the following builtin detector types: `cpu`, `edgetpu`, `hailo8l`, `onnx`, `openvino`, `rknn`, and `tensorrt`. By default, Frigate will use a single CPU detector. Other detectors may require additional configuration as described below. When using multiple detectors they will run in dedicated processes, but pull from a common queue of detection requests from across all cameras.

 ## Edge TPU Detector

@ -147,7 +153,6 @@ model:
  path: /config/model_cache/h8l_cache/ssd_mobilenet_v1.hef
 ```

-
 ## OpenVINO Detector

 The OpenVINO detector type runs an OpenVINO IR model on AMD and Intel CPUs, Intel GPUs and Intel VPU hardware. To configure an OpenVINO detector, set the `"type"` attribute to `"openvino"`.
@ -225,7 +230,7 @@ Note that the labelmap uses a subset of the complete COCO label set that has onl

 #### YOLOv9

-[YOLOv9](https://github.com/MultimediaTechLab/YOLO) models are supported, but not included by default.
+[YOLOv9](https://github.com/WongKinYiu/yolov9) models are supported, but not included by default.

 :::tip

@ -362,7 +367,7 @@ model:

 ### Setup

-The `rocm` detector supports running YOLO-NAS models on AMD GPUs. Use a frigate docker image with `-rocm` suffix, for example `ghcr.io/blakeblackshear/frigate:stable-rocm`.
+Support for AMD GPUs is provided using the [ONNX detector](#ONNX). In order to utilize the AMD GPU for object detection use a frigate docker image with `-rocm` suffix, for example `ghcr.io/blakeblackshear/frigate:stable-rocm`.

 ### Docker settings for GPU access

@ -412,7 +417,7 @@ When using docker compose:
 ```yaml
 services:
  frigate:
-...
+
 environment:
  HSA_OVERRIDE_GFX_VERSION: "9.0.0"
 ```
@ -441,29 +446,9 @@ $ docker exec -it frigate /bin/bash -c '(unset HSA_OVERRIDE_GFX_VERSION && /opt/

 ### Supported Models

-There is no default model provided, the following formats are supported:
-
-#### YOLO-NAS
-
-[YOLO-NAS](https://github.com/Deci-AI/super-gradients/blob/master/YOLONAS.md) models are supported, but not included by default. See [the models section](#downloading-yolo-nas-model) for more information on downloading the YOLO-NAS model for use in Frigate.
-
-After placing the downloaded onnx model in your config folder, you can use the following configuration:
-
-```yaml
-detectors:
-  rocm:
-    type: rocm
-
-model:
-  model_type: yolonas
-  width: 320 # <--- should match whatever was set in notebook
-  height: 320 # <--- should match whatever was set in notebook
-  input_pixel_format: bgr
-  path: /config/yolo_nas_s.onnx
-  labelmap_path: /labelmap/coco-80.txt
-```
-
-Note that the labelmap uses a subset of the complete COCO label set that has only 80 objects.
+See [ONNX supported models](#supported-models) for supported models, there are some caveats:
+- D-FINE models are not supported
+- YOLO-NAS models are known to not run well on integrated GPUs

 ## ONNX

@ -528,7 +513,7 @@ model:

 #### YOLOv9

-[YOLOv9](https://github.com/MultimediaTechLab/YOLO) models are supported, but not included by default.
+[YOLOv9](https://github.com/WongKinYiu/yolov9) models are supported, but not included by default.

 :::tip

@ -555,6 +540,35 @@ model:

 Note that the labelmap uses a subset of the complete COCO label set that has only 80 objects.

+#### D-FINE
+
+[D-FINE](https://github.com/Peterande/D-FINE) is the [current state of the art](https://paperswithcode.com/sota/real-time-object-detection-on-coco?p=d-fine-redefine-regression-task-in-detrs-as) at the time of writing. The ONNX exported models are supported, but not included by default. See [the models section](#downloading-d-fine-model) for more information on downloading the D-FINE model for use in Frigate.
+
+:::warning
+
+D-FINE is currently not supported on OpenVINO
+
+:::
+
+After placing the downloaded onnx model in your config/model_cache folder, you can use the following configuration:
+
+```yaml
+detectors:
+  onnx:
+    type: onnx
+
+model:
+  model_type: dfine
+  width: 640
+  height: 640
+  input_tensor: nchw
+  input_dtype: float
+  path: /config/model_cache/dfine_m_obj2coco.onnx
+  labelmap_path: /labelmap/coco-80.txt
+```
+
+Note that the labelmap uses a subset of the complete COCO label set that has only 80 objects.
+
 ## CPU Detector (not recommended)

 The CPU detector type runs a TensorFlow Lite model utilizing the CPU without hardware acceleration. It is recommended to use a hardware accelerated detector type instead for better performance. To configure a CPU based detector, set the `"type"` attribute to `"cpu"`.
@ -704,7 +718,7 @@ To convert a onnx model to the rknn format using the [rknn-toolkit2](https://git
 This is an example configuration file that you need to adjust to your specific onnx model:

 ```yaml
-soc: ["rk3562","rk3566", "rk3568", "rk3576", "rk3588"]
+soc: ["rk3562", "rk3566", "rk3568", "rk3576", "rk3588"]
 quantization: false

 output_name: "{input_basename}"
@ -735,6 +749,29 @@ Some model types are not included in Frigate by default.

 Here are some tips for getting different model types

+### Downloading D-FINE Model
+
+To export as ONNX:
+
+1. Clone: https://github.com/Peterande/D-FINE and install all dependencies.
+2. Select and download a checkpoint from the [readme](https://github.com/Peterande/D-FINE).
+3. Modify line 58 of `tools/deployment/export_onnx.py` and change batch size to 1: `data = torch.rand(1, 3, 640, 640)`
+4. Run the export, making sure you select the right config, for your checkpoint.
+
+Example:
+
+```
+python3 tools/deployment/export_onnx.py -c configs/dfine/objects365/dfine_hgnetv2_m_obj2coco.yml -r output/dfine_m_obj2coco.pth
+```
+
+:::tip
+
+Model export has only been tested on Linux (or WSL2). Not all dependencies are in `requirements.txt`. Some live in the deployment folder, and some are still missing entirely and must be installed manually.
+
+Make sure you change the batch size to 1 before exporting.
+
+:::
+
 ### Downloading YOLO-NAS Model

 You can build and download a compatible model with pre-trained weights using [this notebook](https://github.com/blakeblackshear/frigate/blob/dev/notebooks/YOLO_NAS_Pretrained_Export.ipynb) [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/blakeblackshear/frigate/blob/dev/notebooks/YOLO_NAS_Pretrained_Export.ipynb).
--- a/docs/docs/configuration/record.md
+++ b/docs/docs/configuration/record.md
@ -183,6 +183,8 @@ record:
  sync_recordings: True
 ```

+This feature is meant to fix variations in files, not completely delete entries in the database. If you delete all of your media, don't use `sync_recordings`, just stop Frigate, delete the `frigate.db` database, and restart.
+
 :::warning

 The sync operation uses considerable CPU resources and in most cases is not needed, only enable when necessary.
--- a/docs/docs/configuration/reference.md
+++ b/docs/docs/configuration/reference.md
@ -255,6 +255,8 @@ ffmpeg:
 # Optional: Detect configuration
 # NOTE: Can be overridden at the camera level
 detect:
+  # Optional: enables detection for the camera (default: shown below)
+  enabled: False
  # Optional: width of the frame for the input with the detect role (default: use native stream resolution)
  width: 1280
  # Optional: height of the frame for the input with the detect role (default: use native stream resolution)
@ -262,8 +264,6 @@ detect:
  # Optional: desired fps for your camera for the input with the detect role (default: shown below)
  # NOTE: Recommended value of 5. Ideally, try and reduce your FPS on the camera.
  fps: 5
-  # Optional: enables detection for the camera (default: True)
-  enabled: True
  # Optional: Number of consecutive detection hits required for an object to be initialized in the tracker. (default: 1/2 the frame rate)
  min_initialized: 2
  # Optional: Number of frames without a detection before Frigate considers an object to be gone. (default: 5x the frame rate)
@ -536,6 +536,8 @@ semantic_search:
  enabled: False
  # Optional: Re-index embeddings database from historical tracked objects (default: shown below)
  reindex: False
+  # Optional: Set the model used for embeddings. (default: shown below)
+  model: "jinav1"
  # Optional: Set the model size used for embeddings. (default: shown below)
  # NOTE: small model runs on CPU and large model runs on GPU
  model_size: "small"
@ -568,7 +570,6 @@ lpr:
  known_plates: {}

 # Optional: Configuration for AI generated tracked object descriptions
-# NOTE: Semantic Search must be enabled for this to do anything.
 # WARNING: Depending on the provider, this will send thumbnails over the internet
 # to Google or OpenAI's LLMs to generate descriptions. It can be overridden at
 # the camera level (enabled: False) to enhance privacy for indoor cameras.
@ -812,6 +813,12 @@ cameras:
        - cat
      # Optional: Restrict generation to objects that entered any of the listed zones (default: none, all zones qualify)
      required_zones: []
+      # Optional: What triggers to use to send frames for a tracked object to generative AI (default: shown below)
+      send_triggers:
+        # Once the object is no longer tracked
+        tracked_object_end: True
+        # Optional: After X many significant updates are received (default: shown below)
+        after_significant_updates: None
      # Optional: Save thumbnails sent to generative AI for review/debugging purposes (default: shown below)
      debug_save_thumbnails: False

--- a/docs/docs/configuration/semantic_search.md
+++ b/docs/docs/configuration/semantic_search.md
@ -5,7 +5,7 @@ title: Semantic Search

 Semantic Search in Frigate allows you to find tracked objects within your review items using either the image itself, a user-defined text description, or an automatically generated one. This feature works by creating _embeddings_ — numerical vector representations — for both the images and text descriptions of your tracked objects. By comparing these embeddings, Frigate assesses their similarities to deliver relevant search results.

-Frigate uses [Jina AI's CLIP model](https://huggingface.co/jinaai/jina-clip-v1) to create and save embeddings to Frigate's database. All of this runs locally.
+Frigate uses models from [Jina AI](https://huggingface.co/jinaai) to create and save embeddings to Frigate's database. All of this runs locally.

 Semantic Search is accessed via the _Explore_ view in the Frigate UI.

@ -35,23 +35,47 @@ If you are enabling Semantic Search for the first time, be advised that Frigate

 :::

-### Jina AI CLIP
+### Jina AI CLIP (version 1)

-The vision model is able to embed both images and text into the same vector space, which allows `image -> image` and `text -> image` similarity searches. Frigate uses this model on tracked objects to encode the thumbnail image and store it in the database. When searching for tracked objects via text in the search box, Frigate will perform a `text -> image` similarity search against this embedding. When clicking "Find Similar" in the tracked object detail pane, Frigate will perform an `image -> image` similarity search to retrieve the closest matching thumbnails.
+The [V1 model from Jina](https://huggingface.co/jinaai/jina-clip-v1) has a vision model which is able to embed both images and text into the same vector space, which allows `image -> image` and `text -> image` similarity searches. Frigate uses this model on tracked objects to encode the thumbnail image and store it in the database. When searching for tracked objects via text in the search box, Frigate will perform a `text -> image` similarity search against this embedding. When clicking "Find Similar" in the tracked object detail pane, Frigate will perform an `image -> image` similarity search to retrieve the closest matching thumbnails.

-The text model is used to embed tracked object descriptions and perform searches against them. Descriptions can be created, viewed, and modified on the Explore page when clicking on thumbnail of a tracked object. See [the Generative AI docs](/configuration/genai.md) for more information on how to automatically generate tracked object descriptions.
+The V1 text model is used to embed tracked object descriptions and perform searches against them. Descriptions can be created, viewed, and modified on the Explore page when clicking on thumbnail of a tracked object. See [the Generative AI docs](/configuration/genai.md) for more information on how to automatically generate tracked object descriptions.

-Differently weighted versions of the Jina model are available and can be selected by setting the `model_size` config option as `small` or `large`:
+Differently weighted versions of the Jina models are available and can be selected by setting the `model_size` config option as `small` or `large`:

 ```yaml
 semantic_search:
  enabled: True
+  model: "jinav1"
  model_size: small
 ```

 - Configuring the `large` model employs the full Jina model and will automatically run on the GPU if applicable.
 - Configuring the `small` model employs a quantized version of the Jina model that uses less RAM and runs on CPU with a very negligible difference in embedding quality.

+### Jina AI CLIP (version 2)
+
+Frigate also supports the [V2 model from Jina](https://huggingface.co/jinaai/jina-clip-v2), which introduces multilingual support (89 languages). In contrast, the V1 model only supports English.
+
+V2 offers only a 3% performance improvement over V1 in both text-image and text-text retrieval tasks, an upgrade that is unlikely to yield noticeable real-world benefits. Additionally, V2 has _significantly_ higher RAM and GPU requirements, leading to increased inference time and memory usage. If you plan to use V2, ensure your system has ample RAM and a discrete GPU. CPU inference (with the `small` model) using V2 is not recommended.
+
+To use the V2 model, update the `model` parameter in your config:
+
+```yaml
+semantic_search:
+  enabled: True
+  model: "jinav2"
+  model_size: large
+```
+
+For most users, especially native English speakers, the V1 model remains the recommended choice.
+
+:::note
+
+Switching between V1 and V2 requires reindexing your embeddings. To do this, set `reindex: True` in your Semantic Search configuration and restart Frigate. The embeddings from V1 and V2 are incompatible, and failing to reindex will result in incorrect search results.
+
+:::
+
 ### GPU Acceleration

 The CLIP models are downloaded in ONNX format, and the `large` model can be accelerated using GPU hardware, when available. This depends on the Docker build that is used.
--- a/docs/docs/configuration/zones.md
+++ b/docs/docs/configuration/zones.md
@ -140,12 +140,12 @@ cameras:
    zones:
      street:
        coordinates: 0.033,0.306,0.324,0.138,0.439,0.185,0.042,0.428
-        distances: 10,12,11,13.5
+        distances: 10,12,11,13.5 # in meters or feet
 ```

 Each number in the `distance` field represents the real-world distance between the points in the `coordinates` list. So in the example above, the distance between the first two points ([0.033,0.306] and [0.324,0.138]) is 10. The distance between the second and third set of points ([0.324,0.138] and [0.439,0.185]) is 12, and so on. The fastest and most accurate way to configure this is through the Zone Editor in the Frigate UI.

-The `distance` values are measured in meters or feet, depending on how `unit_system` is configured in your `ui` config:
+The `distance` values are measured in meters (metric) or feet (imperial), depending on how `unit_system` is configured in your `ui` config:

 ```yaml
 ui:
@ -153,7 +153,9 @@ ui:
  unit_system: metric
 ```

-The average speed of your object as it moved through your zone is saved in Frigate's database and can be seen in the UI in the Tracked Object Details pane in Explore. Current estimated speed can also be seen on the debug view as the third value in the object label (see the caveats below). Current estimated speed, average estimated speed, and velocity angle (the angle of the direction the object is moving relative to the frame) of tracked objects is also sent through the `events` MQTT topic. See the [MQTT docs](../integrations/mqtt.md#frigateevents). These speed values are output as a number in miles per hour (mph) or kilometers per hour (kph), depending on how `unit_system` is configured in your `ui` config.
+The average speed of your object as it moved through your zone is saved in Frigate's database and can be seen in the UI in the Tracked Object Details pane in Explore. Current estimated speed can also be seen on the debug view as the third value in the object label (see the caveats below). Current estimated speed, average estimated speed, and velocity angle (the angle of the direction the object is moving relative to the frame) of tracked objects is also sent through the `events` MQTT topic. See the [MQTT docs](../integrations/mqtt.md#frigateevents).
+
+These speed values are output as a number in miles per hour (mph) or kilometers per hour (kph). For miles per hour, set `unit_system` to `imperial`. For kilometers per hour, set `unit_system` to `metric`.

 #### Best practices and caveats

--- a/docs/docs/frigate/installation.md
+++ b/docs/docs/frigate/installation.md
@ -80,12 +80,12 @@ The Frigate container also stores logs in shm, which can take up to **40MB**, so
 You can calculate the **minimum** shm size for each camera with the following formula using the resolution specified for detect:

 ```console
-# Replace <width> and <height>
+# Template for one camera without logs, replace <width> and <height>
 $ python -c 'print("{:.2f}MB".format((<width> * <height> * 1.5 * 20 + 270480) / 1048576))'

 # Example for 1280x720, including logs
-$ python -c 'print("{:.2f}MB".format((1280 * 720 * 1.5 * 20 + 270480) / 1048576)) + 40'
-46.63MB
+$ python -c 'print("{:.2f}MB".format((1280 * 720 * 1.5 * 20 + 270480) / 1048576 + 40))'
+66.63MB

 # Example for eight cameras detecting at 1280x720, including logs
 $ python -c 'print("{:.2f}MB".format(((1280 * 720 * 1.5 * 20 + 270480) / 1048576) * 8 + 40))'
--- a/docs/docs/guides/getting_started.md
+++ b/docs/docs/guides/getting_started.md
@ -151,8 +151,6 @@ cameras:
        - path: rtsp://10.0.10.10:554/rtsp # <----- The stream you want to use for detection
          roles:
            - detect
-    detect:
-      enabled: False # <---- disable detection until you have a working camera feed
 ```

 ### Step 2: Start Frigate
@ -177,7 +175,7 @@ services:
  frigate:
    ...
    devices:
-      - /dev/dri/renderD128 # for intel hwaccel, needs to be updated for your hardware
+      - /dev/dri/renderD128:/dev/dri/renderD128 # for intel hwaccel, needs to be updated for your hardware
    ...
 ```

@ -307,7 +305,7 @@ By default, Frigate will retain video of all tracked objects for 10 days. The fu

 ### Step 7: Complete config

-At this point you have a complete config with basic functionality. 
+At this point you have a complete config with basic functionality.
 - View [common configuration examples](../configuration/index.md#common-configuration-examples) for a list of common configuration examples.
 - View [full config reference](../configuration/reference.md) for a complete list of configuration options.

--- a/docs/docs/integrations/mqtt.md
+++ b/docs/docs/integrations/mqtt.md
@ -222,6 +222,14 @@ Publishes the rms value for audio detected on this camera.

 **NOTE:** Requires audio detection to be enabled

+### `frigate/<camera_name>/enabled/set`
+
+Topic to turn Frigate's processing of a camera on and off. Expected values are `ON` and `OFF`.
+
+### `frigate/<camera_name>/enabled/state`
+
+Topic with current state of processing for a camera. Published values are `ON` and `OFF`.
+
 ### `frigate/<camera_name>/detect/set`

 Topic to turn object detection for a camera on and off. Expected values are `ON` and `OFF`.
--- a/docs/docs/plus/index.md
+++ b/docs/docs/plus/index.md
@ -28,11 +28,11 @@ Not all model types are supported by all detectors, so it's important to choose

 ## Supported detector types

-Currently, Frigate+ models support CPU (`cpu`), Google Coral (`edgetpu`), OpenVino (`openvino`), ONNX (`onnx`), and ROCm (`rocm`) detectors.
+Currently, Frigate+ models support CPU (`cpu`), Google Coral (`edgetpu`), OpenVino (`openvino`), and ONNX (`onnx`) detectors.

 :::warning

-Using Frigate+ models with `onnx` and `rocm` is only available with Frigate 0.15 and later.
+Using Frigate+ models with `onnx` is only available with Frigate 0.15 and later.

 :::

@ -42,7 +42,7 @@ Using Frigate+ models with `onnx` and `rocm` is only available with Frigate 0.15
 | [Coral (all form factors)](/configuration/object_detectors.md#edge-tpu-detector)                                             | `edgetpu`                 | `mobiledet`            |
 | [Intel](/configuration/object_detectors.md#openvino-detector)                                                                | `openvino`                | `yolonas`              |
 | [NVidia GPU](https://deploy-preview-13787--frigate-docs.netlify.app/configuration/object_detectors#onnx)\*                   | `onnx`                    | `yolonas`              |
-| [AMD ROCm GPU](https://deploy-preview-13787--frigate-docs.netlify.app/configuration/object_detectors#amdrocm-gpu-detector)\* | `rocm`                    | `yolonas`              |
+| [AMD ROCm GPU](https://deploy-preview-13787--frigate-docs.netlify.app/configuration/object_detectors#amdrocm-gpu-detector)\* | `onnx`                    | `yolonas`              |

 _\* Requires Frigate 0.15_

--- a/docs/docs/troubleshooting/edgetpu.md
+++ b/docs/docs/troubleshooting/edgetpu.md
@ -10,6 +10,12 @@ There are many possible causes for a USB coral not being detected and some are O
 1. When the device is first plugged in and has not initialized it will appear as `1a6e:089a Global Unichip Corp.` when running `lsusb` or checking the hardware page in HA OS.
 2. Once initialized, the device will appear as `18d1:9302 Google Inc.` when running `lsusb` or checking the hardware page in HA OS.

+:::tip
+
+Using `lsusb` or checking the hardware page in HA OS will show as `1a6e:089a Global Unichip Corp.` until Frigate runs an inferance using the coral. So don't worry about the identification until after Frigate has attempted to detect the coral.
+
+:::
+
 If the coral does not initialize then Frigate can not interface with it. Some common reasons for the USB based Coral not initializing are:

 ### Not Enough Power
--- a/frigate/api/app.py
+++ b/frigate/api/app.py
@ -22,6 +22,7 @@ from markupsafe import escape
 from peewee import operator
 from pydantic import ValidationError

+from frigate.api.auth import require_role
 from frigate.api.defs.query.app_query_parameters import AppTimelineHourlyQueryParameters
 from frigate.api.defs.request.app_body import AppConfigSetBody
 from frigate.api.defs.tags import Tags
@ -201,7 +202,7 @@ def config_raw():
        )


-@router.post("/config/save")
+@router.post("/config/save", dependencies=[Depends(require_role(["admin"]))])
 def config_save(save_option: str, body: Any = Body(media_type="text/plain")):
    new_config = body.decode()
    if not new_config:
@ -326,7 +327,7 @@ def config_save(save_option: str, body: Any = Body(media_type="text/plain")):
        )


-@router.put("/config/set")
+@router.put("/config/set", dependencies=[Depends(require_role(["admin"]))])
 def config_set(request: Request, body: AppConfigSetBody):
    config_file = find_config_file()

@ -542,7 +543,7 @@ async def logs(
        )


-@router.post("/restart")
+@router.post("/restart", dependencies=[Depends(require_role(["admin"]))])
 def restart():
    try:
        restart_frigate()
--- a/frigate/api/auth.py
+++ b/frigate/api/auth.py
@ -11,8 +11,9 @@ import secrets
 import time
 from datetime import datetime
 from pathlib import Path
+from typing import List

-from fastapi import APIRouter, Request, Response
+from fastapi import APIRouter, Depends, HTTPException, Request, Response
 from fastapi.responses import JSONResponse, RedirectResponse
 from joserfc import jwt
 from peewee import DoesNotExist
@ -22,6 +23,7 @@ from frigate.api.defs.request.app_body import (
    AppPostLoginBody,
    AppPostUsersBody,
    AppPutPasswordBody,
+    AppPutRoleBody,
 )
 from frigate.api.defs.tags import Tags
 from frigate.config import AuthConfig, ProxyConfig
@ -169,8 +171,10 @@ def verify_password(password, password_hash):
    return secrets.compare_digest(password_hash, compare_hash)


-def create_encoded_jwt(user, expiration, secret):
-    return jwt.encode({"alg": "HS256"}, {"sub": user, "exp": expiration}, secret)
+def create_encoded_jwt(user, role, expiration, secret):
+    return jwt.encode(
+        {"alg": "HS256"}, {"sub": user, "role": role, "exp": expiration}, secret
+    )


 def set_jwt_cookie(response: Response, cookie_name, encoded_jwt, expiration, secure):
@ -184,7 +188,48 @@ def set_jwt_cookie(response: Response, cookie_name, encoded_jwt, expiration, sec
    )


-# Endpoint for use with nginx auth_request
+async def get_current_user(request: Request):
+    JWT_COOKIE_NAME = request.app.frigate_config.auth.cookie_name
+    encoded_token = request.cookies.get(JWT_COOKIE_NAME)
+    if not encoded_token:
+        return JSONResponse(content={"message": "No JWT token found"}, status_code=401)
+
+    try:
+        token = jwt.decode(encoded_token, request.app.jwt_token)
+        if "sub" not in token.claims or "role" not in token.claims:
+            return JSONResponse(
+                content={"message": "Invalid JWT token"}, status_code=401
+            )
+        return {"username": token.claims["sub"], "role": token.claims["role"]}
+    except Exception as e:
+        logger.error(f"Error parsing JWT: {e}")
+        return JSONResponse(content={"message": "Invalid JWT token"}, status_code=401)
+
+
+def require_role(required_roles: List[str]):
+    async def role_checker(request: Request):
+        # Get role from header (could be comma-separated)
+        role_header = request.headers.get("remote-role")
+        roles = [r.strip() for r in role_header.split(",")] if role_header else []
+
+        # Check if we have any roles
+        if not roles:
+            raise HTTPException(status_code=403, detail="Role not provided")
+
+        # Check if any role matches required_roles
+        if not any(role in required_roles for role in roles):
+            raise HTTPException(
+                status_code=403,
+                detail=f"Role {', '.join(roles)} not authorized. Required: {', '.join(required_roles)}",
+            )
+
+        # Return the first matching role
+        return next((role for role in roles if role in required_roles), roles[0])
+
+    return role_checker
+
+
+# Endpoints
@router.get("/auth")
 def auth(request: Request):
    auth_config: AuthConfig = request.app.frigate_config.auth
@ -195,6 +240,8 @@ def auth(request: Request):
    # dont require auth if the request is on the internal port
    # this header is set by Frigate's nginx proxy, so it cant be spoofed
    if int(request.headers.get("x-server-port", default=0)) == 5000:
+        success_response.headers["remote-user"] = "anonymous"
+        success_response.headers["remote-role"] = "admin"
        return success_response

    fail_response = Response("", status_code=401)
@ -211,14 +258,18 @@ def auth(request: Request):
    if not auth_config.enabled:
        # pass the user header value from the upstream proxy if a mapping is specified
        # or use anonymous if none are specified
-        if proxy_config.header_map.user is not None:
-            upstream_user_header_value = request.headers.get(
-                proxy_config.header_map.user,
-                default="anonymous",
-            )
-            success_response.headers["remote-user"] = upstream_user_header_value
-        else:
-            success_response.headers["remote-user"] = "anonymous"
+        user_header = proxy_config.header_map.user
+        role_header = proxy_config.header_map.get("role", "Remote-Role")
+        success_response.headers["remote-user"] = (
+            request.headers.get(user_header, default="anonymous")
+            if user_header
+            else "anonymous"
+        )
+        success_response.headers["remote-role"] = (
+            request.headers.get(role_header, default="viewer")
+            if role_header
+            else "viewer"
+        )
        return success_response

    # now apply authentication
@ -251,11 +302,15 @@ def auth(request: Request):
        if "sub" not in token.claims:
            logger.debug("user not set in jwt token")
            return fail_response
+        if "role" not in token.claims:
+            logger.debug("role not set in jwt token")
+            return fail_response
        if "exp" not in token.claims:
            logger.debug("exp not set in jwt token")
            return fail_response

        user = token.claims.get("sub")
+        role = token.claims.get("role")
        current_time = int(time.time())

        # if the jwt is expired
@ -283,7 +338,7 @@ def auth(request: Request):
                return fail_response
            new_expiration = current_time + JWT_SESSION_LENGTH
            new_encoded_jwt = create_encoded_jwt(
-                user, new_expiration, request.app.jwt_token
+                user, role, new_expiration, request.app.jwt_token
            )
            set_jwt_cookie(
                success_response,
@ -294,6 +349,7 @@ def auth(request: Request):
            )

        success_response.headers["remote-user"] = user
+        success_response.headers["remote-role"] = role
        return success_response
    except Exception as e:
        logger.error(f"Error parsing jwt: {e}")
@ -302,8 +358,16 @@ def auth(request: Request):

@router.get("/profile")
 def profile(request: Request):
-    username = request.headers.get("remote-user")
-    return JSONResponse(content={"username": username})
+    username = request.headers.get("remote-user", "anonymous")
+    if username != "anonymous":
+        try:
+            user = User.get_by_id(username)
+            role = getattr(user, "role", "viewer")
+        except DoesNotExist:
+            role = "viewer"  # Fallback if user deleted
+    else:
+        role = None
+    return JSONResponse(content={"username": username, "role": role})


@router.get("/logout")
@ -333,8 +397,11 @@ def login(request: Request, body: AppPostLoginBody):

    password_hash = db_user.password_hash
    if verify_password(password, password_hash):
+        role = getattr(db_user, "role", "viewer")
+        if role not in ["admin", "viewer"]:
+            role = "viewer"  # Enforce valid roles
        expiration = int(time.time()) + JWT_SESSION_LENGTH
-        encoded_jwt = create_encoded_jwt(user, expiration, request.app.jwt_token)
+        encoded_jwt = create_encoded_jwt(user, role, expiration, request.app.jwt_token)
        response = Response("", 200)
        set_jwt_cookie(
            response, JWT_COOKIE_NAME, encoded_jwt, expiration, JWT_COOKIE_SECURE
@ -343,25 +410,31 @@ def login(request: Request, body: AppPostLoginBody):
    return JSONResponse(content={"message": "Login failed"}, status_code=401)


-@router.get("/users")
+@router.get("/users", dependencies=[Depends(require_role(["admin"]))])
 def get_users():
-    exports = User.select(User.username).order_by(User.username).dicts().iterator()
+    exports = (
+        User.select(User.username, User.role).order_by(User.username).dicts().iterator()
+    )
    return JSONResponse([e for e in exports])


-@router.post("/users")
-def create_user(request: Request, body: AppPostUsersBody):
+@router.post("/users", dependencies=[Depends(require_role(["admin"]))])
+def create_user(
+    request: Request,
+    body: AppPostUsersBody,
+):
    HASH_ITERATIONS = request.app.frigate_config.auth.hash_iterations

    if not re.match("^[A-Za-z0-9._]+$", body.username):
-        JSONResponse(content={"message": "Invalid username"}, status_code=400)
+        return JSONResponse(content={"message": "Invalid username"}, status_code=400)

+    role = body.role if body.role in ["admin", "viewer"] else "viewer"
    password_hash = hash_password(body.password, iterations=HASH_ITERATIONS)
-
    User.insert(
        {
            User.username: body.username,
            User.password_hash: password_hash,
+            User.role: role,
            User.notification_tokens: [],
        }
    ).execute()
@ -375,15 +448,61 @@ def delete_user(username: str):


@router.put("/users/{username}/password")
-def update_password(request: Request, username: str, body: AppPutPasswordBody):
+async def update_password(
+    request: Request,
+    username: str,
+    body: AppPutPasswordBody,
+):
+    current_user = await get_current_user(request)
+    if isinstance(current_user, JSONResponse):
+        # auth failed
+        return current_user
+
+    current_username = current_user.get("username")
+    current_role = current_user.get("role")
+
+    # viewers can only change their own password
+    if current_role == "viewer" and current_username != username:
+        raise HTTPException(
+            status_code=403, detail="Viewers can only update their own password"
+        )
+
    HASH_ITERATIONS = request.app.frigate_config.auth.hash_iterations

    password_hash = hash_password(body.password, iterations=HASH_ITERATIONS)
+    User.set_by_id(username, {User.password_hash: password_hash})

-    User.set_by_id(
-        username,
-        {
-            User.password_hash: password_hash,
-        },
-    )
+    return JSONResponse(content={"success": True})
+
+
+@router.put(
+    "/users/{username}/role",
+    dependencies=[Depends(require_role(["admin"]))],
+)
+async def update_role(
+    request: Request,
+    username: str,
+    body: AppPutRoleBody,
+):
+    current_user = await get_current_user(request)
+    if isinstance(current_user, JSONResponse):
+        # auth failed
+        return current_user
+
+    current_role = current_user.get("role")
+    # viewers can't change anyone's role
+    if current_role == "viewer":
+        raise HTTPException(
+            status_code=403, detail="Admin role is required to change user roles"
+        )
+    if username == "admin":
+        return JSONResponse(
+            content={"message": "Cannot modify admin user's role"}, status_code=403
+        )
+    if body.role not in ["admin", "viewer"]:
+        return JSONResponse(
+            content={"message": "Role must be 'admin' or 'viewer'"}, status_code=400
+        )
+
+    User.set_by_id(username, {User.role: body.role})
    return JSONResponse(content={"success": True})
--- a/frigate/api/classification.py
+++ b/frigate/api/classification.py
@ -6,13 +6,17 @@ import random
 import shutil
 import string

-from fastapi import APIRouter, Request, UploadFile
+from fastapi import APIRouter, Depends, Request, UploadFile
 from fastapi.responses import JSONResponse
 from pathvalidate import sanitize_filename
+from peewee import DoesNotExist
+from playhouse.shortcuts import model_to_dict

+from frigate.api.auth import require_role
 from frigate.api.defs.tags import Tags
 from frigate.const import FACE_DIR
 from frigate.embeddings import EmbeddingsContext
+from frigate.models import Event

 logger = logging.getLogger(__name__)

@ -41,7 +45,7 @@ def get_faces():
    return JSONResponse(status_code=200, content=face_dict)


-@router.post("/faces/reprocess")
+@router.post("/faces/reprocess", dependencies=[Depends(require_role(["admin"]))])
 def reclassify_face(request: Request, body: dict = None):
    if not request.app.frigate_config.face_recognition.enabled:
        return JSONResponse(
@ -118,7 +122,7 @@ def train_face(request: Request, name: str, body: dict = None):
    )


-@router.post("/faces/{name}/create")
+@router.post("/faces/{name}/create", dependencies=[Depends(require_role(["admin"]))])
 async def create_face(request: Request, name: str):
    if not request.app.frigate_config.face_recognition.enabled:
        return JSONResponse(
@ -135,7 +139,7 @@ async def create_face(request: Request, name: str):
    )


-@router.post("/faces/{name}/register")
+@router.post("/faces/{name}/register", dependencies=[Depends(require_role(["admin"]))])
 async def register_face(request: Request, name: str, file: UploadFile):
    if not request.app.frigate_config.face_recognition.enabled:
        return JSONResponse(
@ -151,7 +155,7 @@ async def register_face(request: Request, name: str, file: UploadFile):
    )


-@router.post("/faces/{name}/delete")
+@router.post("/faces/{name}/delete", dependencies=[Depends(require_role(["admin"]))])
 def deregister_faces(request: Request, name: str, body: dict = None):
    if not request.app.frigate_config.face_recognition.enabled:
        return JSONResponse(
@ -176,3 +180,36 @@ def deregister_faces(request: Request, name: str, body: dict = None):
        content=({"success": True, "message": "Successfully deleted faces."}),
        status_code=200,
    )
+
+
+@router.put("/lpr/reprocess")
+def reprocess_license_plate(request: Request, event_id: str):
+    if not request.app.frigate_config.lpr.enabled:
+        message = "License plate recognition is not enabled."
+        logger.error(message)
+        return JSONResponse(
+            content=(
+                {
+                    "success": False,
+                    "message": message,
+                }
+            ),
+            status_code=400,
+        )
+
+    try:
+        event = Event.get(Event.id == event_id)
+    except DoesNotExist:
+        message = f"Event {event_id} not found"
+        logger.error(message)
+        return JSONResponse(
+            content=({"success": False, "message": message}), status_code=404
+        )
+
+    context: EmbeddingsContext = request.app.embeddings
+    response = context.reprocess_plate(model_to_dict(event))
+
+    return JSONResponse(
+        content=response,
+        status_code=200,
+    )
--- a/frigate/api/defs/request/app_body.py
+++ b/frigate/api/defs/request/app_body.py
@ -1,3 +1,5 @@
+from typing import Optional
+
 from pydantic import BaseModel


@ -12,8 +14,13 @@ class AppPutPasswordBody(BaseModel):
 class AppPostUsersBody(BaseModel):
    username: str
    password: str
+    role: Optional[str] = "viewer"


 class AppPostLoginBody(BaseModel):
    user: str
    password: str
+
+
+class AppPutRoleBody(BaseModel):
+    role: str
--- a/frigate/api/defs/response/event_response.py
+++ b/frigate/api/defs/response/event_response.py
@ -12,7 +12,7 @@ class EventResponse(BaseModel):
    end_time: Optional[float]
    false_positive: Optional[bool]
    zones: list[str]
-    thumbnail: str
+    thumbnail: Optional[str]
    has_clip: bool
    has_snapshot: bool
    retain_indefinitely: bool
--- a/frigate/api/event.py
+++ b/frigate/api/event.py
@ -14,6 +14,7 @@ from fastapi.responses import JSONResponse
 from peewee import JOIN, DoesNotExist, fn, operator
 from playhouse.shortcuts import model_to_dict

+from frigate.api.auth import require_role
 from frigate.api.defs.query.events_query_parameters import (
    DEFAULT_TIME_RANGE,
    EventsQueryParams,
@ -708,7 +709,11 @@ def event(event_id: str):
        return JSONResponse(content="Event not found", status_code=404)


-@router.post("/events/{event_id}/retain", response_model=GenericResponse)
+@router.post(
+    "/events/{event_id}/retain",
+    response_model=GenericResponse,
+    dependencies=[Depends(require_role(["admin"]))],
+)
 def set_retain(event_id: str):
    try:
        event = Event.get(Event.id == event_id)
@ -928,7 +933,11 @@ def false_positive(request: Request, event_id: str):
    )


-@router.delete("/events/{event_id}/retain", response_model=GenericResponse)
+@router.delete(
+    "/events/{event_id}/retain",
+    response_model=GenericResponse,
+    dependencies=[Depends(require_role(["admin"]))],
+)
 def delete_retain(event_id: str):
    try:
        event = Event.get(Event.id == event_id)
@ -947,7 +956,11 @@ def delete_retain(event_id: str):
    )


-@router.post("/events/{event_id}/sub_label", response_model=GenericResponse)
+@router.post(
+    "/events/{event_id}/sub_label",
+    response_model=GenericResponse,
+    dependencies=[Depends(require_role(["admin"]))],
+)
 def set_sub_label(
    request: Request,
    event_id: str,
@ -991,6 +1004,10 @@ def set_sub_label(
    new_sub_label = body.subLabel
    new_score = body.subLabelScore

+    if new_sub_label == "":
+        new_sub_label = None
+        new_score = None
+
    if tracked_obj:
        tracked_obj.obj_data["sub_label"] = (new_sub_label, new_score)

@ -1001,26 +1018,28 @@ def set_sub_label(

    if event:
        event.sub_label = new_sub_label
-
-        if new_score:
-            data = event.data
+        data = event.data
+        if new_sub_label is None:
+            data["sub_label_score"] = None
+        elif new_score is not None:
            data["sub_label_score"] = new_score
-            event.data = data
-
+        event.data = data
        event.save()

    return JSONResponse(
-        content=(
-            {
-                "success": True,
-                "message": "Event " + event_id + " sub label set to " + new_sub_label,
-            }
-        ),
+        content={
+            "success": True,
+            "message": f"Event {event_id} sub label set to {new_sub_label if new_sub_label is not None else 'None'}",
+        },
        status_code=200,
    )


-@router.post("/events/{event_id}/description", response_model=GenericResponse)
+@router.post(
+    "/events/{event_id}/description",
+    response_model=GenericResponse,
+    dependencies=[Depends(require_role(["admin"]))],
+)
 def set_description(
    request: Request,
    event_id: str,
@ -1067,7 +1086,11 @@ def set_description(
    )


-@router.put("/events/{event_id}/description/regenerate", response_model=GenericResponse)
+@router.put(
+    "/events/{event_id}/description/regenerate",
+    response_model=GenericResponse,
+    dependencies=[Depends(require_role(["admin"]))],
+)
 def regenerate_description(
    request: Request, event_id: str, params: RegenerateQueryParameters = Depends()
 ):
@ -1081,10 +1104,7 @@ def regenerate_description(

    camera_config = request.app.frigate_config.cameras[event.camera]

-    if (
-        request.app.frigate_config.semantic_search.enabled
-        and camera_config.genai.enabled
-    ):
+    if camera_config.genai.enabled:
        request.app.event_metadata_updater.publish((event.id, params.source))

        return JSONResponse(
@ -1138,14 +1158,22 @@ def delete_single_event(event_id: str, request: Request) -> dict:
    return {"success": True, "message": f"Event {event_id} deleted"}


-@router.delete("/events/{event_id}", response_model=GenericResponse)
+@router.delete(
+    "/events/{event_id}",
+    response_model=GenericResponse,
+    dependencies=[Depends(require_role(["admin"]))],
+)
 def delete_event(request: Request, event_id: str):
    result = delete_single_event(event_id, request)
    status_code = 200 if result["success"] else 404
    return JSONResponse(content=result, status_code=status_code)


-@router.delete("/events/", response_model=EventMultiDeleteResponse)
+@router.delete(
+    "/events/",
+    response_model=EventMultiDeleteResponse,
+    dependencies=[Depends(require_role(["admin"]))],
+)
 def delete_events(request: Request, body: EventsDeleteBody):
    if not body.event_ids:
        return JSONResponse(
@ -1171,7 +1199,11 @@ def delete_events(request: Request, body: EventsDeleteBody):
    return JSONResponse(content=response, status_code=200)


-@router.post("/events/{camera_name}/{label}/create", response_model=EventCreateResponse)
+@router.post(
+    "/events/{camera_name}/{label}/create",
+    response_model=EventCreateResponse,
+    dependencies=[Depends(require_role(["admin"]))],
+)
 def create_event(
    request: Request,
    camera_name: str,
@ -1227,7 +1259,11 @@ def create_event(
    )


-@router.put("/events/{event_id}/end", response_model=GenericResponse)
+@router.put(
+    "/events/{event_id}/end",
+    response_model=GenericResponse,
+    dependencies=[Depends(require_role(["admin"]))],
+)
 def end_event(request: Request, event_id: str, body: EventsEndBody):
    try:
        end_time = body.end_time or datetime.datetime.now().timestamp()
--- a/frigate/api/export.py
+++ b/frigate/api/export.py
@ -6,11 +6,12 @@ import string
 from pathlib import Path

 import psutil
-from fastapi import APIRouter, Request
+from fastapi import APIRouter, Depends, Request
 from fastapi.responses import JSONResponse
 from peewee import DoesNotExist
 from playhouse.shortcuts import model_to_dict

+from frigate.api.auth import require_role
 from frigate.api.defs.request.export_recordings_body import ExportRecordingsBody
 from frigate.api.defs.request.export_rename_body import ExportRenameBody
 from frigate.api.defs.tags import Tags
@ -130,7 +131,9 @@ def export_recording(
    )


-@router.patch("/export/{event_id}/rename")
+@router.patch(
+    "/export/{event_id}/rename", dependencies=[Depends(require_role(["admin"]))]
+)
 def export_rename(event_id: str, body: ExportRenameBody):
    try:
        export: Export = Export.get(Export.id == event_id)
@ -158,7 +161,7 @@ def export_rename(event_id: str, body: ExportRenameBody):
    )


-@router.delete("/export/{event_id}")
+@router.delete("/export/{event_id}", dependencies=[Depends(require_role(["admin"]))])
 def export_delete(event_id: str):
    try:
        export: Export = Export.get(Export.id == event_id)
--- a/frigate/api/media.py
+++ b/frigate/api/media.py
@ -31,6 +31,7 @@ from frigate.config import FrigateConfig
 from frigate.const import (
    CACHE_DIR,
    CLIPS_DIR,
+    INSTALL_DIR,
    MAX_SEGMENT_DURATION,
    PREVIEW_FRAME_TYPE,
    RECORD_DIR,
@ -155,7 +156,9 @@ def latest_frame(
            frame_processor.get_current_frame_time(camera_name) + retry_interval
        ):
            if request.app.camera_error_image is None:
-                error_image = glob.glob("/opt/frigate/frigate/images/camera-error.jpg")
+                error_image = glob.glob(
+                    os.path.join(INSTALL_DIR, "frigate/images/camera-error.jpg")
+                )

                if len(error_image) > 0:
                    request.app.camera_error_image = cv2.imread(
@ -550,7 +553,7 @@ def recording_clip(
    )

    file_name = sanitize_filename(f"playlist_{camera_name}_{start_ts}-{end_ts}.txt")
-    file_path = f"/tmp/cache/{file_name}"
+    file_path = os.path.join(CACHE_DIR, file_name)
    with open(file_path, "w") as file:
        clip: Recordings
        for clip in recordings:
--- a/frigate/api/preview.py
+++ b/frigate/api/preview.py
@ -9,7 +9,7 @@ from fastapi import APIRouter
 from fastapi.responses import JSONResponse

 from frigate.api.defs.tags import Tags
-from frigate.const import CACHE_DIR, PREVIEW_FRAME_TYPE
+from frigate.const import BASE_DIR, CACHE_DIR, PREVIEW_FRAME_TYPE
 from frigate.models import Previews

 logger = logging.getLogger(__name__)
@ -52,7 +52,7 @@ def preview_ts(camera_name: str, start_ts: float, end_ts: float):
        clips.append(
            {
                "camera": preview["camera"],
-                "src": preview["path"].replace("/media/frigate", ""),
+                "src": preview["path"].replace(BASE_DIR, ""),
                "type": "video/mp4",
                "start": preview["start_time"],
                "end": preview["end_time"],
--- a/frigate/api/review.py
+++ b/frigate/api/review.py
@ -12,6 +12,7 @@ from fastapi.responses import JSONResponse
 from peewee import Case, DoesNotExist, fn, operator
 from playhouse.shortcuts import model_to_dict

+from frigate.api.auth import require_role
 from frigate.api.defs.query.review_query_parameters import (
    ReviewActivityMotionQueryParams,
    ReviewQueryParams,
@ -343,7 +344,11 @@ def set_multiple_reviewed(body: ReviewModifyMultipleBody):
    )


-@router.post("/reviews/delete", response_model=GenericResponse)
+@router.post(
+    "/reviews/delete",
+    response_model=GenericResponse,
+    dependencies=[Depends(require_role(["admin"]))],
+)
 def delete_reviews(body: ReviewModifyMultipleBody):
    list_of_ids = body.ids
    reviews = (
--- a/frigate/app.py
+++ b/frigate/app.py
@ -93,7 +93,13 @@ class FrigateApp:
        self.log_queue: Queue = mp.Queue()
        self.camera_metrics: dict[str, CameraMetrics] = {}
        self.embeddings_metrics: DataProcessorMetrics | None = (
-            DataProcessorMetrics() if config.semantic_search.enabled else None
+            DataProcessorMetrics()
+            if (
+                config.semantic_search.enabled
+                or config.lpr.enabled
+                or config.face_recognition.enabled
+            )
+            else None
        )
        self.ptz_metrics: dict[str, PTZMetrics] = {}
        self.processes: dict[str, int] = {}
@ -236,7 +242,16 @@ class FrigateApp:
        logger.info(f"Review process started: {review_segment_process.pid}")

    def init_embeddings_manager(self) -> None:
-        if not self.config.semantic_search.enabled:
+        genai_cameras = [
+            c for c in self.config.cameras.values() if c.enabled and c.genai.enabled
+        ]
+
+        if (
+            not self.config.semantic_search.enabled
+            and not genai_cameras
+            and not self.config.lpr.enabled
+            and not self.config.face_recognition.enabled
+        ):
            return

        embedding_process = util.Process(
@ -293,7 +308,16 @@ class FrigateApp:
            migrate_exports(self.config.ffmpeg, list(self.config.cameras.keys()))

    def init_embeddings_client(self) -> None:
-        if self.config.semantic_search.enabled:
+        genai_cameras = [
+            c for c in self.config.cameras.values() if c.enabled and c.genai.enabled
+        ]
+
+        if (
+            self.config.semantic_search.enabled
+            or self.config.lpr.enabled
+            or genai_cameras
+            or self.config.face_recognition.enabled
+        ):
            # Create a client for other processes to use
            self.embeddings = EmbeddingsContext(self.db)

@ -596,6 +620,7 @@ class FrigateApp:
                )
                User.replace(
                    username="admin",
+                    role="admin",
                    password_hash=password_hash,
                    notification_tokens=[],
                ).execute()
--- a/frigate/camera/activity_manager.py
+++ b/frigate/camera/activity_manager.py
@ -20,7 +20,7 @@ class CameraActivityManager:
        self.all_zone_labels: dict[str, set[str]] = {}

        for camera_config in config.cameras.values():
-            if not camera_config.enabled:
+            if not camera_config.enabled_in_config:
                continue

            self.last_camera_activity[camera_config.name] = {}
@ -33,7 +33,11 @@ class CameraActivityManager:
                    self.zone_active_object_counts[zone] = Counter()
                    self.all_zone_labels[zone] = set()

-                self.all_zone_labels[zone].update(zone_config.objects)
+                self.all_zone_labels[zone].update(
+                    zone_config.objects
+                    if zone_config.objects
+                    else camera_config.objects.track
+                )

    def update_activity(self, new_activity: dict[str, dict[str, any]]) -> None:
        all_objects: list[dict[str, any]] = []
--- a/frigate/comms/config_updater.py
+++ b/frigate/comms/config_updater.py
@ -32,7 +32,9 @@ class ConfigPublisher:
 class ConfigSubscriber:
    """Simplifies receiving an updated config."""

-    def __init__(self, topic: str) -> None:
+    def __init__(self, topic: str, exact=False) -> None:
+        self.topic = topic
+        self.exact = exact
        self.context = zmq.Context()
        self.socket = self.context.socket(zmq.SUB)
        self.socket.setsockopt_string(zmq.SUBSCRIBE, topic)
@ -42,7 +44,12 @@ class ConfigSubscriber:
        """Returns updated config or None if no update."""
        try:
            topic = self.socket.recv_string(flags=zmq.NOBLOCK)
-            return (topic, self.socket.recv_pyobj())
+            obj = self.socket.recv_pyobj()
+
+            if not self.exact or self.topic == topic:
+                return (topic, obj)
+            else:
+                return (None, None)
        except zmq.ZMQError:
            return (None, None)

--- a/frigate/comms/dispatcher.py
+++ b/frigate/comms/dispatcher.py
@ -55,6 +55,7 @@ class Dispatcher:
        self._camera_settings_handlers: dict[str, Callable] = {
            "audio": self._on_audio_command,
            "detect": self._on_detect_command,
+            "enabled": self._on_enabled_command,
            "improve_contrast": self._on_motion_improve_contrast_command,
            "ptz_autotracker": self._on_ptz_autotracker_command,
            "motion": self._on_motion_command,
@ -167,6 +168,7 @@ class Dispatcher:
            for camera in camera_status.keys():
                camera_status[camera]["config"] = {
                    "detect": self.config.cameras[camera].detect.enabled,
+                    "enabled": self.config.cameras[camera].enabled,
                    "snapshots": self.config.cameras[camera].snapshots.enabled,
                    "record": self.config.cameras[camera].record.enabled,
                    "audio": self.config.cameras[camera].audio.enabled,
@ -278,6 +280,27 @@ class Dispatcher:
        self.config_updater.publish(f"config/detect/{camera_name}", detect_settings)
        self.publish(f"{camera_name}/detect/state", payload, retain=True)

+    def _on_enabled_command(self, camera_name: str, payload: str) -> None:
+        """Callback for camera topic."""
+        camera_settings = self.config.cameras[camera_name]
+
+        if payload == "ON":
+            if not self.config.cameras[camera_name].enabled_in_config:
+                logger.error(
+                    "Camera must be enabled in the config to be turned on via MQTT."
+                )
+                return
+            if not camera_settings.enabled:
+                logger.info(f"Turning on camera {camera_name}")
+                camera_settings.enabled = True
+        elif payload == "OFF":
+            if camera_settings.enabled:
+                logger.info(f"Turning off camera {camera_name}")
+                camera_settings.enabled = False
+
+        self.config_updater.publish(f"config/enabled/{camera_name}", camera_settings)
+        self.publish(f"{camera_name}/enabled/state", payload, retain=True)
+
    def _on_motion_command(self, camera_name: str, payload: str) -> None:
        """Callback for motion topic."""
        detect_settings = self.config.cameras[camera_name].detect
--- a/frigate/comms/embeddings_updater.py
+++ b/frigate/comms/embeddings_updater.py
@ -15,6 +15,7 @@ class EmbeddingsRequestEnum(Enum):
    generate_search = "generate_search"
    register_face = "register_face"
    reprocess_face = "reprocess_face"
+    reprocess_plate = "reprocess_plate"


 class EmbeddingsResponder:
--- a/frigate/comms/mqtt.py
+++ b/frigate/comms/mqtt.py
@ -43,6 +43,11 @@ class MqttClient(Communicator):  # type: ignore[misc]
    def _set_initial_topics(self) -> None:
        """Set initial state topics."""
        for camera_name, camera in self.config.cameras.items():
+            self.publish(
+                f"{camera_name}/enabled/state",
+                "ON" if camera.enabled_in_config else "OFF",
+                retain=True,
+            )
            self.publish(
                f"{camera_name}/recordings/state",
                "ON" if camera.record.enabled_in_config else "OFF",
@ -196,6 +201,7 @@ class MqttClient(Communicator):  # type: ignore[misc]

        # register callbacks
        callback_types = [
+            "enabled",
            "recordings",
            "snapshots",
            "detect",
--- a/frigate/comms/recordings_updater.py
+++ b/frigate/comms/recordings_updater.py
@ -0,0 +1,36 @@
+"""Facilitates communication between processes."""
+
+import logging
+from enum import Enum
+
+from .zmq_proxy import Publisher, Subscriber
+
+logger = logging.getLogger(__name__)
+
+
+class RecordingsDataTypeEnum(str, Enum):
+    all = ""
+    recordings_available_through = "recordings_available_through"
+
+
+class RecordingsDataPublisher(Publisher):
+    """Publishes latest recording data."""
+
+    topic_base = "recordings/"
+
+    def __init__(self, topic: RecordingsDataTypeEnum) -> None:
+        topic = topic.value
+        super().__init__(topic)
+
+    def publish(self, payload: tuple[str, float]) -> None:
+        super().publish(payload)
+
+
+class RecordingsDataSubscriber(Subscriber):
+    """Receives latest recording data."""
+
+    topic_base = "recordings/"
+
+    def __init__(self, topic: RecordingsDataTypeEnum) -> None:
+        topic = topic.value
+        super().__init__(topic)
--- a/frigate/config/camera/camera.py
+++ b/frigate/config/camera/camera.py
@ -102,6 +102,9 @@ class CameraConfig(FrigateBaseModel):
    zones: dict[str, ZoneConfig] = Field(
        default_factory=dict, title="Zone configuration."
    )
+    enabled_in_config: Optional[bool] = Field(
+        default=None, title="Keep track of original state of camera."
+    )

    _ffmpeg_cmds: list[dict[str, list[str]]] = PrivateAttr()

--- a/frigate/config/camera/detect.py
+++ b/frigate/config/camera/detect.py
@ -32,6 +32,7 @@ class StationaryConfig(FrigateBaseModel):


 class DetectConfig(FrigateBaseModel):
+    enabled: bool = Field(default=False, title="Detection Enabled.")
    height: Optional[int] = Field(
        default=None, title="Height of the stream for the detect role."
    )
@ -41,7 +42,6 @@ class DetectConfig(FrigateBaseModel):
    fps: int = Field(
        default=5, title="Number of frames per second to process through detection."
    )
-    enabled: bool = Field(default=True, title="Detection Enabled.")
    min_initialized: Optional[int] = Field(
        default=None,
        title="Minimum number of consecutive hits for an object to be initialized by the tracker.",
--- a/frigate/config/camera/ffmpeg.py
+++ b/frigate/config/camera/ffmpeg.py
@ -1,4 +1,3 @@
-import shutil
 from enum import Enum
 from typing import Union

@ -71,10 +70,7 @@ class FfmpegConfig(FrigateBaseModel):
    @property
    def ffmpeg_path(self) -> str:
        if self.path == "default":
-            if shutil.which("ffmpeg") is None:
-                return f"/usr/lib/ffmpeg/{DEFAULT_FFMPEG_VERSION}/bin/ffmpeg"
-            else:
-                return "ffmpeg"
+            return f"/usr/lib/ffmpeg/{DEFAULT_FFMPEG_VERSION}/bin/ffmpeg"
        elif self.path in INCLUDED_FFMPEG_VERSIONS:
            return f"/usr/lib/ffmpeg/{self.path}/bin/ffmpeg"
        else:
@ -83,10 +79,7 @@ class FfmpegConfig(FrigateBaseModel):
    @property
    def ffprobe_path(self) -> str:
        if self.path == "default":
-            if shutil.which("ffprobe") is None:
-                return f"/usr/lib/ffmpeg/{DEFAULT_FFMPEG_VERSION}/bin/ffprobe"
-            else:
-                return "ffprobe"
+            return f"/usr/lib/ffmpeg/{DEFAULT_FFMPEG_VERSION}/bin/ffprobe"
        elif self.path in INCLUDED_FFMPEG_VERSIONS:
            return f"/usr/lib/ffmpeg/{self.path}/bin/ffprobe"
        else:
--- a/frigate/config/camera/genai.py
+++ b/frigate/config/camera/genai.py
@ -16,6 +16,17 @@ class GenAIProviderEnum(str, Enum):
    ollama = "ollama"


+class GenAISendTriggersConfig(BaseModel):
+    tracked_object_end: bool = Field(
+        default=True, title="Send once the object is no longer tracked."
+    )
+    after_significant_updates: Optional[int] = Field(
+        default=None,
+        title="Send an early request to generative AI when X frames accumulated.",
+        ge=1,
+    )
+
+
 # uses BaseModel because some global attributes are not available at the camera level
 class GenAICameraConfig(BaseModel):
    enabled: bool = Field(default=False, title="Enable GenAI for camera.")
@ -42,6 +53,10 @@ class GenAICameraConfig(BaseModel):
        default=False,
        title="Save thumbnails sent to generative AI for debugging purposes.",
    )
+    send_triggers: GenAISendTriggersConfig = Field(
+        default_factory=GenAISendTriggersConfig,
+        title="What triggers to use to send frames to generative AI for a tracked object.",
+    )

    @field_validator("required_zones", mode="before")
    @classmethod
--- a/frigate/config/classification.py
+++ b/frigate/config/classification.py
@ -1,3 +1,4 @@
+from enum import Enum
 from typing import Dict, List, Optional

 from pydantic import Field
@ -11,6 +12,11 @@ __all__ = [
 ]


+class SemanticSearchModelEnum(str, Enum):
+    jinav1 = "jinav1"
+    jinav2 = "jinav2"
+
+
 class BirdClassificationConfig(FrigateBaseModel):
    enabled: bool = Field(default=False, title="Enable bird classification.")
    threshold: float = Field(
@ -30,7 +36,11 @@ class ClassificationConfig(FrigateBaseModel):
 class SemanticSearchConfig(FrigateBaseModel):
    enabled: bool = Field(default=False, title="Enable semantic search.")
    reindex: Optional[bool] = Field(
-        default=False, title="Reindex all detections on startup."
+        default=False, title="Reindex all tracked objects on startup."
+    )
+    model: Optional[SemanticSearchModelEnum] = Field(
+        default=SemanticSearchModelEnum.jinav1,
+        title="The CLIP model to use for semantic search.",
    )
    model_size: str = Field(
        default="small", title="The size of the embeddings model used."
--- a/frigate/config/config.py
+++ b/frigate/config/config.py
@ -172,16 +172,6 @@ class RestreamConfig(BaseModel):
    model_config = ConfigDict(extra="allow")


-def verify_semantic_search_dependent_configs(config: FrigateConfig) -> None:
-    """Verify that semantic search is enabled if required features are enabled."""
-    if not config.semantic_search.enabled:
-        if config.genai.enabled:
-            raise ValueError("Genai requires semantic search to be enabled.")
-
-        if config.face_recognition.enabled:
-            raise ValueError("Face recognition requires semantic to be enabled.")
-
-
 def verify_config_roles(camera_config: CameraConfig) -> None:
    """Verify that roles are setup in the config correctly."""
    assigned_roles = list(
@ -526,6 +516,7 @@ class FrigateConfig(FrigateBaseModel):
                camera_config.detect.stationary.interval = stationary_threshold

            # set config pre-value
+            camera_config.enabled_in_config = camera_config.enabled
            camera_config.audio.enabled_in_config = camera_config.audio.enabled
            camera_config.record.enabled_in_config = camera_config.record.enabled
            camera_config.notifications.enabled_in_config = (
@ -647,7 +638,6 @@ class FrigateConfig(FrigateBaseModel):
            detector_config.model = model
            self.detectors[key] = detector_config

-        verify_semantic_search_dependent_configs(self)
        return self

    @field_validator("cameras")
--- a/frigate/config/proxy.py
+++ b/frigate/config/proxy.py
@ -12,6 +12,10 @@ class HeaderMappingConfig(FrigateBaseModel):
    user: str = Field(
        default=None, title="Header name from upstream proxy to identify user."
    )
+    role: str = Field(
+        default=None,
+        title="Header name from upstream proxy to identify user role.",
+    )


 class ProxyConfig(FrigateBaseModel):
--- a/frigate/const.py
+++ b/frigate/const.py
@ -1,5 +1,7 @@
+import os
 import re

+INSTALL_DIR = "/opt/frigate"
 CONFIG_DIR = "/config"
 DEFAULT_DB_PATH = f"{CONFIG_DIR}/frigate.db"
 MODEL_CACHE_DIR = f"{CONFIG_DIR}/model_cache"
@ -61,8 +63,9 @@ MAX_WAL_SIZE = 10  # MB

 # Ffmpeg constants

-DEFAULT_FFMPEG_VERSION = "7.0"
-INCLUDED_FFMPEG_VERSIONS = ["7.0", "5.0"]
+DEFAULT_FFMPEG_VERSION = os.environ.get("DEFAULT_FFMPEG_VERSION", "")
+INCLUDED_FFMPEG_VERSIONS = os.environ.get("INCLUDED_FFMPEG_VERSIONS", "").split(":")
+LIBAVFORMAT_VERSION_MAJOR = int(os.environ.get("LIBAVFORMAT_VERSION_MAJOR", "59"))
 FFMPEG_HWACCEL_NVIDIA = "preset-nvidia"
 FFMPEG_HWACCEL_VAAPI = "preset-vaapi"
 FFMPEG_HWACCEL_VULKAN = "preset-vulkan"
--- a/frigate/data_processing/real_time/license_plate_processor.py
+++ b/frigate/data_processing/real_time/license_plate_processor.py
@ -13,29 +13,21 @@ from Levenshtein import distance
 from pyclipper import ET_CLOSEDPOLYGON, JT_ROUND, PyclipperOffset
 from shapely.geometry import Polygon

-from frigate.comms.inter_process import InterProcessRequestor
-from frigate.config import FrigateConfig
 from frigate.const import FRIGATE_LOCALHOST
-from frigate.embeddings.functions.onnx import GenericONNXEmbedding, ModelTypeEnum
 from frigate.util.image import area

-from ..types import DataProcessorMetrics
-from .api import RealTimeProcessorApi
-
 logger = logging.getLogger(__name__)

 WRITE_DEBUG_IMAGES = False


-class LicensePlateProcessor(RealTimeProcessorApi):
-    def __init__(self, config: FrigateConfig, metrics: DataProcessorMetrics):
-        super().__init__(config, metrics)
-        self.requestor = InterProcessRequestor()
-        self.lpr_config = config.lpr
+class LicensePlateProcessingMixin:
+    def __init__(self, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+
        self.requires_license_plate_detection = (
            "license_plate" not in self.config.objects.all_objects
        )
-        self.detected_license_plates: dict[str, dict[str, any]] = {}

        self.ctc_decoder = CTCDecoder()

@ -47,65 +39,6 @@ class LicensePlateProcessor(RealTimeProcessorApi):
        self.box_thresh = 0.8
        self.mask_thresh = 0.8

-        self.lpr_detection_model = None
-        self.lpr_classification_model = None
-        self.lpr_recognition_model = None
-
-        if self.config.lpr.enabled:
-            self.detection_model = GenericONNXEmbedding(
-                model_name="paddleocr-onnx",
-                model_file="detection.onnx",
-                download_urls={
-                    "detection.onnx": "https://github.com/hawkeye217/paddleocr-onnx/raw/refs/heads/master/models/detection.onnx"
-                },
-                model_size="large",
-                model_type=ModelTypeEnum.lpr_detect,
-                requestor=self.requestor,
-                device="CPU",
-            )
-
-            self.classification_model = GenericONNXEmbedding(
-                model_name="paddleocr-onnx",
-                model_file="classification.onnx",
-                download_urls={
-                    "classification.onnx": "https://github.com/hawkeye217/paddleocr-onnx/raw/refs/heads/master/models/classification.onnx"
-                },
-                model_size="large",
-                model_type=ModelTypeEnum.lpr_classify,
-                requestor=self.requestor,
-                device="CPU",
-            )
-
-            self.recognition_model = GenericONNXEmbedding(
-                model_name="paddleocr-onnx",
-                model_file="recognition.onnx",
-                download_urls={
-                    "recognition.onnx": "https://github.com/hawkeye217/paddleocr-onnx/raw/refs/heads/master/models/recognition.onnx"
-                },
-                model_size="large",
-                model_type=ModelTypeEnum.lpr_recognize,
-                requestor=self.requestor,
-                device="CPU",
-            )
-            self.yolov9_detection_model = GenericONNXEmbedding(
-                model_name="yolov9_license_plate",
-                model_file="yolov9-256-license-plates.onnx",
-                download_urls={
-                    "yolov9-256-license-plates.onnx": "https://github.com/hawkeye217/yolov9-license-plates/raw/refs/heads/master/models/yolov9-256-license-plates.onnx"
-                },
-                model_size="large",
-                model_type=ModelTypeEnum.yolov9_lpr_detect,
-                requestor=self.requestor,
-                device="CPU",
-            )
-
-        if self.lpr_config.enabled:
-            # all models need to be loaded to run LPR
-            self.detection_model._load_model_and_utils()
-            self.classification_model._load_model_and_utils()
-            self.recognition_model._load_model_and_utils()
-            self.yolov9_detection_model._load_model_and_utils()
-
    def _detect(self, image: np.ndarray) -> List[np.ndarray]:
        """
        Detect possible license plates in the input image by first resizing and normalizing it,
@ -132,7 +65,7 @@ class LicensePlateProcessor(RealTimeProcessorApi):
                resized_image,
            )

-        outputs = self.detection_model([normalized_image])[0]
+        outputs = self.model_runner.detection_model([normalized_image])[0]
        outputs = outputs[0, :, :]

        boxes, _ = self._boxes_from_bitmap(outputs, outputs > self.mask_thresh, w, h)
@ -161,7 +94,7 @@ class LicensePlateProcessor(RealTimeProcessorApi):
                norm_img = norm_img[np.newaxis, :]
                norm_images.append(norm_img)

-        outputs = self.classification_model(norm_images)
+        outputs = self.model_runner.classification_model(norm_images)

        return self._process_classification_output(images, outputs)

@ -201,7 +134,7 @@ class LicensePlateProcessor(RealTimeProcessorApi):
                norm_image = norm_image[np.newaxis, :]
                norm_images.append(norm_image)

-        outputs = self.recognition_model(norm_images)
+        outputs = self.model_runner.recognition_model(norm_images)
        return self.ctc_decoder(outputs)

    def _process_license_plate(
@ -217,9 +150,9 @@ class LicensePlateProcessor(RealTimeProcessorApi):
            Tuple[List[str], List[float], List[int]]: Detected license plate texts, confidence scores, and areas of the plates.
        """
        if (
-            self.detection_model.runner is None
-            or self.classification_model.runner is None
-            or self.recognition_model.runner is None
+            self.model_runner.detection_model.runner is None
+            or self.model_runner.classification_model.runner is None
+            or self.model_runner.recognition_model.runner is None
        ):
            # we might still be downloading the models
            logger.debug("Model runners not loaded")
@ -683,7 +616,9 @@ class LicensePlateProcessor(RealTimeProcessorApi):
        input_w = int(input_h * max_wh_ratio)

        # check for model-specific input width
-        model_input_w = self.recognition_model.runner.ort.get_inputs()[0].shape[3]
+        model_input_w = self.model_runner.recognition_model.runner.ort.get_inputs()[
+            0
+        ].shape[3]
        if isinstance(model_input_w, int) and model_input_w > 0:
            input_w = model_input_w

@ -750,19 +685,13 @@ class LicensePlateProcessor(RealTimeProcessorApi):
            image = np.rot90(image, k=3)
        return image

-    def __update_metrics(self, duration: float) -> None:
-        """
-        Update inference metrics.
-        """
-        self.metrics.alpr_pps.value = (self.metrics.alpr_pps.value * 9 + duration) / 10
-
    def _detect_license_plate(self, input: np.ndarray) -> tuple[int, int, int, int]:
        """
        Use a lightweight YOLOv9 model to detect license plates for users without Frigate+

        Return the dimensions of the detected plate as [x1, y1, x2, y2].
        """
-        predictions = self.yolov9_detection_model(input)
+        predictions = self.model_runner.yolov9_detection_model(input)

        confidence_threshold = self.lpr_config.detection_threshold

@ -788,8 +717,8 @@ class LicensePlateProcessor(RealTimeProcessorApi):

        # Return the top scoring bounding box if found
        if top_box is not None:
-            # expand box by 15% to help with OCR
-            expansion = (top_box[2:] - top_box[:2]) * 0.1
+            # expand box by 30% to help with OCR
+            expansion = (top_box[2:] - top_box[:2]) * 0.30

            # Expand box
            expanded_box = np.array(
@ -887,9 +816,22 @@ class LicensePlateProcessor(RealTimeProcessorApi):
        # 5. Return True if we should keep the previous plate (i.e., if it scores higher)
        return prev_score > curr_score

-    def process_frame(self, obj_data: dict[str, any], frame: np.ndarray):
+    def __update_yolov9_metrics(self, duration: float) -> None:
+        """
+        Update inference metrics.
+        """
+        self.metrics.yolov9_lpr_fps.value = (
+            self.metrics.yolov9_lpr_fps.value * 9 + duration
+        ) / 10
+
+    def __update_lpr_metrics(self, duration: float) -> None:
+        """
+        Update inference metrics.
+        """
+        self.metrics.alpr_pps.value = (self.metrics.alpr_pps.value * 9 + duration) / 10
+
+    def lpr_process(self, obj_data: dict[str, any], frame: np.ndarray):
        """Look for license plates in image."""
-        start = datetime.datetime.now().timestamp()

        id = obj_data["id"]

@ -915,6 +857,7 @@ class LicensePlateProcessor(RealTimeProcessorApi):

        if self.requires_license_plate_detection:
            logger.debug("Running manual license_plate detection.")
+
            car_box = obj_data.get("box")

            if not car_box:
@ -939,6 +882,9 @@ class LicensePlateProcessor(RealTimeProcessorApi):
            logger.debug(
                f"YOLOv9 LPD inference time: {(datetime.datetime.now().timestamp() - yolov9_start) * 1000:.2f} ms"
            )
+            self.__update_yolov9_metrics(
+                datetime.datetime.now().timestamp() - yolov9_start
+            )

            if not license_plate:
                logger.debug("Detected no license plates for car object.")
@ -952,7 +898,7 @@ class LicensePlateProcessor(RealTimeProcessorApi):

            # check that license plate is valid
            # double the value because we've doubled the size of the car
-            if license_plate_area < self.config.lpr.min_area * 2:
+            if license_plate_area < self.lpr_config.min_area * 2:
                logger.debug("License plate is less than min_area")
                return

@ -990,7 +936,7 @@ class LicensePlateProcessor(RealTimeProcessorApi):
            # check that license plate is valid
            if (
                not license_plate_box
-                or area(license_plate_box) < self.config.lpr.min_area
+                or area(license_plate_box) < self.lpr_config.min_area
            ):
                logger.debug(f"Invalid license plate box {license_plate}")
                return
@ -1017,11 +963,15 @@ class LicensePlateProcessor(RealTimeProcessorApi):
                license_plate_frame,
            )

+        start = datetime.datetime.now().timestamp()
+
        # run detection, returns results sorted by confidence, best first
        license_plates, confidences, areas = self._process_license_plate(
            license_plate_frame
        )

+        self.__update_lpr_metrics(datetime.datetime.now().timestamp() - start)
+
        logger.debug(f"Text boxes: {license_plates}")
        logger.debug(f"Confidences: {confidences}")
        logger.debug(f"Areas: {areas}")
@ -1096,10 +1046,9 @@ class LicensePlateProcessor(RealTimeProcessorApi):
                "plate": top_plate,
                "char_confidences": top_char_confidences,
                "area": top_area,
+                "obj_data": obj_data,
            }

-        self.__update_metrics(datetime.datetime.now().timestamp() - start)
-
    def handle_request(self, topic, request_data) -> dict[str, any] | None:
        return

--- a/frigate/data_processing/common/license_plate/model.py
+++ b/frigate/data_processing/common/license_plate/model.py
@ -0,0 +1,31 @@
+from frigate.embeddings.onnx.lpr_embedding import (
+    LicensePlateDetector,
+    PaddleOCRClassification,
+    PaddleOCRDetection,
+    PaddleOCRRecognition,
+)
+
+from ...types import DataProcessorModelRunner
+
+
+class LicensePlateModelRunner(DataProcessorModelRunner):
+    def __init__(self, requestor, device: str = "CPU", model_size: str = "large"):
+        super().__init__(requestor, device, model_size)
+        self.detection_model = PaddleOCRDetection(
+            model_size=model_size, requestor=requestor, device=device
+        )
+        self.classification_model = PaddleOCRClassification(
+            model_size=model_size, requestor=requestor, device=device
+        )
+        self.recognition_model = PaddleOCRRecognition(
+            model_size=model_size, requestor=requestor, device=device
+        )
+        self.yolov9_detection_model = LicensePlateDetector(
+            model_size=model_size, requestor=requestor, device=device
+        )
+
+        # Load all models once
+        self.detection_model._load_model_and_utils()
+        self.classification_model._load_model_and_utils()
+        self.recognition_model._load_model_and_utils()
+        self.yolov9_detection_model._load_model_and_utils()
--- a/frigate/data_processing/post/api.py
+++ b/frigate/data_processing/post/api.py
@ -5,16 +5,22 @@ from abc import ABC, abstractmethod

 from frigate.config import FrigateConfig

-from ..types import DataProcessorMetrics, PostProcessDataEnum
+from ..types import DataProcessorMetrics, DataProcessorModelRunner, PostProcessDataEnum

 logger = logging.getLogger(__name__)


 class PostProcessorApi(ABC):
    @abstractmethod
-    def __init__(self, config: FrigateConfig, metrics: DataProcessorMetrics) -> None:
+    def __init__(
+        self,
+        config: FrigateConfig,
+        metrics: DataProcessorMetrics,
+        model_runner: DataProcessorModelRunner,
+    ) -> None:
        self.config = config
        self.metrics = metrics
+        self.model_runner = model_runner
        pass

    @abstractmethod
--- a/frigate/data_processing/post/license_plate.py
+++ b/frigate/data_processing/post/license_plate.py
@ -0,0 +1,224 @@
+"""Handle post processing for license plate recognition."""
+
+import datetime
+import logging
+
+import cv2
+import numpy as np
+from peewee import DoesNotExist
+
+from frigate.comms.embeddings_updater import EmbeddingsRequestEnum
+from frigate.config import FrigateConfig
+from frigate.data_processing.common.license_plate.mixin import (
+    WRITE_DEBUG_IMAGES,
+    LicensePlateProcessingMixin,
+)
+from frigate.data_processing.common.license_plate.model import (
+    LicensePlateModelRunner,
+)
+from frigate.data_processing.types import PostProcessDataEnum
+from frigate.models import Recordings
+from frigate.util.image import get_image_from_recording
+
+from ..types import DataProcessorMetrics
+from .api import PostProcessorApi
+
+logger = logging.getLogger(__name__)
+
+
+class LicensePlatePostProcessor(LicensePlateProcessingMixin, PostProcessorApi):
+    def __init__(
+        self,
+        config: FrigateConfig,
+        metrics: DataProcessorMetrics,
+        model_runner: LicensePlateModelRunner,
+        detected_license_plates: dict[str, dict[str, any]],
+    ):
+        self.detected_license_plates = detected_license_plates
+        self.model_runner = model_runner
+        self.lpr_config = config.lpr
+        self.config = config
+        super().__init__(config, metrics, model_runner)
+
+    def process_data(
+        self, data: dict[str, any], data_type: PostProcessDataEnum
+    ) -> None:
+        """Look for license plates in recording stream image
+        Args:
+            data (dict): containing data about the input.
+            data_type (enum): Describing the data that is being processed.
+
+        Returns:
+            None.
+        """
+        event_id = data["event_id"]
+        camera_name = data["camera"]
+
+        if data_type == PostProcessDataEnum.recording:
+            obj_data = data["obj_data"]
+            frame_time = obj_data["frame_time"]
+            recordings_available_through = data["recordings_available"]
+
+            if frame_time > recordings_available_through:
+                logger.debug(
+                    f"LPR post processing: No recordings available for this frame time {frame_time}, available through {recordings_available_through}"
+                )
+
+        elif data_type == PostProcessDataEnum.tracked_object:
+            # non-functional, need to think about snapshot time
+            obj_data = data["event"]["data"]
+            obj_data["id"] = data["event"]["id"]
+            obj_data["camera"] = data["event"]["camera"]
+            # TODO: snapshot time?
+            frame_time = data["event"]["start_time"]
+
+        else:
+            logger.error("No data type passed to LPR postprocessing")
+            return
+
+        recording_query = (
+            Recordings.select(
+                Recordings.path,
+                Recordings.start_time,
+            )
+            .where(
+                (
+                    (frame_time >= Recordings.start_time)
+                    & (frame_time <= Recordings.end_time)
+                )
+            )
+            .where(Recordings.camera == camera_name)
+            .order_by(Recordings.start_time.desc())
+            .limit(1)
+        )
+
+        try:
+            recording: Recordings = recording_query.get()
+            time_in_segment = frame_time - recording.start_time
+            codec = "mjpeg"
+
+            image_data = get_image_from_recording(
+                self.config.ffmpeg, recording.path, time_in_segment, codec, None
+            )
+
+            if not image_data:
+                logger.debug(
+                    "LPR post processing: Unable to fetch license plate from recording"
+                )
+
+            # Convert bytes to numpy array
+            image_array = np.frombuffer(image_data, dtype=np.uint8)
+
+            if len(image_array) == 0:
+                logger.debug("LPR post processing: No image")
+                return
+
+            image = cv2.imdecode(image_array, cv2.IMREAD_COLOR)
+
+        except DoesNotExist:
+            logger.debug("Error fetching license plate for postprocessing")
+            return
+
+        if WRITE_DEBUG_IMAGES:
+            cv2.imwrite(
+                f"debug/frames/lpr_post_{datetime.datetime.now().timestamp()}.jpg",
+                image,
+            )
+
+        # convert to yuv for processing
+        frame = cv2.cvtColor(image, cv2.COLOR_BGR2YUV_I420)
+
+        detect_width = self.config.cameras[camera_name].detect.width
+        detect_height = self.config.cameras[camera_name].detect.height
+
+        # Scale the boxes based on detect dimensions
+        scale_x = image.shape[1] / detect_width
+        scale_y = image.shape[0] / detect_height
+
+        # Determine which box to enlarge based on detection mode
+        if self.requires_license_plate_detection:
+            # Scale and enlarge the car box
+            box = obj_data.get("box")
+            if not box:
+                return
+
+            # Scale original car box to detection dimensions
+            left = int(box[0] * scale_x)
+            top = int(box[1] * scale_y)
+            right = int(box[2] * scale_x)
+            bottom = int(box[3] * scale_y)
+            box = [left, top, right, bottom]
+        else:
+            # Get the license plate box from attributes
+            if not obj_data.get("current_attributes"):
+                return
+
+            license_plate = None
+            for attr in obj_data["current_attributes"]:
+                if attr.get("label") != "license_plate":
+                    continue
+                if license_plate is None or attr.get("score", 0.0) > license_plate.get(
+                    "score", 0.0
+                ):
+                    license_plate = attr
+
+            if not license_plate or not license_plate.get("box"):
+                return
+
+            # Scale license plate box to detection dimensions
+            orig_box = license_plate["box"]
+            left = int(orig_box[0] * scale_x)
+            top = int(orig_box[1] * scale_y)
+            right = int(orig_box[2] * scale_x)
+            bottom = int(orig_box[3] * scale_y)
+            box = [left, top, right, bottom]
+
+        width_box = right - left
+        height_box = bottom - top
+
+        # Enlarge box slightly to account for drift in detect vs recording stream
+        enlarge_factor = 0.3
+        new_left = max(0, int(left - (width_box * enlarge_factor / 2)))
+        new_top = max(0, int(top - (height_box * enlarge_factor / 2)))
+        new_right = min(image.shape[1], int(right + (width_box * enlarge_factor / 2)))
+        new_bottom = min(
+            image.shape[0], int(bottom + (height_box * enlarge_factor / 2))
+        )
+
+        keyframe_obj_data = obj_data.copy()
+        if self.requires_license_plate_detection:
+            # car box
+            keyframe_obj_data["box"] = [new_left, new_top, new_right, new_bottom]
+        else:
+            # Update the license plate box in the attributes
+            new_attributes = []
+            for attr in obj_data["current_attributes"]:
+                if attr.get("label") == "license_plate":
+                    new_attr = attr.copy()
+                    new_attr["box"] = [new_left, new_top, new_right, new_bottom]
+                    new_attributes.append(new_attr)
+                else:
+                    new_attributes.append(attr)
+            keyframe_obj_data["current_attributes"] = new_attributes
+
+        # run the frame through lpr processing
+        logger.debug(f"Post processing plate: {event_id}, {frame_time}")
+        self.lpr_process(keyframe_obj_data, frame)
+
+    def handle_request(self, topic, request_data) -> dict[str, any] | None:
+        if topic == EmbeddingsRequestEnum.reprocess_plate.value:
+            event = request_data["event"]
+
+            self.process_data(
+                {
+                    "event_id": event["id"],
+                    "camera": event["camera"],
+                    "event": event,
+                },
+                PostProcessDataEnum.tracked_object,
+            )
+
+            return {
+                "message": "Successfully requested reprocessing of license plate.",
+                "success": True,
+            }
--- a/frigate/data_processing/real_time/api.py
+++ b/frigate/data_processing/real_time/api.py
@ -14,7 +14,11 @@ logger = logging.getLogger(__name__)

 class RealTimeProcessorApi(ABC):
    @abstractmethod
-    def __init__(self, config: FrigateConfig, metrics: DataProcessorMetrics) -> None:
+    def __init__(
+        self,
+        config: FrigateConfig,
+        metrics: DataProcessorMetrics,
+    ) -> None:
        self.config = config
        self.metrics = metrics
        pass
--- a/frigate/data_processing/real_time/bird_processor.py
+++ b/frigate/data_processing/real_time/bird_processor.py
@ -22,7 +22,7 @@ except ModuleNotFoundError:
 logger = logging.getLogger(__name__)


-class BirdProcessor(RealTimeProcessorApi):
+class BirdRealTimeProcessor(RealTimeProcessorApi):
    def __init__(self, config: FrigateConfig, metrics: DataProcessorMetrics):
        super().__init__(config, metrics)
        self.interpreter: Interpreter = None
--- a/frigate/data_processing/real_time/face_processor.py
+++ b/frigate/data_processing/real_time/face_processor.py
@ -27,7 +27,7 @@ logger = logging.getLogger(__name__)
 MIN_MATCHING_FACES = 2


-class FaceProcessor(RealTimeProcessorApi):
+class FaceRealTimeProcessor(RealTimeProcessorApi):
    def __init__(self, config: FrigateConfig, metrics: DataProcessorMetrics):
        super().__init__(config, metrics)
        self.face_config = config.face_recognition
@ -76,14 +76,16 @@ class FaceProcessor(RealTimeProcessorApi):

    def __build_detector(self) -> None:
        self.face_detector = cv2.FaceDetectorYN.create(
-            "/config/model_cache/facedet/facedet.onnx",
+            os.path.join(MODEL_CACHE_DIR, "facedet/facedet.onnx"),
            config="",
            input_size=(320, 320),
            score_threshold=0.8,
            nms_threshold=0.3,
        )
        self.landmark_detector = cv2.face.createFacemarkLBF()
-        self.landmark_detector.loadModel("/config/model_cache/facedet/landmarkdet.yaml")
+        self.landmark_detector.loadModel(
+            os.path.join(MODEL_CACHE_DIR, "facedet/landmarkdet.yaml")
+        )

    def __build_classifier(self) -> None:
        if not self.landmark_detector:
--- a/frigate/data_processing/real_time/license_plate.py
+++ b/frigate/data_processing/real_time/license_plate.py
@ -0,0 +1,44 @@
+"""Handle processing images for face detection and recognition."""
+
+import logging
+
+import numpy as np
+
+from frigate.config import FrigateConfig
+from frigate.data_processing.common.license_plate.mixin import (
+    LicensePlateProcessingMixin,
+)
+from frigate.data_processing.common.license_plate.model import (
+    LicensePlateModelRunner,
+)
+
+from ..types import DataProcessorMetrics
+from .api import RealTimeProcessorApi
+
+logger = logging.getLogger(__name__)
+
+
+class LicensePlateRealTimeProcessor(LicensePlateProcessingMixin, RealTimeProcessorApi):
+    def __init__(
+        self,
+        config: FrigateConfig,
+        metrics: DataProcessorMetrics,
+        model_runner: LicensePlateModelRunner,
+        detected_license_plates: dict[str, dict[str, any]],
+    ):
+        self.detected_license_plates = detected_license_plates
+        self.model_runner = model_runner
+        self.lpr_config = config.lpr
+        self.config = config
+        super().__init__(config, metrics)
+
+    def process_frame(self, obj_data: dict[str, any], frame: np.ndarray):
+        """Look for license plates in image."""
+        self.lpr_process(obj_data, frame)
+
+    def handle_request(self, topic, request_data) -> dict[str, any] | None:
+        return
+
+    def expire_object(self, object_id: str):
+        if object_id in self.detected_license_plates:
+            self.detected_license_plates.pop(object_id)
--- a/frigate/data_processing/types.py
+++ b/frigate/data_processing/types.py
@ -10,12 +10,21 @@ class DataProcessorMetrics:
    text_embeddings_sps: Synchronized
    face_rec_fps: Synchronized
    alpr_pps: Synchronized
+    yolov9_lpr_fps: Synchronized

    def __init__(self):
        self.image_embeddings_fps = mp.Value("d", 0.01)
        self.text_embeddings_sps = mp.Value("d", 0.01)
        self.face_rec_fps = mp.Value("d", 0.01)
        self.alpr_pps = mp.Value("d", 0.01)
+        self.yolov9_lpr_fps = mp.Value("d", 0.01)
+
+
+class DataProcessorModelRunner:
+    def __init__(self, requestor, device: str = "CPU", model_size: str = "large"):
+        self.requestor = requestor
+        self.device = device
+        self.model_size = model_size


 class PostProcessDataEnum(str, Enum):
--- a/frigate/detectors/detector_config.py
+++ b/frigate/detectors/detector_config.py
@ -9,7 +9,7 @@ import requests
 from pydantic import BaseModel, ConfigDict, Field
 from pydantic.fields import PrivateAttr

-from frigate.const import DEFAULT_ATTRIBUTE_LABEL_MAP
+from frigate.const import DEFAULT_ATTRIBUTE_LABEL_MAP, MODEL_CACHE_DIR
 from frigate.plus import PlusApi
 from frigate.util.builtin import generate_color_palette, load_labels

@ -37,6 +37,7 @@ class ModelTypeEnum(str, Enum):
    yolox = "yolox"
    yolov9 = "yolov9"
    yolonas = "yolonas"
+    dfine = "dfine"


 class ModelConfig(BaseModel):
@ -122,7 +123,7 @@ class ModelConfig(BaseModel):
            return

        model_id = self.path[7:]
-        self.path = f"/config/model_cache/{model_id}"
+        self.path = os.path.join(MODEL_CACHE_DIR, model_id)
        model_info_path = f"{self.path}.json"

        # download the model if it doesn't exist
--- a/frigate/detectors/plugins/hailo8l.py
+++ b/frigate/detectors/plugins/hailo8l.py
@ -22,6 +22,7 @@ except ModuleNotFoundError:
 from pydantic import BaseModel, Field
 from typing_extensions import Literal

+from frigate.const import MODEL_CACHE_DIR
 from frigate.detectors.detection_api import DetectionApi
 from frigate.detectors.detector_config import BaseDetectorConfig

@ -57,7 +58,7 @@ class HailoDetector(DetectionApi):
        self.h8l_tensor_format = detector_config.model.input_tensor
        self.h8l_pixel_format = detector_config.model.input_pixel_format
        self.model_url = "https://hailo-model-zoo.s3.eu-west-2.amazonaws.com/ModelZoo/Compiled/v2.11.0/hailo8l/ssd_mobilenet_v1.hef"
-        self.cache_dir = "/config/model_cache/h8l_cache"
+        self.cache_dir = os.path.join(MODEL_CACHE_DIR, "h8l_cache")
        self.expected_model_filename = "ssd_mobilenet_v1.hef"
        output_type = "FLOAT32"

--- a/frigate/detectors/plugins/onnx.py
+++ b/frigate/detectors/plugins/onnx.py
@ -9,7 +9,11 @@ from frigate.detectors.detector_config import (
    BaseDetectorConfig,
    ModelTypeEnum,
 )
-from frigate.util.model import get_ort_providers, post_process_yolov9
+from frigate.util.model import (
+    get_ort_providers,
+    post_process_dfine,
+    post_process_yolov9,
+)

 logger = logging.getLogger(__name__)

@ -41,6 +45,7 @@ class ONNXDetector(DetectionApi):
        providers, options = get_ort_providers(
            detector_config.device == "CPU", detector_config.device
        )
+
        self.model = ort.InferenceSession(
            path, providers=providers, provider_options=options
        )
@ -55,6 +60,16 @@ class ONNXDetector(DetectionApi):
        logger.info(f"ONNX: {path} loaded")

    def detect_raw(self, tensor_input: np.ndarray):
+        if self.onnx_model_type == ModelTypeEnum.dfine:
+            tensor_output = self.model.run(
+                None,
+                {
+                    "images": tensor_input,
+                    "orig_target_sizes": np.array([[self.h, self.w]], dtype=np.int64),
+                },
+            )
+            return post_process_dfine(tensor_output, self.w, self.h)
+
        model_input_name = self.model.get_inputs()[0].name
        tensor_output = self.model.run(None, {model_input_name: tensor_input})

@ -84,5 +99,5 @@ class ONNXDetector(DetectionApi):
            return post_process_yolov9(predictions, self.w, self.h)
        else:
            raise Exception(
-                f"{self.onnx_model_type} is currently not supported for rocm. See the docs for more info on supported models."
+                f"{self.onnx_model_type} is currently not supported for onnx. See the docs for more info on supported models."
            )
--- a/frigate/detectors/plugins/openvino.py
+++ b/frigate/detectors/plugins/openvino.py
@ -7,6 +7,7 @@ import openvino.properties as props
 from pydantic import Field
 from typing_extensions import Literal

+from frigate.const import MODEL_CACHE_DIR
 from frigate.detectors.detection_api import DetectionApi
 from frigate.detectors.detector_config import BaseDetectorConfig, ModelTypeEnum
 from frigate.util.model import post_process_yolov9
@ -41,8 +42,10 @@ class OvDetector(DetectionApi):
            logger.error(f"OpenVino model file {detector_config.model.path} not found.")
            raise FileNotFoundError

-        os.makedirs("/config/model_cache/openvino", exist_ok=True)
-        self.ov_core.set_property({props.cache_dir: "/config/model_cache/openvino"})
+        os.makedirs(os.path.join(MODEL_CACHE_DIR, "openvino"), exist_ok=True)
+        self.ov_core.set_property(
+            {props.cache_dir: os.path.join(MODEL_CACHE_DIR, "openvino")}
+        )
        self.interpreter = self.ov_core.compile_model(
            model=detector_config.model.path, device_name=detector_config.device
        )
--- a/frigate/detectors/plugins/rknn.py
+++ b/frigate/detectors/plugins/rknn.py
@ -6,6 +6,7 @@ from typing import Literal

 from pydantic import Field

+from frigate.const import MODEL_CACHE_DIR
 from frigate.detectors.detection_api import DetectionApi
 from frigate.detectors.detector_config import BaseDetectorConfig, ModelTypeEnum

@ -17,7 +18,7 @@ supported_socs = ["rk3562", "rk3566", "rk3568", "rk3576", "rk3588"]

 supported_models = {ModelTypeEnum.yolonas: "^deci-fp16-yolonas_[sml]$"}

-model_cache_dir = "/config/model_cache/rknn_cache/"
+model_cache_dir = os.path.join(MODEL_CACHE_DIR, "rknn_cache/")


 class RknnDetectorConfig(BaseDetectorConfig):
--- a/frigate/detectors/plugins/rocm.py
+++ b/frigate/detectors/plugins/rocm.py
@ -1,169 +0,0 @@
-import ctypes
-import logging
-import os
-import subprocess
-import sys
-
-import cv2
-import numpy as np
-from pydantic import Field
-from typing_extensions import Literal
-
-from frigate.detectors.detection_api import DetectionApi
-from frigate.detectors.detector_config import (
-    BaseDetectorConfig,
-    ModelTypeEnum,
-    PixelFormatEnum,
-)
-
-logger = logging.getLogger(__name__)
-
-DETECTOR_KEY = "rocm"
-
-
-def detect_gfx_version():
-    return subprocess.getoutput(
-        "unset HSA_OVERRIDE_GFX_VERSION && /opt/rocm/bin/rocminfo | grep gfx |head -1|awk '{print $2}'"
-    )
-
-
-def auto_override_gfx_version():
-    # If environment variable already in place, do not override
-    gfx_version = detect_gfx_version()
-    old_override = os.getenv("HSA_OVERRIDE_GFX_VERSION")
-    if old_override not in (None, ""):
-        logger.warning(
-            f"AMD/ROCm: detected {gfx_version} but HSA_OVERRIDE_GFX_VERSION already present ({old_override}), not overriding!"
-        )
-        return old_override
-    mapping = {
-        "gfx90c": "9.0.0",
-        "gfx1031": "10.3.0",
-        "gfx1103": "11.0.0",
-    }
-    override = mapping.get(gfx_version)
-    if override is not None:
-        logger.warning(
-            f"AMD/ROCm: detected {gfx_version}, overriding HSA_OVERRIDE_GFX_VERSION={override}"
-        )
-        os.putenv("HSA_OVERRIDE_GFX_VERSION", override)
-        return override
-    return ""
-
-
-class ROCmDetectorConfig(BaseDetectorConfig):
-    type: Literal[DETECTOR_KEY]
-    conserve_cpu: bool = Field(
-        default=True,
-        title="Conserve CPU at the expense of latency (and reduced max throughput)",
-    )
-    auto_override_gfx: bool = Field(
-        default=True, title="Automatically detect and override gfx version"
-    )
-
-
-class ROCmDetector(DetectionApi):
-    type_key = DETECTOR_KEY
-
-    def __init__(self, detector_config: ROCmDetectorConfig):
-        if detector_config.auto_override_gfx:
-            auto_override_gfx_version()
-
-        try:
-            sys.path.append("/opt/rocm/lib")
-            import migraphx
-
-            logger.info("AMD/ROCm: loaded migraphx module")
-        except ModuleNotFoundError:
-            logger.error("AMD/ROCm: module loading failed, missing ROCm environment?")
-            raise
-
-        if detector_config.conserve_cpu:
-            logger.info("AMD/ROCm: switching HIP to blocking mode to conserve CPU")
-            ctypes.CDLL("/opt/rocm/lib/libamdhip64.so").hipSetDeviceFlags(4)
-
-        self.h = detector_config.model.height
-        self.w = detector_config.model.width
-        self.rocm_model_type = detector_config.model.model_type
-        self.rocm_model_px = detector_config.model.input_pixel_format
-        path = detector_config.model.path
-
-        mxr_path = os.path.splitext(path)[0] + ".mxr"
-        if path.endswith(".mxr"):
-            logger.info(f"AMD/ROCm: loading parsed model from {mxr_path}")
-            self.model = migraphx.load(mxr_path)
-        elif os.path.exists(mxr_path):
-            logger.info(f"AMD/ROCm: loading parsed model from {mxr_path}")
-            self.model = migraphx.load(mxr_path)
-        else:
-            logger.info(f"AMD/ROCm: loading model from {path}")
-
-            if (
-                path.endswith(".tf")
-                or path.endswith(".tf2")
-                or path.endswith(".tflite")
-            ):
-                # untested
-                self.model = migraphx.parse_tf(path)
-            else:
-                self.model = migraphx.parse_onnx(path)
-
-            logger.info("AMD/ROCm: compiling the model")
-
-            self.model.compile(
-                migraphx.get_target("gpu"), offload_copy=True, fast_math=True
-            )
-
-            logger.info(f"AMD/ROCm: saving parsed model into {mxr_path}")
-
-            os.makedirs("/config/model_cache/rocm", exist_ok=True)
-            migraphx.save(self.model, mxr_path)
-
-        logger.info("AMD/ROCm: model loaded")
-
-    def detect_raw(self, tensor_input):
-        model_input_name = self.model.get_parameter_names()[0]
-        model_input_shape = tuple(
-            self.model.get_parameter_shapes()[model_input_name].lens()
-        )
-
-        tensor_input = cv2.dnn.blobFromImage(
-            tensor_input[0],
-            1.0,
-            (model_input_shape[3], model_input_shape[2]),
-            None,
-            swapRB=self.rocm_model_px == PixelFormatEnum.bgr,
-        ).astype(np.uint8)
-
-        detector_result = self.model.run({model_input_name: tensor_input})[0]
-        addr = ctypes.cast(detector_result.data_ptr(), ctypes.POINTER(ctypes.c_float))
-
-        tensor_output = np.ctypeslib.as_array(
-            addr, shape=detector_result.get_shape().lens()
-        )
-
-        if self.rocm_model_type == ModelTypeEnum.yolonas:
-            predictions = tensor_output
-
-            detections = np.zeros((20, 6), np.float32)
-
-            for i, prediction in enumerate(predictions):
-                if i == 20:
-                    break
-                (_, x_min, y_min, x_max, y_max, confidence, class_id) = prediction
-                # when running in GPU mode, empty predictions in the output have class_id of -1
-                if class_id < 0:
-                    break
-                detections[i] = [
-                    class_id,
-                    confidence,
-                    y_min / self.h,
-                    x_min / self.w,
-                    y_max / self.h,
-                    x_max / self.w,
-                ]
-            return detections
-        else:
-            raise Exception(
-                f"{self.rocm_model_type} is currently not supported for rocm. See the docs for more info on supported models."
-            )
--- a/frigate/embeddings/init.py
+++ b/frigate/embeddings/init.py
@ -17,7 +17,7 @@ from frigate.config import FrigateConfig
 from frigate.const import CONFIG_DIR, FACE_DIR
 from frigate.data_processing.types import DataProcessorMetrics
 from frigate.db.sqlitevecq import SqliteVecQueueDatabase
-from frigate.models import Event
+from frigate.models import Event, Recordings
 from frigate.util.builtin import serialize
 from frigate.util.services import listen

@ -28,10 +28,6 @@ logger = logging.getLogger(__name__)


 def manage_embeddings(config: FrigateConfig, metrics: DataProcessorMetrics) -> None:
-    # Only initialize embeddings if semantic search is enabled
-    if not config.semantic_search.enabled:
-        return
-
    stop_event = mp.Event()

    def receiveSignal(signalNumber: int, frame: Optional[FrameType]) -> None:
@ -55,7 +51,7 @@ def manage_embeddings(config: FrigateConfig, metrics: DataProcessorMetrics) -> N
        timeout=max(60, 10 * len([c for c in config.cameras.values() if c.enabled])),
        load_vec_extension=True,
    )
-    models = [Event]
+    models = [Event, Recordings]
    db.bind(models)

    maintainer = EmbeddingMaintainer(
@ -234,3 +230,8 @@ class EmbeddingsContext:
            EmbeddingsRequestEnum.embed_description.value,
            {"id": event_id, "description": description},
        )
+
+    def reprocess_plate(self, event: dict[str, any]) -> dict[str, any]:
+        return self.requestor.send_data(
+            EmbeddingsRequestEnum.reprocess_plate.value, {"event": event}
+        )
--- a/frigate/embeddings/embeddings.py
+++ b/frigate/embeddings/embeddings.py
@ -10,6 +10,7 @@ from playhouse.shortcuts import model_to_dict

 from frigate.comms.inter_process import InterProcessRequestor
 from frigate.config import FrigateConfig
+from frigate.config.classification import SemanticSearchModelEnum
 from frigate.const import (
    CONFIG_DIR,
    UPDATE_EMBEDDINGS_REINDEX_PROGRESS,
@ -22,7 +23,8 @@ from frigate.types import ModelStatusTypesEnum
 from frigate.util.builtin import serialize
 from frigate.util.path import get_event_thumbnail_bytes

-from .functions.onnx import GenericONNXEmbedding, ModelTypeEnum
+from .onnx.jina_v1_embedding import JinaV1ImageEmbedding, JinaV1TextEmbedding
+from .onnx.jina_v2_embedding import JinaV2Embedding

 logger = logging.getLogger(__name__)

@ -75,18 +77,7 @@ class Embeddings:
        # Create tables if they don't exist
        self.db.create_embeddings_tables()

-        models = [
-            "jinaai/jina-clip-v1-text_model_fp16.onnx",
-            "jinaai/jina-clip-v1-tokenizer",
-            "jinaai/jina-clip-v1-vision_model_fp16.onnx"
-            if config.semantic_search.model_size == "large"
-            else "jinaai/jina-clip-v1-vision_model_quantized.onnx",
-            "jinaai/jina-clip-v1-preprocessor_config.json",
-            "facenet-facenet.onnx",
-            "paddleocr-onnx-detection.onnx",
-            "paddleocr-onnx-classification.onnx",
-            "paddleocr-onnx-recognition.onnx",
-        ]
+        models = self.get_model_definitions()

        for model in models:
            self.requestor.send_data(
@ -97,39 +88,64 @@ class Embeddings:
                },
            )

-        self.text_embedding = GenericONNXEmbedding(
-            model_name="jinaai/jina-clip-v1",
-            model_file="text_model_fp16.onnx",
-            tokenizer_file="tokenizer",
-            download_urls={
-                "text_model_fp16.onnx": "https://huggingface.co/jinaai/jina-clip-v1/resolve/main/onnx/text_model_fp16.onnx",
-            },
-            model_size=config.semantic_search.model_size,
-            model_type=ModelTypeEnum.text,
-            requestor=self.requestor,
-            device="CPU",
+        if self.config.semantic_search.model == SemanticSearchModelEnum.jinav2:
+            # Single JinaV2Embedding instance for both text and vision
+            self.embedding = JinaV2Embedding(
+                model_size=self.config.semantic_search.model_size,
+                requestor=self.requestor,
+                device="GPU"
+                if self.config.semantic_search.model_size == "large"
+                else "CPU",
+            )
+            self.text_embedding = lambda input_data: self.embedding(
+                input_data, embedding_type="text"
+            )
+            self.vision_embedding = lambda input_data: self.embedding(
+                input_data, embedding_type="vision"
+            )
+        else:  # Default to jinav1
+            self.text_embedding = JinaV1TextEmbedding(
+                model_size=config.semantic_search.model_size,
+                requestor=self.requestor,
+                device="CPU",
+            )
+            self.vision_embedding = JinaV1ImageEmbedding(
+                model_size=config.semantic_search.model_size,
+                requestor=self.requestor,
+                device="GPU" if config.semantic_search.model_size == "large" else "CPU",
+            )
+
+    def get_model_definitions(self):
+        # Version-specific models
+        if self.config.semantic_search.model == SemanticSearchModelEnum.jinav2:
+            models = [
+                "jinaai/jina-clip-v2-tokenizer",
+                "jinaai/jina-clip-v2-model_fp16.onnx"
+                if self.config.semantic_search.model_size == "large"
+                else "jinaai/jina-clip-v2-model_quantized.onnx",
+                "jinaai/jina-clip-v2-preprocessor_config.json",
+            ]
+        else:  # Default to jinav1
+            models = [
+                "jinaai/jina-clip-v1-text_model_fp16.onnx",
+                "jinaai/jina-clip-v1-tokenizer",
+                "jinaai/jina-clip-v1-vision_model_fp16.onnx"
+                if self.config.semantic_search.model_size == "large"
+                else "jinaai/jina-clip-v1-vision_model_quantized.onnx",
+                "jinaai/jina-clip-v1-preprocessor_config.json",
+            ]
+
+        # Add common models
+        models.extend(
+            [
+                "facenet-facenet.onnx",
+                "paddleocr-onnx-detection.onnx",
+                "paddleocr-onnx-classification.onnx",
+                "paddleocr-onnx-recognition.onnx",
+            ]
        )

-        model_file = (
-            "vision_model_fp16.onnx"
-            if self.config.semantic_search.model_size == "large"
-            else "vision_model_quantized.onnx"
-        )
-
-        download_urls = {
-            model_file: f"https://huggingface.co/jinaai/jina-clip-v1/resolve/main/onnx/{model_file}",
-            "preprocessor_config.json": "https://huggingface.co/jinaai/jina-clip-v1/resolve/main/preprocessor_config.json",
-        }
-
-        self.vision_embedding = GenericONNXEmbedding(
-            model_name="jinaai/jina-clip-v1",
-            model_file=model_file,
-            download_urls=download_urls,
-            model_size=config.semantic_search.model_size,
-            model_type=ModelTypeEnum.vision,
-            requestor=self.requestor,
-            device="GPU" if config.semantic_search.model_size == "large" else "CPU",
-        )
+        return models

    def embed_thumbnail(
        self, event_id: str, thumbnail: bytes, upsert: bool = True
@ -266,7 +282,11 @@ class Embeddings:
        # Get total count of events to process
        total_events = Event.select().count()

-        batch_size = 32
+        batch_size = (
+            4
+            if self.config.semantic_search.model == SemanticSearchModelEnum.jinav2
+            else 32
+        )
        current_page = 1

        totals = {
--- a/frigate/embeddings/functions/onnx.py
+++ b/frigate/embeddings/functions/onnx.py
@ -1,325 +0,0 @@
-import logging
-import os
-import warnings
-from enum import Enum
-from io import BytesIO
-from typing import Dict, List, Optional, Union
-
-import cv2
-import numpy as np
-import requests
-from PIL import Image
-
-# importing this without pytorch or others causes a warning
-# https://github.com/huggingface/transformers/issues/27214
-# suppressed by setting env TRANSFORMERS_NO_ADVISORY_WARNINGS=1
-from transformers import AutoFeatureExtractor, AutoTokenizer
-from transformers.utils.logging import disable_progress_bar
-
-from frigate.comms.inter_process import InterProcessRequestor
-from frigate.const import MODEL_CACHE_DIR, UPDATE_MODEL_STATE
-from frigate.types import ModelStatusTypesEnum
-from frigate.util.downloader import ModelDownloader
-from frigate.util.model import ONNXModelRunner
-
-warnings.filterwarnings(
-    "ignore",
-    category=FutureWarning,
-    message="The class CLIPFeatureExtractor is deprecated",
-)
-
-# disables the progress bar for downloading tokenizers and feature extractors
-disable_progress_bar()
-logger = logging.getLogger(__name__)
-
-FACE_EMBEDDING_SIZE = 160
-LPR_EMBEDDING_SIZE = 256
-
-
-class ModelTypeEnum(str, Enum):
-    face = "face"
-    vision = "vision"
-    text = "text"
-    lpr_detect = "lpr_detect"
-    lpr_classify = "lpr_classify"
-    lpr_recognize = "lpr_recognize"
-    yolov9_lpr_detect = "yolov9_lpr_detect"
-
-
-class GenericONNXEmbedding:
-    """Generic embedding function for ONNX models (text and vision)."""
-
-    def __init__(
-        self,
-        model_name: str,
-        model_file: str,
-        download_urls: Dict[str, str],
-        model_size: str,
-        model_type: ModelTypeEnum,
-        requestor: InterProcessRequestor,
-        tokenizer_file: Optional[str] = None,
-        device: str = "AUTO",
-    ):
-        self.model_name = model_name
-        self.model_file = model_file
-        self.tokenizer_file = tokenizer_file
-        self.requestor = requestor
-        self.download_urls = download_urls
-        self.model_type = model_type
-        self.model_size = model_size
-        self.device = device
-        self.download_path = os.path.join(MODEL_CACHE_DIR, self.model_name)
-        self.tokenizer = None
-        self.feature_extractor = None
-        self.runner = None
-        files_names = list(self.download_urls.keys()) + (
-            [self.tokenizer_file] if self.tokenizer_file else []
-        )
-
-        if not all(
-            os.path.exists(os.path.join(self.download_path, n)) for n in files_names
-        ):
-            logger.debug(f"starting model download for {self.model_name}")
-            self.downloader = ModelDownloader(
-                model_name=self.model_name,
-                download_path=self.download_path,
-                file_names=files_names,
-                download_func=self._download_model,
-            )
-            self.downloader.ensure_model_files()
-        else:
-            self.downloader = None
-            ModelDownloader.mark_files_state(
-                self.requestor,
-                self.model_name,
-                files_names,
-                ModelStatusTypesEnum.downloaded,
-            )
-            self._load_model_and_utils()
-            logger.debug(f"models are already downloaded for {self.model_name}")
-
-    def _download_model(self, path: str):
-        try:
-            file_name = os.path.basename(path)
-
-            if file_name in self.download_urls:
-                ModelDownloader.download_from_url(self.download_urls[file_name], path)
-            elif (
-                file_name == self.tokenizer_file
-                and self.model_type == ModelTypeEnum.text
-            ):
-                if not os.path.exists(path + "/" + self.model_name):
-                    logger.info(f"Downloading {self.model_name} tokenizer")
-
-                tokenizer = AutoTokenizer.from_pretrained(
-                    self.model_name,
-                    trust_remote_code=True,
-                    cache_dir=f"{MODEL_CACHE_DIR}/{self.model_name}/tokenizer",
-                    clean_up_tokenization_spaces=True,
-                )
-                tokenizer.save_pretrained(path)
-
-            self.downloader.requestor.send_data(
-                UPDATE_MODEL_STATE,
-                {
-                    "model": f"{self.model_name}-{file_name}",
-                    "state": ModelStatusTypesEnum.downloaded,
-                },
-            )
-        except Exception:
-            self.downloader.requestor.send_data(
-                UPDATE_MODEL_STATE,
-                {
-                    "model": f"{self.model_name}-{file_name}",
-                    "state": ModelStatusTypesEnum.error,
-                },
-            )
-
-    def _load_model_and_utils(self):
-        if self.runner is None:
-            if self.downloader:
-                self.downloader.wait_for_download()
-            if self.model_type == ModelTypeEnum.text:
-                self.tokenizer = self._load_tokenizer()
-            elif self.model_type == ModelTypeEnum.vision:
-                self.feature_extractor = self._load_feature_extractor()
-            elif self.model_type == ModelTypeEnum.face:
-                self.feature_extractor = []
-            elif self.model_type == ModelTypeEnum.lpr_detect:
-                self.feature_extractor = []
-            elif self.model_type == ModelTypeEnum.lpr_classify:
-                self.feature_extractor = []
-            elif self.model_type == ModelTypeEnum.lpr_recognize:
-                self.feature_extractor = []
-            elif self.model_type == ModelTypeEnum.yolov9_lpr_detect:
-                self.feature_extractor = []
-
-            self.runner = ONNXModelRunner(
-                os.path.join(self.download_path, self.model_file),
-                self.device,
-                self.model_size,
-            )
-
-    def _load_tokenizer(self):
-        tokenizer_path = os.path.join(f"{MODEL_CACHE_DIR}/{self.model_name}/tokenizer")
-        return AutoTokenizer.from_pretrained(
-            self.model_name,
-            cache_dir=tokenizer_path,
-            trust_remote_code=True,
-            clean_up_tokenization_spaces=True,
-        )
-
-    def _load_feature_extractor(self):
-        return AutoFeatureExtractor.from_pretrained(
-            f"{MODEL_CACHE_DIR}/{self.model_name}",
-        )
-
-    def _preprocess_inputs(self, raw_inputs: any) -> any:
-        if self.model_type == ModelTypeEnum.text:
-            max_length = max(len(self.tokenizer.encode(text)) for text in raw_inputs)
-            return [
-                self.tokenizer(
-                    text,
-                    padding="max_length",
-                    truncation=True,
-                    max_length=max_length,
-                    return_tensors="np",
-                )
-                for text in raw_inputs
-            ]
-        elif self.model_type == ModelTypeEnum.vision:
-            processed_images = [self._process_image(img) for img in raw_inputs]
-            return [
-                self.feature_extractor(images=image, return_tensors="np")
-                for image in processed_images
-            ]
-        elif self.model_type == ModelTypeEnum.face:
-            if isinstance(raw_inputs, list):
-                raise ValueError("Face embedding does not support batch inputs.")
-
-            pil = self._process_image(raw_inputs)
-
-            # handle images larger than input size
-            width, height = pil.size
-            if width != FACE_EMBEDDING_SIZE or height != FACE_EMBEDDING_SIZE:
-                if width > height:
-                    new_height = int(((height / width) * FACE_EMBEDDING_SIZE) // 4 * 4)
-                    pil = pil.resize((FACE_EMBEDDING_SIZE, new_height))
-                else:
-                    new_width = int(((width / height) * FACE_EMBEDDING_SIZE) // 4 * 4)
-                    pil = pil.resize((new_width, FACE_EMBEDDING_SIZE))
-
-            og = np.array(pil).astype(np.float32)
-
-            # Image must be FACE_EMBEDDING_SIZExFACE_EMBEDDING_SIZE
-            og_h, og_w, channels = og.shape
-            frame = np.full(
-                (FACE_EMBEDDING_SIZE, FACE_EMBEDDING_SIZE, channels),
-                (0, 0, 0),
-                dtype=np.float32,
-            )
-
-            # compute center offset
-            x_center = (FACE_EMBEDDING_SIZE - og_w) // 2
-            y_center = (FACE_EMBEDDING_SIZE - og_h) // 2
-
-            # copy img image into center of result image
-            frame[y_center : y_center + og_h, x_center : x_center + og_w] = og
-            frame = np.expand_dims(frame, axis=0)
-            return [{"input_2": frame}]
-        elif self.model_type == ModelTypeEnum.lpr_detect:
-            preprocessed = []
-            for x in raw_inputs:
-                preprocessed.append(x)
-            return [{"x": preprocessed[0]}]
-        elif self.model_type == ModelTypeEnum.lpr_classify:
-            processed = []
-            for img in raw_inputs:
-                processed.append({"x": img})
-            return processed
-        elif self.model_type == ModelTypeEnum.lpr_recognize:
-            processed = []
-            for img in raw_inputs:
-                processed.append({"x": img})
-            return processed
-        elif self.model_type == ModelTypeEnum.yolov9_lpr_detect:
-            if isinstance(raw_inputs, list):
-                raise ValueError(
-                    "License plate embedding does not support batch inputs."
-                )
-            # Get image as numpy array
-            img = self._process_image(raw_inputs)
-            height, width, channels = img.shape
-
-            # Resize maintaining aspect ratio
-            if width > height:
-                new_height = int(((height / width) * LPR_EMBEDDING_SIZE) // 4 * 4)
-                img = cv2.resize(img, (LPR_EMBEDDING_SIZE, new_height))
-            else:
-                new_width = int(((width / height) * LPR_EMBEDDING_SIZE) // 4 * 4)
-                img = cv2.resize(img, (new_width, LPR_EMBEDDING_SIZE))
-
-            # Get new dimensions after resize
-            og_h, og_w, channels = img.shape
-
-            # Create black square frame
-            frame = np.full(
-                (LPR_EMBEDDING_SIZE, LPR_EMBEDDING_SIZE, channels),
-                (0, 0, 0),
-                dtype=np.float32,
-            )
-
-            # Center the resized image in the square frame
-            x_center = (LPR_EMBEDDING_SIZE - og_w) // 2
-            y_center = (LPR_EMBEDDING_SIZE - og_h) // 2
-            frame[y_center : y_center + og_h, x_center : x_center + og_w] = img
-
-            # Normalize to 0-1
-            frame = frame / 255.0
-
-            # Convert from HWC to CHW format and add batch dimension
-            frame = np.transpose(frame, (2, 0, 1))
-            frame = np.expand_dims(frame, axis=0)
-            return [{"images": frame}]
-        else:
-            raise ValueError(f"Unable to preprocess inputs for {self.model_type}")
-
-    def _process_image(self, image, output: str = "RGB") -> Image.Image:
-        if isinstance(image, str):
-            if image.startswith("http"):
-                response = requests.get(image)
-                image = Image.open(BytesIO(response.content)).convert(output)
-        elif isinstance(image, bytes):
-            image = Image.open(BytesIO(image)).convert(output)
-
-        return image
-
-    def __call__(
-        self, inputs: Union[List[str], List[Image.Image], List[str]]
-    ) -> List[np.ndarray]:
-        self._load_model_and_utils()
-        if self.runner is None or (
-            self.tokenizer is None and self.feature_extractor is None
-        ):
-            logger.error(
-                f"{self.model_name} model or tokenizer/feature extractor is not loaded."
-            )
-            return []
-
-        processed_inputs = self._preprocess_inputs(inputs)
-        input_names = self.runner.get_input_names()
-        onnx_inputs = {name: [] for name in input_names}
-        input: dict[str, any]
-        for input in processed_inputs:
-            for key, value in input.items():
-                if key in input_names:
-                    onnx_inputs[key].append(value[0])
-
-        for key in input_names:
-            if onnx_inputs.get(key):
-                onnx_inputs[key] = np.stack(onnx_inputs[key])
-            else:
-                logger.warning(f"Expected input '{key}' not found in onnx_inputs")
-
-        embeddings = self.runner.run(onnx_inputs)[0]
-        return [embedding for embedding in embeddings]
--- a/frigate/embeddings/maintainer.py
+++ b/frigate/embeddings/maintainer.py
@ -20,24 +20,39 @@ from frigate.comms.event_metadata_updater import (
 )
 from frigate.comms.events_updater import EventEndSubscriber, EventUpdateSubscriber
 from frigate.comms.inter_process import InterProcessRequestor
+from frigate.comms.recordings_updater import (
+    RecordingsDataSubscriber,
+    RecordingsDataTypeEnum,
+)
 from frigate.config import FrigateConfig
 from frigate.const import (
    CLIPS_DIR,
    UPDATE_EVENT_DESCRIPTION,
 )
-from frigate.data_processing.real_time.api import RealTimeProcessorApi
-from frigate.data_processing.real_time.bird_processor import BirdProcessor
-from frigate.data_processing.real_time.face_processor import FaceProcessor
-from frigate.data_processing.real_time.license_plate_processor import (
-    LicensePlateProcessor,
+from frigate.data_processing.common.license_plate.model import (
+    LicensePlateModelRunner,
 )
-from frigate.data_processing.types import DataProcessorMetrics
+from frigate.data_processing.post.api import PostProcessorApi
+from frigate.data_processing.post.license_plate import (
+    LicensePlatePostProcessor,
+)
+from frigate.data_processing.real_time.api import RealTimeProcessorApi
+from frigate.data_processing.real_time.bird import BirdRealTimeProcessor
+from frigate.data_processing.real_time.face import FaceRealTimeProcessor
+from frigate.data_processing.real_time.license_plate import (
+    LicensePlateRealTimeProcessor,
+)
+from frigate.data_processing.types import DataProcessorMetrics, PostProcessDataEnum
 from frigate.events.types import EventTypeEnum
 from frigate.genai import get_genai_client
 from frigate.models import Event
 from frigate.types import TrackedObjectUpdateTypesEnum
 from frigate.util.builtin import serialize
-from frigate.util.image import SharedMemoryFrameManager, calculate_region
+from frigate.util.image import (
+    SharedMemoryFrameManager,
+    calculate_region,
+    ensure_jpeg_bytes,
+)
 from frigate.util.path import get_event_thumbnail_bytes

 from .embeddings import Embeddings
@ -60,46 +75,81 @@ class EmbeddingMaintainer(threading.Thread):
        super().__init__(name="embeddings_maintainer")
        self.config = config
        self.metrics = metrics
-        self.embeddings = Embeddings(config, db, metrics)
+        self.embeddings = None

-        # Check if we need to re-index events
-        if config.semantic_search.reindex:
-            self.embeddings.reindex()
+        if config.semantic_search.enabled:
+            self.embeddings = Embeddings(config, db, metrics)
+
+            # Check if we need to re-index events
+            if config.semantic_search.reindex:
+                self.embeddings.reindex()
+
+        # create communication for updating event descriptions
+        self.requestor = InterProcessRequestor()

        self.event_subscriber = EventUpdateSubscriber()
        self.event_end_subscriber = EventEndSubscriber()
        self.event_metadata_subscriber = EventMetadataSubscriber(
            EventMetadataTypeEnum.regenerate_description
        )
+        self.recordings_subscriber = RecordingsDataSubscriber(
+            RecordingsDataTypeEnum.recordings_available_through
+        )
        self.embeddings_responder = EmbeddingsResponder()
        self.frame_manager = SharedMemoryFrameManager()
-        self.processors: list[RealTimeProcessorApi] = []
+
+        self.detected_license_plates: dict[str, dict[str, any]] = {}
+
+        # model runners to share between realtime and post processors
+        if self.config.lpr.enabled:
+            lpr_model_runner = LicensePlateModelRunner(self.requestor)
+
+        # realtime processors
+        self.realtime_processors: list[RealTimeProcessorApi] = []

        if self.config.face_recognition.enabled:
-            self.processors.append(FaceProcessor(self.config, metrics))
+            self.realtime_processors.append(FaceRealTimeProcessor(self.config, metrics))

        if self.config.classification.bird.enabled:
-            self.processors.append(BirdProcessor(self.config, metrics))
+            self.realtime_processors.append(BirdRealTimeProcessor(self.config, metrics))

        if self.config.lpr.enabled:
-            self.processors.append(LicensePlateProcessor(self.config, metrics))
+            self.realtime_processors.append(
+                LicensePlateRealTimeProcessor(
+                    self.config, metrics, lpr_model_runner, self.detected_license_plates
+                )
+            )
+
+        # post processors
+        self.post_processors: list[PostProcessorApi] = []
+
+        if self.config.lpr.enabled:
+            self.post_processors.append(
+                LicensePlatePostProcessor(
+                    self.config, metrics, lpr_model_runner, self.detected_license_plates
+                )
+            )

-        # create communication for updating event descriptions
-        self.requestor = InterProcessRequestor()
        self.stop_event = stop_event
        self.tracked_events: dict[str, list[any]] = {}
+        self.early_request_sent: dict[str, bool] = {}
        self.genai_client = get_genai_client(config)

+        # recordings data
+        self.recordings_available_through: dict[str, float] = {}
+
    def run(self) -> None:
        """Maintain a SQLite-vec database for semantic search."""
        while not self.stop_event.is_set():
            self._process_requests()
            self._process_updates()
+            self._process_recordings_updates()
            self._process_finalized()
            self._process_event_metadata()

        self.event_subscriber.stop()
        self.event_end_subscriber.stop()
+        self.recordings_subscriber.stop()
        self.event_metadata_subscriber.stop()
        self.embeddings_responder.stop()
        self.requestor.stop()
@ -110,32 +160,34 @@ class EmbeddingMaintainer(threading.Thread):

        def _handle_request(topic: str, data: dict[str, any]) -> str:
            try:
-                if topic == EmbeddingsRequestEnum.embed_description.value:
-                    return serialize(
-                        self.embeddings.embed_description(
-                            data["id"], data["description"]
-                        ),
-                        pack=False,
-                    )
-                elif topic == EmbeddingsRequestEnum.embed_thumbnail.value:
-                    thumbnail = base64.b64decode(data["thumbnail"])
-                    return serialize(
-                        self.embeddings.embed_thumbnail(data["id"], thumbnail),
-                        pack=False,
-                    )
-                elif topic == EmbeddingsRequestEnum.generate_search.value:
-                    return serialize(
-                        self.embeddings.embed_description("", data, upsert=False),
-                        pack=False,
-                    )
-                else:
-                    for processor in self.processors:
+                # First handle the embedding-specific topics when semantic search is enabled
+                if self.config.semantic_search.enabled:
+                    if topic == EmbeddingsRequestEnum.embed_description.value:
+                        return serialize(
+                            self.embeddings.embed_description(
+                                data["id"], data["description"]
+                            ),
+                            pack=False,
+                        )
+                    elif topic == EmbeddingsRequestEnum.embed_thumbnail.value:
+                        thumbnail = base64.b64decode(data["thumbnail"])
+                        return serialize(
+                            self.embeddings.embed_thumbnail(data["id"], thumbnail),
+                            pack=False,
+                        )
+                    elif topic == EmbeddingsRequestEnum.generate_search.value:
+                        return serialize(
+                            self.embeddings.embed_description("", data, upsert=False),
+                            pack=False,
+                        )
+                processors = [self.realtime_processors, self.post_processors]
+                for processor_list in processors:
+                    for processor in processor_list:
                        resp = processor.handle_request(topic, data)
-
                        if resp is not None:
                            return resp
            except Exception as e:
-                logger.error(f"Unable to handle embeddings request {e}")
+                logger.error(f"Unable to handle embeddings request {e}", exc_info=True)

        self.embeddings_responder.check_for_request(_handle_request)

@ -154,7 +206,7 @@ class EmbeddingMaintainer(threading.Thread):
        camera_config = self.config.cameras[camera]

        # no need to process updated objects if face recognition, lpr, genai are disabled
-        if not camera_config.genai.enabled and len(self.processors) == 0:
+        if not camera_config.genai.enabled and len(self.realtime_processors) == 0:
            return

        # Create our own thumbnail based on the bounding box and the frame time
@ -171,7 +223,7 @@ class EmbeddingMaintainer(threading.Thread):
            )
            return

-        for processor in self.processors:
+        for processor in self.realtime_processors:
            processor.process_frame(data, yuv_frame)

        # no need to save our own thumbnails if genai is not enabled
@ -189,6 +241,43 @@ class EmbeddingMaintainer(threading.Thread):

            self.tracked_events[data["id"]].append(data)

+        # check if we're configured to send an early request after a minimum number of updates received
+        if (
+            self.genai_client is not None
+            and camera_config.genai.send_triggers.after_significant_updates
+        ):
+            if (
+                len(self.tracked_events.get(data["id"], []))
+                >= camera_config.genai.send_triggers.after_significant_updates
+                and data["id"] not in self.early_request_sent
+            ):
+                if data["has_clip"] and data["has_snapshot"]:
+                    event: Event = Event.get(Event.id == data["id"])
+
+                    if (
+                        not camera_config.genai.objects
+                        or event.label in camera_config.genai.objects
+                    ) and (
+                        not camera_config.genai.required_zones
+                        or set(data["entered_zones"])
+                        & set(camera_config.genai.required_zones)
+                    ):
+                        logger.debug(f"{camera} sending early request to GenAI")
+
+                        self.early_request_sent[data["id"]] = True
+                        threading.Thread(
+                            target=self._genai_embed_description,
+                            name=f"_genai_embed_description_{event.id}",
+                            daemon=True,
+                            args=(
+                                event,
+                                [
+                                    data["thumbnail"]
+                                    for data in self.tracked_events[data["id"]]
+                                ],
+                            ),
+                        ).start()
+
        self.frame_manager.close(frame_name)

    def _process_finalized(self) -> None:
@ -202,7 +291,32 @@ class EmbeddingMaintainer(threading.Thread):
            event_id, camera, updated_db = ended
            camera_config = self.config.cameras[camera]

-            for processor in self.processors:
+            # call any defined post processors
+            for processor in self.post_processors:
+                if isinstance(processor, LicensePlatePostProcessor):
+                    recordings_available = self.recordings_available_through.get(camera)
+                    if (
+                        recordings_available is not None
+                        and event_id in self.detected_license_plates
+                    ):
+                        processor.process_data(
+                            {
+                                "event_id": event_id,
+                                "camera": camera,
+                                "recordings_available": self.recordings_available_through[
+                                    camera
+                                ],
+                                "obj_data": self.detected_license_plates[event_id][
+                                    "obj_data"
+                                ],
+                            },
+                            PostProcessDataEnum.recording,
+                        )
+                else:
+                    processor.process_data(event_id, PostProcessDataEnum.event_id)
+
+            # expire in realtime processors
+            for processor in self.realtime_processors:
                processor.expire_object(event_id)

            if updated_db:
@ -221,10 +335,11 @@ class EmbeddingMaintainer(threading.Thread):
                # Embed the thumbnail
                self._embed_thumbnail(event_id, thumbnail)

+                # Run GenAI
                if (
                    camera_config.genai.enabled
+                    and camera_config.genai.send_triggers.tracked_object_end
                    and self.genai_client is not None
-                    and event.data.get("description") is None
                    and (
                        not camera_config.genai.objects
                        or event.label in camera_config.genai.objects
@ -234,87 +349,30 @@ class EmbeddingMaintainer(threading.Thread):
                        or set(event.zones) & set(camera_config.genai.required_zones)
                    )
                ):
-                    if event.has_snapshot and camera_config.genai.use_snapshot:
-                        with open(
-                            os.path.join(CLIPS_DIR, f"{event.camera}-{event.id}.jpg"),
-                            "rb",
-                        ) as image_file:
-                            snapshot_image = image_file.read()
-
-                            img = cv2.imdecode(
-                                np.frombuffer(snapshot_image, dtype=np.int8),
-                                cv2.IMREAD_COLOR,
-                            )
-
-                            # crop snapshot based on region before sending off to genai
-                            height, width = img.shape[:2]
-                            x1_rel, y1_rel, width_rel, height_rel = event.data["region"]
-
-                            x1, y1 = int(x1_rel * width), int(y1_rel * height)
-                            cropped_image = img[
-                                y1 : y1 + int(height_rel * height),
-                                x1 : x1 + int(width_rel * width),
-                            ]
-
-                            _, buffer = cv2.imencode(".jpg", cropped_image)
-                            snapshot_image = buffer.tobytes()
-
-                    num_thumbnails = len(self.tracked_events.get(event_id, []))
-
-                    embed_image = (
-                        [snapshot_image]
-                        if event.has_snapshot and camera_config.genai.use_snapshot
-                        else (
-                            [
-                                data["thumbnail"]
-                                for data in self.tracked_events[event_id]
-                            ]
-                            if num_thumbnails > 0
-                            else [thumbnail]
-                        )
-                    )
-
-                    if camera_config.genai.debug_save_thumbnails and num_thumbnails > 0:
-                        logger.debug(
-                            f"Saving {num_thumbnails} thumbnails for event {event.id}"
-                        )
-
-                        Path(
-                            os.path.join(CLIPS_DIR, f"genai-requests/{event.id}")
-                        ).mkdir(parents=True, exist_ok=True)
-
-                        for idx, data in enumerate(self.tracked_events[event_id], 1):
-                            jpg_bytes: bytes = data["thumbnail"]
-
-                            if jpg_bytes is None:
-                                logger.warning(
-                                    f"Unable to save thumbnail {idx} for {event.id}."
-                                )
-                            else:
-                                with open(
-                                    os.path.join(
-                                        CLIPS_DIR,
-                                        f"genai-requests/{event.id}/{idx}.jpg",
-                                    ),
-                                    "wb",
-                                ) as j:
-                                    j.write(jpg_bytes)
-
-                    # Generate the description. Call happens in a thread since it is network bound.
-                    threading.Thread(
-                        target=self._embed_description,
-                        name=f"_embed_description_{event.id}",
-                        daemon=True,
-                        args=(
-                            event,
-                            embed_image,
-                        ),
-                    ).start()
+                    self._process_genai_description(event, camera_config, thumbnail)

            # Delete tracked events based on the event_id
            if event_id in self.tracked_events:
                del self.tracked_events[event_id]

+    def _process_recordings_updates(self) -> None:
+        """Process recordings updates."""
+        while True:
+            recordings_data = self.recordings_subscriber.check_for_update(timeout=0.01)
+
+            if recordings_data == None:
+                break
+
+            camera, recordings_available_through_timestamp = recordings_data
+
+            self.recordings_available_through[camera] = (
+                recordings_available_through_timestamp
+            )
+
+            logger.debug(
+                f"{camera} now has recordings available through {recordings_available_through_timestamp}"
+            )
+
    def _process_event_metadata(self):
        # Check for regenerate description requests
        (topic, event_id, source) = self.event_metadata_subscriber.check_for_update(
@ -345,9 +403,66 @@ class EmbeddingMaintainer(threading.Thread):

    def _embed_thumbnail(self, event_id: str, thumbnail: bytes) -> None:
        """Embed the thumbnail for an event."""
+        if not self.config.semantic_search.enabled:
+            return
+
        self.embeddings.embed_thumbnail(event_id, thumbnail)

-    def _embed_description(self, event: Event, thumbnails: list[bytes]) -> None:
+    def _process_genai_description(self, event, camera_config, thumbnail) -> None:
+        if event.has_snapshot and camera_config.genai.use_snapshot:
+            snapshot_image = self._read_and_crop_snapshot(event, camera_config)
+            if not snapshot_image:
+                return
+
+        num_thumbnails = len(self.tracked_events.get(event.id, []))
+
+        # ensure we have a jpeg to pass to the model
+        thumbnail = ensure_jpeg_bytes(thumbnail)
+
+        embed_image = (
+            [snapshot_image]
+            if event.has_snapshot and camera_config.genai.use_snapshot
+            else (
+                [data["thumbnail"] for data in self.tracked_events[event.id]]
+                if num_thumbnails > 0
+                else [thumbnail]
+            )
+        )
+
+        if camera_config.genai.debug_save_thumbnails and num_thumbnails > 0:
+            logger.debug(f"Saving {num_thumbnails} thumbnails for event {event.id}")
+
+            Path(os.path.join(CLIPS_DIR, f"genai-requests/{event.id}")).mkdir(
+                parents=True, exist_ok=True
+            )
+
+            for idx, data in enumerate(self.tracked_events[event.id], 1):
+                jpg_bytes: bytes = data["thumbnail"]
+
+                if jpg_bytes is None:
+                    logger.warning(f"Unable to save thumbnail {idx} for {event.id}.")
+                else:
+                    with open(
+                        os.path.join(
+                            CLIPS_DIR,
+                            f"genai-requests/{event.id}/{idx}.jpg",
+                        ),
+                        "wb",
+                    ) as j:
+                        j.write(jpg_bytes)
+
+        # Generate the description. Call happens in a thread since it is network bound.
+        threading.Thread(
+            target=self._genai_embed_description,
+            name=f"_genai_embed_description_{event.id}",
+            daemon=True,
+            args=(
+                event,
+                embed_image,
+            ),
+        ).start()
+
+    def _genai_embed_description(self, event: Event, thumbnails: list[bytes]) -> None:
        """Embed the description for an event."""
        camera_config = self.config.cameras[event.camera]

@ -370,7 +485,8 @@ class EmbeddingMaintainer(threading.Thread):
        )

        # Embed the description
-        self.embeddings.embed_description(event.id, description)
+        if self.config.semantic_search.enabled:
+            self.embeddings.embed_description(event.id, description)

        logger.debug(
            "Generated description for %s (%d images): %s",
@ -379,6 +495,45 @@ class EmbeddingMaintainer(threading.Thread):
            description,
        )

+    def _read_and_crop_snapshot(self, event: Event, camera_config) -> bytes | None:
+        """Read, decode, and crop the snapshot image."""
+
+        snapshot_file = os.path.join(CLIPS_DIR, f"{event.camera}-{event.id}.jpg")
+
+        if not os.path.isfile(snapshot_file):
+            logger.error(
+                f"Cannot load snapshot for {event.id}, file not found: {snapshot_file}"
+            )
+            return None
+
+        try:
+            with open(snapshot_file, "rb") as image_file:
+                snapshot_image = image_file.read()
+
+                img = cv2.imdecode(
+                    np.frombuffer(snapshot_image, dtype=np.int8),
+                    cv2.IMREAD_COLOR,
+                )
+
+                # Crop snapshot based on region
+                # provide full image if region doesn't exist (manual events)
+                height, width = img.shape[:2]
+                x1_rel, y1_rel, width_rel, height_rel = event.data.get(
+                    "region", [0, 0, 1, 1]
+                )
+                x1, y1 = int(x1_rel * width), int(y1_rel * height)
+
+                cropped_image = img[
+                    y1 : y1 + int(height_rel * height),
+                    x1 : x1 + int(width_rel * width),
+                ]
+
+                _, buffer = cv2.imencode(".jpg", cropped_image)
+
+                return buffer.tobytes()
+        except Exception:
+            return None
+
    def handle_regenerate_description(self, event_id: str, source: str) -> None:
        try:
            event: Event = Event.get(Event.id == event_id)
@ -393,39 +548,18 @@ class EmbeddingMaintainer(threading.Thread):

        thumbnail = get_event_thumbnail_bytes(event)

+        # ensure we have a jpeg to pass to the model
+        thumbnail = ensure_jpeg_bytes(thumbnail)
+
        logger.debug(
            f"Trying {source} regeneration for {event}, has_snapshot: {event.has_snapshot}"
        )

        if event.has_snapshot and source == "snapshot":
-            snapshot_file = os.path.join(CLIPS_DIR, f"{event.camera}-{event.id}.jpg")
-
-            if not os.path.isfile(snapshot_file):
-                logger.error(
-                    f"Cannot regenerate description for {event.id}, snapshot file not found: {snapshot_file}"
-                )
+            snapshot_image = self._read_and_crop_snapshot(event, camera_config)
+            if not snapshot_image:
                return

-            with open(snapshot_file, "rb") as image_file:
-                snapshot_image = image_file.read()
-                img = cv2.imdecode(
-                    np.frombuffer(snapshot_image, dtype=np.int8), cv2.IMREAD_COLOR
-                )
-
-                # crop snapshot based on region before sending off to genai
-                # provide full image if region doesn't exist (manual events)
-                region = event.data.get("region", [0, 0, 1, 1])
-                height, width = img.shape[:2]
-                x1_rel, y1_rel, width_rel, height_rel = region
-
-                x1, y1 = int(x1_rel * width), int(y1_rel * height)
-                cropped_image = img[
-                    y1 : y1 + int(height_rel * height), x1 : x1 + int(width_rel * width)
-                ]
-
-                _, buffer = cv2.imencode(".jpg", cropped_image)
-                snapshot_image = buffer.tobytes()
-
        embed_image = (
            [snapshot_image]
            if event.has_snapshot and source == "snapshot"
@ -436,4 +570,4 @@ class EmbeddingMaintainer(threading.Thread):
            )
        )

-        self._embed_description(event, embed_image)
+        self._genai_embed_description(event, embed_image)
--- a/frigate/embeddings/onnx/base_embedding.py
+++ b/frigate/embeddings/onnx/base_embedding.py
@ -0,0 +1,100 @@
+"""Base class for onnx embedding implementations."""
+
+import logging
+import os
+from abc import ABC, abstractmethod
+from enum import Enum
+from io import BytesIO
+
+import numpy as np
+import requests
+from PIL import Image
+
+from frigate.const import UPDATE_MODEL_STATE
+from frigate.types import ModelStatusTypesEnum
+from frigate.util.downloader import ModelDownloader
+
+logger = logging.getLogger(__name__)
+
+
+class EmbeddingTypeEnum(str, Enum):
+    thumbnail = "thumbnail"
+    description = "description"
+
+
+class BaseEmbedding(ABC):
+    """Base embedding class."""
+
+    def __init__(self, model_name: str, model_file: str, download_urls: dict[str, str]):
+        self.model_name = model_name
+        self.model_file = model_file
+        self.download_urls = download_urls
+        self.downloader: ModelDownloader = None
+
+    def _download_model(self, path: str):
+        try:
+            file_name = os.path.basename(path)
+
+            if file_name in self.download_urls:
+                ModelDownloader.download_from_url(self.download_urls[file_name], path)
+
+            self.downloader.requestor.send_data(
+                UPDATE_MODEL_STATE,
+                {
+                    "model": f"{self.model_name}-{file_name}",
+                    "state": ModelStatusTypesEnum.downloaded,
+                },
+            )
+        except Exception:
+            self.downloader.requestor.send_data(
+                UPDATE_MODEL_STATE,
+                {
+                    "model": f"{self.model_name}-{file_name}",
+                    "state": ModelStatusTypesEnum.error,
+                },
+            )
+
+    @abstractmethod
+    def _load_model_and_utils(self):
+        pass
+
+    @abstractmethod
+    def _preprocess_inputs(self, raw_inputs: any) -> any:
+        pass
+
+    def _process_image(self, image, output: str = "RGB") -> Image.Image:
+        if isinstance(image, str):
+            if image.startswith("http"):
+                response = requests.get(image)
+                image = Image.open(BytesIO(response.content)).convert(output)
+        elif isinstance(image, bytes):
+            image = Image.open(BytesIO(image)).convert(output)
+
+        return image
+
+    def _postprocess_outputs(self, outputs: any) -> any:
+        return outputs
+
+    def __call__(
+        self, inputs: list[str] | list[Image.Image] | list[str]
+    ) -> list[np.ndarray]:
+        self._load_model_and_utils()
+        processed = self._preprocess_inputs(inputs)
+        input_names = self.runner.get_input_names()
+        onnx_inputs = {name: [] for name in input_names}
+        input: dict[str, any]
+        for input in processed:
+            for key, value in input.items():
+                if key in input_names:
+                    onnx_inputs[key].append(value[0])
+
+        for key in input_names:
+            if onnx_inputs.get(key):
+                onnx_inputs[key] = np.stack(onnx_inputs[key])
+            else:
+                logger.warning(f"Expected input '{key}' not found in onnx_inputs")
+
+        outputs = self.runner.run(onnx_inputs)[0]
+        embeddings = self._postprocess_outputs(outputs)
+
+        return [embedding for embedding in embeddings]
--- a/frigate/embeddings/onnx/jina_v1_embedding.py
+++ b/frigate/embeddings/onnx/jina_v1_embedding.py
@ -0,0 +1,216 @@
+"""JinaV1 Embeddings."""
+
+import logging
+import os
+import warnings
+
+# importing this without pytorch or others causes a warning
+# https://github.com/huggingface/transformers/issues/27214
+# suppressed by setting env TRANSFORMERS_NO_ADVISORY_WARNINGS=1
+from transformers import AutoFeatureExtractor, AutoTokenizer
+from transformers.utils.logging import disable_progress_bar
+
+from frigate.comms.inter_process import InterProcessRequestor
+from frigate.const import MODEL_CACHE_DIR, UPDATE_MODEL_STATE
+from frigate.types import ModelStatusTypesEnum
+from frigate.util.downloader import ModelDownloader
+
+from .base_embedding import BaseEmbedding
+from .runner import ONNXModelRunner
+
+warnings.filterwarnings(
+    "ignore",
+    category=FutureWarning,
+    message="The class CLIPFeatureExtractor is deprecated",
+)
+
+# disables the progress bar for downloading tokenizers and feature extractors
+disable_progress_bar()
+logger = logging.getLogger(__name__)
+
+
+class JinaV1TextEmbedding(BaseEmbedding):
+    def __init__(
+        self,
+        model_size: str,
+        requestor: InterProcessRequestor,
+        device: str = "AUTO",
+    ):
+        super().__init__(
+            model_name="jinaai/jina-clip-v1",
+            model_file="text_model_fp16.onnx",
+            download_urls={
+                "text_model_fp16.onnx": "https://huggingface.co/jinaai/jina-clip-v1/resolve/main/onnx/text_model_fp16.onnx",
+            },
+        )
+        self.tokenizer_file = "tokenizer"
+        self.requestor = requestor
+        self.model_size = model_size
+        self.device = device
+        self.download_path = os.path.join(MODEL_CACHE_DIR, self.model_name)
+        self.tokenizer = None
+        self.feature_extractor = None
+        self.runner = None
+        files_names = list(self.download_urls.keys()) + [self.tokenizer_file]
+
+        if not all(
+            os.path.exists(os.path.join(self.download_path, n)) for n in files_names
+        ):
+            logger.debug(f"starting model download for {self.model_name}")
+            self.downloader = ModelDownloader(
+                model_name=self.model_name,
+                download_path=self.download_path,
+                file_names=files_names,
+                download_func=self._download_model,
+            )
+            self.downloader.ensure_model_files()
+        else:
+            self.downloader = None
+            ModelDownloader.mark_files_state(
+                self.requestor,
+                self.model_name,
+                files_names,
+                ModelStatusTypesEnum.downloaded,
+            )
+            self._load_model_and_utils()
+            logger.debug(f"models are already downloaded for {self.model_name}")
+
+    def _download_model(self, path: str):
+        try:
+            file_name = os.path.basename(path)
+
+            if file_name in self.download_urls:
+                ModelDownloader.download_from_url(self.download_urls[file_name], path)
+            elif file_name == self.tokenizer_file:
+                if not os.path.exists(path + "/" + self.model_name):
+                    logger.info(f"Downloading {self.model_name} tokenizer")
+
+                tokenizer = AutoTokenizer.from_pretrained(
+                    self.model_name,
+                    trust_remote_code=True,
+                    cache_dir=f"{MODEL_CACHE_DIR}/{self.model_name}/tokenizer",
+                    clean_up_tokenization_spaces=True,
+                )
+                tokenizer.save_pretrained(path)
+
+            self.downloader.requestor.send_data(
+                UPDATE_MODEL_STATE,
+                {
+                    "model": f"{self.model_name}-{file_name}",
+                    "state": ModelStatusTypesEnum.downloaded,
+                },
+            )
+        except Exception:
+            self.downloader.requestor.send_data(
+                UPDATE_MODEL_STATE,
+                {
+                    "model": f"{self.model_name}-{file_name}",
+                    "state": ModelStatusTypesEnum.error,
+                },
+            )
+
+    def _load_model_and_utils(self):
+        if self.runner is None:
+            if self.downloader:
+                self.downloader.wait_for_download()
+
+            tokenizer_path = os.path.join(
+                f"{MODEL_CACHE_DIR}/{self.model_name}/tokenizer"
+            )
+            self.tokenizer = AutoTokenizer.from_pretrained(
+                self.model_name,
+                cache_dir=tokenizer_path,
+                trust_remote_code=True,
+                clean_up_tokenization_spaces=True,
+            )
+
+            self.runner = ONNXModelRunner(
+                os.path.join(self.download_path, self.model_file),
+                self.device,
+                self.model_size,
+            )
+
+    def _preprocess_inputs(self, raw_inputs):
+        max_length = max(len(self.tokenizer.encode(text)) for text in raw_inputs)
+        return [
+            self.tokenizer(
+                text,
+                padding="max_length",
+                truncation=True,
+                max_length=max_length,
+                return_tensors="np",
+            )
+            for text in raw_inputs
+        ]
+
+
+class JinaV1ImageEmbedding(BaseEmbedding):
+    def __init__(
+        self,
+        model_size: str,
+        requestor: InterProcessRequestor,
+        device: str = "AUTO",
+    ):
+        model_file = (
+            "vision_model_fp16.onnx"
+            if model_size == "large"
+            else "vision_model_quantized.onnx"
+        )
+        super().__init__(
+            model_name="jinaai/jina-clip-v1",
+            model_file=model_file,
+            download_urls={
+                model_file: f"https://huggingface.co/jinaai/jina-clip-v1/resolve/main/onnx/{model_file}",
+                "preprocessor_config.json": "https://huggingface.co/jinaai/jina-clip-v1/resolve/main/preprocessor_config.json",
+            },
+        )
+        self.requestor = requestor
+        self.model_size = model_size
+        self.device = device
+        self.download_path = os.path.join(MODEL_CACHE_DIR, self.model_name)
+        self.feature_extractor = None
+        self.runner: ONNXModelRunner | None = None
+        files_names = list(self.download_urls.keys())
+        if not all(
+            os.path.exists(os.path.join(self.download_path, n)) for n in files_names
+        ):
+            logger.debug(f"starting model download for {self.model_name}")
+            self.downloader = ModelDownloader(
+                model_name=self.model_name,
+                download_path=self.download_path,
+                file_names=files_names,
+                download_func=self._download_model,
+            )
+            self.downloader.ensure_model_files()
+        else:
+            self.downloader = None
+            ModelDownloader.mark_files_state(
+                self.requestor,
+                self.model_name,
+                files_names,
+                ModelStatusTypesEnum.downloaded,
+            )
+            self._load_model_and_utils()
+            logger.debug(f"models are already downloaded for {self.model_name}")
+
+    def _load_model_and_utils(self):
+        if self.runner is None:
+            if self.downloader:
+                self.downloader.wait_for_download()
+
+            self.feature_extractor = AutoFeatureExtractor.from_pretrained(
+                f"{MODEL_CACHE_DIR}/{self.model_name}",
+            )
+
+            self.runner = ONNXModelRunner(
+                os.path.join(self.download_path, self.model_file),
+                self.device,
+                self.model_size,
+            )
+
+    def _preprocess_inputs(self, raw_inputs):
+        processed_images = [self._process_image(img) for img in raw_inputs]
+        return [
+            self.feature_extractor(images=image, return_tensors="np")
+            for image in processed_images
+        ]
--- a/frigate/embeddings/onnx/jina_v2_embedding.py
+++ b/frigate/embeddings/onnx/jina_v2_embedding.py
@ -0,0 +1,231 @@
+"""JinaV2 Embeddings."""
+
+import io
+import logging
+import os
+
+import numpy as np
+from PIL import Image
+from transformers import AutoTokenizer
+from transformers.utils.logging import disable_progress_bar, set_verbosity_error
+
+from frigate.comms.inter_process import InterProcessRequestor
+from frigate.const import MODEL_CACHE_DIR, UPDATE_MODEL_STATE
+from frigate.types import ModelStatusTypesEnum
+from frigate.util.downloader import ModelDownloader
+
+from .base_embedding import BaseEmbedding
+from .runner import ONNXModelRunner
+
+# disables the progress bar and download logging for downloading tokenizers and image processors
+disable_progress_bar()
+set_verbosity_error()
+logger = logging.getLogger(__name__)
+
+
+class JinaV2Embedding(BaseEmbedding):
+    def __init__(
+        self,
+        model_size: str,
+        requestor: InterProcessRequestor,
+        device: str = "AUTO",
+        embedding_type: str = None,
+    ):
+        model_file = (
+            "model_fp16.onnx" if model_size == "large" else "model_quantized.onnx"
+        )
+        super().__init__(
+            model_name="jinaai/jina-clip-v2",
+            model_file=model_file,
+            download_urls={
+                model_file: f"https://huggingface.co/jinaai/jina-clip-v2/resolve/main/onnx/{model_file}",
+                "preprocessor_config.json": "https://huggingface.co/jinaai/jina-clip-v2/resolve/main/preprocessor_config.json",
+            },
+        )
+        self.tokenizer_file = "tokenizer"
+        self.embedding_type = embedding_type
+        self.requestor = requestor
+        self.model_size = model_size
+        self.device = device
+        self.download_path = os.path.join(MODEL_CACHE_DIR, self.model_name)
+        self.tokenizer = None
+        self.image_processor = None
+        self.runner = None
+        files_names = list(self.download_urls.keys()) + [self.tokenizer_file]
+        if not all(
+            os.path.exists(os.path.join(self.download_path, n)) for n in files_names
+        ):
+            logger.debug(f"starting model download for {self.model_name}")
+            self.downloader = ModelDownloader(
+                model_name=self.model_name,
+                download_path=self.download_path,
+                file_names=files_names,
+                download_func=self._download_model,
+            )
+            self.downloader.ensure_model_files()
+        else:
+            self.downloader = None
+            ModelDownloader.mark_files_state(
+                self.requestor,
+                self.model_name,
+                files_names,
+                ModelStatusTypesEnum.downloaded,
+            )
+            self._load_model_and_utils()
+            logger.debug(f"models are already downloaded for {self.model_name}")
+
+    def _download_model(self, path: str):
+        try:
+            file_name = os.path.basename(path)
+
+            if file_name in self.download_urls:
+                ModelDownloader.download_from_url(self.download_urls[file_name], path)
+            elif file_name == self.tokenizer_file:
+                if not os.path.exists(os.path.join(path, self.model_name)):
+                    logger.info(f"Downloading {self.model_name} tokenizer")
+
+                tokenizer = AutoTokenizer.from_pretrained(
+                    self.model_name,
+                    trust_remote_code=True,
+                    cache_dir=os.path.join(
+                        MODEL_CACHE_DIR, self.model_name, "tokenizer"
+                    ),
+                    clean_up_tokenization_spaces=True,
+                )
+                tokenizer.save_pretrained(path)
+            self.requestor.send_data(
+                UPDATE_MODEL_STATE,
+                {
+                    "model": f"{self.model_name}-{file_name}",
+                    "state": ModelStatusTypesEnum.downloaded,
+                },
+            )
+        except Exception:
+            self.requestor.send_data(
+                UPDATE_MODEL_STATE,
+                {
+                    "model": f"{self.model_name}-{file_name}",
+                    "state": ModelStatusTypesEnum.error,
+                },
+            )
+
+    def _load_model_and_utils(self):
+        if self.runner is None:
+            if self.downloader:
+                self.downloader.wait_for_download()
+
+            tokenizer_path = os.path.join(
+                f"{MODEL_CACHE_DIR}/{self.model_name}/tokenizer"
+            )
+            self.tokenizer = AutoTokenizer.from_pretrained(
+                self.model_name,
+                cache_dir=tokenizer_path,
+                trust_remote_code=True,
+                clean_up_tokenization_spaces=True,
+            )
+
+            self.runner = ONNXModelRunner(
+                os.path.join(self.download_path, self.model_file),
+                self.device,
+                self.model_size,
+            )
+
+    def _preprocess_image(self, image_data: bytes | Image.Image) -> np.ndarray:
+        """
+        Manually preprocess a single image from bytes or PIL.Image to (3, 512, 512).
+        """
+        if isinstance(image_data, bytes):
+            image = Image.open(io.BytesIO(image_data))
+        else:
+            image = image_data
+
+        if image.mode != "RGB":
+            image = image.convert("RGB")
+
+        image = image.resize((512, 512), Image.Resampling.LANCZOS)
+
+        # Convert to numpy array, normalize to [0, 1], and transpose to (channels, height, width)
+        image_array = np.array(image, dtype=np.float32) / 255.0
+        image_array = np.transpose(image_array, (2, 0, 1))  # (H, W, C) -> (C, H, W)
+
+        return image_array
+
+    def _preprocess_inputs(self, raw_inputs):
+        """
+        Preprocess inputs into a list of real input tensors (no dummies).
+        - For text: Returns list of input_ids.
+        - For vision: Returns list of pixel_values.
+        """
+        if not isinstance(raw_inputs, list):
+            raw_inputs = [raw_inputs]
+
+        processed = []
+        if self.embedding_type == "text":
+            for text in raw_inputs:
+                input_ids = self.tokenizer([text], return_tensors="np")["input_ids"]
+                processed.append(input_ids)
+        elif self.embedding_type == "vision":
+            for img in raw_inputs:
+                pixel_values = self._preprocess_image(img)
+                processed.append(
+                    pixel_values[np.newaxis, ...]
+                )  # Add batch dim: (1, 3, 512, 512)
+        else:
+            raise ValueError(
+                f"Invalid embedding_type: {self.embedding_type}. Must be 'text' or 'vision'."
+            )
+        return processed
+
+    def _postprocess_outputs(self, outputs):
+        """
+        Process ONNX model outputs, truncating each embedding in the array to truncate_dim.
+        - outputs: NumPy array of embeddings.
+        - Returns: List of truncated embeddings.
+        """
+        # size of vector in database
+        truncate_dim = 768
+
+        # jina v2 defaults to 1024 and uses Matryoshka representation, so
+        # truncating only causes an extremely minor decrease in retrieval accuracy
+        if outputs.shape[-1] > truncate_dim:
+            outputs = outputs[..., :truncate_dim]
+
+        return outputs
+
+    def __call__(
+        self, inputs: list[str] | list[Image.Image] | list[str], embedding_type=None
+    ) -> list[np.ndarray]:
+        self.embedding_type = embedding_type
+        if not self.embedding_type:
+            raise ValueError(
+                "embedding_type must be specified either in __init__ or __call__"
+            )
+
+        self._load_model_and_utils()
+        processed = self._preprocess_inputs(inputs)
+        batch_size = len(processed)
+
+        # Prepare ONNX inputs with matching batch sizes
+        onnx_inputs = {}
+        if self.embedding_type == "text":
+            onnx_inputs["input_ids"] = np.stack([x[0] for x in processed])
+            onnx_inputs["pixel_values"] = np.zeros(
+                (batch_size, 3, 512, 512), dtype=np.float32
+            )
+        elif self.embedding_type == "vision":
+            onnx_inputs["input_ids"] = np.zeros((batch_size, 16), dtype=np.int64)
+            onnx_inputs["pixel_values"] = np.stack([x[0] for x in processed])
+        else:
+            raise ValueError("Invalid embedding type")
+
+        # Run inference
+        outputs = self.runner.run(onnx_inputs)
+        if self.embedding_type == "text":
+            embeddings = outputs[2]  # text embeddings
+        elif self.embedding_type == "vision":
+            embeddings = outputs[3]  # image embeddings
+        else:
+            raise ValueError("Invalid embedding type")
+
+        embeddings = self._postprocess_outputs(embeddings)
+        return [embedding for embedding in embeddings]
--- a/frigate/embeddings/onnx/lpr_embedding.py
+++ b/frigate/embeddings/onnx/lpr_embedding.py
@ -0,0 +1,297 @@
+import logging
+import os
+import warnings
+
+import cv2
+import numpy as np
+
+from frigate.comms.inter_process import InterProcessRequestor
+from frigate.const import MODEL_CACHE_DIR
+from frigate.types import ModelStatusTypesEnum
+from frigate.util.downloader import ModelDownloader
+
+from .base_embedding import BaseEmbedding
+from .runner import ONNXModelRunner
+
+warnings.filterwarnings(
+    "ignore",
+    category=FutureWarning,
+    message="The class CLIPFeatureExtractor is deprecated",
+)
+
+logger = logging.getLogger(__name__)
+
+LPR_EMBEDDING_SIZE = 256
+
+
+class PaddleOCRDetection(BaseEmbedding):
+    def __init__(
+        self,
+        model_size: str,
+        requestor: InterProcessRequestor,
+        device: str = "AUTO",
+    ):
+        super().__init__(
+            model_name="paddleocr-onnx",
+            model_file="detection.onnx",
+            download_urls={
+                "detection.onnx": "https://github.com/hawkeye217/paddleocr-onnx/raw/refs/heads/master/models/detection.onnx"
+            },
+        )
+        self.requestor = requestor
+        self.model_size = model_size
+        self.device = device
+        self.download_path = os.path.join(MODEL_CACHE_DIR, self.model_name)
+        self.runner: ONNXModelRunner | None = None
+        files_names = list(self.download_urls.keys())
+        if not all(
+            os.path.exists(os.path.join(self.download_path, n)) for n in files_names
+        ):
+            logger.debug(f"starting model download for {self.model_name}")
+            self.downloader = ModelDownloader(
+                model_name=self.model_name,
+                download_path=self.download_path,
+                file_names=files_names,
+                download_func=self._download_model,
+            )
+            self.downloader.ensure_model_files()
+        else:
+            self.downloader = None
+            ModelDownloader.mark_files_state(
+                self.requestor,
+                self.model_name,
+                files_names,
+                ModelStatusTypesEnum.downloaded,
+            )
+            self._load_model_and_utils()
+            logger.debug(f"models are already downloaded for {self.model_name}")
+
+    def _load_model_and_utils(self):
+        if self.runner is None:
+            if self.downloader:
+                self.downloader.wait_for_download()
+
+            self.runner = ONNXModelRunner(
+                os.path.join(self.download_path, self.model_file),
+                self.device,
+                self.model_size,
+            )
+
+    def _preprocess_inputs(self, raw_inputs):
+        preprocessed = []
+        for x in raw_inputs:
+            preprocessed.append(x)
+        return [{"x": preprocessed[0]}]
+
+
+class PaddleOCRClassification(BaseEmbedding):
+    def __init__(
+        self,
+        model_size: str,
+        requestor: InterProcessRequestor,
+        device: str = "AUTO",
+    ):
+        super().__init__(
+            model_name="paddleocr-onnx",
+            model_file="classification.onnx",
+            download_urls={
+                "classification.onnx": "https://github.com/hawkeye217/paddleocr-onnx/raw/refs/heads/master/models/classification.onnx"
+            },
+        )
+        self.requestor = requestor
+        self.model_size = model_size
+        self.device = device
+        self.download_path = os.path.join(MODEL_CACHE_DIR, self.model_name)
+        self.runner: ONNXModelRunner | None = None
+        files_names = list(self.download_urls.keys())
+        if not all(
+            os.path.exists(os.path.join(self.download_path, n)) for n in files_names
+        ):
+            logger.debug(f"starting model download for {self.model_name}")
+            self.downloader = ModelDownloader(
+                model_name=self.model_name,
+                download_path=self.download_path,
+                file_names=files_names,
+                download_func=self._download_model,
+            )
+            self.downloader.ensure_model_files()
+        else:
+            self.downloader = None
+            ModelDownloader.mark_files_state(
+                self.requestor,
+                self.model_name,
+                files_names,
+                ModelStatusTypesEnum.downloaded,
+            )
+            self._load_model_and_utils()
+            logger.debug(f"models are already downloaded for {self.model_name}")
+
+    def _load_model_and_utils(self):
+        if self.runner is None:
+            if self.downloader:
+                self.downloader.wait_for_download()
+
+            self.runner = ONNXModelRunner(
+                os.path.join(self.download_path, self.model_file),
+                self.device,
+                self.model_size,
+            )
+
+    def _preprocess_inputs(self, raw_inputs):
+        processed = []
+        for img in raw_inputs:
+            processed.append({"x": img})
+        return processed
+
+
+class PaddleOCRRecognition(BaseEmbedding):
+    def __init__(
+        self,
+        model_size: str,
+        requestor: InterProcessRequestor,
+        device: str = "AUTO",
+    ):
+        super().__init__(
+            model_name="paddleocr-onnx",
+            model_file="recognition.onnx",
+            download_urls={
+                "recognition.onnx": "https://github.com/hawkeye217/paddleocr-onnx/raw/refs/heads/master/models/recognition.onnx"
+            },
+        )
+        self.requestor = requestor
+        self.model_size = model_size
+        self.device = device
+        self.download_path = os.path.join(MODEL_CACHE_DIR, self.model_name)
+        self.runner: ONNXModelRunner | None = None
+        files_names = list(self.download_urls.keys())
+        if not all(
+            os.path.exists(os.path.join(self.download_path, n)) for n in files_names
+        ):
+            logger.debug(f"starting model download for {self.model_name}")
+            self.downloader = ModelDownloader(
+                model_name=self.model_name,
+                download_path=self.download_path,
+                file_names=files_names,
+                download_func=self._download_model,
+            )
+            self.downloader.ensure_model_files()
+        else:
+            self.downloader = None
+            ModelDownloader.mark_files_state(
+                self.requestor,
+                self.model_name,
+                files_names,
+                ModelStatusTypesEnum.downloaded,
+            )
+            self._load_model_and_utils()
+            logger.debug(f"models are already downloaded for {self.model_name}")
+
+    def _load_model_and_utils(self):
+        if self.runner is None:
+            if self.downloader:
+                self.downloader.wait_for_download()
+
+            self.runner = ONNXModelRunner(
+                os.path.join(self.download_path, self.model_file),
+                self.device,
+                self.model_size,
+            )
+
+    def _preprocess_inputs(self, raw_inputs):
+        processed = []
+        for img in raw_inputs:
+            processed.append({"x": img})
+        return processed
+
+
+class LicensePlateDetector(BaseEmbedding):
+    def __init__(
+        self,
+        model_size: str,
+        requestor: InterProcessRequestor,
+        device: str = "AUTO",
+    ):
+        super().__init__(
+            model_name="yolov9_license_plate",
+            model_file="yolov9-256-license-plates.onnx",
+            download_urls={
+                "yolov9-256-license-plates.onnx": "https://github.com/hawkeye217/yolov9-license-plates/raw/refs/heads/master/models/yolov9-256-license-plates.onnx"
+            },
+        )
+
+        self.requestor = requestor
+        self.model_size = model_size
+        self.device = device
+        self.download_path = os.path.join(MODEL_CACHE_DIR, self.model_name)
+        self.runner: ONNXModelRunner | None = None
+        files_names = list(self.download_urls.keys())
+        if not all(
+            os.path.exists(os.path.join(self.download_path, n)) for n in files_names
+        ):
+            logger.debug(f"starting model download for {self.model_name}")
+            self.downloader = ModelDownloader(
+                model_name=self.model_name,
+                download_path=self.download_path,
+                file_names=files_names,
+                download_func=self._download_model,
+            )
+            self.downloader.ensure_model_files()
+        else:
+            self.downloader = None
+            ModelDownloader.mark_files_state(
+                self.requestor,
+                self.model_name,
+                files_names,
+                ModelStatusTypesEnum.downloaded,
+            )
+            self._load_model_and_utils()
+            logger.debug(f"models are already downloaded for {self.model_name}")
+
+    def _load_model_and_utils(self):
+        if self.runner is None:
+            if self.downloader:
+                self.downloader.wait_for_download()
+
+            self.runner = ONNXModelRunner(
+                os.path.join(self.download_path, self.model_file),
+                self.device,
+                self.model_size,
+            )
+
+    def _preprocess_inputs(self, raw_inputs):
+        if isinstance(raw_inputs, list):
+            raise ValueError("License plate embedding does not support batch inputs.")
+        # Get image as numpy array
+        img = self._process_image(raw_inputs)
+        height, width, channels = img.shape
+
+        # Resize maintaining aspect ratio
+        if width > height:
+            new_height = int(((height / width) * LPR_EMBEDDING_SIZE) // 4 * 4)
+            img = cv2.resize(img, (LPR_EMBEDDING_SIZE, new_height))
+        else:
+            new_width = int(((width / height) * LPR_EMBEDDING_SIZE) // 4 * 4)
+            img = cv2.resize(img, (new_width, LPR_EMBEDDING_SIZE))
+
+        # Get new dimensions after resize
+        og_h, og_w, channels = img.shape
+
+        # Create black square frame
+        frame = np.full(
+            (LPR_EMBEDDING_SIZE, LPR_EMBEDDING_SIZE, channels),
+            (0, 0, 0),
+            dtype=np.float32,
+        )
+
+        # Center the resized image in the square frame
+        x_center = (LPR_EMBEDDING_SIZE - og_w) // 2
+        y_center = (LPR_EMBEDDING_SIZE - og_h) // 2
+        frame[y_center : y_center + og_h, x_center : x_center + og_w] = img
+
+        # Normalize to 0-1
+        frame = frame / 255.0
+
+        # Convert from HWC to CHW format and add batch dimension
+        frame = np.transpose(frame, (2, 0, 1))
+        frame = np.expand_dims(frame, axis=0)
+        return [{"images": frame}]
--- a/frigate/embeddings/onnx/runner.py
+++ b/frigate/embeddings/onnx/runner.py
@ -0,0 +1,76 @@
+"""Convenience runner for onnx models."""
+
+import logging
+import os.path
+from typing import Any
+
+import onnxruntime as ort
+
+from frigate.const import MODEL_CACHE_DIR
+from frigate.util.model import get_ort_providers
+
+try:
+    import openvino as ov
+except ImportError:
+    # openvino is not included
+    pass
+
+logger = logging.getLogger(__name__)
+
+
+class ONNXModelRunner:
+    """Run onnx models optimally based on available hardware."""
+
+    def __init__(self, model_path: str, device: str, requires_fp16: bool = False):
+        self.model_path = model_path
+        self.ort: ort.InferenceSession = None
+        self.ov: ov.Core = None
+        providers, options = get_ort_providers(device == "CPU", device, requires_fp16)
+        self.interpreter = None
+
+        if "OpenVINOExecutionProvider" in providers:
+            try:
+                # use OpenVINO directly
+                self.type = "ov"
+                self.ov = ov.Core()
+                self.ov.set_property(
+                    {ov.properties.cache_dir: os.path.join(MODEL_CACHE_DIR, "openvino")}
+                )
+                self.interpreter = self.ov.compile_model(
+                    model=model_path, device_name=device
+                )
+            except Exception as e:
+                logger.warning(
+                    f"OpenVINO failed to build model, using CPU instead: {e}"
+                )
+                self.interpreter = None
+
+        # Use ONNXRuntime
+        if self.interpreter is None:
+            self.type = "ort"
+            self.ort = ort.InferenceSession(
+                model_path,
+                providers=providers,
+                provider_options=options,
+            )
+
+    def get_input_names(self) -> list[str]:
+        if self.type == "ov":
+            input_names = []
+
+            for input in self.interpreter.inputs:
+                input_names.extend(input.names)
+
+            return input_names
+        elif self.type == "ort":
+            return [input.name for input in self.ort.get_inputs()]
+
+    def run(self, input: dict[str, Any]) -> Any:
+        if self.type == "ov":
+            infer_request = self.interpreter.create_infer_request()
+
+            outputs = infer_request.infer(input)
+
+            return outputs
+        elif self.type == "ort":
+            return self.ort.run(None, input)
--- a/frigate/events/audio.py
+++ b/frigate/events/audio.py
@ -135,8 +135,13 @@ class AudioEventMaintainer(threading.Thread):
        # create communication for audio detections
        self.requestor = InterProcessRequestor()
        self.config_subscriber = ConfigSubscriber(f"config/audio/{camera.name}")
+        self.enabled_subscriber = ConfigSubscriber(
+            f"config/enabled/{camera.name}", True
+        )
        self.detection_publisher = DetectionPublisher(DetectionTypeEnum.audio)

+        self.was_enabled = camera.enabled
+
    def detect_audio(self, audio) -> None:
        if not self.config.audio.enabled or self.stop_event.is_set():
            return
@ -248,6 +253,23 @@ class AudioEventMaintainer(threading.Thread):
                        f"Failed to end audio event {detection['id']} with status code {resp.status_code}"
                    )

+    def expire_all_detections(self) -> None:
+        """Immediately end all current detections"""
+        now = datetime.datetime.now().timestamp()
+        for label, detection in list(self.detections.items()):
+            if detection:
+                self.requestor.send_data(f"{self.config.name}/audio/{label}", "OFF")
+                resp = requests.put(
+                    f"{FRIGATE_LOCALHOST}/api/events/{detection['id']}/end",
+                    json={"end_time": now},
+                )
+                if resp.status_code == 200:
+                    self.detections[label] = None
+                else:
+                    self.logger.warning(
+                        f"Failed to end audio event {detection['id']} with status code {resp.status_code}"
+                    )
+
    def start_or_restart_ffmpeg(self) -> None:
        self.audio_listener = start_or_restart_ffmpeg(
            self.ffmpeg_cmd,
@ -283,10 +305,41 @@ class AudioEventMaintainer(threading.Thread):
            self.logger.error(f"Error reading audio data from ffmpeg process: {e}")
            log_and_restart()

+    def _update_enabled_state(self) -> bool:
+        """Fetch the latest config and update enabled state."""
+        _, config_data = self.enabled_subscriber.check_for_update()
+        if config_data:
+            self.config.enabled = config_data.enabled
+            return config_data.enabled
+
+        return self.config.enabled
+
    def run(self) -> None:
-        self.start_or_restart_ffmpeg()
+        if self._update_enabled_state():
+            self.start_or_restart_ffmpeg()

        while not self.stop_event.is_set():
+            enabled = self._update_enabled_state()
+            if enabled != self.was_enabled:
+                if enabled:
+                    self.logger.debug(
+                        f"Enabling audio detections for {self.config.name}"
+                    )
+                    self.start_or_restart_ffmpeg()
+                else:
+                    self.logger.debug(
+                        f"Disabling audio detections for {self.config.name}, ending events"
+                    )
+                    self.expire_all_detections()
+                    stop_ffmpeg(self.audio_listener, self.logger)
+                    self.audio_listener = None
+                self.was_enabled = enabled
+                continue
+
+            if not enabled:
+                time.sleep(0.1)
+                continue
+
            # check if there is an updated config
            (
                updated_topic,
@ -302,6 +355,7 @@ class AudioEventMaintainer(threading.Thread):
        self.logpipe.close()
        self.requestor.stop()
        self.config_subscriber.stop()
+        self.enabled_subscriber.stop()
        self.detection_publisher.stop()


--- a/frigate/ffmpeg_presets.py
+++ b/frigate/ffmpeg_presets.py
@ -10,6 +10,7 @@ from frigate.const import (
    FFMPEG_HWACCEL_NVIDIA,
    FFMPEG_HWACCEL_VAAPI,
    FFMPEG_HWACCEL_VULKAN,
+    LIBAVFORMAT_VERSION_MAJOR,
 )
 from frigate.util.services import vainfo_hwaccel
 from frigate.version import VERSION
@ -51,9 +52,8 @@ class LibvaGpuSelector:
        return ""


-LIBAV_VERSION = int(os.getenv("LIBAVFORMAT_VERSION_MAJOR", "59") or "59")
-FPS_VFR_PARAM = "-fps_mode vfr" if LIBAV_VERSION >= 59 else "-vsync 2"
-TIMEOUT_PARAM = "-timeout" if LIBAV_VERSION >= 59 else "-stimeout"
+FPS_VFR_PARAM = "-fps_mode vfr" if LIBAVFORMAT_VERSION_MAJOR >= 59 else "-vsync 2"
+TIMEOUT_PARAM = "-timeout" if LIBAVFORMAT_VERSION_MAJOR >= 59 else "-stimeout"

 _gpu_selector = LibvaGpuSelector()
 _user_agent_args = [
@ -65,8 +65,8 @@ PRESETS_HW_ACCEL_DECODE = {
    "preset-rpi-64-h264": "-c:v:1 h264_v4l2m2m",
    "preset-rpi-64-h265": "-c:v:1 hevc_v4l2m2m",
    FFMPEG_HWACCEL_VAAPI: f"-hwaccel_flags allow_profile_mismatch -hwaccel vaapi -hwaccel_device {_gpu_selector.get_selected_gpu()} -hwaccel_output_format vaapi",
-    "preset-intel-qsv-h264": f"-hwaccel qsv -qsv_device {_gpu_selector.get_selected_gpu()} -hwaccel_output_format qsv -c:v h264_qsv{' -bsf:v dump_extra' if LIBAV_VERSION >= 61 else ''}",  # https://trac.ffmpeg.org/ticket/9766#comment:17
-    "preset-intel-qsv-h265": f"-load_plugin hevc_hw -hwaccel qsv -qsv_device {_gpu_selector.get_selected_gpu()} -hwaccel_output_format qsv{' -bsf:v dump_extra' if LIBAV_VERSION >= 61 else ''}",  # https://trac.ffmpeg.org/ticket/9766#comment:17
+    "preset-intel-qsv-h264": f"-hwaccel qsv -qsv_device {_gpu_selector.get_selected_gpu()} -hwaccel_output_format qsv -c:v h264_qsv{' -bsf:v dump_extra' if LIBAVFORMAT_VERSION_MAJOR >= 61 else ''}",  # https://trac.ffmpeg.org/ticket/9766#comment:17
+    "preset-intel-qsv-h265": f"-load_plugin hevc_hw -hwaccel qsv -qsv_device {_gpu_selector.get_selected_gpu()} -hwaccel_output_format qsv{' -bsf:v dump_extra' if LIBAVFORMAT_VERSION_MAJOR >= 61 else ''}",  # https://trac.ffmpeg.org/ticket/9766#comment:17
    FFMPEG_HWACCEL_NVIDIA: "-hwaccel cuda -hwaccel_output_format cuda",
    "preset-jetson-h264": "-c:v h264_nvmpi -resize {1}x{2}",
    "preset-jetson-h265": "-c:v hevc_nvmpi -resize {1}x{2}",
--- a/Show More
+++ b/Show More
				`@ -1 +0,0 @@`
				`deb [arch=amd64 signed-by=/etc/apt/keyrings/rocm.gpg] https://repo.radeon.com/rocm/apt/5.7.3 focal main`