frigate/frigate/genai/__init__.py

"""Generative AI module for Frigate."""

import datetime
import importlib
import json
import logging
import os
import re
from typing import Any, Callable, Optional

import numpy as np
from playhouse.shortcuts import model_to_dict
from pydantic import ValidationError

from frigate.config import CameraConfig, GenAIConfig, GenAIProviderEnum
from frigate.const import CLIPS_DIR
from frigate.data_processing.post.types import ReviewMetadata
from frigate.genai.manager import GenAIClientManager
from frigate.models import Event

logger = logging.getLogger(__name__)

__all__ = [
    "GenAIClient",
    "GenAIClientManager",
    "GenAIConfig",
    "GenAIProviderEnum",
    "PROVIDERS",
    "load_providers",
    "register_genai_provider",
]

PROVIDERS = {}


def register_genai_provider(key: GenAIProviderEnum) -> Callable:
    """Register a GenAI provider."""

    def decorator(cls: type) -> type:
        PROVIDERS[key] = cls
        return cls

    return decorator


class GenAIClient:
    """Generative AI client for Frigate."""

    def __init__(self, genai_config: GenAIConfig, timeout: int = 120) -> None:
        self.genai_config: GenAIConfig = genai_config
        self.timeout = timeout
        self.provider = self._init_provider()

    def generate_review_description(
        self,
        review_data: dict[str, Any],
        thumbnails: list[bytes],
        concerns: list[str],
        preferred_language: str | None,
        debug_save: bool,
        activity_context_prompt: str,
    ) -> ReviewMetadata | None:
        """Generate a description for the review item activity."""

        def get_concern_prompt() -> str:
            if concerns:
                concern_list = "\n    - ".join(concerns)
                return f"""- `other_concerns` (list of strings): Include a list of any of the following concerns that are occurring:
    - {concern_list}"""
            else:
                return ""

        def get_language_prompt() -> str:
            if preferred_language:
                return f"Provide your answer in {preferred_language}"
            else:
                return ""

        def get_objects_list() -> str:
            if review_data["unified_objects"]:
                return "\n- " + "\n- ".join(review_data["unified_objects"])
            else:
                return "\n- (No objects detected)"

        context_prompt = f"""
Your task is to analyze a sequence of images taken in chronological order from a security camera.

## Normal Activity Patterns for This Property

{activity_context_prompt}

## Task Instructions

Describe the scene based on observable actions and movements, evaluate the activity against the Activity Indicators above, and assign a potential_threat_level (0, 1, or 2) by applying the threat level indicators consistently.

## Analysis Guidelines

When forming your description:
- **CRITICAL: Only describe objects explicitly listed in "Objects in Scene" below.** Do not infer or mention additional people, vehicles, or objects not present in this list, even if visual patterns suggest them. If only a car is listed, do not describe a person interacting with it unless "person" is also in the objects list.
- **Only describe actions actually visible in the frames.** Do not assume or infer actions that you don't observe happening. If someone walks toward furniture but you never see them sit, do not say they sat. Stick to what you can see across the sequence.
- Describe what you observe: actions, movements, interactions with objects and the environment. Include any observable environmental changes (e.g., lighting changes triggered by activity).
- Note visible details such as clothing, items being carried or placed, tools or equipment present, and how they interact with the property or objects.
- Consider the full sequence chronologically: what happens from start to finish, how duration and actions relate to the location and objects involved.
- **Use the actual timestamp provided in "Activity started at"** below for time of day context—do not infer time from image brightness or darkness. Unusual hours (late night/early morning) should increase suspicion when the observable behavior itself appears questionable. However, recognize that some legitimate activities can occur at any hour.
- **Consider duration as a primary factor**: Apply the duration thresholds defined in the activity patterns above. Brief sequences during normal hours with apparent purpose typically indicate normal activity unless explicit suspicious actions are visible.
- **Weigh all evidence holistically**: Match the activity against the normal and suspicious patterns defined above, then evaluate based on the complete context (zone, objects, time, actions, duration). Apply the threat level indicators consistently. Use your judgment for edge cases.

## Response Field Guidelines

Respond with a JSON object matching the provided schema. Field-specific guidance:
- `scene`: Describe how the sequence begins, then the progression of events — all significant movements and actions in order. For example, if a vehicle arrives and then a person exits, describe both sequentially. For named subjects (those with a `←` separator in "Objects in Scene"), always use their name — do not replace them with generic terms. For unnamed objects (e.g., "person", "car"), refer to them naturally with articles (e.g., "a person", "the car"). Your description should align with and support the threat level you assign.
- `title`: Characterize **what took place and where** — interpret the overall purpose or outcome, do not simply compress the scene description into fewer words. Include the relevant location (zone, area, or entry point). For named subjects, always use their name. For unnamed objects, refer to them naturally with articles. No editorial qualifiers like "routine" or "suspicious."
- `potential_threat_level`: Must be consistent with your scene description and the activity patterns above.
{get_concern_prompt()}

## Sequence Details

- Camera: {review_data["camera"]}
- Total frames: {len(thumbnails)} (Frame 1 = earliest, Frame {len(thumbnails)} = latest)
- Activity started at {review_data["start"]} and lasted {review_data["duration"]} seconds
- Zones involved: {", ".join(review_data["zones"]) if review_data["zones"] else "None"}

## Objects in Scene

Each line represents a detection state, not necessarily unique individuals. The `←` symbol separates a recognized subject's name from their object type — use only the name (before the `←`) in your response, not the type after it. The same subject may appear across multiple lines if detected multiple times.

**Note: Unidentified objects (without names) are NOT indicators of suspicious activity—they simply mean the system hasn't identified that object.**
{get_objects_list()}

{get_language_prompt()}
"""
        logger.debug(
            f"Sending {len(thumbnails)} images to create review description on {review_data['camera']}"
        )

        if debug_save:
            with open(
                os.path.join(
                    CLIPS_DIR, "genai-requests", review_data["id"], "prompt.txt"
                ),
                "w",
            ) as f:
                f.write(context_prompt)

        # Build JSON schema for structured output from ReviewMetadata model
        schema = ReviewMetadata.model_json_schema()
        schema.get("properties", {}).pop("time", None)

        if "time" in schema.get("required", []):
            schema["required"].remove("time")
        if not concerns:
            schema.get("properties", {}).pop("other_concerns", None)
            if "other_concerns" in schema.get("required", []):
                schema["required"].remove("other_concerns")

        response_format = {
            "type": "json_schema",
            "json_schema": {
                "name": "review_metadata",
                "strict": True,
                "schema": schema,
            },
        }

        response = self._send(context_prompt, thumbnails, response_format)

        if debug_save and response:
            with open(
                os.path.join(
                    CLIPS_DIR, "genai-requests", review_data["id"], "response.txt"
                ),
                "w",
            ) as f:
                f.write(response)

        if response:
            clean_json = re.sub(
                r"\n?```$", "", re.sub(r"^```[a-zA-Z0-9]*\n?", "", response)
            )

            try:
                metadata = ReviewMetadata.model_validate_json(clean_json)
            except ValidationError as ve:
                # Constraint violations (length, item count, ranges) are logged
                # at debug and the response is kept anyway — a slightly
                # off-spec answer is still usable, and dropping the whole
                # response loses the narrative content the model produced.
                for err in ve.errors():
                    loc = ".".join(str(p) for p in err["loc"]) or "<root>"
                    logger.debug(
                        "Review metadata soft validation: %s — %s (input: %r)",
                        loc,
                        err["msg"],
                        err.get("input"),
                    )
                try:
                    raw = json.loads(clean_json)
                except json.JSONDecodeError as je:
                    logger.error("Failed to parse review description JSON: %s", je)
                    return None
                # observations and confidence are required on the model; fill an empty default
                # if the response omitted it so attribute access stays safe.
                raw.setdefault("observations", [])
                raw.setdefault("confidence", 0.0)
                metadata = ReviewMetadata.model_construct(**raw)
            except Exception as e:
                logger.error(
                    f"Failed to parse review description as the response did not match expected format. {e}"
                )
                return None

            try:
                # Normalize confidence if model returned a percentage (e.g. 85 instead of 0.85)
                if metadata.confidence > 1.0:
                    metadata.confidence = min(metadata.confidence / 100.0, 1.0)

                # If any verified objects (contain ← separator), set to 0
                if any("←" in obj for obj in review_data["unified_objects"]):
                    metadata.potential_threat_level = 0

                metadata.title = metadata.title[0].upper() + metadata.title[1:]
                metadata.time = review_data["start"]
                return metadata
            except Exception as e:
                logger.error(f"Failed to post-process review metadata: {e}")
                return None
        else:
            logger.debug(
                f"Invalid response received from GenAI provider for review description on {review_data['camera']}. Response: {response}",
            )
            return None

    def generate_review_summary(
        self,
        start_ts: float,
        end_ts: float,
        events: list[dict[str, Any]],
        preferred_language: str | None,
        debug_save: bool,
    ) -> str | None:
        """Generate a summary of review item descriptions over a period of time."""
        time_range = f"{datetime.datetime.fromtimestamp(start_ts).strftime('%B %d, %Y at %I:%M %p')} to {datetime.datetime.fromtimestamp(end_ts).strftime('%B %d, %Y at %I:%M %p')}"
        timeline_summary_prompt = f"""
You are a security officer writing a concise security report.

Time range: {time_range}

Input format: Each event is a JSON object with:
- "title", "scene", "confidence", "potential_threat_level" (0-2), "other_concerns", "camera", "time", "start_time", "end_time"
- "context": array of related events from other cameras that occurred during overlapping time periods

**Note: Use the "scene" field for event descriptions in the report. Ignore any "shortSummary" field if present.**

Report Structure - Use this EXACT format:

# Security Summary - {time_range}

## Overview
[Write 1-2 sentences summarizing the overall activity pattern during this period.]

---

## Timeline

[Group events by time periods (e.g., "Morning (6:00 AM - 12:00 PM)", "Afternoon (12:00 PM - 5:00 PM)", "Evening (5:00 PM - 9:00 PM)", "Night (9:00 PM - 6:00 AM)"). Use appropriate time blocks based on when events occurred.]

### [Time Block Name]

**HH:MM AM/PM** | [Camera Name] | [Threat Level Indicator]
- [Event title]: [Clear description incorporating contextual information from the "context" array]
- Context: [If context array has items, mention them here, e.g., "Delivery truck present on Front Driveway Cam (HH:MM AM/PM)"]
- Assessment: [Brief assessment incorporating context - if context explains the event, note it here]

[Repeat for each event in chronological order within the time block]

---

## Summary
[One sentence summarizing the period. If all events are normal/explained: "Routine activity observed." If review needed: "Some activity requires review but no security concerns." If security concerns: "Security concerns requiring immediate attention."]

Guidelines:
- List ALL events in chronological order, grouped by time blocks
- Threat level indicators: ✓ Normal, ⚠️ Needs review, 🔴 Security concern
- Integrate contextual information naturally - use the "context" array to enrich each event's description
- If context explains the event (e.g., delivery truck explains person at door), describe it accordingly (e.g., "delivery person" not "unidentified person")
- Be concise but informative - focus on what happened and what it means
- If contextual information makes an event clearly normal, reflect that in your assessment
- Only create time blocks that have events - don't create empty sections
"""

        timeline_summary_prompt += "\n\nEvents:\n"
        for event in events:
            timeline_summary_prompt += f"\n{event}\n"

        if preferred_language:
            timeline_summary_prompt += f"\nProvide your answer in {preferred_language}"

        if debug_save:
            with open(
                os.path.join(
                    CLIPS_DIR, "genai-requests", f"{start_ts}-{end_ts}", "prompt.txt"
                ),
                "w",
            ) as f:
                f.write(timeline_summary_prompt)

        response = self._send(timeline_summary_prompt, [])

        if debug_save and response:
            with open(
                os.path.join(
                    CLIPS_DIR, "genai-requests", f"{start_ts}-{end_ts}", "response.txt"
                ),
                "w",
            ) as f:
                f.write(response)

        return response

    def generate_object_description(
        self,
        camera_config: CameraConfig,
        thumbnails: list[bytes],
        event: Event,
    ) -> Optional[str]:
        """Generate a description for the frame."""
        try:
            prompt = camera_config.objects.genai.object_prompts.get(
                str(event.label),
                camera_config.objects.genai.prompt,
            ).format(**model_to_dict(event))
        except KeyError as e:
            logger.error(f"Invalid key in GenAI prompt: {e}")
            return None

        logger.debug(f"Sending images to genai provider with prompt: {prompt}")
        return self._send(prompt, thumbnails)

    def _init_provider(self) -> Any:
        """Initialize the client."""
        return None

    def _send(
        self,
        prompt: str,
        images: list[bytes],
        response_format: Optional[dict] = None,
    ) -> Optional[str]:
        """Submit a request to the provider."""
        return None

    @property
    def supports_vision(self) -> bool:
        """Whether the model supports vision/image input.

        Defaults to True for cloud providers. Providers that can detect
        capability at runtime (e.g. llama.cpp) should override this.
        """
        return True

    def list_models(self) -> list[str]:
        """Return the list of model names available from this provider.

        Providers should override this to query their backend.
        """
        return []

    def get_context_size(self) -> int:
        """Get the context window size for this provider in tokens."""
        return 4096

    def estimate_image_tokens(self, width: int, height: int) -> float:
        """Estimate prompt tokens consumed by a single image of the given dimensions.

        Default heuristic: ~1 token per 1250 pixels. Providers that can measure or
        know their model's exact image-token cost should override.
        """
        return (width * height) / 1250

    def embed(
        self,
        texts: list[str] | None = None,
        images: list[bytes] | None = None,
    ) -> list[np.ndarray]:
        """Generate embeddings for text and/or images.

        Returns list of numpy arrays (one per input). Expected dimension is 768
        for Frigate semantic search compatibility.

        Providers that support embeddings should override this method.
        """
        logger.warning(
            "%s does not support embeddings. "
            "This method should be overridden by the provider implementation.",
            self.__class__.__name__,
        )
        return []

    def chat_with_tools(
        self,
        messages: list[dict[str, Any]],
        tools: Optional[list[dict[str, Any]]] = None,
        tool_choice: Optional[str] = "auto",
    ) -> dict[str, Any]:
        """
        Send chat messages to LLM with optional tool definitions.

        This method handles conversation-style interactions with the LLM,
        including function calling/tool usage capabilities.

        Args:
            messages: List of message dictionaries. Each message should have:
                - 'role': str - One of 'user', 'assistant', 'system', or 'tool'
                - 'content': str - The message content
                - 'tool_call_id': Optional[str] - For tool responses, the ID of the tool call
                - 'name': Optional[str] - For tool messages, the tool name
            tools: Optional list of tool definitions in OpenAI-compatible format.
                   Each tool should have 'type': 'function' and 'function' with:
                   - 'name': str - Tool name
                   - 'description': str - Tool description
                   - 'parameters': dict - JSON schema for parameters
            tool_choice: How the model should handle tools:
                - 'auto': Model decides whether to call tools
                - 'none': Model must not call tools
                - 'required': Model must call at least one tool
                - Or a dict specifying a specific tool to call
            **kwargs: Additional provider-specific parameters.

        Returns:
            Dictionary with:
            - 'content': Optional[str] - The text response from the LLM, None if tool calls
            - 'tool_calls': Optional[List[Dict]] - List of tool calls if LLM wants to call tools.
              Each tool call dict has:
                - 'id': str - Unique identifier for this tool call
                - 'name': str - Tool name to call
                - 'arguments': dict - Arguments for the tool call (parsed JSON)
            - 'finish_reason': str - Reason generation stopped:
                - 'stop': Normal completion
                - 'tool_calls': LLM wants to call tools
                - 'length': Hit token limit
                - 'error': An error occurred

        Raises:
            NotImplementedError: If the provider doesn't implement this method.
        """
        # Base implementation - each provider should override this
        logger.warning(
            f"{self.__class__.__name__} does not support chat_with_tools. "
            "This method should be overridden by the provider implementation."
        )
        return {
            "content": None,
            "tool_calls": None,
            "finish_reason": "error",
        }


def load_providers() -> None:
    package_dir = os.path.dirname(__file__)
    for filename in os.listdir(package_dir):
        if filename.endswith(".py") and filename != "__init__.py":
            module_name = f"frigate.genai.{filename[:-3]}"
            importlib.import_module(module_name)
-												Semantic Search for Detections (#11899)

* Initial re-implementation of semantic search

* put docker-compose back and make reindex match docs

* remove debug code and fix import

* fix docs

* manually build pysqlite3 as binaries are only available for x86-64

* update comment in build_pysqlite3.sh

* only embed objects

* better error handling when genai fails

* ask ollama to pull requested model at startup

* update ollama docs

* address some PR review comments

* fix lint

* use IPC to write description, update docs for reindex

* remove gemini-pro-vision from docs as it will be unavailable soon

* fix OpenAI doc available models

* fix api error in gemini and metadata for embeddings

											
										
										
											2024-06-22 00:30:19 +03:00
+								"""Generative AI module for Frigate."""
-												Genai review summaries (#19473)

* Generate review item summaries with requests

* Adjust logic to only send important items

* Don't mention ladder

* Adjust prompt to be more specific

* Add more relaxed nature for normal activity

* Cleanup summary

* Update ollama client

* Add more directions to analyze the frames in order

* Remove environment from prompt
											
										
										
											2025-08-13 01:27:35 +03:00
+								import datetime
-												Semantic Search for Detections (#11899)

* Initial re-implementation of semantic search

* put docker-compose back and make reindex match docs

* remove debug code and fix import

* fix docs

* manually build pysqlite3 as binaries are only available for x86-64

* update comment in build_pysqlite3.sh

* only embed objects

* better error handling when genai fails

* ask ollama to pull requested model at startup

* update ollama docs

* address some PR review comments

* fix lint

* use IPC to write description, update docs for reindex

* remove gemini-pro-vision from docs as it will be unavailable soon

* fix OpenAI doc available models

* fix api error in gemini and metadata for embeddings

											
										
										
											2024-06-22 00:30:19 +03:00
+								import importlib
-												Miscellaneous fixes (#23009)

* Reduce max frames per second to 1

* Use pydantic but don't fail if some constraints are not met.

* Adjust limits

* Adjust limits

* Cleanup

* add unsaved changes icon/popover to individual settings section

* allow changing camera friendly_name from camera management pane

---------

Co-authored-by: Josh Hawkins <32435876+hawkeye217@users.noreply.github.com>
											
										
										
											2026-04-27 01:09:35 +03:00
+								import json
-												Update ollama docs and add genai debug logging (#15012)


											
										
										
											2024-11-16 00:24:17 +03:00
+								import logging
-												Semantic Search for Detections (#11899)

* Initial re-implementation of semantic search

* put docker-compose back and make reindex match docs

* remove debug code and fix import

* fix docs

* manually build pysqlite3 as binaries are only available for x86-64

* update comment in build_pysqlite3.sh

* only embed objects

* better error handling when genai fails

* ask ollama to pull requested model at startup

* update ollama docs

* address some PR review comments

* fix lint

* use IPC to write description, update docs for reindex

* remove gemini-pro-vision from docs as it will be unavailable soon

* fix OpenAI doc available models

* fix api error in gemini and metadata for embeddings

											
										
										
											2024-06-22 00:30:19 +03:00
+								import os
-												Review Item GenAI metadata (#19442)

* Rename existing function

* Keep track of thumbnial updates

* Tinkering with genai prompt

* Adjust input format

* Create model for review description output

* testing prompt changes

* Prompt improvements and image saving

* Add config for review items genai

* Use genai review config

* Actual config usage

* Adjust debug image saving

* Fix

* Fix review creation

* Adjust prompt

* Prompt adjustment

* Run genai in thread

* Fix detections block

* Adjust prompt

* Prompt changes

* Save genai response to metadata model

* Handle metadata

* Send review update to dispatcher

* Save review metadata to DB

* Send review notification updates

* Quick fix

* Fix name

* Fix update type

* Correctly dump model

* Add card

* Add card

* Remove message

* Cleanup typing and UI

* Adjust prompt

* Formatting

* Add log

* Formatting

* Add inference speed and keep alive
											
										
										
											2025-08-10 14:57:54 +03:00
+								import re
-												Increase mypy coverage and fixes (#22632)
											
										
										
											2026-03-25 18:28:48 +03:00
+								from typing import Any, Callable, Optional
-												Semantic Search for Detections (#11899)

* Initial re-implementation of semantic search

* put docker-compose back and make reindex match docs

* remove debug code and fix import

* fix docs

* manually build pysqlite3 as binaries are only available for x86-64

* update comment in build_pysqlite3.sh

* only embed objects

* better error handling when genai fails

* ask ollama to pull requested model at startup

* update ollama docs

* address some PR review comments

* fix lint

* use IPC to write description, update docs for reindex

* remove gemini-pro-vision from docs as it will be unavailable soon

* fix OpenAI doc available models

* fix api error in gemini and metadata for embeddings

											
										
										
											2024-06-22 00:30:19 +03:00
-												Support using GenAI for embeddings / semantic search (#22323)

* Support GenAI for embeddings

* Add embed API support

* Add support for embedding via genai

* Basic docs

* undo

* Fix sending images

* Don't require download check

* Set model

* Handle emb correctly

* Clarification

* Cleanup

* Cleanup
											
										
										
											2026-03-08 18:55:00 +03:00
+								import numpy as np
-												Fix genai labels (#14330)

* Publish model state and embeddings reindex in dispatcher onConnect

* remove unneeded from explore

* add embeddings reindex progress to statusbar

* don't allow right click or show similar button if semantic search is disabled

* fix status bar

* Convert peewee model to dict before formatting for genai description

* add embeddings reindex progress to statusbar

* fix status bar

* Convert peewee model to dict before formatting for genai description
											
										
										
											2024-10-14 15:23:10 +03:00
+								from playhouse.shortcuts import model_to_dict
-												Miscellaneous fixes (#23009)

* Reduce max frames per second to 1

* Use pydantic but don't fail if some constraints are not met.

* Adjust limits

* Adjust limits

* Cleanup

* add unsaved changes icon/popover to individual settings section

* allow changing camera friendly_name from camera management pane

---------

Co-authored-by: Josh Hawkins <32435876+hawkeye217@users.noreply.github.com>
											
										
										
											2026-04-27 01:09:35 +03:00
+								from pydantic import ValidationError
-												Fix genai labels (#14330)

* Publish model state and embeddings reindex in dispatcher onConnect

* remove unneeded from explore

* add embeddings reindex progress to statusbar

* don't allow right click or show similar button if semantic search is disabled

* fix status bar

* Convert peewee model to dict before formatting for genai description

* add embeddings reindex progress to statusbar

* fix status bar

* Convert peewee model to dict before formatting for genai description
											
										
										
											2024-10-14 15:23:10 +03:00
-												Add support for multiple GenAI Providers (#22144)

* GenAI client manager

* Add config migration

* Convert to roles list

* Support getting client via manager

* Cleanup

* Fix import issues

* Set model in llama.cpp config

* Clenaup

* Use config update

* Clenaup

* Add new title and desc
											
										
										
											2026-02-27 18:35:33 +03:00
+								from frigate.config import CameraConfig, GenAIConfig, GenAIProviderEnum
-												Genai review summaries (#19473)

* Generate review item summaries with requests

* Adjust logic to only send important items

* Don't mention ladder

* Adjust prompt to be more specific

* Add more relaxed nature for normal activity

* Cleanup summary

* Update ollama client

* Add more directions to analyze the frames in order

* Remove environment from prompt
											
										
										
											2025-08-13 01:27:35 +03:00
+								from frigate.const import CLIPS_DIR
-												Review Item GenAI metadata (#19442)

* Rename existing function

* Keep track of thumbnial updates

* Tinkering with genai prompt

* Adjust input format

* Create model for review description output

* testing prompt changes

* Prompt improvements and image saving

* Add config for review items genai

* Use genai review config

* Actual config usage

* Adjust debug image saving

* Fix

* Fix review creation

* Adjust prompt

* Prompt adjustment

* Run genai in thread

* Fix detections block

* Adjust prompt

* Prompt changes

* Save genai response to metadata model

* Handle metadata

* Send review update to dispatcher

* Save review metadata to DB

* Send review notification updates

* Quick fix

* Fix name

* Fix update type

* Correctly dump model

* Add card

* Add card

* Remove message

* Cleanup typing and UI

* Adjust prompt

* Formatting

* Add log

* Formatting

* Add inference speed and keep alive
											
										
										
											2025-08-10 14:57:54 +03:00
+								from frigate.data_processing.post.types import ReviewMetadata
-												Add support for multiple GenAI Providers (#22144)

* GenAI client manager

* Add config migration

* Convert to roles list

* Support getting client via manager

* Cleanup

* Fix import issues

* Set model in llama.cpp config

* Clenaup

* Use config update

* Clenaup

* Add new title and desc
											
										
										
											2026-02-27 18:35:33 +03:00
+								from frigate.genai.manager import GenAIClientManager
-												Fix substitution on genai prompts (#14298)


											
										
										
											2024-10-12 15:19:24 +03:00
+								from frigate.models import Event
-												Semantic Search for Detections (#11899)

* Initial re-implementation of semantic search

* put docker-compose back and make reindex match docs

* remove debug code and fix import

* fix docs

* manually build pysqlite3 as binaries are only available for x86-64

* update comment in build_pysqlite3.sh

* only embed objects

* better error handling when genai fails

* ask ollama to pull requested model at startup

* update ollama docs

* address some PR review comments

* fix lint

* use IPC to write description, update docs for reindex

* remove gemini-pro-vision from docs as it will be unavailable soon

* fix OpenAI doc available models

* fix api error in gemini and metadata for embeddings

											
										
										
											2024-06-22 00:30:19 +03:00
-												Update ollama docs and add genai debug logging (#15012)


											
										
										
											2024-11-16 00:24:17 +03:00
+								logger = logging.getLogger(__name__)
-												Add support for multiple GenAI Providers (#22144)

* GenAI client manager

* Add config migration

* Convert to roles list

* Support getting client via manager

* Cleanup

* Fix import issues

* Set model in llama.cpp config

* Clenaup

* Use config update

* Clenaup

* Add new title and desc
											
										
										
											2026-02-27 18:35:33 +03:00
+								__all__ = [
 								    "GenAIClient",
 								    "GenAIClientManager",
 								    "GenAIConfig",
 								    "GenAIProviderEnum",
 								    "PROVIDERS",
 								    "load_providers",
 								    "register_genai_provider",
 								]
-												Semantic Search for Detections (#11899)

* Initial re-implementation of semantic search

* put docker-compose back and make reindex match docs

* remove debug code and fix import

* fix docs

* manually build pysqlite3 as binaries are only available for x86-64

* update comment in build_pysqlite3.sh

* only embed objects

* better error handling when genai fails

* ask ollama to pull requested model at startup

* update ollama docs

* address some PR review comments

* fix lint

* use IPC to write description, update docs for reindex

* remove gemini-pro-vision from docs as it will be unavailable soon

* fix OpenAI doc available models

* fix api error in gemini and metadata for embeddings

											
										
										
											2024-06-22 00:30:19 +03:00
+								PROVIDERS = {}
-												Increase mypy coverage and fixes (#22632)
											
										
										
											2026-03-25 18:28:48 +03:00
+								def register_genai_provider(key: GenAIProviderEnum) -> Callable:
-												Semantic Search for Detections (#11899)

* Initial re-implementation of semantic search

* put docker-compose back and make reindex match docs

* remove debug code and fix import

* fix docs

* manually build pysqlite3 as binaries are only available for x86-64

* update comment in build_pysqlite3.sh

* only embed objects

* better error handling when genai fails

* ask ollama to pull requested model at startup

* update ollama docs

* address some PR review comments

* fix lint

* use IPC to write description, update docs for reindex

* remove gemini-pro-vision from docs as it will be unavailable soon

* fix OpenAI doc available models

* fix api error in gemini and metadata for embeddings

											
										
										
											2024-06-22 00:30:19 +03:00
+								    """Register a GenAI provider."""
-												Increase mypy coverage and fixes (#22632)
											
										
										
											2026-03-25 18:28:48 +03:00
+								    def decorator(cls: type) -> type:
-												Semantic Search for Detections (#11899)

* Initial re-implementation of semantic search

* put docker-compose back and make reindex match docs

* remove debug code and fix import

* fix docs

* manually build pysqlite3 as binaries are only available for x86-64

* update comment in build_pysqlite3.sh

* only embed objects

* better error handling when genai fails

* ask ollama to pull requested model at startup

* update ollama docs

* address some PR review comments

* fix lint

* use IPC to write description, update docs for reindex

* remove gemini-pro-vision from docs as it will be unavailable soon

* fix OpenAI doc available models

* fix api error in gemini and metadata for embeddings

											
										
										
											2024-06-22 00:30:19 +03:00
+								        PROVIDERS[key] = cls
 								        return cls
 								    return decorator
 								class GenAIClient:
 								    """Generative AI client for Frigate."""
-												Refactor object genai to be a post-processor (#20331)

* Refactor object genai to be a post-processor

* Include function correctly
											
										
										
											2025-10-02 21:48:11 +03:00
+								    def __init__(self, genai_config: GenAIConfig, timeout: int = 120) -> None:
-												Semantic Search for Detections (#11899)

* Initial re-implementation of semantic search

* put docker-compose back and make reindex match docs

* remove debug code and fix import

* fix docs

* manually build pysqlite3 as binaries are only available for x86-64

* update comment in build_pysqlite3.sh

* only embed objects

* better error handling when genai fails

* ask ollama to pull requested model at startup

* update ollama docs

* address some PR review comments

* fix lint

* use IPC to write description, update docs for reindex

* remove gemini-pro-vision from docs as it will be unavailable soon

* fix OpenAI doc available models

* fix api error in gemini and metadata for embeddings

											
										
										
											2024-06-22 00:30:19 +03:00
+								        self.genai_config: GenAIConfig = genai_config
 								        self.timeout = timeout
 								        self.provider = self._init_provider()
-												Review Item GenAI metadata (#19442)

* Rename existing function

* Keep track of thumbnial updates

* Tinkering with genai prompt

* Adjust input format

* Create model for review description output

* testing prompt changes

* Prompt improvements and image saving

* Add config for review items genai

* Use genai review config

* Actual config usage

* Adjust debug image saving

* Fix

* Fix review creation

* Adjust prompt

* Prompt adjustment

* Run genai in thread

* Fix detections block

* Adjust prompt

* Prompt changes

* Save genai response to metadata model

* Handle metadata

* Send review update to dispatcher

* Save review metadata to DB

* Send review notification updates

* Quick fix

* Fix name

* Fix update type

* Correctly dump model

* Add card

* Add card

* Remove message

* Cleanup typing and UI

* Adjust prompt

* Formatting

* Add log

* Formatting

* Add inference speed and keep alive
											
										
										
											2025-08-10 14:57:54 +03:00
+								    def generate_review_description(
-												Add config for users to define additional concerns that GenAI should make note of in review summary (#19463)

* Don't default to openai

* Improve UI

* Allow configuring additional concerns that users may want the AI to note

* Formatting

* Add preferred language config

* Remove unused
											
										
										
											2025-08-11 22:17:25 +03:00
+								        self,
 								        review_data: dict[str, Any],
 								        thumbnails: list[bytes],
 								        concerns: list[str],
 								        preferred_language: str | None,
-												Genai review summaries (#19473)

* Generate review item summaries with requests

* Adjust logic to only send important items

* Don't mention ladder

* Adjust prompt to be more specific

* Add more relaxed nature for normal activity

* Cleanup summary

* Update ollama client

* Add more directions to analyze the frames in order

* Remove environment from prompt
											
										
										
											2025-08-13 01:27:35 +03:00
+								        debug_save: bool,
-												Customizable GenAI Review prompt (#20296)

* Add customizable prompt

* Update docs
											
										
										
											2025-10-01 02:07:16 +03:00
+								        activity_context_prompt: str,
-												Review Item GenAI metadata (#19442)

* Rename existing function

* Keep track of thumbnial updates

* Tinkering with genai prompt

* Adjust input format

* Create model for review description output

* testing prompt changes

* Prompt improvements and image saving

* Add config for review items genai

* Use genai review config

* Actual config usage

* Adjust debug image saving

* Fix

* Fix review creation

* Adjust prompt

* Prompt adjustment

* Run genai in thread

* Fix detections block

* Adjust prompt

* Prompt changes

* Save genai response to metadata model

* Handle metadata

* Send review update to dispatcher

* Save review metadata to DB

* Send review notification updates

* Quick fix

* Fix name

* Fix update type

* Correctly dump model

* Add card

* Add card

* Remove message

* Cleanup typing and UI

* Adjust prompt

* Formatting

* Add log

* Formatting

* Add inference speed and keep alive
											
										
										
											2025-08-10 14:57:54 +03:00
+								    ) -> ReviewMetadata | None:
 								        """Generate a description for the review item activity."""
-												Add config for users to define additional concerns that GenAI should make note of in review summary (#19463)

* Don't default to openai

* Improve UI

* Allow configuring additional concerns that users may want the AI to note

* Formatting

* Add preferred language config

* Remove unused
											
										
										
											2025-08-11 22:17:25 +03:00
-												Add ability to pass additional args to Ollama (#19484)

* Call out recognized objects more specifically

* Cleanup

* Make keep_alive and options configurable

* Generalize

* Use for other providers
											
										
										
											2025-08-13 18:28:01 +03:00
+								        def get_concern_prompt() -> str:
 								            if concerns:
 								                concern_list = "\n    - ".join(concerns)
-												Miscellaneous Fixes (#20866)

* Don't warn when event ids have expired for trigger sync

* Import faster_whisper conditinally to avoid illegal instruction

* Catch OpenVINO runtime error

* fix race condition in detail stream context

navigating between tracked objects in Explore would sometimes prevent the object track from appearing

* Handle case where classification images are deleted

* Adjust default rounded corners on larger screens

* Improve flow handling for classification state

* Remove images when wizard is cancelled

* Improve deletion handling for classes

* Set constraints on review buffers

* Update to support correct data format

* Set minimum duration for recording based review items

* Use friendly name in review genai prompt

---------

Co-authored-by: Nicolas Mowen <nickmowen213@gmail.com>
											
										
										
											2025-11-10 20:03:56 +03:00
+								                return f"""- `other_concerns` (list of strings): Include a list of any of the following concerns that are occurring:
-												Add ability to pass additional args to Ollama (#19484)

* Call out recognized objects more specifically

* Cleanup

* Make keep_alive and options configurable

* Generalize

* Use for other providers
											
										
										
											2025-08-13 18:28:01 +03:00
+								    - {concern_list}"""
 								            else:
 								                return ""
-												Add config for users to define additional concerns that GenAI should make note of in review summary (#19463)

* Don't default to openai

* Improve UI

* Allow configuring additional concerns that users may want the AI to note

* Formatting

* Add preferred language config

* Remove unused
											
										
										
											2025-08-11 22:17:25 +03:00
-												Add ability to pass additional args to Ollama (#19484)

* Call out recognized objects more specifically

* Cleanup

* Make keep_alive and options configurable

* Generalize

* Use for other providers
											
										
										
											2025-08-13 18:28:01 +03:00
+								        def get_language_prompt() -> str:
 								            if preferred_language:
 								                return f"Provide your answer in {preferred_language}"
 								            else:
 								                return ""
-												Add config for users to define additional concerns that GenAI should make note of in review summary (#19463)

* Don't default to openai

* Improve UI

* Allow configuring additional concerns that users may want the AI to note

* Formatting

* Add preferred language config

* Remove unused
											
										
										
											2025-08-11 22:17:25 +03:00
-												Unify list of objects under dedicated section (#20684)

* Unify list of objects under dedicated section

* Use helper fuction
											
										
										
											2025-10-27 00:37:57 +03:00
+								        def get_objects_list() -> str:
 								            if review_data["unified_objects"]:
 								                return "\n- " + "\n- ".join(review_data["unified_objects"])
-												Map verified objects to their sub label directly (#20413)

* Map verified objects to their sub label directly

* Simplify access

* Cleanup

* Add protection for mismatched object and index

* Keep track of verified objects separately
											
										
										
											2025-10-10 16:07:00 +03:00
+								            else:
-												Unify list of objects under dedicated section (#20684)

* Unify list of objects under dedicated section

* Use helper fuction
											
										
										
											2025-10-27 00:37:57 +03:00
+								                return "\n- (No objects detected)"
-												Map verified objects to their sub label directly (#20413)

* Map verified objects to their sub label directly

* Simplify access

* Cleanup

* Add protection for mismatched object and index

* Keep track of verified objects separately
											
										
										
											2025-10-10 16:07:00 +03:00
-												Review Item GenAI metadata (#19442)

* Rename existing function

* Keep track of thumbnial updates

* Tinkering with genai prompt

* Adjust input format

* Create model for review description output

* testing prompt changes

* Prompt improvements and image saving

* Add config for review items genai

* Use genai review config

* Actual config usage

* Adjust debug image saving

* Fix

* Fix review creation

* Adjust prompt

* Prompt adjustment

* Run genai in thread

* Fix detections block

* Adjust prompt

* Prompt changes

* Save genai response to metadata model

* Handle metadata

* Send review update to dispatcher

* Save review metadata to DB

* Send review notification updates

* Quick fix

* Fix name

* Fix update type

* Correctly dump model

* Add card

* Add card

* Remove message

* Cleanup typing and UI

* Adjust prompt

* Formatting

* Add log

* Formatting

* Add inference speed and keep alive
											
										
										
											2025-08-10 14:57:54 +03:00
+								        context_prompt = f"""
-												Add live context tool to LLM (#21754)

* Add live context tool

* Improve handling of images in request

* Improve prompt caching
											
										
										
											2026-01-22 22:04:40 +03:00
+								Your task is to analyze a sequence of images taken in chronological order from a security camera.
-												Add config for users to define additional concerns that GenAI should make note of in review summary (#19463)

* Don't default to openai

* Improve UI

* Allow configuring additional concerns that users may want the AI to note

* Formatting

* Add preferred language config

* Remove unused
											
										
										
											2025-08-11 22:17:25 +03:00
-												Various fixes (#20666)

* Remove nvidia pyindex

* Improve prompt
											
										
										
											2025-10-26 00:40:04 +03:00
+								## Normal Activity Patterns for This Property
-												Unify list of objects under dedicated section (#20684)

* Unify list of objects under dedicated section

* Use helper fuction
											
										
										
											2025-10-27 00:37:57 +03:00
-												Improve review summary performance (#20328)

* Undo vite

* Balance the prompt

* Round duration

* Calculate context size to determine number of images

* Increase number of images
											
										
										
											2025-10-02 18:17:25 +03:00
+								{activity_context_prompt}
-												Various fixes (#20666)

* Remove nvidia pyindex

* Improve prompt
											
										
										
											2025-10-26 00:40:04 +03:00
+								## Task Instructions
-												Refactor Review GenAI Prompt (#22353)

* Improve title to better capture activity

* Improve efficiency of prompt

* Use json format for llama.cpp

* Cleanup prompt

* Add output format for other LLMs
											
										
										
											2026-03-10 03:47:37 +03:00
+								Describe the scene based on observable actions and movements, evaluate the activity against the Activity Indicators above, and assign a potential_threat_level (0, 1, or 2) by applying the threat level indicators consistently.
-												Add config for users to define additional concerns that GenAI should make note of in review summary (#19463)

* Don't default to openai

* Improve UI

* Allow configuring additional concerns that users may want the AI to note

* Formatting

* Add preferred language config

* Remove unused
											
										
										
											2025-08-11 22:17:25 +03:00
-												Various fixes (#20666)

* Remove nvidia pyindex

* Improve prompt
											
										
										
											2025-10-26 00:40:04 +03:00
+								## Analysis Guidelines
-												Genai review summaries (#19473)

* Generate review item summaries with requests

* Adjust logic to only send important items

* Don't mention ladder

* Adjust prompt to be more specific

* Add more relaxed nature for normal activity

* Cleanup summary

* Update ollama client

* Add more directions to analyze the frames in order

* Remove environment from prompt
											
										
										
											2025-08-13 01:27:35 +03:00
+								When forming your description:
-												Unify list of objects under dedicated section (#20684)

* Unify list of objects under dedicated section

* Use helper fuction
											
										
										
											2025-10-27 00:37:57 +03:00
+								- **CRITICAL: Only describe objects explicitly listed in "Objects in Scene" below.** Do not infer or mention additional people, vehicles, or objects not present in this list, even if visual patterns suggest them. If only a car is listed, do not describe a person interacting with it unless "person" is also in the objects list.
-												Improve Review Summary Prompt (#20289)

* Improve prompt to have better discernment and logic based on detected objects

* Be more specific about the time of day

* Add re-inforcers for LLM to be accurate and not complete a narrative
											
										
										
											2025-09-30 15:52:38 +03:00
+								- **Only describe actions actually visible in the frames.** Do not assume or infer actions that you don't observe happening. If someone walks toward furniture but you never see them sit, do not say they sat. Stick to what you can see across the sequence.
 								- Describe what you observe: actions, movements, interactions with objects and the environment. Include any observable environmental changes (e.g., lighting changes triggered by activity).
 								- Note visible details such as clothing, items being carried or placed, tools or equipment present, and how they interact with the property or objects.
-												Customizable GenAI Review prompt (#20296)

* Add customizable prompt

* Update docs
											
										
										
											2025-10-01 02:07:16 +03:00
+								- Consider the full sequence chronologically: what happens from start to finish, how duration and actions relate to the location and objects involved.
 								- **Use the actual timestamp provided in "Activity started at"** below for time of day context—do not infer time from image brightness or darkness. Unusual hours (late night/early morning) should increase suspicion when the observable behavior itself appears questionable. However, recognize that some legitimate activities can occur at any hour.
-												Review description updates (#20723)

* Update docs for review descriptions

* Add logging for context tokens used

* Incrase number of images due to lower than expected context usage

* Re-balance the suspicious activity checks

* Adjustments to context sizing

* optimize context usage

* Adjust context usage

* Make title more direct

* Update docs
											
										
										
											2025-10-30 17:52:55 +03:00
+								- **Consider duration as a primary factor**: Apply the duration thresholds defined in the activity patterns above. Brief sequences during normal hours with apparent purpose typically indicate normal activity unless explicit suspicious actions are visible.
 								- **Weigh all evidence holistically**: Match the activity against the normal and suspicious patterns defined above, then evaluate based on the complete context (zone, objects, time, actions, duration). Apply the threat level indicators consistently. Use your judgment for edge cases.
-												Customizable GenAI Review prompt (#20296)

* Add customizable prompt

* Update docs
											
										
										
											2025-10-01 02:07:16 +03:00
-												Refactor Review GenAI Prompt (#22353)

* Improve title to better capture activity

* Improve efficiency of prompt

* Use json format for llama.cpp

* Cleanup prompt

* Add output format for other LLMs
											
										
										
											2026-03-10 03:47:37 +03:00
+								## Response Field Guidelines
-												Various fixes (#20666)

* Remove nvidia pyindex

* Improve prompt
											
										
										
											2025-10-26 00:40:04 +03:00
-												Refactor Review GenAI Prompt (#22353)

* Improve title to better capture activity

* Improve efficiency of prompt

* Use json format for llama.cpp

* Cleanup prompt

* Add output format for other LLMs
											
										
										
											2026-03-10 03:47:37 +03:00
+								Respond with a JSON object matching the provided schema. Field-specific guidance:
-												Miscellaneous fixes (#22780)

* fix mobile export crash by removing stale iOS non-modal drawer workaround

* Remove titlecase to avoid Gemma4 handling plain labels as proper nouns

* Improve titling:

* Make directions more clear

* Properly capitalize delivery services

* update dispatcher config reference on save

* subscribe to review topic so ReviewDescriptionProcessor knows genai is enabled

* auto-send ON genai review WS message when enabled_in_config transitions to true

* remove unused object level

* update docs to clarify pre/post capture settings

* add ui docs links

* improve known_plates field in settings UI

* only show save all when multiple sections are changed

or if the section being changed is not currently being viewed

* fix docs

---------

Co-authored-by: Nicolas Mowen <nickmowen213@gmail.com>
											
										
										
											2026-04-07 16:16:19 +03:00
+								- `scene`: Describe how the sequence begins, then the progression of events — all significant movements and actions in order. For example, if a vehicle arrives and then a person exits, describe both sequentially. For named subjects (those with a `←` separator in "Objects in Scene"), always use their name — do not replace them with generic terms. For unnamed objects (e.g., "person", "car"), refer to them naturally with articles (e.g., "a person", "the car"). Your description should align with and support the threat level you assign.
 								- `title`: Characterize **what took place and where** — interpret the overall purpose or outcome, do not simply compress the scene description into fewer words. Include the relevant location (zone, area, or entry point). For named subjects, always use their name. For unnamed objects, refer to them naturally with articles. No editorial qualifiers like "routine" or "suspicious."
-												Refactor Review GenAI Prompt (#22353)

* Improve title to better capture activity

* Improve efficiency of prompt

* Use json format for llama.cpp

* Cleanup prompt

* Add output format for other LLMs
											
										
										
											2026-03-10 03:47:37 +03:00
+								- `potential_threat_level`: Must be consistent with your scene description and the activity patterns above.
-												Add ability to pass additional args to Ollama (#19484)

* Call out recognized objects more specifically

* Cleanup

* Make keep_alive and options configurable

* Generalize

* Use for other providers
											
										
										
											2025-08-13 18:28:01 +03:00
+								{get_concern_prompt()}
-												Add config for users to define additional concerns that GenAI should make note of in review summary (#19463)

* Don't default to openai

* Improve UI

* Allow configuring additional concerns that users may want the AI to note

* Formatting

* Add preferred language config

* Remove unused
											
										
										
											2025-08-11 22:17:25 +03:00
-												Various fixes (#20666)

* Remove nvidia pyindex

* Improve prompt
											
										
										
											2025-10-26 00:40:04 +03:00
+								## Sequence Details
-												Add live context tool to LLM (#21754)

* Add live context tool

* Improve handling of images in request

* Improve prompt caching
											
										
										
											2026-01-22 22:04:40 +03:00
+								- Camera: {review_data["camera"]}
 								- Total frames: {len(thumbnails)} (Frame 1 = earliest, Frame {len(thumbnails)} = latest)
-												Improve natural language of prompt (#19515)

* Make sequence details human-readable so they are used in natural language response

* Cleanup

* Improve prompt and image selection

* Adjust

* Adjust sligtly

* Format time

* Adjust frame selection logic

* Debug save response

* Ignore extra fields

* Adjust docs
											
										
										
											2025-08-15 16:25:49 +03:00
+								- Activity started at {review_data["start"]} and lasted {review_data["duration"]} seconds
-												Miscellaneous Fixes (#20866)

* Don't warn when event ids have expired for trigger sync

* Import faster_whisper conditinally to avoid illegal instruction

* Catch OpenVINO runtime error

* fix race condition in detail stream context

navigating between tracked objects in Explore would sometimes prevent the object track from appearing

* Handle case where classification images are deleted

* Adjust default rounded corners on larger screens

* Improve flow handling for classification state

* Remove images when wizard is cancelled

* Improve deletion handling for classes

* Set constraints on review buffers

* Update to support correct data format

* Set minimum duration for recording based review items

* Use friendly name in review genai prompt

---------

Co-authored-by: Nicolas Mowen <nickmowen213@gmail.com>
											
										
										
											2025-11-10 20:03:56 +03:00
+								- Zones involved: {", ".join(review_data["zones"]) if review_data["zones"] else "None"}
-												Genai review summaries (#19473)

* Generate review item summaries with requests

* Adjust logic to only send important items

* Don't mention ladder

* Adjust prompt to be more specific

* Add more relaxed nature for normal activity

* Cleanup summary

* Update ollama client

* Add more directions to analyze the frames in order

* Remove environment from prompt
											
										
										
											2025-08-13 01:27:35 +03:00
-												Unify list of objects under dedicated section (#20684)

* Unify list of objects under dedicated section

* Use helper fuction
											
										
										
											2025-10-27 00:37:57 +03:00
+								## Objects in Scene
-												Review Summary Optimizations (#22533)

* Use different association method

* Clarify

* Remove extra details from ollama schema

* Fix Gemini Chat

* Fix incorrect instructions

* Improve name handling

* Change order of information for llama.cpp

* Simplify prompt

* Fix formatting
											
										
										
											2026-03-19 19:39:24 +03:00
+								Each line represents a detection state, not necessarily unique individuals. The `←` symbol separates a recognized subject's name from their object type — use only the name (before the `←`) in your response, not the type after it. The same subject may appear across multiple lines if detected multiple times.
-												Review prompt adjustments (#20704)

* Make prompt more fair and reduce time extension

* Adjust naming of unrecognized objects

* Improve object naming behavior

* Add more context image levels
											
										
										
											2025-10-28 16:28:36 +03:00
-												Various Tweaks (#20713)

* Adjust for commutes

* Tweaks

* Don't show no models view in grid

* Add text-md to inputs

* Adjust train title for mobile

* Cleanup prompt more

* Use i18n functions for tooltip

* Fix model complexity causing crash

* Cleanup
											
										
										
											2025-10-29 17:40:50 +03:00
+								**Note: Unidentified objects (without names) are NOT indicators of suspicious activity—they simply mean the system hasn't identified that object.**
-												Unify list of objects under dedicated section (#20684)

* Unify list of objects under dedicated section

* Use helper fuction
											
										
										
											2025-10-27 00:37:57 +03:00
+								{get_objects_list()}
-												Various fixes (#20666)

* Remove nvidia pyindex

* Improve prompt
											
										
										
											2025-10-26 00:40:04 +03:00
-												Add ability to pass additional args to Ollama (#19484)

* Call out recognized objects more specifically

* Cleanup

* Make keep_alive and options configurable

* Generalize

* Use for other providers
											
										
										
											2025-08-13 18:28:01 +03:00
+								{get_language_prompt()}
-												Improve review summary (#20216)

* Add debug logging for review summaries report

* Improve debug logging

* Improve review report prompt

* Cleanup

* Add date to report
											
										
										
											2025-09-26 05:05:22 +03:00
+								"""
-												Use preview frames for Review Descriptions (#19450)

* Use preview frames for genai

* Cleanup

* Adjust
											
										
										
											2025-08-10 19:24:08 +03:00
+								        logger.debug(
 								            f"Sending {len(thumbnails)} images to create review description on {review_data['camera']}"
 								        )
-												Genai review summaries (#19473)

* Generate review item summaries with requests

* Adjust logic to only send important items

* Don't mention ladder

* Adjust prompt to be more specific

* Add more relaxed nature for normal activity

* Cleanup summary

* Update ollama client

* Add more directions to analyze the frames in order

* Remove environment from prompt
											
										
										
											2025-08-13 01:27:35 +03:00
 								        if debug_save:
 								            with open(
 								                os.path.join(
 								                    CLIPS_DIR, "genai-requests", review_data["id"], "prompt.txt"
 								                ),
 								                "w",
 								            ) as f:
 								                f.write(context_prompt)
-												Refactor Review GenAI Prompt (#22353)

* Improve title to better capture activity

* Improve efficiency of prompt

* Use json format for llama.cpp

* Cleanup prompt

* Add output format for other LLMs
											
										
										
											2026-03-10 03:47:37 +03:00
+								        # Build JSON schema for structured output from ReviewMetadata model
 								        schema = ReviewMetadata.model_json_schema()
 								        schema.get("properties", {}).pop("time", None)
 								        if "time" in schema.get("required", []):
 								            schema["required"].remove("time")
 								        if not concerns:
 								            schema.get("properties", {}).pop("other_concerns", None)
 								            if "other_concerns" in schema.get("required", []):
 								                schema["required"].remove("other_concerns")
 								        response_format = {
 								            "type": "json_schema",
 								            "json_schema": {
 								                "name": "review_metadata",
 								                "strict": True,
 								                "schema": schema,
 								            },
 								        }
 								        response = self._send(context_prompt, thumbnails, response_format)
-												Review Item GenAI metadata (#19442)

* Rename existing function

* Keep track of thumbnial updates

* Tinkering with genai prompt

* Adjust input format

* Create model for review description output

* testing prompt changes

* Prompt improvements and image saving

* Add config for review items genai

* Use genai review config

* Actual config usage

* Adjust debug image saving

* Fix

* Fix review creation

* Adjust prompt

* Prompt adjustment

* Run genai in thread

* Fix detections block

* Adjust prompt

* Prompt changes

* Save genai response to metadata model

* Handle metadata

* Send review update to dispatcher

* Save review metadata to DB

* Send review notification updates

* Quick fix

* Fix name

* Fix update type

* Correctly dump model

* Add card

* Add card

* Remove message

* Cleanup typing and UI

* Adjust prompt

* Formatting

* Add log

* Formatting

* Add inference speed and keep alive
											
										
										
											2025-08-10 14:57:54 +03:00
-												Various Fixes (#19615)

* Don't write to write None response to file

* fix genai config migration

* Fix JP6 build

* Include base image ARG
											
										
										
											2025-08-19 15:49:55 +03:00
+								        if debug_save and response:
-												Improve natural language of prompt (#19515)

* Make sequence details human-readable so they are used in natural language response

* Cleanup

* Improve prompt and image selection

* Adjust

* Adjust sligtly

* Format time

* Adjust frame selection logic

* Debug save response

* Ignore extra fields

* Adjust docs
											
										
										
											2025-08-15 16:25:49 +03:00
+								            with open(
 								                os.path.join(
 								                    CLIPS_DIR, "genai-requests", review_data["id"], "response.txt"
 								                ),
 								                "w",
 								            ) as f:
 								                f.write(response)
-												Review Item GenAI metadata (#19442)

* Rename existing function

* Keep track of thumbnial updates

* Tinkering with genai prompt

* Adjust input format

* Create model for review description output

* testing prompt changes

* Prompt improvements and image saving

* Add config for review items genai

* Use genai review config

* Actual config usage

* Adjust debug image saving

* Fix

* Fix review creation

* Adjust prompt

* Prompt adjustment

* Run genai in thread

* Fix detections block

* Adjust prompt

* Prompt changes

* Save genai response to metadata model

* Handle metadata

* Send review update to dispatcher

* Save review metadata to DB

* Send review notification updates

* Quick fix

* Fix name

* Fix update type

* Correctly dump model

* Add card

* Add card

* Remove message

* Cleanup typing and UI

* Adjust prompt

* Formatting

* Add log

* Formatting

* Add inference speed and keep alive
											
										
										
											2025-08-10 14:57:54 +03:00
+								        if response:
 								            clean_json = re.sub(
 								                r"\n?```$", "", re.sub(r"^```[a-zA-Z0-9]*\n?", "", response)
 								            )
 								            try:
-												Improve natural language of prompt (#19515)

* Make sequence details human-readable so they are used in natural language response

* Cleanup

* Improve prompt and image selection

* Adjust

* Adjust sligtly

* Format time

* Adjust frame selection logic

* Debug save response

* Ignore extra fields

* Adjust docs
											
										
										
											2025-08-15 16:25:49 +03:00
+								                metadata = ReviewMetadata.model_validate_json(clean_json)
-												Miscellaneous fixes (#23009)

* Reduce max frames per second to 1

* Use pydantic but don't fail if some constraints are not met.

* Adjust limits

* Adjust limits

* Cleanup

* add unsaved changes icon/popover to individual settings section

* allow changing camera friendly_name from camera management pane

---------

Co-authored-by: Josh Hawkins <32435876+hawkeye217@users.noreply.github.com>
											
										
										
											2026-04-27 01:09:35 +03:00
+								            except ValidationError as ve:
 								                # Constraint violations (length, item count, ranges) are logged
 								                # at debug and the response is kept anyway — a slightly
 								                # off-spec answer is still usable, and dropping the whole
 								                # response loses the narrative content the model produced.
 								                for err in ve.errors():
 								                    loc = ".".join(str(p) for p in err["loc"]) or "<root>"
 								                    logger.debug(
 								                        "Review metadata soft validation: %s — %s (input: %r)",
 								                        loc,
 								                        err["msg"],
 								                        err.get("input"),
 								                    )
 								                try:
 								                    raw = json.loads(clean_json)
 								                except json.JSONDecodeError as je:
 								                    logger.error("Failed to parse review description JSON: %s", je)
 								                    return None
-												Miscellaneous fixes (#23017)

* add ui to camera config update topics enum

* add mqtt to camera config update enum

* ensure cleanup runs when an event end skips post-processing

* end any in-progress audio events when audio detection is disabled

we already end in-progress audio events when we disable a camera, but this mirrors that logic for specifically disabling audio detection

* Improve GenAI metadata

* fix invalid recording segment topic being misrouted to the valid handler

* Add confidence default to avoid unnecessary field causing issues

---------

Co-authored-by: Nicolas Mowen <nickmowen213@gmail.com>
											
										
										
											2026-04-28 17:54:09 +03:00
+								                # observations and confidence are required on the model; fill an empty default
-												Miscellaneous fixes (#23009)

* Reduce max frames per second to 1

* Use pydantic but don't fail if some constraints are not met.

* Adjust limits

* Adjust limits

* Cleanup

* add unsaved changes icon/popover to individual settings section

* allow changing camera friendly_name from camera management pane

---------

Co-authored-by: Josh Hawkins <32435876+hawkeye217@users.noreply.github.com>
											
										
										
											2026-04-27 01:09:35 +03:00
+								                # if the response omitted it so attribute access stays safe.
 								                raw.setdefault("observations", [])
-												Miscellaneous fixes (#23017)

* add ui to camera config update topics enum

* add mqtt to camera config update enum

* ensure cleanup runs when an event end skips post-processing

* end any in-progress audio events when audio detection is disabled

we already end in-progress audio events when we disable a camera, but this mirrors that logic for specifically disabling audio detection

* Improve GenAI metadata

* fix invalid recording segment topic being misrouted to the valid handler

* Add confidence default to avoid unnecessary field causing issues

---------

Co-authored-by: Nicolas Mowen <nickmowen213@gmail.com>
											
										
										
											2026-04-28 17:54:09 +03:00
+								                raw.setdefault("confidence", 0.0)
-												Miscellaneous fixes (#23009)

* Reduce max frames per second to 1

* Use pydantic but don't fail if some constraints are not met.

* Adjust limits

* Adjust limits

* Cleanup

* add unsaved changes icon/popover to individual settings section

* allow changing camera friendly_name from camera management pane

---------

Co-authored-by: Josh Hawkins <32435876+hawkeye217@users.noreply.github.com>
											
										
										
											2026-04-27 01:09:35 +03:00
+								                metadata = ReviewMetadata.model_construct(**raw)
 								            except Exception as e:
 								                logger.error(
 								                    f"Failed to parse review description as the response did not match expected format. {e}"
 								                )
 								                return None
-												Improve natural language of prompt (#19515)

* Make sequence details human-readable so they are used in natural language response

* Cleanup

* Improve prompt and image selection

* Adjust

* Adjust sligtly

* Format time

* Adjust frame selection logic

* Debug save response

* Ignore extra fields

* Adjust docs
											
										
										
											2025-08-15 16:25:49 +03:00
-												Miscellaneous fixes (#23009)

* Reduce max frames per second to 1

* Use pydantic but don't fail if some constraints are not met.

* Adjust limits

* Adjust limits

* Cleanup

* add unsaved changes icon/popover to individual settings section

* allow changing camera friendly_name from camera management pane

---------

Co-authored-by: Josh Hawkins <32435876+hawkeye217@users.noreply.github.com>
											
										
										
											2026-04-27 01:09:35 +03:00
+								            try:
-												Handle percentage as int (#22370)
											
										
										
											2026-03-10 16:35:00 +03:00
+								                # Normalize confidence if model returned a percentage (e.g. 85 instead of 0.85)
 								                if metadata.confidence > 1.0:
 								                    metadata.confidence = min(metadata.confidence / 100.0, 1.0)
-												Review Summary Optimizations (#22533)

* Use different association method

* Clarify

* Remove extra details from ollama schema

* Fix Gemini Chat

* Fix incorrect instructions

* Improve name handling

* Change order of information for llama.cpp

* Simplify prompt

* Fix formatting
											
										
										
											2026-03-19 19:39:24 +03:00
+								                # If any verified objects (contain ← separator), set to 0
 								                if any("←" in obj for obj in review_data["unified_objects"]):
-												Improve natural language of prompt (#19515)

* Make sequence details human-readable so they are used in natural language response

* Cleanup

* Improve prompt and image selection

* Adjust

* Adjust sligtly

* Format time

* Adjust frame selection logic

* Debug save response

* Ignore extra fields

* Adjust docs
											
										
										
											2025-08-15 16:25:49 +03:00
+								                    metadata.potential_threat_level = 0
-												Miscellaneous fixes (#22780)

* fix mobile export crash by removing stale iOS non-modal drawer workaround

* Remove titlecase to avoid Gemma4 handling plain labels as proper nouns

* Improve titling:

* Make directions more clear

* Properly capitalize delivery services

* update dispatcher config reference on save

* subscribe to review topic so ReviewDescriptionProcessor knows genai is enabled

* auto-send ON genai review WS message when enabled_in_config transitions to true

* remove unused object level

* update docs to clarify pre/post capture settings

* add ui docs links

* improve known_plates field in settings UI

* only show save all when multiple sections are changed

or if the section being changed is not currently being viewed

* fix docs

---------

Co-authored-by: Nicolas Mowen <nickmowen213@gmail.com>
											
										
										
											2026-04-07 16:16:19 +03:00
+								                metadata.title = metadata.title[0].upper() + metadata.title[1:]
-												Improve review summary (#20216)

* Add debug logging for review summaries report

* Improve debug logging

* Improve review report prompt

* Cleanup

* Add date to report
											
										
										
											2025-09-26 05:05:22 +03:00
+								                metadata.time = review_data["start"]
-												Improve natural language of prompt (#19515)

* Make sequence details human-readable so they are used in natural language response

* Cleanup

* Improve prompt and image selection

* Adjust

* Adjust sligtly

* Format time

* Adjust frame selection logic

* Debug save response

* Ignore extra fields

* Adjust docs
											
										
										
											2025-08-15 16:25:49 +03:00
+								                return metadata
-												Review Item GenAI metadata (#19442)

* Rename existing function

* Keep track of thumbnial updates

* Tinkering with genai prompt

* Adjust input format

* Create model for review description output

* testing prompt changes

* Prompt improvements and image saving

* Add config for review items genai

* Use genai review config

* Actual config usage

* Adjust debug image saving

* Fix

* Fix review creation

* Adjust prompt

* Prompt adjustment

* Run genai in thread

* Fix detections block

* Adjust prompt

* Prompt changes

* Save genai response to metadata model

* Handle metadata

* Send review update to dispatcher

* Save review metadata to DB

* Send review notification updates

* Quick fix

* Fix name

* Fix update type

* Correctly dump model

* Add card

* Add card

* Remove message

* Cleanup typing and UI

* Adjust prompt

* Formatting

* Add log

* Formatting

* Add inference speed and keep alive
											
										
										
											2025-08-10 14:57:54 +03:00
+								            except Exception as e:
-												Miscellaneous fixes (#23009)

* Reduce max frames per second to 1

* Use pydantic but don't fail if some constraints are not met.

* Adjust limits

* Adjust limits

* Cleanup

* add unsaved changes icon/popover to individual settings section

* allow changing camera friendly_name from camera management pane

---------

Co-authored-by: Josh Hawkins <32435876+hawkeye217@users.noreply.github.com>
											
										
										
											2026-04-27 01:09:35 +03:00
+								                logger.error(f"Failed to post-process review metadata: {e}")
-												Review Item GenAI metadata (#19442)

* Rename existing function

* Keep track of thumbnial updates

* Tinkering with genai prompt

* Adjust input format

* Create model for review description output

* testing prompt changes

* Prompt improvements and image saving

* Add config for review items genai

* Use genai review config

* Actual config usage

* Adjust debug image saving

* Fix

* Fix review creation

* Adjust prompt

* Prompt adjustment

* Run genai in thread

* Fix detections block

* Adjust prompt

* Prompt changes

* Save genai response to metadata model

* Handle metadata

* Send review update to dispatcher

* Save review metadata to DB

* Send review notification updates

* Quick fix

* Fix name

* Fix update type

* Correctly dump model

* Add card

* Add card

* Remove message

* Cleanup typing and UI

* Adjust prompt

* Formatting

* Add log

* Formatting

* Add inference speed and keep alive
											
										
										
											2025-08-10 14:57:54 +03:00
+								                return None
 								        else:
-												Tweaks (#22770)

* radix pointer events fix

* add debug log for no genai responses

* tweak profiles docs

* add weblate to maintainers list
											
										
										
											2026-04-05 19:08:23 +03:00
+								            logger.debug(
 								                f"Invalid response received from GenAI provider for review description on {review_data['camera']}. Response: {response}",
 								            )
-												Review Item GenAI metadata (#19442)

* Rename existing function

* Keep track of thumbnial updates

* Tinkering with genai prompt

* Adjust input format

* Create model for review description output

* testing prompt changes

* Prompt improvements and image saving

* Add config for review items genai

* Use genai review config

* Actual config usage

* Adjust debug image saving

* Fix

* Fix review creation

* Adjust prompt

* Prompt adjustment

* Run genai in thread

* Fix detections block

* Adjust prompt

* Prompt changes

* Save genai response to metadata model

* Handle metadata

* Send review update to dispatcher

* Save review metadata to DB

* Send review notification updates

* Quick fix

* Fix name

* Fix update type

* Correctly dump model

* Add card

* Add card

* Remove message

* Cleanup typing and UI

* Adjust prompt

* Formatting

* Add log

* Formatting

* Add inference speed and keep alive
											
										
										
											2025-08-10 14:57:54 +03:00
+								            return None
-												Genai review summaries (#19473)

* Generate review item summaries with requests

* Adjust logic to only send important items

* Don't mention ladder

* Adjust prompt to be more specific

* Add more relaxed nature for normal activity

* Cleanup summary

* Update ollama client

* Add more directions to analyze the frames in order

* Remove environment from prompt
											
										
										
											2025-08-13 01:27:35 +03:00
+								    def generate_review_summary(
-												Improve review summary (#20216)

* Add debug logging for review summaries report

* Improve debug logging

* Improve review report prompt

* Cleanup

* Add date to report
											
										
										
											2025-09-26 05:05:22 +03:00
+								        self,
 								        start_ts: float,
 								        end_ts: float,
-												Miscellaneous Fixes (#21208)

* conditionally display actions for admin role only

* only allow admins to save annotation offset

* Fix classification reset filter

* fix explore context menu from blocking pointer events on the body element after dialog close

applying modal=false to the menu (not to the dialog) to fix this in the same way as elsewhere in the codebase

* add select all link to face library, classification, and explore

* Disable iOS image dragging for classification card

* add proxmox ballooning comment

* lpr docs tweaks

* yaml list

* clarify tls_insecure

* Improve security summary format and usefulness

---------

Co-authored-by: Nicolas Mowen <nickmowen213@gmail.com>
											
										
										
											2025-12-11 17:23:34 +03:00
+								        events: list[dict[str, Any]],
-												Miscellaneous fixes (#21373)

* Send preferred language for report service

* make object lifecycle scrollable in tracking details

* fix info popovers in live camera drawer

* ensure metrics are initialized if genai is enabled

* docs

* ollama cloud model docs

* Ensure object descriptions get claened up

---------

Co-authored-by: Josh Hawkins <32435876+hawkeye217@users.noreply.github.com>
											
										
										
											2025-12-21 03:30:34 +03:00
+								        preferred_language: str | None,
-												Improve review summary (#20216)

* Add debug logging for review summaries report

* Improve debug logging

* Improve review report prompt

* Cleanup

* Add date to report
											
										
										
											2025-09-26 05:05:22 +03:00
+								        debug_save: bool,
-												Genai review summaries (#19473)

* Generate review item summaries with requests

* Adjust logic to only send important items

* Don't mention ladder

* Adjust prompt to be more specific

* Add more relaxed nature for normal activity

* Cleanup summary

* Update ollama client

* Add more directions to analyze the frames in order

* Remove environment from prompt
											
										
										
											2025-08-13 01:27:35 +03:00
+								    ) -> str | None:
 								        """Generate a summary of review item descriptions over a period of time."""
-												Improve review summary (#20216)

* Add debug logging for review summaries report

* Improve debug logging

* Improve review report prompt

* Cleanup

* Add date to report
											
										
										
											2025-09-26 05:05:22 +03:00
+								        time_range = f"{datetime.datetime.fromtimestamp(start_ts).strftime('%B %d, %Y at %I:%M %p')} to {datetime.datetime.fromtimestamp(end_ts).strftime('%B %d, %Y at %I:%M %p')}"
-												Genai review summaries (#19473)

* Generate review item summaries with requests

* Adjust logic to only send important items

* Don't mention ladder

* Adjust prompt to be more specific

* Add more relaxed nature for normal activity

* Cleanup summary

* Update ollama client

* Add more directions to analyze the frames in order

* Remove environment from prompt
											
										
										
											2025-08-13 01:27:35 +03:00
+								        timeline_summary_prompt = f"""
-												Miscellaneous Fixes (#21208)

* conditionally display actions for admin role only

* only allow admins to save annotation offset

* Fix classification reset filter

* fix explore context menu from blocking pointer events on the body element after dialog close

applying modal=false to the menu (not to the dialog) to fix this in the same way as elsewhere in the codebase

* add select all link to face library, classification, and explore

* Disable iOS image dragging for classification card

* add proxmox ballooning comment

* lpr docs tweaks

* yaml list

* clarify tls_insecure

* Improve security summary format and usefulness

---------

Co-authored-by: Nicolas Mowen <nickmowen213@gmail.com>
											
										
										
											2025-12-11 17:23:34 +03:00
+								You are a security officer writing a concise security report.
 								Time range: {time_range}
 								Input format: Each event is a JSON object with:
 								- "title", "scene", "confidence", "potential_threat_level" (0-2), "other_concerns", "camera", "time", "start_time", "end_time"
 								- "context": array of related events from other cameras that occurred during overlapping time periods
-												Miscellaneous fixes (0.17 beta) (#21431)

* Add shortSummary field to review summary to be used for notifications

* pull in current config version into default config

* fix crash when dynamically adding cameras

depending on where we are in the update loop, camera configs might not be updated yet and we are receiving detections already

* add no tracked objects and icon to explore summary view

* reset add camera wizard when closing and saving

* don't flash no exports icon while loading

* Improve handling of homekit config

* Increase prompt tokens reservation

* Adjust

* Catch event not found object detection

* Use thread lock for JinaV2 in onnxruntime

* remove incorrect embeddings process from memray docs

* only show transcribe button if audio event has video

* apply aspect ratio and margin constraints to path overlay in detail stream on mobile

improves a specific case where the overlay was not aligned with 4:3 cameras on mobile phones

* show metadata title as tooltip on icon hover in detail stream

---------

Co-authored-by: Josh Hawkins <32435876+hawkeye217@users.noreply.github.com>
											
										
										
											2025-12-26 17:45:03 +03:00
+								**Note: Use the "scene" field for event descriptions in the report. Ignore any "shortSummary" field if present.**
-												Miscellaneous Fixes (#21208)

* conditionally display actions for admin role only

* only allow admins to save annotation offset

* Fix classification reset filter

* fix explore context menu from blocking pointer events on the body element after dialog close

applying modal=false to the menu (not to the dialog) to fix this in the same way as elsewhere in the codebase

* add select all link to face library, classification, and explore

* Disable iOS image dragging for classification card

* add proxmox ballooning comment

* lpr docs tweaks

* yaml list

* clarify tls_insecure

* Improve security summary format and usefulness

---------

Co-authored-by: Nicolas Mowen <nickmowen213@gmail.com>
											
										
										
											2025-12-11 17:23:34 +03:00
+								Report Structure - Use this EXACT format:
 								# Security Summary - {time_range}
 								## Overview
 								[Write 1-2 sentences summarizing the overall activity pattern during this period.]
 								---
 								## Timeline
 								[Group events by time periods (e.g., "Morning (6:00 AM - 12:00 PM)", "Afternoon (12:00 PM - 5:00 PM)", "Evening (5:00 PM - 9:00 PM)", "Night (9:00 PM - 6:00 AM)"). Use appropriate time blocks based on when events occurred.]
 								### [Time Block Name]
 								**HH:MM AM/PM** | [Camera Name] | [Threat Level Indicator]
 								- [Event title]: [Clear description incorporating contextual information from the "context" array]
 								- Context: [If context array has items, mention them here, e.g., "Delivery truck present on Front Driveway Cam (HH:MM AM/PM)"]
 								- Assessment: [Brief assessment incorporating context - if context explains the event, note it here]
 								[Repeat for each event in chronological order within the time block]
 								---
 								## Summary
 								[One sentence summarizing the period. If all events are normal/explained: "Routine activity observed." If review needed: "Some activity requires review but no security concerns." If security concerns: "Security concerns requiring immediate attention."]
 								Guidelines:
 								- List ALL events in chronological order, grouped by time blocks
 								- Threat level indicators: ✓ Normal, ⚠️ Needs review, 🔴 Security concern
 								- Integrate contextual information naturally - use the "context" array to enrich each event's description
 								- If context explains the event (e.g., delivery truck explains person at door), describe it accordingly (e.g., "delivery person" not "unidentified person")
 								- Be concise but informative - focus on what happened and what it means
 								- If contextual information makes an event clearly normal, reflect that in your assessment
 								- Only create time blocks that have events - don't create empty sections
-												Improve review summary (#20216)

* Add debug logging for review summaries report

* Improve debug logging

* Improve review report prompt

* Cleanup

* Add date to report
											
										
										
											2025-09-26 05:05:22 +03:00
+								"""
-												Genai review summaries (#19473)

* Generate review item summaries with requests

* Adjust logic to only send important items

* Don't mention ladder

* Adjust prompt to be more specific

* Add more relaxed nature for normal activity

* Cleanup summary

* Update ollama client

* Add more directions to analyze the frames in order

* Remove environment from prompt
											
										
										
											2025-08-13 01:27:35 +03:00
-												Miscellaneous Fixes (#21208)

* conditionally display actions for admin role only

* only allow admins to save annotation offset

* Fix classification reset filter

* fix explore context menu from blocking pointer events on the body element after dialog close

applying modal=false to the menu (not to the dialog) to fix this in the same way as elsewhere in the codebase

* add select all link to face library, classification, and explore

* Disable iOS image dragging for classification card

* add proxmox ballooning comment

* lpr docs tweaks

* yaml list

* clarify tls_insecure

* Improve security summary format and usefulness

---------

Co-authored-by: Nicolas Mowen <nickmowen213@gmail.com>
											
										
										
											2025-12-11 17:23:34 +03:00
+								        timeline_summary_prompt += "\n\nEvents:\n"
 								        for event in events:
 								            timeline_summary_prompt += f"\n{event}\n"
-												Genai review summaries (#19473)

* Generate review item summaries with requests

* Adjust logic to only send important items

* Don't mention ladder

* Adjust prompt to be more specific

* Add more relaxed nature for normal activity

* Cleanup summary

* Update ollama client

* Add more directions to analyze the frames in order

* Remove environment from prompt
											
										
										
											2025-08-13 01:27:35 +03:00
-												Miscellaneous fixes (#21373)

* Send preferred language for report service

* make object lifecycle scrollable in tracking details

* fix info popovers in live camera drawer

* ensure metrics are initialized if genai is enabled

* docs

* ollama cloud model docs

* Ensure object descriptions get claened up

---------

Co-authored-by: Josh Hawkins <32435876+hawkeye217@users.noreply.github.com>
											
										
										
											2025-12-21 03:30:34 +03:00
+								        if preferred_language:
 								            timeline_summary_prompt += f"\nProvide your answer in {preferred_language}"
-												Improve review summary (#20216)

* Add debug logging for review summaries report

* Improve debug logging

* Improve review report prompt

* Cleanup

* Add date to report
											
										
										
											2025-09-26 05:05:22 +03:00
+								        if debug_save:
 								            with open(
 								                os.path.join(
 								                    CLIPS_DIR, "genai-requests", f"{start_ts}-{end_ts}", "prompt.txt"
 								                ),
 								                "w",
 								            ) as f:
 								                f.write(timeline_summary_prompt)
 								        response = self._send(timeline_summary_prompt, [])
 								        if debug_save and response:
 								            with open(
 								                os.path.join(
 								                    CLIPS_DIR, "genai-requests", f"{start_ts}-{end_ts}", "response.txt"
 								                ),
 								                "w",
 								            ) as f:
 								                f.write(response)
 								        return response
-												Genai review summaries (#19473)

* Generate review item summaries with requests

* Adjust logic to only send important items

* Don't mention ladder

* Adjust prompt to be more specific

* Add more relaxed nature for normal activity

* Cleanup summary

* Update ollama client

* Add more directions to analyze the frames in order

* Remove environment from prompt
											
										
										
											2025-08-13 01:27:35 +03:00
-												Review Item GenAI metadata (#19442)

* Rename existing function

* Keep track of thumbnial updates

* Tinkering with genai prompt

* Adjust input format

* Create model for review description output

* testing prompt changes

* Prompt improvements and image saving

* Add config for review items genai

* Use genai review config

* Actual config usage

* Adjust debug image saving

* Fix

* Fix review creation

* Adjust prompt

* Prompt adjustment

* Run genai in thread

* Fix detections block

* Adjust prompt

* Prompt changes

* Save genai response to metadata model

* Handle metadata

* Send review update to dispatcher

* Save review metadata to DB

* Send review notification updates

* Quick fix

* Fix name

* Fix update type

* Correctly dump model

* Add card

* Add card

* Remove message

* Cleanup typing and UI

* Adjust prompt

* Formatting

* Add log

* Formatting

* Add inference speed and keep alive
											
										
										
											2025-08-10 14:57:54 +03:00
+								    def generate_object_description(
-												write prompts for genai at the camera level (#13767)


											
										
										
											2024-09-16 17:46:11 +03:00
+								        self,
 								        camera_config: CameraConfig,
 								        thumbnails: list[bytes],
-												Fix substitution on genai prompts (#14298)


											
										
										
											2024-10-12 15:19:24 +03:00
+								        event: Event,
-												Semantic Search for Detections (#11899)

* Initial re-implementation of semantic search

* put docker-compose back and make reindex match docs

* remove debug code and fix import

* fix docs

* manually build pysqlite3 as binaries are only available for x86-64

* update comment in build_pysqlite3.sh

* only embed objects

* better error handling when genai fails

* ask ollama to pull requested model at startup

* update ollama docs

* address some PR review comments

* fix lint

* use IPC to write description, update docs for reindex

* remove gemini-pro-vision from docs as it will be unavailable soon

* fix OpenAI doc available models

* fix api error in gemini and metadata for embeddings

											
										
										
											2024-06-22 00:30:19 +03:00
+								    ) -> Optional[str]:
 								        """Generate a description for the frame."""
-												Catch invalid key in genai prompt (#19657)


											
										
										
											2025-08-20 16:03:50 +03:00
+								        try:
-												Fix object genai prompt access (#20322)


											
										
										
											2025-10-02 14:48:16 +03:00
+								            prompt = camera_config.objects.genai.object_prompts.get(
-												Increase mypy coverage and fixes (#22632)
											
										
										
											2026-03-25 18:28:48 +03:00
+								                str(event.label),
-												Fix object genai prompt access (#20322)


											
										
										
											2025-10-02 14:48:16 +03:00
+								                camera_config.objects.genai.prompt,
-												Catch invalid key in genai prompt (#19657)


											
										
										
											2025-08-20 16:03:50 +03:00
+								            ).format(**model_to_dict(event))
 								        except KeyError as e:
 								            logger.error(f"Invalid key in GenAI prompt: {e}")
 								            return None
-												Update ollama docs and add genai debug logging (#15012)


											
										
										
											2024-11-16 00:24:17 +03:00
+								        logger.debug(f"Sending images to genai provider with prompt: {prompt}")
-												Semantic Search for Detections (#11899)

* Initial re-implementation of semantic search

* put docker-compose back and make reindex match docs

* remove debug code and fix import

* fix docs

* manually build pysqlite3 as binaries are only available for x86-64

* update comment in build_pysqlite3.sh

* only embed objects

* better error handling when genai fails

* ask ollama to pull requested model at startup

* update ollama docs

* address some PR review comments

* fix lint

* use IPC to write description, update docs for reindex

* remove gemini-pro-vision from docs as it will be unavailable soon

* fix OpenAI doc available models

* fix api error in gemini and metadata for embeddings

											
										
										
											2024-06-22 00:30:19 +03:00
+								        return self._send(prompt, thumbnails)
-												Increase mypy coverage and fixes (#22632)
											
										
										
											2026-03-25 18:28:48 +03:00
+								    def _init_provider(self) -> Any:
-												Semantic Search for Detections (#11899)

* Initial re-implementation of semantic search

* put docker-compose back and make reindex match docs

* remove debug code and fix import

* fix docs

* manually build pysqlite3 as binaries are only available for x86-64

* update comment in build_pysqlite3.sh

* only embed objects

* better error handling when genai fails

* ask ollama to pull requested model at startup

* update ollama docs

* address some PR review comments

* fix lint

* use IPC to write description, update docs for reindex

* remove gemini-pro-vision from docs as it will be unavailable soon

* fix OpenAI doc available models

* fix api error in gemini and metadata for embeddings

											
										
										
											2024-06-22 00:30:19 +03:00
+								        """Initialize the client."""
 								        return None
-												Refactor Review GenAI Prompt (#22353)

* Improve title to better capture activity

* Improve efficiency of prompt

* Use json format for llama.cpp

* Cleanup prompt

* Add output format for other LLMs
											
										
										
											2026-03-10 03:47:37 +03:00
+								    def _send(
 								        self,
 								        prompt: str,
 								        images: list[bytes],
 								        response_format: Optional[dict] = None,
 								    ) -> Optional[str]:
-												Revert "Miscellaneous fixes (0.17 beta) (#21764)" (#21825)

This reverts commit 50ac5a1483c94c86fca3a84c2a33a9e898a40de9.
											
										
										
											2026-01-29 21:30:21 +03:00
+								        """Submit a request to the provider."""
-												Semantic Search for Detections (#11899)

* Initial re-implementation of semantic search

* put docker-compose back and make reindex match docs

* remove debug code and fix import

* fix docs

* manually build pysqlite3 as binaries are only available for x86-64

* update comment in build_pysqlite3.sh

* only embed objects

* better error handling when genai fails

* ask ollama to pull requested model at startup

* update ollama docs

* address some PR review comments

* fix lint

* use IPC to write description, update docs for reindex

* remove gemini-pro-vision from docs as it will be unavailable soon

* fix OpenAI doc available models

* fix api error in gemini and metadata for embeddings

											
										
										
											2024-06-22 00:30:19 +03:00
+								        return None
-												Refactor genai (#22752)

* Switch to a feature-based roles so it is easier to choose models for different tasks

* Fallback and try llama-swap format

* List models supported by provider

* Cleanup

* Add frontend

* Improve model loading

* Make it possible to update genai without restarting

* Cleanup

* Cleanup

* Mypy
											
										
										
											2026-04-04 02:13:52 +03:00
+								    @property
 								    def supports_vision(self) -> bool:
 								        """Whether the model supports vision/image input.
 								        Defaults to True for cloud providers. Providers that can detect
 								        capability at runtime (e.g. llama.cpp) should override this.
 								        """
 								        return True
 								    def list_models(self) -> list[str]:
 								        """Return the list of model names available from this provider.
 								        Providers should override this to query their backend.
 								        """
 								        return []
-												Improve review summary performance (#20328)

* Undo vite

* Balance the prompt

* Round duration

* Calculate context size to determine number of images

* Increase number of images
											
										
										
											2025-10-02 18:17:25 +03:00
+								    def get_context_size(self) -> int:
 								        """Get the context window size for this provider in tokens."""
 								        return 4096
-												GenAI Optimizations (#23006)

* Test for image token usage in llama.cpp so we can more appropriately decide how many frames to include

* Limit based on frames per second

* handle zone case sensitivity

* Improve formatting

* Add observations field so model can build CoT before outputting used fields
											
										
										
											2026-04-26 01:38:18 +03:00
+								    def estimate_image_tokens(self, width: int, height: int) -> float:
 								        """Estimate prompt tokens consumed by a single image of the given dimensions.
 								        Default heuristic: ~1 token per 1250 pixels. Providers that can measure or
 								        know their model's exact image-token cost should override.
 								        """
 								        return (width * height) / 1250
-												Support using GenAI for embeddings / semantic search (#22323)

* Support GenAI for embeddings

* Add embed API support

* Add support for embedding via genai

* Basic docs

* undo

* Fix sending images

* Don't require download check

* Set model

* Handle emb correctly

* Clarification

* Cleanup

* Cleanup
											
										
										
											2026-03-08 18:55:00 +03:00
+								    def embed(
 								        self,
 								        texts: list[str] | None = None,
 								        images: list[bytes] | None = None,
 								    ) -> list[np.ndarray]:
 								        """Generate embeddings for text and/or images.
 								        Returns list of numpy arrays (one per input). Expected dimension is 768
 								        for Frigate semantic search compatibility.
 								        Providers that support embeddings should override this method.
 								        """
 								        logger.warning(
 								            "%s does not support embeddings. "
 								            "This method should be overridden by the provider implementation.",
 								            self.__class__.__name__,
 								        )
 								        return []
-												Implement LLM Chat API with tool calling support (#21731)

* Implement initial tools definiton APIs

* Add initial chat completion API with tool support

* Implement other providers

* Cleanup
											
										
										
											2026-01-20 18:13:12 +03:00
+								    def chat_with_tools(
 								        self,
 								        messages: list[dict[str, Any]],
 								        tools: Optional[list[dict[str, Any]]] = None,
 								        tool_choice: Optional[str] = "auto",
 								    ) -> dict[str, Any]:
 								        """
 								        Send chat messages to LLM with optional tool definitions.
 								        This method handles conversation-style interactions with the LLM,
 								        including function calling/tool usage capabilities.
 								        Args:
 								            messages: List of message dictionaries. Each message should have:
 								                - 'role': str - One of 'user', 'assistant', 'system', or 'tool'
 								                - 'content': str - The message content
 								                - 'tool_call_id': Optional[str] - For tool responses, the ID of the tool call
 								                - 'name': Optional[str] - For tool messages, the tool name
 								            tools: Optional list of tool definitions in OpenAI-compatible format.
 								                   Each tool should have 'type': 'function' and 'function' with:
 								                   - 'name': str - Tool name
 								                   - 'description': str - Tool description
 								                   - 'parameters': dict - JSON schema for parameters
 								            tool_choice: How the model should handle tools:
 								                - 'auto': Model decides whether to call tools
 								                - 'none': Model must not call tools
 								                - 'required': Model must call at least one tool
 								                - Or a dict specifying a specific tool to call
 								            **kwargs: Additional provider-specific parameters.
 								        Returns:
 								            Dictionary with:
 								            - 'content': Optional[str] - The text response from the LLM, None if tool calls
 								            - 'tool_calls': Optional[List[Dict]] - List of tool calls if LLM wants to call tools.
 								              Each tool call dict has:
 								                - 'id': str - Unique identifier for this tool call
 								                - 'name': str - Tool name to call
 								                - 'arguments': dict - Arguments for the tool call (parsed JSON)
 								            - 'finish_reason': str - Reason generation stopped:
 								                - 'stop': Normal completion
 								                - 'tool_calls': LLM wants to call tools
 								                - 'length': Hit token limit
 								                - 'error': An error occurred
 								        Raises:
 								            NotImplementedError: If the provider doesn't implement this method.
 								        """
 								        # Base implementation - each provider should override this
 								        logger.warning(
 								            f"{self.__class__.__name__} does not support chat_with_tools. "
 								            "This method should be overridden by the provider implementation."
 								        )
 								        return {
 								            "content": None,
 								            "tool_calls": None,
 								            "finish_reason": "error",
 								        }
-												Semantic Search for Detections (#11899)

* Initial re-implementation of semantic search

* put docker-compose back and make reindex match docs

* remove debug code and fix import

* fix docs

* manually build pysqlite3 as binaries are only available for x86-64

* update comment in build_pysqlite3.sh

* only embed objects

* better error handling when genai fails

* ask ollama to pull requested model at startup

* update ollama docs

* address some PR review comments

* fix lint

* use IPC to write description, update docs for reindex

* remove gemini-pro-vision from docs as it will be unavailable soon

* fix OpenAI doc available models

* fix api error in gemini and metadata for embeddings

											
										
										
											2024-06-22 00:30:19 +03:00
-												Increase mypy coverage and fixes (#22632)
											
										
										
											2026-03-25 18:28:48 +03:00
+								def load_providers() -> None:
-												Semantic Search for Detections (#11899)

* Initial re-implementation of semantic search

* put docker-compose back and make reindex match docs

* remove debug code and fix import

* fix docs

* manually build pysqlite3 as binaries are only available for x86-64

* update comment in build_pysqlite3.sh

* only embed objects

* better error handling when genai fails

* ask ollama to pull requested model at startup

* update ollama docs

* address some PR review comments

* fix lint

* use IPC to write description, update docs for reindex

* remove gemini-pro-vision from docs as it will be unavailable soon

* fix OpenAI doc available models

* fix api error in gemini and metadata for embeddings

											
										
										
											2024-06-22 00:30:19 +03:00
+								    package_dir = os.path.dirname(__file__)
 								    for filename in os.listdir(package_dir):
 								        if filename.endswith(".py") and filename != "__init__.py":
 								            module_name = f"frigate.genai.{filename[:-3]}"
 								            importlib.import_module(module_name)