Merge 42453dad30 into 32e433cafc

Allow GenAI providers to be initialized lazily (#23482 )
* allow GenAI providers to be initialized even if they failed on previous attempts * mypy
2026-07-04 19:11:14 +03:00 · 2026-06-14 17:32:37 -05:00 · 2026-06-14 11:40:33 -05:00 · 2026-06-09 11:33:16 +00:00
3 changed files with 38 additions and 3 deletions
--- a/docker/tensorrt/requirements-amd64.txt
+++ b/docker/tensorrt/requirements-amd64.txt
@ -11,7 +11,7 @@ nvidia-cuda-nvrtc-cu12==12.8.93; platform_machine == 'x86_64'
 nvidia-cuda-runtime-cu12==12.8.90; platform_machine == 'x86_64'
 nvidia-cusolver-cu12==11.7.3.90; platform_machine == 'x86_64'
 nvidia-cusparse-cu12==12.5.8.93; platform_machine == 'x86_64'
-nvidia-nccl-cu12==2.26.2.post1; platform_machine == 'x86_64'
+nvidia-nccl-cu12==2.30.7; platform_machine == 'x86_64'
 nvidia-nvjitlink-cu12==12.8.93; platform_machine == 'x86_64'
 onnx==1.16.*; platform_machine == 'x86_64'
 onnxruntime-gpu==1.24.*; platform_machine == 'x86_64'
--- a/frigate/genai/init.py
+++ b/frigate/genai/init.py
@ -5,6 +5,7 @@ import json
 import logging
 import os
 import re
+import time
 from typing import Any, AsyncGenerator, Callable, Optional

 import numpy as np
@ -50,6 +51,10 @@ def register_genai_provider(key: GenAIProviderEnum) -> Callable:
 class GenAIClient:
    """Generative AI client for Frigate."""

+    # Minimum seconds between re-initialization attempts when the provider was
+    # offline at startup
+    REINIT_INTERVAL = 60.0
+
    def __init__(
        self,
        genai_config: GenAIConfig,
@ -60,6 +65,34 @@ class GenAIClient:
        self.timeout = timeout
        self.validate_model = validate_model
        self.provider = self._init_provider()
+        self._last_init_attempt = time.monotonic()
+
+    def ensure_provider(self) -> bool:
+        """Ensure a provider is available, retrying initialization if needed.
+
+        Providers can fail to initialize at startup when their backing service
+        isn't online yet (common when both are started together). This retries
+        ``_init_provider`` lazily — throttled to ``REINIT_INTERVAL`` — so the
+        client recovers on its own once the service is reachable, without a
+        config reload.
+
+        Returns True if a provider is available.
+        """
+        if self.provider is not None:
+            return True
+
+        now = time.monotonic()
+        if now - self._last_init_attempt < self.REINIT_INTERVAL:
+            return False
+
+        self._last_init_attempt = now
+        self.provider = self._init_provider()
+        if self.provider is not None:
+            logger.info(
+                "GenAI provider %s is now available",
+                self.genai_config.provider,
+            )
+        return self.provider is not None

    def generate_review_description(
        self,
--- a/frigate/genai/manager.py
+++ b/frigate/genai/manager.py
@ -62,7 +62,9 @@ class GenAIClientManager:
    def _get_client(self, name: str) -> "Optional[GenAIClient]":
        """Return the client for *name*, creating it on first access."""
        if name in self._clients:
-            return self._clients[name]
+            client = self._clients[name]
+            client.ensure_provider()
+            return client

        from frigate.genai import PROVIDERS

@ -78,7 +80,7 @@ class GenAIClientManager:
            return None

        try:
-            client: "GenAIClient" = provider_cls(genai_cfg)
+            client = provider_cls(genai_cfg)
        except Exception as e:
            logger.exception(
                "Failed to create GenAI client for provider %s: %s",
Author	SHA1	Message	Date
dependabot[bot]	f790ed6159	Merge `42453dad30` into `32e433cafc`	2026-06-14 17:32:37 -05:00
Nicolas Mowen	32e433cafc	Allow GenAI providers to be initialized lazily (#23482 ) Some checks are pending CI / AMD64 Build (push) Waiting to run Details CI / ARM Build (push) Waiting to run Details CI / Jetson Jetpack 6 (push) Waiting to run Details CI / AMD64 Extra Build (push) Blocked by required conditions Details CI / ARM Extra Build (push) Blocked by required conditions Details CI / Synaptics Build (push) Blocked by required conditions Details CI / Assemble and push default build (push) Blocked by required conditions Details * allow GenAI providers to be initialized even if they failed on previous attempts * mypy	2026-06-14 11:40:33 -05:00
dependabot[bot]	42453dad30	Bump nvidia-nccl-cu12 from 2.26.2.post1 to 2.30.7 in /docker/tensorrt Bumps [nvidia-nccl-cu12](https://developer.nvidia.com/cuda-zone) from 2.26.2.post1 to 2.30.7. --- updated-dependencies: - dependency-name: nvidia-nccl-cu12 dependency-version: 2.30.7 dependency-type: direct:production update-type: version-update:semver-minor ... Signed-off-by: dependabot[bot] <support@github.com>	2026-06-09 11:33:16 +00:00