Adjustments to context sizing

2026-04-11 17:47:37 +03:00 · 2025-10-30 07:09:03 -06:00 · 2025-10-30 07:09:03 -06:00 · 09bf71b4f9
commit 09bf71b4f9
parent 31aed17ca2
2 changed files with 22 additions and 16 deletions
--- a/frigate/data_processing/post/review_descriptions.py
+++ b/frigate/data_processing/post/review_descriptions.py
@ -53,32 +53,38 @@ class ReviewDescriptionProcessor(PostProcessorApi):
    ) -> int:
        """Calculate optimal number of frames based on context size and image source.
-        Recordings (480p): ~250 tokens/image, capped at 20 frames
+        Recordings (480p): ~500 tokens/image, capped at 20 frames
-        Previews (180p): ~100 tokens/image, capped at 20 frames
+        Previews (180p): ~170 tokens/image, capped at 20 frames
-        Targets 70-80% context utilization while keeping inference time reasonable.
+        Targets 75% context utilization while keeping inference time reasonable.
        """
        context_size = self.genai_client.get_context_size()
        if image_source == ImageSourceEnum.recordings:
            if context_size > 16000:
                return 20
            elif context_size > 14000:
                return 18
            elif context_size > 12000:
                return 14
            elif context_size > 10000:
                return 10
            elif context_size > 8000:
                return 8
            elif context_size > 6000:
                return 6
            else:
                return 4
        else:
            if context_size > 12000:
                return 20
-            elif context_size > 10000:
+            elif context_size > 8000:
-                return 18
+                return 16
            elif context_size > 6000:
-                return 14
+                return 12
            elif context_size > 4000:
                return 10
            else:
                return 6
        else:
            if context_size > 10000:
                return 20
            elif context_size > 6000:
                return 16
            elif context_size > 4000:
                return 12
            else:
                return 8
    def process_data(self, data, data_type):
        self.metrics.review_desc_dps.value = self.review_descs_dps.eps()
--- a/frigate/genai/ollama.py
+++ b/frigate/genai/ollama.py
@ -68,7 +68,7 @@ class OllamaClient(GenAIClient):
                f"Ollama tokens used: eval_count={result.get('eval_count')}, prompt_eval_count={result.get('prompt_eval_count')}"
            )
            return result["response"].strip()
-        except (TimeoutException, ResponseError) as e:
+        except (TimeoutException, ResponseError, ConnectionError) as e:
            logger.warning("Ollama returned an error: %s", str(e))
            return None