From ae3427158c7d90f15059452126c8058fb643de49 Mon Sep 17 00:00:00 2001 From: Nicolas Mowen Date: Thu, 18 Sep 2025 22:23:29 -0600 Subject: [PATCH] Correctly enable cuda graphs --- frigate/detectors/detection_runners.py | 22 ++++++++++++++-------- 1 file changed, 14 insertions(+), 8 deletions(-) diff --git a/frigate/detectors/detection_runners.py b/frigate/detectors/detection_runners.py index 3e304d63c..20227b11d 100644 --- a/frigate/detectors/detection_runners.py +++ b/frigate/detectors/detection_runners.py @@ -420,16 +420,22 @@ def get_optimized_runner( if device != "CPU" and is_openvino_gpu_npu_available(): return OpenVINOModelRunner(model_path, device, model_type, **kwargs) - ortSession = ort.InferenceSession( - model_path, - providers=providers, - provider_options=options, - ) - if ( not CudaGraphRunner.is_complex_model(model_type) and providers[0] == "CUDAExecutionProvider" ): - return CudaGraphRunner(ortSession, options[0]["device_id"]) + options[0] = { + **options[0], + "enable_cuda_graph": True, + } + return CudaGraphRunner(ort.InferenceSession( + model_path, + providers=providers, + provider_options=options, + ), options[0]["device_id"]) - return ONNXModelRunner(ortSession) + return ONNXModelRunner(ort.InferenceSession( + model_path, + providers=providers, + provider_options=options, + ))