This commit is contained in:
Josh Hawkins 2025-05-27 08:52:46 -05:00
parent 27bfc81a20
commit 772190869f
3 changed files with 4 additions and 7 deletions

View File

@ -44,7 +44,7 @@ class AudioTranscriptionRealTimeProcessor(RealTimeProcessorApi):
if self.config.audio_transcription.model_size == "large":
self.asr = FasterWhisperASR(
modelsize="tiny", # could use 'base' for CPU, switch to 'small' or 'large-v2' for GPU
modelsize="tiny",
device="cuda"
if self.config.audio_transcription.device == "GPU"
else "cpu",

View File

@ -179,12 +179,10 @@ class EmbeddingMaintainer(threading.Thread):
)
)
audio_transcription_cameras = [
c
if any(
c.enabled_in_config and c.audio_transcription.enabled
for c in self.config.cameras.values()
if c.enabled_in_config and c.audio_transcription.enabled
]
if audio_transcription_cameras:
):
self.post_processors.append(
AudioTranscriptionPostProcessor(self.config, self.requestor, metrics)
)

View File

@ -226,7 +226,6 @@ class AudioEventMaintainer(threading.Thread):
# run audio transcription
if self.transcription_processor is not None and (
# rms >= self.camera_config.audio.min_volume or self.is_endpoint is False
self.camera_config.audio_transcription.live_enabled
):
self.transcribing = True