Read audio frames from ffmpeg process directly

2026-02-05 18:55:23 +03:00 · 2023-07-25 16:58:17 -06:00 · 2023-07-25 16:58:17 -06:00 · 636de05738
commit 636de05738
parent ab60077294
1 changed files with 19 additions and 29 deletions
--- a/frigate/events/audio.py
+++ b/frigate/events/audio.py
@ -3,9 +3,9 @@
 import datetime
 import logging
 import multiprocessing as mp
 import os
 import signal
 import threading
 import time
 from types import FrameType
 from typing import Optional, Tuple
@ -21,7 +21,6 @@ from frigate.const import (
    AUDIO_MAX_BIT_RANGE,
    AUDIO_MIN_CONFIDENCE,
    AUDIO_SAMPLE_RATE,
    CACHE_DIR,
    FRIGATE_LOCALHOST,
 )
 from frigate.ffmpeg_presets import parse_preset_input
@ -40,12 +39,12 @@ except ModuleNotFoundError:
 logger = logging.getLogger(__name__)
-def get_ffmpeg_command(input_args: list[str], input_path: str, pipe: str) -> list[str]:
+def get_ffmpeg_command(input_args: list[str], input_path: str) -> list[str]:
    return get_ffmpeg_arg_list(
        f"ffmpeg {{}} -i {{}} -f {AUDIO_FORMAT} -ar {AUDIO_SAMPLE_RATE} -ac 1 -y {{}}".format(
            " ".join(input_args),
            input_path,
-            pipe,
+            "pipe:",
        )
    )
@ -169,14 +168,11 @@ class AudioEventMaintainer(threading.Thread):
        self.shape = (int(round(AUDIO_DURATION * AUDIO_SAMPLE_RATE)),)
        self.chunk_size = int(round(AUDIO_DURATION * AUDIO_SAMPLE_RATE * 2))
        self.logger = logging.getLogger(f"audio.{self.config.name}")
        self.pipe = f"{CACHE_DIR}/{self.config.name}-audio"
        self.ffmpeg_cmd = get_ffmpeg_command(
            get_ffmpeg_arg_list(self.config.ffmpeg.global_args)
            + parse_preset_input("preset-rtsp-audio-only", 1),
            [i.path for i in self.config.ffmpeg.inputs if "audio" in i.roles][0],
            self.pipe,
        )
        self.pipe_file = None
        self.logpipe = LogPipe(f"ffmpeg.{self.config.name}.audio")
        self.audio_listener = None
@ -279,40 +275,34 @@ class AudioEventMaintainer(threading.Thread):
                        f"Failed to end audio event {detection['id']} with status code {resp.status_code}"
                    )
-    def restart_audio_pipe(self) -> None:
+    def start_or_restart_ffmpeg(self) -> None:
        try:
            if self.pipe_file:
                os.close(self.pipe_file)
            if os.path.exists(self.pipe):
                os.remove(self.pipe)
            self.pipe_file = None
            os.mkfifo(self.pipe)
        except FileExistsError:
            pass
        self.audio_listener = start_or_restart_ffmpeg(
-            self.ffmpeg_cmd, self.logger, self.logpipe, None, self.audio_listener
+            self.ffmpeg_cmd,
            self.logger,
            self.logpipe,
            self.chunk_size,
            self.audio_listener,
        )
    def read_audio(self) -> None:
        if self.pipe_file is None:
            self.pipe_file = open(self.pipe, "rb")
        try:
-            audio = np.frombuffer(self.pipe_file.read(self.chunk_size), dtype=np.int16)
+            self.logger.error("Trying to read from process")
            audio = np.frombuffer(self.audio_listener.stdout.read(self.chunk_size), dtype=np.int16)
            self.logger.error("Finished reading from process")
            self.detect_audio(audio)
-        except BrokenPipeError:
+        except Exception:
            self.logger.error(
                "Error reading audio data from ffmpeg process, restarting..."
            )
            time.sleep(self.config.ffmpeg.retry_interval)
            self.logpipe.dump()
-            self.restart_audio_pipe()
+            self.start_or_restart_ffmpeg()
    def run(self) -> None:
-        self.restart_audio_pipe()
+        self.start_or_restart_ffmpeg()
        while not self.stop_event.is_set():
            self.read_audio()
        self.pipe_file.close()
        stop_ffmpeg(self.audio_listener, self.logger)
        self.logpipe.close()