mirror of
https://github.com/blakeblackshear/frigate.git
synced 2026-05-01 19:17:41 +03:00
use float16 and small model on gpu for real-time
This commit is contained in:
parent
e60b51d036
commit
43a3943c50
@ -122,9 +122,9 @@ class FasterWhisperASR(ASRBase):
|
||||
|
||||
# this worked fast and reliably on NVIDIA L40
|
||||
model = WhisperModel(
|
||||
model_size_or_path="tiny",
|
||||
model_size_or_path="small" if device == "cuda" else "tiny",
|
||||
device=device,
|
||||
compute_type="int8",
|
||||
compute_type="float16" if device == "cuda" else "int8",
|
||||
local_files_only=False,
|
||||
download_root=model_dir,
|
||||
)
|
||||
|
||||
Loading…
Reference in New Issue
Block a user