diff --git a/openlrc/defaults.py b/openlrc/defaults.py index 3e8438b..215cff1 100644 --- a/openlrc/defaults.py +++ b/openlrc/defaults.py @@ -34,11 +34,10 @@ # Check https://github.com/guillaumekln/faster-whisper/blob/3b4a6aa1c22d293ddde9f08bdd31fc842086a6ea/faster_whisper/vad.py#L14 for details default_vad_options = { - "threshold": 0.382, + "threshold": 0.15001, "min_speech_duration_ms": 250, "max_speech_duration_s": float("inf"), "min_silence_duration_ms": 2000, - "window_size_samples": 1024, "speech_pad_ms": 400, } diff --git a/pyproject.toml b/pyproject.toml index 9b1191a..0846bf1 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -56,7 +56,7 @@ filetype = "^1.2.0" jaconvV2 = "^0.4" spacy = "^3.5.4" pysbd = "^0.3.4" -faster-whisper = "^1.0.0" +faster-whisper = "^1.0.3" soundfile = "^0.12.1" ffmpeg-normalize = "^1.27.5" deepfilternet = "^0.5.6"