From c2bf036234c3c9d2520f6223878f7fb61dcf4531 Mon Sep 17 00:00:00 2001 From: Mahmoud Ashraf Date: Wed, 13 Nov 2024 16:07:46 +0200 Subject: [PATCH] change `language_detection_threshold` default value (#1134) --- faster_whisper/transcribe.py | 7 ++----- 1 file changed, 2 insertions(+), 5 deletions(-) diff --git a/faster_whisper/transcribe.py b/faster_whisper/transcribe.py index 199bb09..0918328 100644 --- a/faster_whisper/transcribe.py +++ b/faster_whisper/transcribe.py @@ -692,7 +692,7 @@ class WhisperModel: clip_timestamps: Union[str, List[float]] = "0", hallucination_silence_threshold: Optional[float] = None, hotwords: Optional[str] = None, - language_detection_threshold: Optional[float] = None, + language_detection_threshold: Optional[float] = 0.5, language_detection_segments: int = 1, ) -> Tuple[Iterable[Segment], TranscriptionInfo]: """Transcribes an input file. @@ -882,10 +882,7 @@ class WhisperModel: ] # Get top language token and probability language, language_probability = all_language_probs[0] - if ( - language_detection_threshold is None - or language_probability > language_detection_threshold - ): + if language_probability > language_detection_threshold: break detected_language_info.setdefault(language, []).append( language_probability