Browse Source

faster transcription

KoljaB 9 months ago
parent
commit
94d7437e59
1 changed files with 4 additions and 3 deletions
  1. 4 3
      RealtimeSTT/audio_recorder.py

+ 4 - 3
RealtimeSTT/audio_recorder.py

@@ -160,7 +160,7 @@ class AudioToTextRecorder:
                  initial_prompt: Optional[Union[str, Iterable[int]]] = None,
                  initial_prompt: Optional[Union[str, Iterable[int]]] = None,
                  suppress_tokens: Optional[List[int]] = [-1],
                  suppress_tokens: Optional[List[int]] = [-1],
                  log_transcription_time: bool = False,
                  log_transcription_time: bool = False,
-                 early_transcription_on_silence: bool = True
+                 early_transcription_on_silence: bool = False
                  ):
                  ):
         """
         """
         Initializes an audio recorder and  transcription
         Initializes an audio recorder and  transcription
@@ -343,13 +343,14 @@ class AudioToTextRecorder:
             from the transcription output.
             from the transcription output.
         - log_transcription_time (bool, default=False): Logs processing time
         - log_transcription_time (bool, default=False): Logs processing time
             of main model transcription 
             of main model transcription 
-        - early_transcription_on_silence (bool, default=True):  If True, the
+        - early_transcription_on_silence (bool, default=False):  If True, the
             system will immediately transcribe audio when silence is detected.
             system will immediately transcribe audio when silence is detected.
             If silence lasts longer than post_speech_silence_duration, the 
             If silence lasts longer than post_speech_silence_duration, the 
             recording is stopped, and the transcription is submitted. If 
             recording is stopped, and the transcription is submitted. If 
             voice activity resumes within this period, the transcription 
             voice activity resumes within this period, the transcription 
             is discarded. Results in faster final transcriptions to the cost
             is discarded. Results in faster final transcriptions to the cost
-            of some unnecessary final transcriptions
+            of some unnecessary final transcriptions. Recommended only
+            when transcription occurs fast enough (strong GPU required).
 
 
         Raises:
         Raises:
             Exception: Errors related to initializing transcription
             Exception: Errors related to initializing transcription