hace 1 año · b684f9bb6d
--- a/README.md
+++ b/README.md
@@ -3,7 +3,6 @@
 
				 
			
 
				 *Easy-to-use, low-latency speech-to-text library for realtime applications*
			
 
				 
			
 
				-
			
 
				 ## About the Project
			
 
				 
			
 
				 RealtimeSTT listens to the microphone and transcribes voice into text.  
			
@@ -13,15 +12,16 @@ It's ideal for:
 
				 - **Voice Assistants**
			
 
				 - Applications requiring **fast and precise** speech-to-text conversion
			
 
				 
			
 
				+https://github.com/KoljaB/RealtimeSTT/assets/7604638/207cb9a2-4482-48e7-9d2b-0722c3ee6d14
			
 
				+
			
 
				 ### Features
			
 
				 
			
 
				 - **Voice Activity Detection**: Automatically detects when you start and stop speaking.
			
 
				-- **Wake Word Activation**: Only starts transcription upon hearing a specific wake word.
			
 
				 - **Realtime Transcription**: Transforms speech to text in real-time.
			
 
				+- **Wake Word Activation**: Can activate upon detecting a designated wake word.
			
 
				 
			
 
				 > **Hint**: *Check out [RealtimeTTS](https://github.com/KoljaB/RealtimeTTS), the output counterpart of this library, for text-to-voice capabilities. Together, they form a powerful realtime audio wrapper around large language models.*
			
 
				 
			
 
				-
			
 
				 ## Tech Stack
			
 
				 
			
 
				 This library uses:
			
--- a/example_app/install_cpu.bat
+++ b/example_app/install_cpu.bat
@@ -10,4 +10,4 @@ if not exist test_env\Scripts\python.exe (
 
				 )
			
 
				 
			
 
				 echo Activating VENV
			
 
				-start cmd /k "call test_env\Scripts\activate.bat && pip install --upgrade RealtimeSTT==0.1.3 && pip install --upgrade RealtimeTTS==0.1.3 && pip install pysoundfile==0.9.0.post1 openai==0.27.8 keyboard==0.13.5 PyQt5==5.15.9 sounddevice==0.4.6 wavio==0.0.7"
			
 
				+start cmd /k "call test_env\Scripts\activate.bat && pip install --upgrade RealtimeSTT==0.1.4 && pip install --upgrade RealtimeTTS==0.1.3 && pip install pysoundfile==0.9.0.post1 openai==0.27.8 keyboard==0.13.5 PyQt5==5.15.9 sounddevice==0.4.6 wavio==0.0.7"
			
--- a/example_app/install_gpu.bat
+++ b/example_app/install_gpu.bat
@@ -10,4 +10,4 @@ if not exist test_env\Scripts\python.exe (
 
				 )
			
 
				 
			
 
				 echo Activating VENV
			
 
				-start cmd /k "call test_env\Scripts\activate.bat && pip install --upgrade RealtimeSTT==0.1.3 && pip install --upgrade RealtimeTTS==0.1.3 && pip uninstall torch --yes && pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu118 && pip install pysoundfile==0.9.0.post1 openai==0.27.8 keyboard==0.13.5 PyQt5==5.15.9 sounddevice==0.4.6 wavio==0.0.7"
			
 
				+start cmd /k "call test_env\Scripts\activate.bat && pip install --upgrade RealtimeSTT==0.1.4 && pip install --upgrade RealtimeTTS==0.1.3 && pip uninstall torch --yes && pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu118 && pip install pysoundfile==0.9.0.post1 openai==0.27.8 keyboard==0.13.5 PyQt5==5.15.9 sounddevice==0.4.6 wavio==0.0.7"
			
--- a/example_app/start.bat
+++ b/example_app/start.bat
@@ -21,4 +21,4 @@ set ELEVENLABS_API_KEY=
 
				 
			
 
				 
			
 
				 echo Activating VENV
			
 
				-start cmd /k "call test_env\Scripts\activate.bat && python VoiceApp.py"
			
 
				+start cmd /k "call test_env\Scripts\activate.bat && python ui_openai_voice_interface.py"