11 maanden geleden · 0856319583
--- a/Dockerfile
+++ b/Dockerfile
@@ -21,14 +21,14 @@ CMD ["python3", "example_browserclient/server.py"]
 
				 
			
 
				 # --------------------------------------------
			
 
				 
			
 
				-FROM ubuntu22.04 as cpu
			
 
				+FROM ubuntu:22.04 as cpu
			
 
				 
			
 
				 WORKDIR /app
			
 
				 
			
 
				 RUN apt-get update -y && \
			
 
				   apt-get install -y python3 python3-pip portaudio19-dev
			
 
				 
			
 
				-RUN pip3 install torch==2.2.2+cu118 torchaudio==2.2.2 --index-url https://download.pytorch.org/whl/cu118
			
 
				+RUN pip3 install torch==2.3.0 torchaudio==2.3.0
			
 
				 
			
 
				 COPY requirements.txt /app/requirements.txt
			
 
				 RUN pip3 install -r /app/requirements.txt
			
@@ -36,4 +36,4 @@ RUN pip3 install -r /app/requirements.txt
 
				 EXPOSE 9001
			
 
				 ENV PYTHONPATH "${PYTHONPATH}:/app"
			
 
				 RUN export PYTHONPATH="${PYTHONPATH}:/app"
			
 
				-CMD ["python3", "example_browserclient/server.py"]
			
 
				+CMD ["python3", "example_browserclient/server.py"]
			
--- a/RealtimeSTT/audio_recorder.py
+++ b/RealtimeSTT/audio_recorder.py
@@ -443,7 +443,7 @@ class AudioToTextRecorder:
 
				         # Set device for model
			
 
				         self.device = "cuda" if self.device == "cuda" and torch.cuda.is_available() else "cpu"
			
 
				 
			
 
				-        self.transcript_process = mp.Process(
			
 
				+        self.transcript_process = self._start_thread(
			
 
				             target=AudioToTextRecorder._transcription_worker,
			
 
				             args=(
			
 
				                 child_transcription_pipe,
			
@@ -459,7 +459,6 @@ class AudioToTextRecorder:
 
				                 self.suppress_tokens
			
 
				             )
			
 
				         )
			
 
				-        self.transcript_process.start()
			
 
				 
			
 
				         # Start audio data reading process
			
 
				         if self.use_microphone.value:
			
@@ -468,7 +467,7 @@ class AudioToTextRecorder:
 
				                          f" sample rate: {self.sample_rate}"
			
 
				                          f" buffer size: {self.buffer_size}"
			
 
				                          )
			
 
				-            self.reader_process = mp.Process(
			
 
				+            self.reader_process = self._start_thread(
			
 
				                 target=AudioToTextRecorder._audio_data_worker,
			
 
				                 args=(
			
 
				                     self.audio_queue,
			
@@ -480,7 +479,6 @@ class AudioToTextRecorder:
 
				                     self.use_microphone
			
 
				                 )
			
 
				             )
			
 
				-            self.reader_process.start()
			
 
				 
			
 
				         # Initialize the realtime transcription model
			
 
				         if self.enable_realtime_transcription:
			
@@ -642,13 +640,36 @@ class AudioToTextRecorder:
 
				         self.realtime_thread = threading.Thread(target=self._realtime_worker)
			
 
				         self.realtime_thread.daemon = True
			
 
				         self.realtime_thread.start()
			
 
				-
			
 
				+                   
			
 
				         # Wait for transcription models to start
			
 
				         logging.debug('Waiting for main transcription model to start')
			
 
				         self.main_transcription_ready_event.wait()
			
 
				         logging.debug('Main transcription model ready')
			
 
				 
			
 
				         logging.debug('RealtimeSTT initialization completed successfully')
			
 
				+                   
			
 
				+    def _start_thread(self, target=None, args=()):
			
 
				+        """
			
 
				+        Implement a consistent threading model across the library.
			
 
				+
			
 
				+        This method is used to start any thread in this library. It uses the
			
 
				+        standard threading. Thread for Linux and for all others uses the pytorch
			
 
				+        MultiProcessing library 'Process'.
			
 
				+        Args:
			
 
				+            target (callable object): is the callable object to be invoked by
			
 
				+              the run() method. Defaults to None, meaning nothing is called.
			
 
				+            args (tuple): is a list or tuple of arguments for the target
			
 
				+              invocation. Defaults to ().
			
 
				+        """
			
 
				+        if (platform.system() == 'Linux'):
			
 
				+            thread = threading.Thread(target=target, args=args)
			
 
				+            thread.deamon = True
			
 
				+            thread.start()
			
 
				+            return thread
			
 
				+        else:
			
 
				+            thread = mp.Process(target=target, args=args)
			
 
				+            thread.start()
			
 
				+            return thread
			
 
				 
			
 
				     @staticmethod
			
 
				     def _transcription_worker(conn,