2 jaren geleden · cd3e70dbbc
--- a/.github/workflows/docker.yml
+++ b/.github/workflows/docker.yml
@@ -34,7 +34,9 @@ jobs:
 
				           context: .
			
 
				           platforms: linux/amd64,linux/arm64
			
 
				           push: true
			
 
				-          tags: ftcaplan/matrix-stt-bot:latest
			
 
				+          tags: ftcaplan/matrix-stt-bot:tiny
			
 
				+          build-args: |
			
 
				+            "PRELOAD_MODEL=tiny"
			
 
				       -
			
 
				         name: Build and push
			
 
				         uses: docker/build-push-action@v2
			
@@ -42,9 +44,7 @@ jobs:
 
				           context: .
			
 
				           platforms: linux/amd64,linux/arm64
			
 
				           push: true
			
 
				-          tags: ftcaplan/matrix-stt-bot:tiny
			
 
				-          build-args: |
			
 
				-            "PRELOAD_MODEL=tiny"
			
 
				+          tags: ftcaplan/matrix-stt-bot:latest
			
 
				       -
			
 
				         name: Build and push
			
 
				         uses: docker/build-push-action@v2
			
--- a/main.py
+++ b/main.py
@@ -23,7 +23,7 @@ config.ignore_unverified_devices = True
 
				 config.store_path = '/data/crypto_store/'
			
 
				 bot = botlib.Bot(creds, config)
			
 
				 
			
 
				-asr = ASR(os.getenv('ASR_MODEL', 'tiny'), os.getenv('ASR_LANGUAGE', 'en'))
			
 
				+asr = ASR(os.getenv('ASR_MODEL', os.getenv('PRELOAD_MODEL', 'tiny')), os.getenv('ASR_LANGUAGE', 'en'))
			
 
				 
			
 
				 @bot.listener.on_custom_event(nio.RoomMessage)
			
 
				 async def on_message(room, event):
			
--- a/speech_recognition.py
+++ b/speech_recognition.py
@@ -3,7 +3,6 @@ import ffmpeg
 
				 import asyncio
			
 
				 import subprocess
			
 
				 import os
			
 
				-import shutil
			
 
				 
			
 
				 SAMPLE_RATE = 16000
			
 
				 
			
@@ -37,19 +36,20 @@ class ASR():
 
				     self.model = model
			
 
				     self.language = language
			
 
				 
			
 
				-    if not os.path.exists("/data/models"):
			
 
				-      os.mkdir("/data/models")
			
 
				-    self.model_path = f"/data/models/ggml-{model}.bin"
			
 
				+    if os.path.exists(f"/app/ggml-model-whisper-{model}.bin"):
			
 
				+      self.model_path = f"/app/ggml-model-whisper-{model}.bin"
			
 
				+    else:
			
 
				+      self.model_path = f"/data/models/ggml-{model}.bin"
			
 
				+      if not os.path.exists("/data/models"):
			
 
				+        os.mkdir("/data/models")
			
 
				+        
			
 
				     self.model_url = f"https://ggml.ggerganov.com/ggml-model-whisper-{self.model}.bin"
			
 
				     self.lock = asyncio.Lock()
			
 
				 
			
 
				   def load_model(self):
			
 
				     if not os.path.exists(self.model_path) or os.path.getsize(self.model_path) == 0:
			
 
				-      print("Fetching model...")
			
 
				-      if os.path.exists(f"ggml-model-whisper-{self.model}.bin"):
			
 
				-        shutil.copy(f"ggml-model-whisper-{self.model}.bin", self.model_path)
			
 
				-      else:
			
 
				-        subprocess.run(["wget", self.model_url, "-O", self.model_path], check=True)
			
 
				+      print("Downloading model...")
			
 
				+      subprocess.run(["wget", self.model_url, "-O", self.model_path], check=True)
			
 
				       print("Done.")
			
 
				 
			
 
				   async def transcribe(self, audio: bytes) -> str: