Spaces:

utkarsh-dixit
/

WhisperFusion

Paused

App Files Files Community

makaveli10 commited on Dec 20, 2023

Commit

456c9bb

1 Parent(s): a291214

add whisper bot client

Browse files

Files changed (2) hide show

whisper_live/__version__.py +0 -1
whisper_live/client.py +27 -12

whisper_live/__version__.py DELETED Viewed

	@@ -1 +0,0 @@
1	- __version__="0.0.9"

whisper_live/client.py CHANGED Viewed

@@ -50,7 +50,7 @@ class Client:
     INSTANCES = {}
     def __init__(
-        self, host=None, port=None, is_multilingual=False, lang=None, translate=False
     ):
         """
         Initializes a Client instance for audio recording and streaming to a server.
@@ -66,7 +66,7 @@ class Client:
             lang (str, optional): The selected language for transcription when multilingual is disabled. Default is None.
             translate (bool, optional): Specifies if the task is translation. Default is False.
         """
-        self.chunk = 1024
         self.format = pyaudio.paInt16
         self.channels = 1
         self.rate = 16000
@@ -80,7 +80,9 @@ class Client:
         self.last_response_recieved = None
         self.disconnect_if_no_response_for = 15
         self.multilingual = is_multilingual
-        self.language = lang if is_multilingual else "en"
         if translate:
             self.task = "translate"
@@ -140,11 +142,16 @@ class Client:
             print("[ERROR]: invalid client uid")
             return
-        if "status" in message.keys() and message["status"] == "WAIT":
-            self.waiting = True
-            print(
-                f"[INFO]:Server is full. Estimated wait time {round(message['message'])} minutes."
-            )
         if "message" in message.keys() and message["message"] == "DISCONNECT":
             print("[INFO]: Server overtime disconnected.")
@@ -162,11 +169,18 @@ class Client:
             )
             return
         if "segments" not in message.keys():
             return
         message = message["segments"]
         text = []
         if len(message):
             for seg in message:
                 if text and text[-1] == seg["text"]:
@@ -213,6 +227,7 @@ class Client:
                     "multilingual": self.multilingual,
                     "language": self.language,
                     "task": self.task,
                 }
             )
         )
@@ -497,8 +512,8 @@ class TranscriptionClient:
         transcription_client()
         ```
     """
-    def __init__(self, host, port, is_multilingual=False, lang=None, translate=False):
-        self.client = Client(host, port, is_multilingual, lang, translate)
     def __call__(self, audio=None, hls_url=None):
         """
@@ -514,10 +529,10 @@ class TranscriptionClient:
         """
         print("[INFO]: Waiting for server ready ...")
         while not self.client.recording:
-            if self.client.waiting:
                 self.client.close_websocket()
                 return
-            pass
         print("[INFO]: Server Ready!")
         if hls_url is not None:
             self.client.process_hls_stream(hls_url)

     INSTANCES = {}
     def __init__(
+        self, host=None, port=None, is_multilingual=False, lang=None, translate=False, model_size="small"
     ):
         """
         Initializes a Client instance for audio recording and streaming to a server.
             lang (str, optional): The selected language for transcription when multilingual is disabled. Default is None.
             translate (bool, optional): Specifies if the task is translation. Default is False.
         """
+        self.chunk = 1024 * 3
         self.format = pyaudio.paInt16
         self.channels = 1
         self.rate = 16000
         self.last_response_recieved = None
         self.disconnect_if_no_response_for = 15
         self.multilingual = is_multilingual
+        self.language = lang
+        self.model_size = model_size
+        self.server_error = False
         if translate:
             self.task = "translate"
             print("[ERROR]: invalid client uid")
             return
+        if "status" in message.keys():
+            if message["status"] == "WAIT":
+                self.waiting = True
+                print(
+                    f"[INFO]:Server is full. Estimated wait time {round(message['message'])} minutes."
+                )
+            elif message["status"] == "ERROR":
+                print(f"Message from Server: {message['message']}")
+                self.server_error = True
+            return
         if "message" in message.keys() and message["message"] == "DISCONNECT":
             print("[INFO]: Server overtime disconnected.")
             )
             return
+        if "llm_output" in message.keys():
+            print("LLM output: ")
+            for item in message["llm_output"]:
+                print(item)
         if "segments" not in message.keys():
             return
         message = message["segments"]
         text = []
+        print(message)
         if len(message):
             for seg in message:
                 if text and text[-1] == seg["text"]:
                     "multilingual": self.multilingual,
                     "language": self.language,
                     "task": self.task,
+                    "model_size": self.model_size,
                 }
             )
         )
         transcription_client()
         ```
     """
+    def __init__(self, host, port, is_multilingual=False, lang=None, translate=False, model_size="small"):
+        self.client = Client(host, port, is_multilingual, lang, translate, model_size)
     def __call__(self, audio=None, hls_url=None):
         """
         """
         print("[INFO]: Waiting for server ready ...")
         while not self.client.recording:
+            if self.client.waiting or self.client.server_error:
                 self.client.close_websocket()
                 return
         print("[INFO]: Server Ready!")
         if hls_url is not None:
             self.client.process_hls_stream(hls_url)