Exodia

Sleeping

KleinPenny commited on Sep 13, 2024

Commit

867343a

verified ·

1 Parent(s): 9d03774

Update app.py

Update ASR Module

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,6 +4,7 @@ from huggingface_hub import InferenceClient
 import os
 import requests
 import scipy.io.wavfile
 client = InferenceClient(
     "meta-llama/Meta-Llama-3-8B-Instruct",
@@ -56,23 +57,22 @@ def process_audio(audio_data):
     else:
         return "Invalid audio data format"
-    # Define the local file path to save the WAV file
-    local_wav_file = "converted_audio.wav"
-    # Save the audio data as a WAV file
-    scipy.io.wavfile.write(local_wav_file, sample_rate, data)
     API_URL = "https://api-inference.huggingface.co/models/openai/whisper-large-v2"
     headers = {"Authorization": f"Bearer {os.getenv('hf_token')}"}
-    def query(filename):
-        with open(filename, "rb") as f:
-            file_data = f.read()
-        response = requests.post(API_URL, headers=headers, data=file_data)
         return response.json()
     # Call the API to process the audio
-    output = query(local_wav_file)
     print(output)

 import os
 import requests
 import scipy.io.wavfile
+import io
 client = InferenceClient(
     "meta-llama/Meta-Llama-3-8B-Instruct",
     else:
         return "Invalid audio data format"
+    # Convert the audio data to WAV format in memory
+    buf = io.BytesIO()
+    scipy.io.wavfile.write(buf, sample_rate, data)
+    wav_bytes = buf.getvalue()
+    buf.close()
     API_URL = "https://api-inference.huggingface.co/models/openai/whisper-large-v2"
     headers = {"Authorization": f"Bearer {os.getenv('hf_token')}"}
+    def query(wav_data):
+        response = requests.post(API_URL, headers=headers, data=wav_data)
         return response.json()
     # Call the API to process the audio
+    output = query(wav_bytes)
     print(output)