Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -195,16 +195,20 @@ def process_speech(input_language, audio_input):
|
|
195 |
return f"{e}"
|
196 |
|
197 |
|
198 |
-
def
|
199 |
-
|
200 |
-
return
|
|
|
|
|
201 |
|
|
|
202 |
client = Client("https://facebook-seamless-m4t.hf.space/--replicas/8cllp/")
|
203 |
|
204 |
try:
|
|
|
205 |
result = client.predict(
|
206 |
"T2ST",
|
207 |
-
"text",
|
208 |
None,
|
209 |
None,
|
210 |
input_text,
|
@@ -212,44 +216,31 @@ def convert_text_to_speech(input_text: str, source_language: str, target_languag
|
|
212 |
target_language,
|
213 |
api_name="/run"
|
214 |
)
|
215 |
-
except Exception as e:
|
216 |
-
return None, f"Error during prediction: {str(e)}"
|
217 |
|
218 |
-
|
|
|
|
|
|
|
219 |
translated_text = ""
|
220 |
audio_file_path = ""
|
221 |
|
|
|
222 |
if result:
|
223 |
for item in result:
|
224 |
if isinstance(item, str):
|
225 |
-
if item
|
226 |
-
|
|
|
|
|
227 |
else:
|
|
|
228 |
translated_text += item + " "
|
229 |
-
except Exception as e:
|
230 |
-
return None, f"Error processing result: {str(e)}"
|
231 |
|
232 |
-
|
233 |
-
return None, "No audio file path found in the result."
|
234 |
|
235 |
-
|
236 |
-
|
237 |
-
|
238 |
-
def process_image(image_input):
|
239 |
-
# Initialize the Gradio client with the URL of the Gradio server
|
240 |
-
client = Client("https://adept-fuyu-8b-demo.hf.space/--replicas/pqjvl/")
|
241 |
-
|
242 |
-
# Assuming image_input is a URL path to the image
|
243 |
-
image_path = image_input
|
244 |
-
|
245 |
-
# Call the predict method of the client
|
246 |
-
result = client.predict(
|
247 |
-
image_path, # URL of the image
|
248 |
-
True, # Additional parameter for the server (e.g., enable detailed captioning)
|
249 |
-
fn_index=2
|
250 |
-
)
|
251 |
-
|
252 |
-
return result
|
253 |
|
254 |
|
255 |
def query_vectara(text):
|
|
|
195 |
return f"{e}"
|
196 |
|
197 |
|
198 |
+
def is_base64(s):
|
199 |
+
try:
|
200 |
+
return base64.b64encode(base64.b64decode(s)) == s.encode()
|
201 |
+
except Exception:
|
202 |
+
return False
|
203 |
|
204 |
+
def convert_text_to_speech(input_text: str, source_language: str, target_language: str) -> tuple[str, str]:
|
205 |
client = Client("https://facebook-seamless-m4t.hf.space/--replicas/8cllp/")
|
206 |
|
207 |
try:
|
208 |
+
# Make a prediction request to the client
|
209 |
result = client.predict(
|
210 |
"T2ST",
|
211 |
+
"text", # Since we are doing text-to-speech
|
212 |
None,
|
213 |
None,
|
214 |
input_text,
|
|
|
216 |
target_language,
|
217 |
api_name="/run"
|
218 |
)
|
|
|
|
|
219 |
|
220 |
+
# Print or log the raw API response for inspection
|
221 |
+
print("Raw API Response:", result)
|
222 |
+
|
223 |
+
# Initialize variables
|
224 |
translated_text = ""
|
225 |
audio_file_path = ""
|
226 |
|
227 |
+
# Process the result
|
228 |
if result:
|
229 |
for item in result:
|
230 |
if isinstance(item, str):
|
231 |
+
# Check if the item is a URL pointing to an audio file or a base64 encoded string
|
232 |
+
if any(ext in item.lower() for ext in ['.mp3', '.wav', '.ogg']) or is_base64(item):
|
233 |
+
if not audio_file_path: # Store only the first audio file path or base64 string
|
234 |
+
audio_file_path = item
|
235 |
else:
|
236 |
+
# Concatenate the translated text
|
237 |
translated_text += item + " "
|
|
|
|
|
238 |
|
239 |
+
return audio_file_path, translated_text.strip()
|
|
|
240 |
|
241 |
+
except Exception as e:
|
242 |
+
print(f"Error in text-to-speech conversion: {str(e)}")
|
243 |
+
return None, f"Error in text-to-speech conversion: {str(e)}"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
244 |
|
245 |
|
246 |
def query_vectara(text):
|