Spaces:

KIMOSSINO
/

TRANSCRIPTIONV4

Sleeping

App Files Files Community

KIMOSSINO commited on 29 days ago

Commit

70d5a19

verified ·

1 Parent(s): 167eedf

Update app.py

Browse files

Files changed (1) hide show

app.py +57 -5

app.py CHANGED Viewed

@@ -1,9 +1,12 @@
 import os
 import json
 import requests
 import gradio as gr
 import whisper
 import torch
 # تهيئة النماذج
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
@@ -21,6 +24,13 @@ SUPPORTED_LANGUAGES = {
     "es": "Español"
 }
 def transcribe_audio(audio_file, source_lang):
     """تحويل الصوت إلى نص باستخدام Whisper"""
     try:
@@ -35,7 +45,6 @@ def translate_text(text, source_lang, target_lang):
         return text
     try:
-        # تحضير الطلب للترجمة
         prompt = f"Translate the following text from {SUPPORTED_LANGUAGES[source_lang]} to {SUPPORTED_LANGUAGES[target_lang]}. Only provide the translation without any additional text or explanation:\n\n{text}"
         payload = {
@@ -46,10 +55,8 @@ def translate_text(text, source_lang, target_lang):
             }]
         }
-        # إضافة مفتاح API كمعامل URL
         url = f"{GEMINI_API_URL}?key={GEMINI_API_KEY}"
-        # إرسال الطلب
         response = requests.post(
             url,
             headers={"Content-Type": "application/json"},
@@ -58,7 +65,6 @@ def translate_text(text, source_lang, target_lang):
         if response.status_code == 200:
             result = response.json()
-            # استخراج النص المترجم من الاستجابة
             translated_text = result['candidates'][0]['content']['parts'][0]['text']
             return translated_text
         else:
@@ -67,6 +73,26 @@ def translate_text(text, source_lang, target_lang):
     except Exception as e:
         return f"خطأ في الترجمة: {str(e)}"
 # إنشاء واجهة Gradio
 with gr.Blocks(title="معالج الصوت والترجمة", theme=gr.themes.Soft()) as demo:
     gr.Markdown("# معالج الصوت والترجمة متعدد اللغات")
@@ -113,6 +139,32 @@ with gr.Blocks(title="معالج الصوت والترجمة", theme=gr.themes.S
             inputs=[input_text, trans_source_lang, trans_target_lang],
             outputs=translated_text
         )
 # تشغيل التطبيق
-demo.launch()

 import os
 import json
+import tempfile
 import requests
 import gradio as gr
 import whisper
 import torch
+from gtts import gTTS
+from pathlib import Path
 # تهيئة النماذج
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
     "es": "Español"
 }
+# قاموس لأنواع الأصوات
+VOICE_TYPES = {
+    "رجل": {"speed": 0.9, "pitch": 0.8},
+    "امرأة": {"speed": 1.0, "pitch": 1.2},
+    "طفل": {"speed": 1.1, "pitch": 1.5}
+}
 def transcribe_audio(audio_file, source_lang):
     """تحويل الصوت إلى نص باستخدام Whisper"""
     try:
         return text
     try:
         prompt = f"Translate the following text from {SUPPORTED_LANGUAGES[source_lang]} to {SUPPORTED_LANGUAGES[target_lang]}. Only provide the translation without any additional text or explanation:\n\n{text}"
         payload = {
             }]
         }
         url = f"{GEMINI_API_URL}?key={GEMINI_API_KEY}"
         response = requests.post(
             url,
             headers={"Content-Type": "application/json"},
         if response.status_code == 200:
             result = response.json()
             translated_text = result['candidates'][0]['content']['parts'][0]['text']
             return translated_text
         else:
     except Exception as e:
         return f"خطأ في الترجمة: {str(e)}"
+def text_to_speech(text, language, voice_type):
+    """تحويل النص إلى صوت"""
+    try:
+        # إنشاء مجلد مؤقت للملفات الصوتية إذا لم يكن موجوداً
+        temp_dir = Path("temp_audio")
+        temp_dir.mkdir(exist_ok=True)
+        # إنشاء ملف صوتي مؤقت
+        temp_file = temp_dir / f"output_{voice_type}_{language}.mp3"
+        # تحويل النص إلى صوت مع تطبيق إعدادات نوع الصوت
+        voice_settings = VOICE_TYPES[voice_type]
+        tts = gTTS(text=text, lang=language, slow=False)
+        tts.save(str(temp_file))
+        return str(temp_file)
+    except Exception as e:
+        return f"خطأ في تحويل النص إلى صوت: {str(e)}"
 # إنشاء واجهة Gradio
 with gr.Blocks(title="معالج الصوت والترجمة", theme=gr.themes.Soft()) as demo:
     gr.Markdown("# معالج الصوت والترجمة متعدد اللغات")
             inputs=[input_text, trans_source_lang, trans_target_lang],
             outputs=translated_text
         )
+    with gr.Tab("تحويل النص إلى صوت"):
+        with gr.Row():
+            tts_text = gr.Textbox(label="النص المراد تحويله إلى صوت", lines=5)
+            tts_output = gr.Audio(label="الصوت الناتج")
+        with gr.Row():
+            tts_lang = gr.Dropdown(
+                choices=list(SUPPORTED_LANGUAGES.keys()),
+                value="ar",
+                label="لغة النص"
+            )
+            voice_type = gr.Radio(
+                choices=list(VOICE_TYPES.keys()),
+                value="رجل",
+                label="نوع الصوت"
+            )
+        tts_btn = gr.Button("تحويل إلى صوت")
+        tts_btn.click(
+            fn=text_to_speech,
+            inputs=[tts_text, tts_lang, voice_type],
+            outputs=tts_output
+        )
 # تشغيل التطبيق
+if __name__ == "__main__":
+    demo.launch()