Spaces:

ixxan
/

uyghur-speech-models

Running

Irpan commited on 12 days ago

Commit

ed17acd

•

1 Parent(s): b1dd882

asr

Files changed (5) hide show

app.py CHANGED Viewed

@@ -9,7 +9,7 @@ mms_transcribe = gr.Interface(
         gr.Audio(),
         gr.Dropdown(
             choices=[model for model in asr.models_info] + ["Compare All Models"],
-            label="Select Model for ASR",
             value="ixxan/wav2vec2-large-mms-1b-uyghur-latin",
             interactive=True
         ),
@@ -18,12 +18,11 @@ mms_transcribe = gr.Interface(
         gr.Textbox(label="Uyghur Arabic Transcription"),
         gr.Textbox(label="Uyghur Latin Transcription"),
     ],
-    #examples=ASR_EXAMPLES,
     title="Speech-to-text",
     description=(
         "Transcribe Uyghur speech audio from a microphone or input file."
     ),
-    #article=ASR_NOTE,
     allow_flagging="never",
 )
@@ -33,7 +32,7 @@ mms_synthesize = gr.Interface(
         gr.Text(label="Input text"),
         gr.Dropdown(
             choices=[model for model in tts.models_info],
-            label="Select Model for TTS",
             value="Meta-MMS",
             interactive=True
         )
@@ -43,7 +42,9 @@ mms_synthesize = gr.Interface(
     ],
     examples=util.tts_examples,
     title="Text-to-speech",
-    description=("Generate audio from input text."),
     allow_flagging="never",
 )

         gr.Audio(),
         gr.Dropdown(
             choices=[model for model in asr.models_info] + ["Compare All Models"],
+            label="Select a Model for ASR",
             value="ixxan/wav2vec2-large-mms-1b-uyghur-latin",
             interactive=True
         ),
         gr.Textbox(label="Uyghur Arabic Transcription"),
         gr.Textbox(label="Uyghur Latin Transcription"),
     ],
+    examples=util.asr_examples,
     title="Speech-to-text",
     description=(
         "Transcribe Uyghur speech audio from a microphone or input file."
     ),
     allow_flagging="never",
 )
         gr.Text(label="Input text"),
         gr.Dropdown(
             choices=[model for model in tts.models_info],
+            label="Select a Model for TTS",
             value="Meta-MMS",
             interactive=True
         )
     ],
     examples=util.tts_examples,
     title="Text-to-speech",
+    description=(
+        "Generate audio from input Uyghur text."
+        ),
     allow_flagging="never",
 )

examples/.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

examples/1.wav ADDED Viewed

Binary file (221 kB). View file

examples/2.wav ADDED Viewed

Binary file (184 kB). View file

util.py CHANGED Viewed

@@ -4,6 +4,9 @@ from umsc import UgMultiScriptConverter
 ug_arab_to_latn = UgMultiScriptConverter('UAS', 'ULS')
 ug_latn_to_arab = UgMultiScriptConverter('ULS', 'UAS')
 tts_examples = [
     ["مەكتەپكە بارغاندا تېخىمۇ بىلىملىك بولۇمەن.", "Meta-MMS"],
     ["قىلىچ قان تامغۇزسا، بەگ ئەل ئالىدۇ؛ قەلەمدىن سىياھتانسا، ئالتۇن كېلىدۇ.", "Meta-MMS"],

 ug_arab_to_latn = UgMultiScriptConverter('UAS', 'ULS')
 ug_latn_to_arab = UgMultiScriptConverter('ULS', 'UAS')
+asr_examples = [['examples/1.wav', 'ixxan/wav2vec2-large-mms-1b-uyghur-latin'],
+                ['examples/2.wav', 'ixxan/wav2vec2-large-mms-1b-uyghur-latin']]
 tts_examples = [
     ["مەكتەپكە بارغاندا تېخىمۇ بىلىملىك بولۇمەن.", "Meta-MMS"],
     ["قىلىچ قان تامغۇزسا، بەگ ئەل ئالىدۇ؛ قەلەمدىن سىياھتانسا، ئالتۇن كېلىدۇ.", "Meta-MMS"],