Spaces:

katospiegel
/

amanu

Runtime error

App Files Files Community

katospiegel commited on Oct 19, 2023

Commit

9dba6bb

1 Parent(s): 2cce248

method for creating the final text

Browse files

Files changed (2) hide show

app.py +3 -2
helpers.py +41 -0

app.py CHANGED Viewed

@@ -88,7 +88,7 @@ def transcribeWhisperX(audiofile, model, language, patiente,
     #     write_srt(result_aligned["segments"], file=srt)
     ###########################################################################
-    return audio_path, audio_normalized_path, vocal_path, novocal_path, vocal_path, guardar_dataframe_en_csv(diarize_segments), json.dumps(result_speakers)
 transcribeI = gr.Interface(
@@ -133,7 +133,8 @@ transcribeII = gr.Interface(
              gr.Audio(type="filepath", label="normalized"),
              gr.Audio(type="filepath", label="vocal"),
              gr.Audio(type="filepath", label="no_vocal"),
-            gr.File(label="Archivo SRT generado"),
              gr.File(label="Tabla con diarización generada"),
              gr.JSON(label="JSON Output"),
              #gr.JSON(label="JSON Output"),

     #     write_srt(result_aligned["segments"], file=srt)
     ###########################################################################
+    return audio_path, audio_normalized_path, vocal_path, novocal_path, vocal_path, str(file_path.stem), guardar_dataframe_en_csv(diarize_segments), json.dumps(result_speakers)
 transcribeI = gr.Interface(
              gr.Audio(type="filepath", label="normalized"),
              gr.Audio(type="filepath", label="vocal"),
              gr.Audio(type="filepath", label="no_vocal"),
+             gr.File(label="Archivo SRT generado"),
+             gr.File(label="Archivo CSV generado"),
              gr.File(label="Tabla con diarización generada"),
              gr.JSON(label="JSON Output"),
              #gr.JSON(label="JSON Output"),

helpers.py CHANGED Viewed

@@ -38,3 +38,44 @@ def dataframe_a_lista(df):
     lista_strings = df_str.apply(lambda row: ' '.join(row), axis=1).tolist()
     return lista_strings

     lista_strings = df_str.apply(lambda row: ' '.join(row), axis=1).tolist()
     return lista_strings
+def generar_transcripcion(dataframe):
+    # Ordenamos el DataFrame por Timestamp
+    dataframe = dataframe.sort_values(by='Timestamp')
+    # Creamos un diccionario para almacenar los textos de cada speaker
+    textos_por_speaker = {}
+    # Iteramos sobre las filas del DataFrame
+    for index, row in dataframe.iterrows():
+        # Obtenemos los valores de la fila
+        timestamp = row['Timestamp']
+        speaker = row['speaker']
+        texto = row['text']
+        # Si el speaker no está en el diccionario, lo agregamos
+        if speaker not in textos_por_speaker:
+            textos_por_speaker[speaker] = []
+        # Agregamos el texto al diccionario
+        textos_por_speaker[speaker].append(texto)
+    # Creamos una lista para almacenar las líneas de la transcripción
+    lineas_transcripcion = []
+    # Iteramos sobre los speakers y sus textos
+    for speaker, textos in textos_por_speaker.items():
+        # Creamos un párrafo con todos los textos del speaker
+        parrafo = ' '.join(textos)
+        # Agregamos la línea de la transcripción con el timestamp y el speaker
+        linea = f"{timestamp} - {speaker}: {parrafo}"
+        # Agregamos la línea a la lista de la transcripción
+        lineas_transcripcion.append(linea)
+    # Guardamos la transcripción en un archivo de texto
+    nombre_archivo = guardar_en_archivo(lineas_transcripcion)
+    return nombre_archivo