Spaces:

M4xjunior
/

locseed

Running on Zero

App Files Files Community

M4xjunior commited on Dec 2, 2024

Commit

7341fd9

1 Parent(s): b837d0b

fixd

Browse files

Files changed (2) hide show

app.py +13 -13
logs/sentence_analyzer_2024-12-02.log +18 -0

app.py CHANGED Viewed

@@ -28,7 +28,7 @@ def gpu_decorator(func):
 # Importando a nova API F5TTS
 from f5_tts.api import F5TTS
-from f5_tts.infer.utils_infer import preprocess_ref_audio_text
 import os
 from huggingface_hub import hf_hub_download
@@ -51,8 +51,8 @@ def load_f5tts():
     return F5TTS(
         model_type="F5-TTS",  # Ajuste o nome do modelo se necessário
         ckpt_file=ckpt_path,
-        vocab_file="/home/user/app/data/Emilia_ZH_EN_pinyin/vocab.txt", # Caminho para o arquivo vocab.txt
-        device="cuda" if torch.cuda.is_available() else "cpu", # Define o dispositivo
         use_ema=True
     )
@@ -84,7 +84,7 @@ def infer(
             last_device = device_test
         if last_ema != use_ema:
             last_ema = use_ema
-        vocab_file = "/home/user/app/data/Emilia_ZH_EN_pinyin/vocab.txt"
         tts_api = F5TTS(
             model_type=exp_name, ckpt_file=file_checkpoint, vocab_file=vocab_file, device=device_test, use_ema=use_ema
         )
@@ -202,16 +202,16 @@ with gr.Blocks(css=custom_css) as app:
                 # Processar cada chunk
                 audio_segments = []
                 for chunk in chunks:
-                    # Usando a função infer correta aqui
-                    audio_file, device_used, seed_used = infer(
-                        "Emilia_ZH_EN_pinyin", # Substitua pelo nome do seu projeto
-                        "/home/user/app/model_1200000.safetensors", # Substitua pelo caminho do seu checkpoint
-                        "F5-TTS", # Ou "E2-TTS" dependendo do seu modelo
                         ref_text_input,
                         ref_audio_input,
                         chunk,
                         nfe_slider,
-                        True, # use_ema - ajuste se necessário
                         speed_slider,
                         seed_input,
                         remove_silence,
@@ -253,8 +253,8 @@ with gr.Blocks(css=custom_css) as app:
                 ],
                 outputs=[
                     audio_output,
-                    ref_text_input,  # Atualiza o texto de referência, se necessário
-                    seed_output,  # Saída do Seed
                 ],
             )
@@ -279,4 +279,4 @@ if __name__ == "__main__":
     if not USING_SPACES:
         main()
     else:
-        app.queue().launch()

 # Importando a nova API F5TTS
 from f5_tts.api import F5TTS
+from f5_tts.infer.utils_infer import preprocess_ref_audio_text
 import os
 from huggingface_hub import hf_hub_download
     return F5TTS(
         model_type="F5-TTS",  # Ajuste o nome do modelo se necessário
         ckpt_file=ckpt_path,
+        vocab_file="/home/user/app/data/Emilia_ZH_EN_pinyin/vocab.txt",  # Caminho para o arquivo vocab.txt
+        device="cuda" if torch.cuda.is_available() else "cpu",  # Define o dispositivo
         use_ema=True
     )
             last_device = device_test
         if last_ema != use_ema:
             last_ema = use_ema
+        vocab_file = "/home/user/app/data/Emilia_ZH_EN_pinyin/vocab.txt"
         tts_api = F5TTS(
             model_type=exp_name, ckpt_file=file_checkpoint, vocab_file=vocab_file, device=device_test, use_ema=use_ema
         )
                 # Processar cada chunk
                 audio_segments = []
                 for chunk in chunks:
+                    # Usando a função infer correta aqui, ignorando device_used
+                    audio_file, _, seed_used = infer(
+                        "Emilia_ZH_EN_pinyin",  # Substitua pelo nome do seu projeto
+                        "/home/user/app/model_1200000.safetensors",  # Substitua pelo caminho do seu checkpoint
+                        "F5-TTS",  # Ou "E2-TTS" dependendo do seu modelo
                         ref_text_input,
                         ref_audio_input,
                         chunk,
                         nfe_slider,
+                        True,  # use_ema - ajuste se necessário
                         speed_slider,
                         seed_input,
                         remove_silence,
                 ],
                 outputs=[
                     audio_output,
+                    ref_text_input,
+                    seed_output,
                 ],
             )
     if not USING_SPACES:
         main()
     else:
+        app.queue().launch()

logs/sentence_analyzer_2024-12-02.log CHANGED Viewed

@@ -26,3 +26,21 @@
 2024-12-02 19:25:59,990 - SentenceAnalyzer - INFO - SentenceAnalyzer initialized successfully
 2024-12-02 19:28:56,156 - SentenceAnalyzer - DEBUG - Logger set up successfully
 2024-12-02 19:28:56,156 - SentenceAnalyzer - INFO - SentenceAnalyzer initialized successfully

 2024-12-02 19:25:59,990 - SentenceAnalyzer - INFO - SentenceAnalyzer initialized successfully
 2024-12-02 19:28:56,156 - SentenceAnalyzer - DEBUG - Logger set up successfully
 2024-12-02 19:28:56,156 - SentenceAnalyzer - INFO - SentenceAnalyzer initialized successfully
+2024-12-02 19:30:06,733 - SentenceAnalyzer - DEBUG - Logger set up successfully
+2024-12-02 19:30:06,734 - SentenceAnalyzer - INFO - SentenceAnalyzer initialized successfully
+2024-12-02 19:30:28,918 - SentenceAnalyzer - DEBUG - Starting sentence splitting
+2024-12-02 19:30:28,918 - SentenceAnalyzer - DEBUG - Normalized text using NFC
+2024-12-02 19:30:28,919 - SentenceAnalyzer - DEBUG - Removed page numbers and chapter titles
+2024-12-02 19:30:28,919 - SentenceAnalyzer - DEBUG - Replaced hyphenated line breaks
+2024-12-02 19:30:28,919 - SentenceAnalyzer - DEBUG - Replaced multiple newlines with a space
+2024-12-02 19:30:28,919 - SentenceAnalyzer - DEBUG - Normalized whitespace
+2024-12-02 19:30:28,941 - SentenceAnalyzer - DEBUG - Split text into 1 sentences using NLTK
+2024-12-02 19:30:28,941 - SentenceAnalyzer - INFO - Split text into 1 sentences after cleanup
+2024-12-02 19:31:01,028 - SentenceAnalyzer - DEBUG - Starting sentence splitting
+2024-12-02 19:31:01,028 - SentenceAnalyzer - DEBUG - Normalized text using NFC
+2024-12-02 19:31:01,029 - SentenceAnalyzer - DEBUG - Removed page numbers and chapter titles
+2024-12-02 19:31:01,029 - SentenceAnalyzer - DEBUG - Replaced hyphenated line breaks
+2024-12-02 19:31:01,029 - SentenceAnalyzer - DEBUG - Replaced multiple newlines with a space
+2024-12-02 19:31:01,029 - SentenceAnalyzer - DEBUG - Normalized whitespace
+2024-12-02 19:31:01,051 - SentenceAnalyzer - DEBUG - Split text into 1 sentences using NLTK
+2024-12-02 19:31:01,051 - SentenceAnalyzer - INFO - Split text into 1 sentences after cleanup