salomonsky commited on
Commit
85e8a86
·
verified ·
1 Parent(s): 7a4f83c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -8
app.py CHANGED
@@ -1,10 +1,10 @@
1
  import streamlit as st
2
  import torch
3
  import numpy as np
4
- from transformers import Wav2Vec2Processor, Wav2Vec2ForCTC
5
  import pyaudio
6
- import sounddevice as sd
7
- from TTS.api import TTS
 
8
 
9
  class VoiceAssistant:
10
  def __init__(self):
@@ -12,9 +12,6 @@ class VoiceAssistant:
12
  self.processor = Wav2Vec2Processor.from_pretrained("facebook/wav2vec2-large-xlsr-53-spanish")
13
  self.model = Wav2Vec2ForCTC.from_pretrained("facebook/wav2vec2-large-xlsr-53-spanish")
14
 
15
- # Cargar modelo TTS para síntesis de voz en español (modelo corregido)
16
- self.tts_model = TTS(model_name="microsoft/speecht5_tts", progress_bar=False)
17
-
18
  # Parámetros de audio
19
  self.sample_rate = 16000
20
  self.chunk_size = 480
@@ -66,8 +63,10 @@ class VoiceAssistant:
66
  return "Respuesta generada para: " + text
67
 
68
  def text_to_speech(self, text):
69
- output_path = "response.wav"
70
- self.tts_model.tts_to_file(text=text, file_path=output_path)
 
 
71
  return output_path
72
 
73
  def run(self):
 
1
  import streamlit as st
2
  import torch
3
  import numpy as np
 
4
  import pyaudio
5
+ from transformers import Wav2Vec2Processor, Wav2Vec2ForCTC
6
+ from gtts import gTTS
7
+ import os
8
 
9
  class VoiceAssistant:
10
  def __init__(self):
 
12
  self.processor = Wav2Vec2Processor.from_pretrained("facebook/wav2vec2-large-xlsr-53-spanish")
13
  self.model = Wav2Vec2ForCTC.from_pretrained("facebook/wav2vec2-large-xlsr-53-spanish")
14
 
 
 
 
15
  # Parámetros de audio
16
  self.sample_rate = 16000
17
  self.chunk_size = 480
 
63
  return "Respuesta generada para: " + text
64
 
65
  def text_to_speech(self, text):
66
+ # Usar gTTS para convertir texto a voz
67
+ tts = gTTS(text=text, lang='es')
68
+ output_path = "response.mp3"
69
+ tts.save(output_path)
70
  return output_path
71
 
72
  def run(self):