FinalTrans / app.py
shahpalash10's picture
Update app.py
24992c5
raw
history blame
2.39 kB
import streamlit as st
from transformers import pipeline
from gtts import gTTS
import speech_recognition as sr
import pyaudio
# Create a translation pipeline
pipe = pipeline('translation', model='Helsinki-NLP/opus-mt-en-hi')
# Initialize the SpeechRecognition recognizer
recognizer = sr.Recognizer()
# Create a Streamlit input element for microphone input
audio_input = st.empty()
# Initialize PyAudio and stream variables
p = pyaudio.PyAudio()
stream = None
# Check if the microphone input is requested
if st.checkbox("Use Microphone for English Input"):
with audio_input:
st.warning("Listening for audio input... Speak in English.")
try:
with sr.Microphone() as source:
# Open the audio stream
stream = p.open(format=pyaudio.paInt16, channels=1, rate=16000, input=True, frames_per_buffer=1024)
audio = b""
for _ in range(0, int(16000 / 1024 * 5)): # Adjust the recording duration as needed
audio += stream.read(1024)
# Recognize the English speech
english_text = recognizer.recognize_google(audio, language='en')
st.success("Audio input recorded. Translating...")
# Translate the English text to Hindi
out = pipe(english_text, src_lang='en', tgt_lang='hi')
# Extract the translation
translation_text = out[0]['translation_text']
st.text(f"English Input: {english_text}")
st.text(f"Hindi Translation: {translation_text}")
# Convert the translated text to speech
tts = gTTS(translation_text, lang='hi')
tts.save("translated_audio.mp3")
# Display the audio player for listening to the speech
st.audio("translated_audio.mp3", format='audio/mp3')
except sr.WaitTimeoutError:
st.warning("No speech detected. Please speak into the microphone.")
except sr.RequestError as e:
st.error(f"Could not request results from Google Speech Recognition service: {e}")
except sr.UnknownValueError:
st.warning("Speech recognition could not understand the audio.")
finally:
# Clean up audio resources
if stream:
stream.stop_stream()
stream.close()
p.terminate()