pratikshahp commited on
Commit
e63c96b
·
verified ·
1 Parent(s): b74da9a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -6
app.py CHANGED
@@ -1,16 +1,16 @@
1
  import torch
2
- #from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
3
- from transformers import Speech2Text2Processor, SpeechEncoderDecoderModel
4
  import streamlit as st
5
  from audio_recorder_streamlit import audio_recorder
6
  import numpy as np
7
 
8
  # Function to transcribe audio to text
9
  def transcribe_audio(audio_bytes):
10
- #processor = Wav2Vec2Processor.from_pretrained("facebook/wav2vec2-base-960h")
11
- processor = Speech2Text2Processor.from_pretrained("facebook/s2t-wav2vec2-large-en-de")
12
- model = SpeechEncoderDecoderModel.from_pretrained("facebook/s2t-wav2vec2-large-en-de")
13
- #model = Wav2Vec2ForCTC.from_pretrained("facebook/wav2vec2-base-960h")
14
 
15
 
16
  # Convert bytes to numpy array
 
1
  import torch
2
+ from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
3
+ #from transformers import Speech2Text2Processor, SpeechEncoderDecoderModel
4
  import streamlit as st
5
  from audio_recorder_streamlit import audio_recorder
6
  import numpy as np
7
 
8
  # Function to transcribe audio to text
9
  def transcribe_audio(audio_bytes):
10
+ processor = Wav2Vec2Processor.from_pretrained("facebook/wav2vec2-base-960h")
11
+ #processor = Speech2Text2Processor.from_pretrained("facebook/s2t-wav2vec2-large-en-de")
12
+ #model = SpeechEncoderDecoderModel.from_pretrained("facebook/s2t-wav2vec2-large-en-de")
13
+ model = Wav2Vec2ForCTC.from_pretrained("facebook/wav2vec2-base-960h")
14
 
15
 
16
  # Convert bytes to numpy array