Spaces:

Shubham09
/

samplewhisper

Runtime error

Shubham09 commited on Dec 5, 2022

Commit

cb420c2

1 Parent(s): 93ad2c2

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -8,9 +8,9 @@ nltk.download("punkt")
 model_name = "Shubham09/whisper31filescheck"
-processor = WhisperProcessor.from_pretrained(model_name)
-tokenizer = WhisperTokenizer.from_pretrained(model_name)
-model = WhisperForConditionalGeneration.from_pretrained(model_name,decoder_input_ids)
 def load_data(input_file):
@@ -33,14 +33,14 @@ def asr_transcript(input_file):
   speech = load_data(input_file)
   #Tokenize
-  input_features = processor(speech, return_tensors="pt").input_features  #, padding="longest" , return_tensors="pt"
   #input_values = tokenizer(speech, return_tensors="pt").input_values
   #Take logits
   logits = model(input_features).logits
   #Take argmax
   predicted_ids = torch.argmax(logits, dim=-1)
   #Get the words from predicted word ids
-  transcription = processor.batch_decode(predicted_ids[0])
   #Correcting the letter casing
   #transcription = correct_casing(transcription.lower())
   return transcription

 model_name = "Shubham09/whisper31filescheck"
+processor = WhisperProcessor.from_pretrained(model_name,task="transcribe")
+#tokenizer = WhisperTokenizer.from_pretrained(model_name)
+model = WhisperForConditionalGeneration.from_pretrained(model_name)
 def load_data(input_file):
   speech = load_data(input_file)
   #Tokenize
+  input_features = processor(speech).input_features  #, padding="longest" , return_tensors="pt"
   #input_values = tokenizer(speech, return_tensors="pt").input_values
   #Take logits
   logits = model(input_features).logits
   #Take argmax
   predicted_ids = torch.argmax(logits, dim=-1)
   #Get the words from predicted word ids
+  transcription = processor.batch_decode(predicted_ids)
   #Correcting the letter casing
   #transcription = correct_casing(transcription.lower())
   return transcription