moro23 commited on
Commit
900aeb7
·
1 Parent(s): deeb5cc

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -12,7 +12,7 @@ nltk.download("punkt")
12
  #model_name = "moro23/wav2vec-large-xls-r-300-ha-colab_4"
13
  #tokenizer = Wav2Vec2Tokenizer.from_pretrained(model_name, use_auth_token=token_value)
14
  #tokenizer = Wav2Vec2Processor.from_pretrained(model_name, use_auth_token=token_value)
15
- #model = Wav2Vec2ForCTC.from_pretrained(model_name, use_auth_token=token_value)
16
 
17
  def load_data(input_file):
18
 
@@ -37,7 +37,8 @@ def asr_transcript(input_file):
37
  #Tokenize
38
  input_dict = tokenizer(speech, return_tensors="pt", padding=True)
39
  #Take logits
40
- logits = model(input_dict.input_values.to("cuda").logits
 
41
  #Take argmax
42
  predicted_ids = torch.argmax(logits, dim=-1)[0]
43
  #Get the words from predicted word ids
 
12
  #model_name = "moro23/wav2vec-large-xls-r-300-ha-colab_4"
13
  #tokenizer = Wav2Vec2Tokenizer.from_pretrained(model_name, use_auth_token=token_value)
14
  #tokenizer = Wav2Vec2Processor.from_pretrained(model_name, use_auth_token=token_value)
15
+ #model = Wav2Vec2ForCTC.from_pretrained(model_name, use_auth_token=token_value).to("cuda")
16
 
17
  def load_data(input_file):
18
 
 
37
  #Tokenize
38
  input_dict = tokenizer(speech, return_tensors="pt", padding=True)
39
  #Take logits
40
+ logits = model(input_dict.input_values.to("cuda")).logits
41
+
42
  #Take argmax
43
  predicted_ids = torch.argmax(logits, dim=-1)[0]
44
  #Get the words from predicted word ids