Marco-Cheung commited on
Commit
b503d5a
1 Parent(s): 18b1ae7

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -5
app.py CHANGED
@@ -14,11 +14,7 @@ voices = {
14
  device = "cuda:0" if torch.cuda.is_available() else "cpu"
15
 
16
  # load speech translation checkpoint
17
- asr_pipe = pipeline("automatic-speech-recognition", model=ASR_MODEL_NAME, chunk_length_s=10,device=device)
18
- # set the forced ids
19
- #asr_pipe.model.config.forced_decoder_ids = asr_pipe.tokenizer.get_decoder_prompt_ids(language='de', task="transcribe")
20
- asr_pipe.config.forced_decoder_ids = None
21
- asr_pipe.config.suppress_tokens = []
22
 
23
  MULTILINGUAL = True # set True for multilingual models, False for English-only
24
 
@@ -30,6 +26,10 @@ processor = AutoProcessor.from_pretrained("suno/bark-small")
30
  model = BarkModel.from_pretrained("suno/bark-small").to(device)
31
  sampling_rate = model.generation_config.sample_rate
32
 
 
 
 
 
33
  def translate(audio):
34
  outputs = asr_pipe(audio, max_new_tokens=256, generate_kwargs={"task": "translate"})
35
  return outputs["text"]
 
14
  device = "cuda:0" if torch.cuda.is_available() else "cpu"
15
 
16
  # load speech translation checkpoint
17
+ asr_pipe = pipeline("automatic-speech-recognition", model=ASR_MODEL_NAME, chunk_length_s=30,device=device)
 
 
 
 
18
 
19
  MULTILINGUAL = True # set True for multilingual models, False for English-only
20
 
 
26
  model = BarkModel.from_pretrained("suno/bark-small").to(device)
27
  sampling_rate = model.generation_config.sample_rate
28
 
29
+ # set the forced ids
30
+ model.config.forced_decoder_ids = None
31
+ model.config.suppress_tokens = []
32
+
33
  def translate(audio):
34
  outputs = asr_pipe(audio, max_new_tokens=256, generate_kwargs={"task": "translate"})
35
  return outputs["text"]