Marco-Cheung
commited on
Commit
•
b503d5a
1
Parent(s):
18b1ae7
Update app.py
Browse files
app.py
CHANGED
@@ -14,11 +14,7 @@ voices = {
|
|
14 |
device = "cuda:0" if torch.cuda.is_available() else "cpu"
|
15 |
|
16 |
# load speech translation checkpoint
|
17 |
-
asr_pipe = pipeline("automatic-speech-recognition", model=ASR_MODEL_NAME, chunk_length_s=
|
18 |
-
# set the forced ids
|
19 |
-
#asr_pipe.model.config.forced_decoder_ids = asr_pipe.tokenizer.get_decoder_prompt_ids(language='de', task="transcribe")
|
20 |
-
asr_pipe.config.forced_decoder_ids = None
|
21 |
-
asr_pipe.config.suppress_tokens = []
|
22 |
|
23 |
MULTILINGUAL = True # set True for multilingual models, False for English-only
|
24 |
|
@@ -30,6 +26,10 @@ processor = AutoProcessor.from_pretrained("suno/bark-small")
|
|
30 |
model = BarkModel.from_pretrained("suno/bark-small").to(device)
|
31 |
sampling_rate = model.generation_config.sample_rate
|
32 |
|
|
|
|
|
|
|
|
|
33 |
def translate(audio):
|
34 |
outputs = asr_pipe(audio, max_new_tokens=256, generate_kwargs={"task": "translate"})
|
35 |
return outputs["text"]
|
|
|
14 |
device = "cuda:0" if torch.cuda.is_available() else "cpu"
|
15 |
|
16 |
# load speech translation checkpoint
|
17 |
+
asr_pipe = pipeline("automatic-speech-recognition", model=ASR_MODEL_NAME, chunk_length_s=30,device=device)
|
|
|
|
|
|
|
|
|
18 |
|
19 |
MULTILINGUAL = True # set True for multilingual models, False for English-only
|
20 |
|
|
|
26 |
model = BarkModel.from_pretrained("suno/bark-small").to(device)
|
27 |
sampling_rate = model.generation_config.sample_rate
|
28 |
|
29 |
+
# set the forced ids
|
30 |
+
model.config.forced_decoder_ids = None
|
31 |
+
model.config.suppress_tokens = []
|
32 |
+
|
33 |
def translate(audio):
|
34 |
outputs = asr_pipe(audio, max_new_tokens=256, generate_kwargs={"task": "translate"})
|
35 |
return outputs["text"]
|