Spaces:
Runtime error
Runtime error
+ choosing model size
Browse files
app.py
CHANGED
@@ -11,9 +11,11 @@ AUTO_DETECT_LANG = "Auto Detect"
|
|
11 |
def transcribe(audio, state={}, model_size='base', delay=1.2, lang=None, translate=False):
|
12 |
time.sleep(delay - 1)
|
13 |
|
|
|
|
|
14 |
if model_size != current_size:
|
15 |
-
model = whisper.load_model(model_size)
|
16 |
current_size = model_size
|
|
|
17 |
|
18 |
transcription = model.transcribe(
|
19 |
audio,
|
@@ -35,11 +37,11 @@ def transcribe(audio, state={}, model_size='base', delay=1.2, lang=None, transla
|
|
35 |
|
36 |
|
37 |
title = "OpenAI's Whisper Real-time Demo"
|
38 |
-
description = "A simple demo of OpenAI's [**Whisper**](https://github.com/openai/whisper) speech recognition model."
|
39 |
|
40 |
model_size = gr.Dropdown(label="Model size", choices=['base', 'tiny', 'small', 'medium', 'large'], value='base')
|
41 |
|
42 |
-
delay_slider = gr.inputs.Slider(minimum=1, maximum=5, default=1.2, label="Rate of transcription
|
43 |
|
44 |
available_languages = sorted(tokenizer.TO_LANGUAGE_CODE.keys())
|
45 |
available_languages = [lang.capitalize() for lang in available_languages]
|
|
|
11 |
def transcribe(audio, state={}, model_size='base', delay=1.2, lang=None, translate=False):
|
12 |
time.sleep(delay - 1)
|
13 |
|
14 |
+
global current_size
|
15 |
+
global model
|
16 |
if model_size != current_size:
|
|
|
17 |
current_size = model_size
|
18 |
+
model = whisper.load_model(current_size)
|
19 |
|
20 |
transcription = model.transcribe(
|
21 |
audio,
|
|
|
37 |
|
38 |
|
39 |
title = "OpenAI's Whisper Real-time Demo"
|
40 |
+
description = "A simple demo of OpenAI's [**Whisper**](https://github.com/openai/whisper) speech recognition model. This demo runs on a CPU. For faster inference choose 'tiny' model size and set the language explicitly."
|
41 |
|
42 |
model_size = gr.Dropdown(label="Model size", choices=['base', 'tiny', 'small', 'medium', 'large'], value='base')
|
43 |
|
44 |
+
delay_slider = gr.inputs.Slider(minimum=1, maximum=5, default=1.2, label="Rate of transcription")
|
45 |
|
46 |
available_languages = sorted(tokenizer.TO_LANGUAGE_CODE.keys())
|
47 |
available_languages = [lang.capitalize() for lang in available_languages]
|