Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
Update app.py
Browse files
app.py
CHANGED
@@ -1,11 +1,13 @@
|
|
1 |
import gradio as gr
|
2 |
from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
|
|
|
3 |
import fasttext
|
4 |
|
5 |
# Initialize fastText model
|
6 |
-
model_path = 'lid.323.ftz'
|
7 |
-
language_model = fasttext.load_model(model_path)
|
8 |
|
|
|
9 |
model_path_translation = "anzorq/m2m100_418M_ft_ru-kbd_44K"
|
10 |
tgt_lang="zu"
|
11 |
|
@@ -14,7 +16,7 @@ model = AutoModelForSeq2SeqLM.from_pretrained(model_path_translation, use_safete
|
|
14 |
|
15 |
def translate(text, num_beams=4, num_return_sequences=4):
|
16 |
# Detect language
|
17 |
-
languages, _ =
|
18 |
detected_language = languages[0].replace("__label__", "")
|
19 |
|
20 |
inputs = tokenizer(text, return_tensors="pt")
|
|
|
1 |
import gradio as gr
|
2 |
from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
|
3 |
+
from huggingface_hub import hf_hub_download
|
4 |
import fasttext
|
5 |
|
6 |
# Initialize fastText model
|
7 |
+
# model_path = 'lid.323.ftz'
|
8 |
+
# language_model = fasttext.load_model(model_path)
|
9 |
|
10 |
+
lid_model = fasttext.load_model(hf_hub_download("facebook/fasttext-language-identification", "model.bin"))
|
11 |
model_path_translation = "anzorq/m2m100_418M_ft_ru-kbd_44K"
|
12 |
tgt_lang="zu"
|
13 |
|
|
|
16 |
|
17 |
def translate(text, num_beams=4, num_return_sequences=4):
|
18 |
# Detect language
|
19 |
+
languages, _ = lid_model.predict(text, k=1)
|
20 |
detected_language = languages[0].replace("__label__", "")
|
21 |
|
22 |
inputs = tokenizer(text, return_tensors="pt")
|