anzorq commited on
Commit
be21142
·
1 Parent(s): bf34975

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -3
app.py CHANGED
@@ -1,11 +1,13 @@
1
  import gradio as gr
2
  from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
 
3
  import fasttext
4
 
5
  # Initialize fastText model
6
- model_path = 'lid.323.ftz'
7
- language_model = fasttext.load_model(model_path)
8
 
 
9
  model_path_translation = "anzorq/m2m100_418M_ft_ru-kbd_44K"
10
  tgt_lang="zu"
11
 
@@ -14,7 +16,7 @@ model = AutoModelForSeq2SeqLM.from_pretrained(model_path_translation, use_safete
14
 
15
  def translate(text, num_beams=4, num_return_sequences=4):
16
  # Detect language
17
- languages, _ = language_model.predict(text, k=1)
18
  detected_language = languages[0].replace("__label__", "")
19
 
20
  inputs = tokenizer(text, return_tensors="pt")
 
1
  import gradio as gr
2
  from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
3
+ from huggingface_hub import hf_hub_download
4
  import fasttext
5
 
6
  # Initialize fastText model
7
+ # model_path = 'lid.323.ftz'
8
+ # language_model = fasttext.load_model(model_path)
9
 
10
+ lid_model = fasttext.load_model(hf_hub_download("facebook/fasttext-language-identification", "model.bin"))
11
  model_path_translation = "anzorq/m2m100_418M_ft_ru-kbd_44K"
12
  tgt_lang="zu"
13
 
 
16
 
17
  def translate(text, num_beams=4, num_return_sequences=4):
18
  # Detect language
19
+ languages, _ = lid_model.predict(text, k=1)
20
  detected_language = languages[0].replace("__label__", "")
21
 
22
  inputs = tokenizer(text, return_tensors="pt")