Spaces:
Sleeping
Sleeping
Tried going from Tswana to Eng as Sub for Sesotho to Eng
Browse files
app.py
CHANGED
@@ -13,6 +13,8 @@ model = AutoModelForSeq2SeqLM.from_pretrained("souvorinkg/eng-ses-nllb", token=F
|
|
13 |
# tokenizer_kin_to_en = AutoTokenizer.from_pretrained("souvorinkg/eng-ses-nllb", token=False, src_lang="kin_Latn", tgt_lang="eng_Latn")
|
14 |
|
15 |
tokenizer_en_to_ses = AutoTokenizer.from_pretrained("souvorinkg/eng-ses-nllb", token=False, src_lang="eng_Latn", tgt_lang="ses_Latn")
|
|
|
|
|
16 |
|
17 |
|
18 |
# Define the translation function for English to Kinyarwanda
|
@@ -30,10 +32,10 @@ tokenizer_en_to_ses = AutoTokenizer.from_pretrained("souvorinkg/eng-ses-nllb", t
|
|
30 |
def translate_en_to_ses(SourceText):
|
31 |
inputs = tokenizer_en_to_ses(SourceText, return_tensors="pt")
|
32 |
translated_tokens = model.generate(**inputs, max_length=30)
|
33 |
-
return
|
34 |
|
35 |
def translate_ses_to_en(SourceText):
|
36 |
-
inputs = inputs =
|
37 |
translated_tokens = model.generate(**inputs, max_length=30)
|
38 |
return tokenizer_en_to_ses.batch_decode(translated_tokens, skip_special_tokens=True)[0]
|
39 |
|
@@ -50,8 +52,8 @@ def translate(SourceText, direction):
|
|
50 |
# return translate_kin_to_en(SourceText)
|
51 |
if direction == "English to Sesotho":
|
52 |
return translate_en_to_ses(SourceText)
|
53 |
-
|
54 |
-
|
55 |
# if direction == "English to Tswana":
|
56 |
# return translate == translate_en_to_tsn(SourceText)
|
57 |
|
|
|
13 |
# tokenizer_kin_to_en = AutoTokenizer.from_pretrained("souvorinkg/eng-ses-nllb", token=False, src_lang="kin_Latn", tgt_lang="eng_Latn")
|
14 |
|
15 |
tokenizer_en_to_ses = AutoTokenizer.from_pretrained("souvorinkg/eng-ses-nllb", token=False, src_lang="eng_Latn", tgt_lang="ses_Latn")
|
16 |
+
tokenizer_tsn_to_eng = AutoTokenizer.from_pretrained("souvorinkg/eng-ses-nllb", token=False, src_lang="tsn_Latn", tgt_lang="eng_Latn")
|
17 |
+
|
18 |
|
19 |
|
20 |
# Define the translation function for English to Kinyarwanda
|
|
|
32 |
def translate_en_to_ses(SourceText):
|
33 |
inputs = tokenizer_en_to_ses(SourceText, return_tensors="pt")
|
34 |
translated_tokens = model.generate(**inputs, max_length=30)
|
35 |
+
return tokenizer_tsn_to_eng.batch_decode(translated_tokens, skip_special_tokens=True)[0]
|
36 |
|
37 |
def translate_ses_to_en(SourceText):
|
38 |
+
inputs = inputs = tokenizer_tsn_to_eng(SourceText, return_tensors="pt")
|
39 |
translated_tokens = model.generate(**inputs, max_length=30)
|
40 |
return tokenizer_en_to_ses.batch_decode(translated_tokens, skip_special_tokens=True)[0]
|
41 |
|
|
|
52 |
# return translate_kin_to_en(SourceText)
|
53 |
if direction == "English to Sesotho":
|
54 |
return translate_en_to_ses(SourceText)
|
55 |
+
if direction == "Sesotho to English":
|
56 |
+
return translate_ses_to_en(SourceText)
|
57 |
# if direction == "English to Tswana":
|
58 |
# return translate == translate_en_to_tsn(SourceText)
|
59 |
|