Update app.py
Browse files
app.py
CHANGED
@@ -1,5 +1,6 @@
|
|
1 |
import logging
|
2 |
from transformers import MarianMTModel, MarianTokenizer
|
|
|
3 |
|
4 |
# Setup logging
|
5 |
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
|
@@ -15,13 +16,13 @@ def translate_to_english(text):
|
|
15 |
model = MarianMTModel.from_pretrained(model_name)
|
16 |
|
17 |
logger.info("Tokenizing text")
|
18 |
-
tokenized_text = tokenizer
|
19 |
|
20 |
logger.info("Performing translation")
|
21 |
-
|
22 |
|
23 |
logger.info("Decoding translation")
|
24 |
-
translated_text = tokenizer.decode(
|
25 |
return translated_text
|
26 |
|
27 |
# Sample Russian text
|
|
|
1 |
import logging
|
2 |
from transformers import MarianMTModel, MarianTokenizer
|
3 |
+
import sentencepiece
|
4 |
|
5 |
# Setup logging
|
6 |
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
|
|
|
16 |
model = MarianMTModel.from_pretrained(model_name)
|
17 |
|
18 |
logger.info("Tokenizing text")
|
19 |
+
tokenized_text = tokenizer(text, return_tensors='pt', padding=True, truncation=True)
|
20 |
|
21 |
logger.info("Performing translation")
|
22 |
+
translated_tokens = model.generate(**tokenized_text)
|
23 |
|
24 |
logger.info("Decoding translation")
|
25 |
+
translated_text = tokenizer.decode(translated_tokens[0], skip_special_tokens=True)
|
26 |
return translated_text
|
27 |
|
28 |
# Sample Russian text
|