Fralet commited on
Commit
6b8e76a
·
verified ·
1 Parent(s): b95583d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -3
app.py CHANGED
@@ -1,5 +1,6 @@
1
  import logging
2
  from transformers import MarianMTModel, MarianTokenizer
 
3
 
4
  # Setup logging
5
  logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
@@ -15,13 +16,13 @@ def translate_to_english(text):
15
  model = MarianMTModel.from_pretrained(model_name)
16
 
17
  logger.info("Tokenizing text")
18
- tokenized_text = tokenizer.prepare_seq2seq_batch([text], return_tensors='pt')
19
 
20
  logger.info("Performing translation")
21
- translation = model.generate(**tokenized_text)
22
 
23
  logger.info("Decoding translation")
24
- translated_text = tokenizer.decode(translation[0], skip_special_tokens=True)
25
  return translated_text
26
 
27
  # Sample Russian text
 
1
  import logging
2
  from transformers import MarianMTModel, MarianTokenizer
3
+ import sentencepiece
4
 
5
  # Setup logging
6
  logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
 
16
  model = MarianMTModel.from_pretrained(model_name)
17
 
18
  logger.info("Tokenizing text")
19
+ tokenized_text = tokenizer(text, return_tensors='pt', padding=True, truncation=True)
20
 
21
  logger.info("Performing translation")
22
+ translated_tokens = model.generate(**tokenized_text)
23
 
24
  logger.info("Decoding translation")
25
+ translated_text = tokenizer.decode(translated_tokens[0], skip_special_tokens=True)
26
  return translated_text
27
 
28
  # Sample Russian text