|
import gradio as gr |
|
from transformers import pipeline |
|
import json |
|
import re |
|
|
|
|
|
with open('phrase_mappings.json', 'r') as f: |
|
phrase_mapping = json.load(f) |
|
|
|
|
|
class UnifiedTranslator: |
|
def __init__(self, model_name, phrase_mapping): |
|
self.model = pipeline("translation", model=model_name) |
|
self.phrase_mapping = phrase_mapping |
|
|
|
def translate(self, text): |
|
|
|
text_lower = text.lower().strip() |
|
|
|
|
|
print(f"Input text: {text_lower}") |
|
|
|
|
|
for pattern, translation in self.phrase_mapping.items(): |
|
try: |
|
|
|
|
|
pattern_regex = re.compile( |
|
re.escape(pattern).replace(r"\{name\}", r"([\w'-]+)").strip(), |
|
re.IGNORECASE |
|
) |
|
match = pattern_regex.fullmatch(text_lower) |
|
if match: |
|
|
|
if '{name}' in pattern: |
|
return translation.format(name=match.group(1)) |
|
else: |
|
return translation |
|
except re.error as e: |
|
print(f"Regex error with pattern {pattern}: {e}") |
|
|
|
|
|
try: |
|
translation = self.model(text)[0] |
|
return translation['translation_text'] |
|
except Exception as e: |
|
print(f"Model translation error: {e}") |
|
return "Translation error occurred" |
|
|
|
|
|
translator = UnifiedTranslator("Bildad/Swahili-English_Translation", phrase_mapping) |
|
|
|
|
|
def translate_text(text): |
|
return translator.translate(text) |
|
|
|
iface = gr.Interface( |
|
fn=translate_text, |
|
inputs="text", |
|
outputs="text", |
|
title="Swahili-English Translation", |
|
description="Translate Swahili to English with custom phrase mappings." |
|
) |
|
|
|
|
|
iface.launch(share=True) |
|
|