File size: 865 Bytes
4a2c972
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
# src/translator.py — Multilingual translation using Hugging Face MarianMT

from transformers import MarianMTModel, MarianTokenizer

class Translator:
    def __init__(self, src_lang="en", tgt_lang="fr"):
        model_name = f"Helsinki-NLP/opus-mt-{src_lang}-{tgt_lang}"
        self.tokenizer = MarianTokenizer.from_pretrained(model_name)
        self.model = MarianMTModel.from_pretrained(model_name)

    def translate(self, text):
        inputs = self.tokenizer(text, return_tensors="pt", padding=True)
        translated = self.model.generate(**inputs)
        return self.tokenizer.decode(translated[0], skip_special_tokens=True)


if __name__ == "__main__":
    translator = Translator(src_lang="en", tgt_lang="es")
    text = "Hello, how are you?"
    print(f"Original: {text}")
    print(f"Translated: {translator.translate(text)}")