File size: 913 Bytes
45bcbb5
7925ce4
45bcbb5
 
 
 
 
7925ce4
45bcbb5
 
7925ce4
45bcbb5
 
c6d6c95
45bcbb5
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
from transformers import MarianMTModel, MarianTokenizer

def translate_text(input_text, source_lang="en", target_lang="hi"):
    # Load pre-trained model and tokenizer for MarianMT
    model_name = f'Helsinki-NLP/opus-mt-{source_lang}-{target_lang}'
    model = MarianMTModel.from_pretrained(model_name)
    tokenizer = MarianTokenizer.from_pretrained(model_name)

    # Tokenize the input text
    input_ids = tokenizer.encode(input_text, return_tensors="pt")

    # Generate translation
    translation_ids = model.generate(input_ids)

    # Decode the translated text
    translated_text = tokenizer.decode(translation_ids[0], skip_special_tokens=True)

    return translated_text

if __name__ == "__main__":
    # Example usage
    input_text = "Hello, how are you?"
    translated_text = translate_text(input_text)
    
    print(f"Input Text: {input_text}")
    print(f"Translated Text: {translated_text}")