-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathtranslation.py
More file actions
31 lines (24 loc) · 1.21 KB
/
translation.py
File metadata and controls
31 lines (24 loc) · 1.21 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
from transformers import MarianMTModel, MarianTokenizer
src_text = [
"ذهب الرئيس پوتن إلى القصر الرئاسي في العاصمة كييڤ",
]
model_name = "Helsinki-NLP/opus-mt-ar-en"
tokenizer = MarianTokenizer.from_pretrained(model_name)
model = MarianMTModel.from_pretrained(model_name)
translated = model.generate(**tokenizer(src_text, return_tensors="pt", padding=True))
translated_text_to_AR = ' '.join([tokenizer.decode(t, skip_special_tokens=True) for t in translated])
print('translated_text_to_AR: ',translated_text_to_AR)
# expected output:
# Just follow your heart.
# Wayne Rahi Dosh?
from transformers import MarianTokenizer, MarianMTModel
mname = "marefa-nlp/marefa-mt-en-ar"
tokenizer = MarianTokenizer.from_pretrained(mname)
model = MarianMTModel.from_pretrained(mname)
# English Sample Text
input = translated_text_to_AR
translated_tokens = model.generate(**tokenizer.prepare_seq2seq_batch([input], return_tensors="pt"))
translated_text = [tokenizer.decode(t, skip_special_tokens=True) for t in translated_tokens]
# translated Arabic Text
print('translated_text: ',translated_text)
# ذهب الرئيس پوتن إلى القصر الرئاسي في العاصمة كييڤ