anzorq commited on
Commit
58e3099
·
1 Parent(s): 503cf0f

Create README.md

Browse files
Files changed (1) hide show
  1. README.md +31 -0
README.md ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ### Inference
2
+
3
+ ```bash
4
+ pip install transformers sentencepiece
5
+ ```
6
+
7
+ ```Python
8
+ from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
9
+
10
+ model_path = "anzorq/m2m100_1.2B_ft_ru-kbd_50K"
11
+ tgt_lang="zu"
12
+
13
+ tokenizer = AutoTokenizer.from_pretrained('facebook/m2m100_1.2B')
14
+ model = AutoModelForSeq2SeqLM.from_pretrained(model_path)
15
+ model.to('cuda')
16
+
17
+ def translate(text, num_beams=4, num_return_sequences=4):
18
+ inputs = tokenizer(text, return_tensors="pt")
19
+ inputs.to('cuda')
20
+ num_return_sequences = min(num_return_sequences, num_beams)
21
+
22
+ translated_tokens = model.generate(
23
+ **inputs,
24
+ forced_bos_token_id=tokenizer.lang_code_to_id[tgt_lang],
25
+ num_beams=num_beams,
26
+ num_return_sequences=num_return_sequences
27
+ )
28
+
29
+ translations = [tokenizer.decode(translation, skip_special_tokens=True) for translation in translated_tokens]
30
+ return translations
31
+ ```