blackhole33 commited on
Commit
5e430a5
·
verified ·
1 Parent(s): d979361

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +48 -3
README.md CHANGED
@@ -1,3 +1,48 @@
1
- ---
2
- license: apache-2.0
3
- ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ datasets:
4
+ - booba-uz/translation-dataset-250k
5
+ language:
6
+ - en
7
+ - uz
8
+ metrics:
9
+ - bleu 35
10
+ base_model:
11
+ - facebook/nllb-200-distilled-600M
12
+ pipeline_tag: translation
13
+ library_name: transformers
14
+ ---
15
+
16
+
17
+ # model usage:
18
+
19
+
20
+ ```
21
+
22
+ from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
23
+
24
+ model_name = 'booba-uz/english-uzbek-translation_v2'
25
+ tokenizer = AutoTokenizer.from_pretrained(model_name)
26
+ model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
27
+
28
+ tokenizer.src_lang = "en"
29
+ tokenizer.tgt_lang = "uz"
30
+ prefix = "Translate this text from English to uzbek: "
31
+
32
+ # Function to translate text
33
+ def translate_text(text: str, target_lang: str = 'uz'):
34
+
35
+ text = prefix + text
36
+ inputs = tokenizer.encode(text, return_tensors="pt", padding=True)
37
+ translated = model.generate(inputs, num_beams=5, max_length=200, early_stopping=True)
38
+ translated_text = tokenizer.decode(translated[0], skip_special_tokens=True)
39
+ return translated_text
40
+
41
+ input_text = "An Azerbaijan Airlines Embraer ERJ-190AR aircraft crashed at Aktau Airport in Kazakhstan while attempting an emergency landing. The plane, registered as 4K-AZ65, was carrying 67 passengers and five crew members at the time. Some media reports suggest that the number of passengers exceeded 100, with over 60 identified as Russian citizens."
42
+
43
+ # Translate the input text to Uzbek
44
+ output_text = translate_text(input_text)
45
+ print("Translated text:", output_text)
46
+
47
+
48
+ ```