entai2965
/

small100-ctranslate2

gsarti/flores_101

Model card Files Files and versions

entai2965 commited on Nov 21, 2024

Commit

bb55154

·

verified ·

1 Parent(s): af447d0

Update README.md

Files changed (1) hide show

README.md +7 -3

README.md CHANGED Viewed

@@ -110,10 +110,14 @@ tags:
 - tico19
 - gmnlp/tico19
 - tatoeba
 datasets:
 - tico19
 - flores101
 - tatoeba
 ---
 From: https://huggingface.co/alirezamsh/small100
@@ -302,7 +306,8 @@ encoded_list=[]
 for text in raw_list:
     encoded_list.append(tokenizer.convert_ids_to_tokens(tokenizer.encode(text)))
-# translate
 translated_list=translator.translate_batch(encoded_list,target_prefix=[target_language_token]*len(raw_list))
 #decode
@@ -357,5 +362,4 @@ translated_list=[tokenizer.decode(tokenizer.convert_tokens_to_ids(token.hypothes
 #output
 for text in translated_list:
     print(text)
-```

 - tico19
 - gmnlp/tico19
 - tatoeba
+- nmt
 datasets:
 - tico19
 - flores101
 - tatoeba
+base_model:
+- alirezamsh/small100
+pipeline_tag: translation
 ---
 From: https://huggingface.co/alirezamsh/small100
 for text in raw_list:
     encoded_list.append(tokenizer.convert_ids_to_tokens(tokenizer.encode(text)))
+#translate
+#https://opennmt.net/CTranslate2/python/ctranslate2.Translator.html?#ctranslate2.Translator.translate_batch
 translated_list=translator.translate_batch(encoded_list,target_prefix=[target_language_token]*len(raw_list))
 #decode
 #output
 for text in translated_list:
     print(text)
+```