ur_en / usage_spm.py
datasetsANDmodels's picture
Update usage_spm.py
8faf5a6 verified
#export KMP_DUPLICATE_LIB_OK=TRUE
import ctranslate2
import sentencepiece as spm
from translate import Translator
text="I am calling from tax office"
text="میں ٹیکس آفس سے کال کر رہا ہوں۔"
translator = ctranslate2.Translator("ur_en/")
sp = spm.SentencePieceProcessor(model_file="ur_en/sentencepiece.model")
tokens = sp.encode(text, out_type=str)
translated_tokens = translator.translate_batch([tokens])
output = sp.decode(translated_tokens[0][0]["tokens"]).replace("▁"," ")
print( f"{output}")