AutoPage / docling /utils /ocr_utils.py
Mqleet's picture
upd code
fcaa164
raw
history blame
263 Bytes
def map_tesseract_script(script: str) -> str:
r""" """
if script == "Katakana" or script == "Hiragana":
script = "Japanese"
elif script == "Han":
script = "HanS"
elif script == "Korean":
script = "Hangul"
return script