radiobee-aligner / tests /test_detect.py
freemt
Update slow-track for more lang pairs
7fd4e54
raw
history blame contribute delete
No virus
1.36 kB
"""Test detect."""
import pytest
from radiobee.detect import detect
@pytest.mark.parametrize(
"test_input,expected", [
("", "en"),
(" ", "en"),
(" \n ", "en"),
("注释", "zh"),
]
)
def test_detect(test_input, expected):
"""Test detect."""
assert detect(test_input) == expected
# expected set_languages[0], set_languages = ["en", "zh"]
assert detect(test_input, ["en", "zh"]) == expected
def test_detect_de():
"""Test detect de."""
text_de = "4\u3000In der Beschränkung zeigt sich erst der Meister, / Und das Gesetz nur kann uns Freiheit geben. 参见http://www.business-it.nl/files/7d413a5dca62fc735a072b16fbf050b1-27.php." # noqa
assert detect(text_de) == "de"
assert detect(text_de, ["en", "zh"]) == "zh"
def test_elm1():
"""Test ——撰文:Thomas Gibbons-Neff和Fahim Abed,摄影:Jim Huylebroek=."""
elm1 = "——撰文:Thomas Gibbons-Neff和Fahim Abed,摄影:Jim Huylebroek"
assert detect(elm1) == "ja"
assert detect(elm1, ["en", "zh"]) == "zh"
def test_elm2():
"""Test 在卢旺达基加利的一家牛奶吧。 JACQUES NKINZINGABO FOR THE NEW YORK TIMES."""
elm2 = "在卢旺达基加利的一家牛奶吧。 JACQUES NKINZINGABO FOR THE NEW YORK TIMES"
assert detect(elm2) == "zh"
assert detect(elm2, ["en", "zh"]) == "zh"