Spaces:
Runtime error
Runtime error
File size: 1,409 Bytes
e84d35a |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 |
"""Test seg_text."""
import pytest
from radiobee.seg_text import seg_text
def test_seg_text1():
"""Test seg_text 1."""
text = " text 1\n\n test 2. test 3"
_ = seg_text(text)
assert len(_) == 2
text = " text 1\n\n test 2. Test 3"
_ = seg_text(text)
assert len(_) == 3
@pytest.mark.parametrize(
"test_input,expected", [
("", []),
(" ", []),
(" \n ", []),
]
)
def test_seg_text_blanks(test_input, expected):
"""Test blanks."""
assert seg_text(test_input) == expected
def test_seg_text_semicolon():
"""Test semicolon."""
text = """ “元宇宙”,英文為“Metaverse”。該詞出自1992年;的科幻小說《雪崩》。 """
assert len(seg_text(text)) == 2
assert len(seg_text(text, 'zh')) == 2
assert len(seg_text(text, 'ja')) == 2
assert len(seg_text(text, 'ko')) == 2
assert len(seg_text(text, 'en')) == 1
def test_seg_text_semicolon_extra():
"""Test semicolon."""
extra = "[;;]"
text = """ “元宇宙”,英文為“Metaverse”。該詞出自1992年;的科幻小說《雪崩》。 """
assert len(seg_text(text, extra=extra)) == 2 + 1
assert len(seg_text(text, 'zh', extra=extra)) == 2 + 1
assert len(seg_text(text, 'ja', extra=extra)) == 2 + 1
assert len(seg_text(text, 'ko', extra=extra)) == 2 + 1
assert len(seg_text(text, 'en', extra=extra)) == 1 + 1
|