Spaces:
Running
Running
from myv_translit import cyr2lat, detect_script | |
def test_join_acute(): | |
assert cyr2lat('кель') == 'keĺ' | |
assert cyr2lat('кель', joint_acute=False) == 'keĺ' | |
assert len(cyr2lat('кель')) == 3 | |
assert len(cyr2lat('кель', joint_acute=False)) == 4 | |
def test_first_e(): | |
assert cyr2lat('эрзя') == 'ěrzä' | |
assert cyr2lat('эрзя', first_e_with_hacek=False) == 'erzä' | |
def test_soft_l(): | |
assert cyr2lat('пелькс') == 'peĺks' | |
assert cyr2lat('пелькс', soft_l_after_vowels=False) == 'pelks' | |
def test_detection(): | |
assert detect_script('123 456?? 8743 098543 ???...,.! @%%&&& хз') == 'unk' | |
assert detect_script('ěrzä') == 'lat' | |
assert detect_script('ěrzä ю') == 'lat' | |
assert detect_script('ЭРЗЯ') == 'cyr' | |
assert detect_script('ЭРЗЯ d') == 'cyr' | |
assert detect_script('ěrzä эрзянь') == 'mix' | |
# todo: test on a larger corpus | |
# todo: test cyclical consistency | |