mwmbl/test/test_indexdb.py
2023-05-20 22:11:51 +01:00

6 lines
165 B
Python

from mwmbl.tokenizer import clean_unicode
def test_clean_unicode():
result = clean_unicode('Bad extract text \ud83c')
assert result == 'Bad extract text '