6 lines
165 B
Python
6 lines
165 B
Python
from mwmbl.tokenizer import clean_unicode
|
|
|
|
|
|
def test_clean_unicode():
|
|
result = clean_unicode('Bad extract text \ud83c')
|
|
assert result == 'Bad extract text '
|