You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

17 lines
361 B

import pytest
@pytest.mark.parametrize(
"word,lemma",
[
("새로운", "새롭"),
("빨간", "빨갛"),
("클수록", ""),
("뭡니까", ""),
("됐다", ""),
],
)
def test_ko_lemmatizer_assigns(ko_tokenizer, word, lemma):
test_lemma = ko_tokenizer(word)[0].lemma_
assert test_lemma == lemma