You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

14 lines
398 B

import unittest
import nltk
from nltk.corpus.reader import pl196x
class TestCorpusViews(unittest.TestCase):
def test_corpus_reader(self):
pl196x_dir = nltk.data.find("corpora/pl196x/")
pl = pl196x.Pl196xCorpusReader(
pl196x_dir, r".*\.xml", textids="textids.txt", cat_file="cats.txt"
)
pl.tagged_words(fileids=pl.fileids(), categories="cats.txt")