import unittest import nltk from nltk.corpus.reader import pl196x class TestCorpusViews(unittest.TestCase): def test_corpus_reader(self): pl196x_dir = nltk.data.find('corpora/pl196x') pl = pl196x.Pl196xCorpusReader(pl196x_dir, r'.*\.xml', textids='textids.txt', cat_file='cats.txt') pl.tagged_words(fileids=pl.fileids(), categories='cats.txt')