You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
15 lines
454 B
Python
15 lines
454 B
Python
import unittest
|
|
|
|
import nltk
|
|
from nltk.corpus.reader import pl196x
|
|
|
|
|
|
class TestCorpusViews(unittest.TestCase):
|
|
|
|
def test_corpus_reader(self):
|
|
pl196x_dir = nltk.data.find('corpora/pl196x')
|
|
pl = pl196x.Pl196xCorpusReader(pl196x_dir, r'.*\.xml',
|
|
textids='textids.txt',
|
|
cat_file='cats.txt')
|
|
pl.tagged_words(fileids=pl.fileids(), categories='cats.txt')
|