| 1234567891011121314 |
- import unittest
- import nltk
- from nltk.corpus.reader import pl196x
- class TestCorpusViews(unittest.TestCase):
- def test_corpus_reader(self):
- pl196x_dir = nltk.data.find('corpora/pl196x')
- pl = pl196x.Pl196xCorpusReader(pl196x_dir, r'.*\.xml',
- textids='textids.txt',
- cat_file='cats.txt')
- pl.tagged_words(fileids=pl.fileids(), categories='cats.txt')
|