test_pl196x.py 454 B

1234567891011121314
  1. import unittest
  2. import nltk
  3. from nltk.corpus.reader import pl196x
  4. class TestCorpusViews(unittest.TestCase):
  5. def test_corpus_reader(self):
  6. pl196x_dir = nltk.data.find('corpora/pl196x')
  7. pl = pl196x.Pl196xCorpusReader(pl196x_dir, r'.*\.xml',
  8. textids='textids.txt',
  9. cat_file='cats.txt')
  10. pl.tagged_words(fileids=pl.fileids(), categories='cats.txt')