CofeehousePy/nlpfr/nltk/test/unit/test_pl196x.py

15 lines
468 B
Python

import unittest
import nltk
from nltk.corpus.reader import pl196x
class TestCorpusViews(unittest.TestCase):
def test_corpus_reader(self):
pl196x_dir = nltk.data.find('corpora/pl196x')
pl = pl196x.Pl196xCorpusReader(pl196x_dir, r'.*\.xml',
textids='textids.txt',
cat_file='cats.txt')
pl.tagged_words(fileids=pl.fileids(), categories='cats.txt')