Code Coverage for nltk.corpus.reader.wordlist
Untested Functions
|
Partially Tested Functions
|
from nltk.corpus.reader.util import *
from nltk.corpus.reader.api import *
from nltk.internals import deprecated
from nltk.tokenize import line_tokenize
class WordListCorpusReader(CorpusReader):
"""
List of words, one per line. Blank lines are ignored.
"""
def words(self, files=None):
return line_tokenize(self.raw(files))
def raw(self, files=None):
if files is None: files = self._files
elif isinstance(files, basestring): files = [files]
return concat([self.open(f).read() for f in files])
@deprecated("Use .raw() or .words() instead.")
def read(self, items=None, format='listed'):
if format == 'raw': return self.raw(items)
if format == 'listed': return self.words(items)
raise ValueError('bad format %r' % format)
@deprecated("Use .words() instead.")
def listed(self, items=None):
return self.words(items)