Package nltk :: Package corpus :: Package reader :: Module pl196x
[hide private]
[frames] | no frames]

Module pl196x

source code

Classes [hide private]
TEICorpusView
Pl196xCorpusReader
Variables [hide private]
  PARA = re.compile(r'<p(?: [^>]*)?>(.*?)</p>')
  SENT = re.compile(r'<s(?: [^>]*)?>(.*?)</s>')
  TAGGEDWORD = re.compile(r'<([wc](?: [^>]*)?>)(.*?)</[wc]>')
  WORD = re.compile(r'<[wc](?: [^>]*)?>(.*?)</[wc]>')
  TYPE = re.compile(r'type="(.*?)"')
  ANA = re.compile(r'ana="(.*?)"')
  TEXTID = re.compile(r'text id="(.*?)"')