本文整理匯總了Python中nltk.corpus.reader.xmldocs.XMLCorpusView.__init__方法的典型用法代碼示例。如果您正苦於以下問題:Python XMLCorpusView.__init__方法的具體用法?Python XMLCorpusView.__init__怎麽用?Python XMLCorpusView.__init__使用的例子?那麽, 這裏精選的方法代碼示例或許可以為您提供幫助。您也可以進一步了解該方法所在類nltk.corpus.reader.xmldocs.XMLCorpusView
的用法示例。
在下文中一共展示了XMLCorpusView.__init__方法的5個代碼示例,這些例子默認根據受歡迎程度排序。您可以為喜歡或者感覺有用的代碼點讚,您的評價將有助於係統推薦出更棒的Python代碼示例。
示例1: __init__
# 需要導入模塊: from nltk.corpus.reader.xmldocs import XMLCorpusView [as 別名]
# 或者: from nltk.corpus.reader.xmldocs.XMLCorpusView import __init__ [as 別名]
def __init__(self, fileid, sent, tag, strip_space, stem):
"""
:param fileid: The name of the underlying file.
:param sent: If true, include sentence bracketing.
:param tag: The name of the tagset to use, or None for no tags.
:param strip_space: If true, strip spaces from word tokens.
:param stem: If true, then substitute stems for words.
"""
if sent:
tagspec = '.*/s'
else:
tagspec = '.*/s/(.*/)?(c|w)'
self._sent = sent
self._tag = tag
self._strip_space = strip_space
self._stem = stem
self.title = None #: Title of the document.
self.author = None #: Author of the document.
self.editor = None #: Editor
self.resps = None #: Statement of responsibility
XMLCorpusView.__init__(self, fileid, tagspec)
# Read in a tasty header.
self._open()
self.read_block(self._stream, '.*/teiHeader$', self.handle_header)
self.close()
# Reset tag context.
self._tag_context = {0: ()}
示例2: __init__
# 需要導入模塊: from nltk.corpus.reader.xmldocs import XMLCorpusView [as 別名]
# 或者: from nltk.corpus.reader.xmldocs.XMLCorpusView import __init__ [as 別名]
def __init__(self, filename, **kwargs):
self.tags = kwargs.pop('tags', None)
self.tagspec = '.*/seg/fs'
self.xml_tool = XML_Tool(filename, 'ann_morphosyntax.xml')
XMLCorpusView.__init__(
self, self.xml_tool.build_preprocessed_file(), self.tagspec
)
示例3: __init__
# 需要導入模塊: from nltk.corpus.reader.xmldocs import XMLCorpusView [as 別名]
# 或者: from nltk.corpus.reader.xmldocs.XMLCorpusView import __init__ [as 別名]
def __init__(self, filename, **kwargs):
self.mode = kwargs.pop('mode', 0)
self.tagspec = '.*/div/ab'
self.segm_dict = dict()
#xml preprocessing
self.xml_tool = XML_Tool(filename, 'text.xml')
#base class init
XMLCorpusView.__init__(self, self.xml_tool.build_preprocessed_file(), self.tagspec)
示例4: __init__
# 需要導入模塊: from nltk.corpus.reader.xmldocs import XMLCorpusView [as 別名]
# 或者: from nltk.corpus.reader.xmldocs.XMLCorpusView import __init__ [as 別名]
def __init__(self, fileid, unit, bracket_sent, pos_tag, sem_tag):
"""
:param fileid: The name of the underlying file.
:param unit: One of `'token'`, `'word'`, or `'chunk'`.
:param bracket_sent: If true, include sentence bracketing.
:param pos_tag: Whether to include part-of-speech tags.
:param sem_tag: Whether to include semantic tags, namely WordNet lemma
and OOV named entity status.
"""
if bracket_sent: tagspec = '.*/s'
else: tagspec = '.*/s/(punc|wf)'
self._unit = unit
self._sent = bracket_sent
self._pos_tag = pos_tag
self._sem_tag = sem_tag
XMLCorpusView.__init__(self, fileid, tagspec)
示例5: __init__
# 需要導入模塊: from nltk.corpus.reader.xmldocs import XMLCorpusView [as 別名]
# 或者: from nltk.corpus.reader.xmldocs.XMLCorpusView import __init__ [as 別名]
def __init__(self, fileid, tagspec, elt_handler=None):
XMLCorpusView.__init__(self, fileid, tagspec, elt_handler)