本文整理汇总了Python中html.parser.HTMLParser.__init__方法的典型用法代码示例。如果您正苦于以下问题:Python HTMLParser.__init__方法的具体用法?Python HTMLParser.__init__怎么用?Python HTMLParser.__init__使用的例子?那么恭喜您, 这里精选的方法代码示例或许可以为您提供帮助。您也可以进一步了解该方法所在类html.parser.HTMLParser
的用法示例。
在下文中一共展示了HTMLParser.__init__方法的15个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Python代码示例。
示例1: __init__
# 需要导入模块: from html.parser import HTMLParser [as 别名]
# 或者: from html.parser.HTMLParser import __init__ [as 别名]
def __init__(self, **kwargs):
HTMLParser.__init__(self)
self.kwargs = kwargs
self.active = None
self.last_content = ""
self.rows = []
self.found_first_valid_num = False
示例2: __init__
# 需要导入模块: from html.parser import HTMLParser [as 别名]
# 或者: from html.parser.HTMLParser import __init__ [as 别名]
def __init__(self):
HTMLParser.__init__(self)
self.collect_data = False
self.bound = 20
self.des_tag = "div"
self.des_attr = ("id", "content")
self.stations_info = None
示例3: __init__
# 需要导入模块: from html.parser import HTMLParser [as 别名]
# 或者: from html.parser.HTMLParser import __init__ [as 别名]
def __init__(self, builder=None, encoding=None):
self.__stack = []
if builder is None:
builder = ElementTree.TreeBuilder()
self.__builder = builder
self.encoding = encoding or "iso-8859-1"
HTMLParser.__init__(self)
示例4: __init__
# 需要导入模块: from html.parser import HTMLParser [as 别名]
# 或者: from html.parser.HTMLParser import __init__ [as 别名]
def __init__(self):
HTMLParser.__init__(self)
self.data = dict()
self.recordingAuthor = False
self.recordingBody = False;
self.data["body"] = ""
self.save_tags = ['p', 'blockquote', 'h1', 'h2', 'h3', 'h4', 'h5']
示例5: __init__
# 需要导入模块: from html.parser import HTMLParser [as 别名]
# 或者: from html.parser.HTMLParser import __init__ [as 别名]
def __init__(self):
HTMLParser.__init__(self)
self.url = None
self.params = {}
self.in_form = False
self.form_parsed = False
self.method = "GET"
示例6: __init__
# 需要导入模块: from html.parser import HTMLParser [as 别名]
# 或者: from html.parser.HTMLParser import __init__ [as 别名]
def __init__(self, results, url, trackers):
HTMLParser.__init__(self)
self.results = results
self.url = url
self.trackers = trackers
self.td_counter = None
self.current_item = None
示例7: __init__
# 需要导入模块: from html.parser import HTMLParser [as 别名]
# 或者: from html.parser.HTMLParser import __init__ [as 别名]
def __init__(self,strict=False):
# Constructor call of parent class.
HTMLParser.__init__(self,strict)
# Defining variables of this class.
# There are 3 types of variables.
# data_variables: these are the required information
# data_check_variables: boolean values corresponding to each of the data_variables
# to keep a check on the data been already extracted or not.
# tag_check_variables: used for matching the proper format.
self.h1=False
self.desc=False
self.description=' '
self.sol=False
self.solution=' '
self.p=False;
self.li=False;
self.ref=False;
self.references=' '
self.cvss=False;
self.cvss_score=0.0;
self.cve=False
self.cve_id=' '
self.links=[]
self.prod=False;
self.products=[]
self.last_h6=' '
self.h6=False
self.h7=False
self.clas=False
self.attack_from=' '
self.attk=False
self.impact=' '
self.impt=False
示例8: __init__
# 需要导入模块: from html.parser import HTMLParser [as 别名]
# 或者: from html.parser.HTMLParser import __init__ [as 别名]
def __init__(self,
remove_comments=False,
remove_empty_space=False,
remove_all_empty_space=False,
reduce_empty_attributes=True,
reduce_boolean_attributes=False,
remove_optional_attribute_quotes=True,
keep_pre=False,
pre_tags=PRE_TAGS,
pre_attr='pre'):
if sys.version_info[0] >= 3 and sys.version_info[1] >= 4:
# convert_charrefs is True by default in Python 3.5.0 and newer. It was
# introduced in 3.4.
HTMLParser.__init__(self, convert_charrefs=False)
else:
HTMLParser.__init__(self)
self.keep_pre = keep_pre
self.pre_tags = pre_tags
self.remove_comments = remove_comments
self.remove_empty_space = remove_empty_space
self.remove_all_empty_space = remove_all_empty_space
self.reduce_empty_attributes = reduce_empty_attributes
self.reduce_boolean_attributes = reduce_boolean_attributes
self.remove_optional_attribute_quotes = remove_optional_attribute_quotes
self.pre_attr = pre_attr
self._data_buffer = []
self._in_pre_tag = 0
self._in_head = False
self._in_title = False
self._after_doctype = False
self._tag_stack = []
self._title_newly_opened = False
self.__title_trailing_whitespace = False
示例9: __init__
# 需要导入模块: from html.parser import HTMLParser [as 别名]
# 或者: from html.parser.HTMLParser import __init__ [as 别名]
def __init__(self):
HTMLParser.__init__(self)
self.starParsing = False
self.ratingParsing = False
self.starStack = Stack()
self.ratingStack = Stack()
self.ratingDict = {}
示例10: __init__
# 需要导入模块: from html.parser import HTMLParser [as 别名]
# 或者: from html.parser.HTMLParser import __init__ [as 别名]
def __init__(self):
HTMLParser.__init__(self)
self.items = []
self.foundItem = False
self.br_before = False
self.checkBr = False
self.current_item_url = ""
示例11: __init__
# 需要导入模块: from html.parser import HTMLParser [as 别名]
# 或者: from html.parser.HTMLParser import __init__ [as 别名]
def __init__(self,
remove_comments=False,
remove_empty_space=False,
remove_all_empty_space=False,
reduce_empty_attributes=True,
reduce_boolean_attributes=False,
remove_optional_attribute_quotes=True,
keep_pre=False,
pre_tags=PRE_TAGS,
pre_attr='pre'):
HTMLParser.__init__(self)
self.keep_pre = keep_pre
self.pre_tags = pre_tags
self.remove_comments = remove_comments
self.remove_empty_space = remove_empty_space
self.remove_all_empty_space = remove_all_empty_space
self.reduce_empty_attributes = reduce_empty_attributes
self.reduce_boolean_attributes = reduce_boolean_attributes
self.remove_optional_attribute_quotes = remove_optional_attribute_quotes
self.pre_attr = pre_attr
self._data_buffer = []
self._in_pre_tag = 0
self._in_head = False
self._in_title = False
self._after_doctype = False
self._tag_stack = []
self._title_newly_opened = False
self.__title_trailing_whitespace = False
示例12: __init__
# 需要导入模块: from html.parser import HTMLParser [as 别名]
# 或者: from html.parser.HTMLParser import __init__ [as 别名]
def __init__(self):
HTMLParser.__init__(self)
self.links = []
self.isNumber = 0
self.stack = []
self.day = []
self.test = []
示例13: __init__
# 需要导入模块: from html.parser import HTMLParser [as 别名]
# 或者: from html.parser.HTMLParser import __init__ [as 别名]
def __init__(self, news):
HTMLParser.__init__(self)
self.count_a = 0;
self.current_tag = ""
self.looking_for_testata = False
self.news = news
示例14: __init__
# 需要导入模块: from html.parser import HTMLParser [as 别名]
# 或者: from html.parser.HTMLParser import __init__ [as 别名]
def __init__(self):
HTMLParser.__init__(self)
self.stack = []
self.template_names = []
self.templates = {}
self.current_template = ""
self.current_template_count = 0
示例15: __init__
# 需要导入模块: from html.parser import HTMLParser [as 别名]
# 或者: from html.parser.HTMLParser import __init__ [as 别名]
def __init__(self, url):
HTMLParser.__init__(self)
self.url = url
self.current_item = None
self.save_data = None
self.seeds_leech = False
self.size_repl = re_compile(",")