Python HTMLParser.__init__方法代碼示例

本文整理匯總了Python中html.parser.HTMLParser.__init__方法的典型用法代碼示例。如果您正苦於以下問題：Python HTMLParser.__init__方法的具體用法？Python HTMLParser.__init__怎麽用？Python HTMLParser.__init__使用的例子？那麽, 這裏精選的方法代碼示例或許可以為您提供幫助。您也可以進一步了解該方法所在類html.parser.HTMLParser的用法示例。

在下文中一共展示了HTMLParser.__init__方法的15個代碼示例，這些例子默認根據受歡迎程度排序。您可以為喜歡或者感覺有用的代碼點讚，您的評價將有助於係統推薦出更棒的Python代碼示例。

示例1: init

# 需要導入模塊: from html.parser import HTMLParser [as 別名]
# 或者: from html.parser.HTMLParser import __init__ [as 別名]
def __init__(
        self,
        decode_html_entities=False,
        data_separator=' ',
    ):

        HTMLParser.__init__(self, convert_charrefs=decode_html_entities)

        self._data_separator = data_separator

        self._in_td = False
        self._in_th = False
        self._current_table = []
        self._current_row = []
        self._current_cell = []
        self.tables = []

開發者ID:schmijos，項目名稱:html-table-parser-python3，代碼行數:18，代碼來源:parser.py

示例2: init

# 需要導入模塊: from html.parser import HTMLParser [as 別名]
# 或者: from html.parser.HTMLParser import __init__ [as 別名]
def __init__(self, start_tag, start_attr, end_tag, end_attr):
        """使用相當簡單

        html = '<div class="declare" id="J-declare">聲明：百科詞條人人可編輯。<a class="declare-details"></a>'
        p = ParseHtml('div', ['class="declare"'], 'a', ['class="declare-details"'])
        p.feed(html)
        print(p.get_data())  # 聲明：百科詞條人人可編輯。

        :param start_tag: 開始標簽，必須填寫
        :param start_attr: 開始標簽裏麵的屬性，切記一定是列表[]類型。如果沒有，傳入空列表[]
        :param end_tag: 結束標簽，必須填寫
        :param end_attr: 結束標簽裏麵的屬性，切記一定是列表[]類型。如果沒有，傳入空列表[]
        """
        HTMLParser.__init__(self)
        self._data = ''
        self._flag = False
        self._start_tag = start_tag
        self._start_attr = self._split(start_attr)
        self._end_tag = end_tag
        self._end_attr = self._split(end_attr)

開發者ID:jtyoui，項目名稱:Jtyoui，代碼行數:22，代碼來源:HTML.py

示例3: init

# 需要導入模塊: from html.parser import HTMLParser [as 別名]
# 或者: from html.parser.HTMLParser import __init__ [as 別名]
def __init__(self, *args, **kwargs):
        '''
            __init__ - Create an AdvancedTagSlim object.

                @see AdvancedTag

                Extra arguments:

                  slimSelfClosing <bool> default False - If True, will use slim-endings on self-closing tags,

                    i.e. <br/> instead of <br />

                    This may break xhtml compatibility but modern browsers are okay with it.
        '''
        if 'slimSelfClosing' in kwargs:
            slimSelfClosing = kwargs.pop('slimSelfClosing')
        else:
            slimSelfClosing = False
        AdvancedTag.__init__(self, *args, **kwargs)

        object.__setattr__(self, 'slimSelfClosing', slimSelfClosing)

開發者ID:kata198，項目名稱:AdvancedHTMLParser，代碼行數:23，代碼來源:Formatter.py

示例4: init

# 需要導入模塊: from html.parser import HTMLParser [as 別名]
# 或者: from html.parser.HTMLParser import __init__ [as 別名]
def __init__(self, data):
        """
        The data holds the characters.

        Example:

        html = Html()
        data = '<body><em>alpha</em></body>'
        dom = html.feed(data)
        x = dom.fst('em')
        x.append(Data('\nbeta'))

        It outputs.

        <body ><em >alpha
        beta</em></body>
        """

        Root.__init__(self, DATA)
        self.data = data

開發者ID:iogf，項目名稱:ehp，代碼行數:22，代碼來源:ehp.py

示例5: init

# 需要導入模塊: from html.parser import HTMLParser [as 別名]
# 或者: from html.parser.HTMLParser import __init__ [as 別名]
def __init__(self, obj_type, results, heading, metadata):
        """Init our data structure.

        Args:
            obj_type: String object type name (as returned by
                device_type)
            results: A list of Result objects to include in the
                report.
            heading: String heading describing the report.
            metadata: Dictionary of other data you want to output.
                key: Heading name.
                val Another dictionary, with:
                    key: Subheading name.
                    val: String of data to print.
        """
        self.obj_type = obj_type
        self.results = results
        self.heading = heading
        self.metadata = metadata

開發者ID:jssimporter，項目名稱:Spruce，代碼行數:21，代碼來源:spruce.py

示例6: init

# 需要導入模塊: from html.parser import HTMLParser [as 別名]
# 或者: from html.parser.HTMLParser import __init__ [as 別名]
def __init__(self, *args):
        super(EmailAlerter, self).__init__(*args)

        self.smtp_host = self.rule.get('smtp_host', 'localhost')
        self.smtp_ssl = self.rule.get('smtp_ssl', False)
        self.from_addr = self.rule.get('from_addr', 'ElastAlert')
        self.smtp_port = self.rule.get('smtp_port')
        if self.rule.get('smtp_auth_file'):
            self.get_account(self.rule['smtp_auth_file'])
        self.smtp_key_file = self.rule.get('smtp_key_file')
        self.smtp_cert_file = self.rule.get('smtp_cert_file')
        # Convert email to a list if it isn't already
        if isinstance(self.rule['email'], str):
            self.rule['email'] = [self.rule['email']]
        # If there is a cc then also convert it a list if it isn't
        cc = self.rule.get('cc')
        if cc and isinstance(cc, str):
            self.rule['cc'] = [self.rule['cc']]
        # If there is a bcc then also convert it to a list if it isn't
        bcc = self.rule.get('bcc')
        if bcc and isinstance(bcc, str):
            self.rule['bcc'] = [self.rule['bcc']]
        add_suffix = self.rule.get('email_add_domain')
        if add_suffix and not add_suffix.startswith('@'):
            self.rule['email_add_domain'] = '@' + add_suffix

開發者ID:Yelp，項目名稱:elastalert，代碼行數:27，代碼來源:alerts.py

示例7: init

# 需要導入模塊: from html.parser import HTMLParser [as 別名]
# 或者: from html.parser.HTMLParser import __init__ [as 別名]
def __init__(self, fileepub):
        self.path = os.path.abspath(fileepub)
        self.file = zipfile.ZipFile(fileepub, "r")
        cont = ET.parse(self.file.open("META-INF/container.xml"))
        self.rootfile = cont.find(
            "CONT:rootfiles/CONT:rootfile",
            self.NS
        ).attrib["full-path"]
        self.rootdir = os.path.dirname(self.rootfile)\
            + "/" if os.path.dirname(self.rootfile) != "" else ""
        cont = ET.parse(self.file.open(self.rootfile))
        # EPUB3
        self.version = cont.getroot().get("version")
        if self.version == "2.0":
            # self.toc = self.rootdir + cont.find("OPF:manifest/*[@id='ncx']", self.NS).get("href")
            self.toc = self.rootdir\
                + cont.find(
                    "OPF:manifest/*[@media-type='application/x-dtbncx+xml']",
                    self.NS
                ).get("href")
        elif self.version == "3.0":
            self.toc = self.rootdir\
                + cont.find(
                    "OPF:manifest/*[@properties='nav']",
                    self.NS
                ).get("href")

        self.contents = []
        self.toc_entries = []

開發者ID:wustho，項目名稱:epr，代碼行數:31，代碼來源:epr.py

示例8: init

# 需要導入模塊: from html.parser import HTMLParser [as 別名]
# 或者: from html.parser.HTMLParser import __init__ [as 別名]
def __init__(self):
        HTMLParser.__init__(self)

開發者ID:graalvm，項目名稱:mx，代碼行數:4，代碼來源:mx_mxtests.py

示例9: get_links

# 需要導入模塊: from html.parser import HTMLParser [as 別名]
# 或者: from html.parser.HTMLParser import __init__ [as 別名]
def get_links(html):
    class URLSeeker(HTMLParser):
        def __init__(self):
            HTMLParser.__init__(self)
            self.urls = []

        def handle_starttag(self, tag, attrs):
            href = dict(attrs).get('href')
            if href and tag == 'a':
                self.urls.append(href)

    url_seeker = URLSeeker()
    url_seeker.feed(html)
    return url_seeker.urls

開發者ID:tao12345666333，項目名稱:tornado-zh，代碼行數:16，代碼來源:webspider.py

示例10: init

# 需要導入模塊: from html.parser import HTMLParser [as 別名]
# 或者: from html.parser.HTMLParser import __init__ [as 別名]
def __init__(self):
        HTMLParser.__init__(self)
        self._data_flag = ''
        self.desc = ''
        self._desc_flag = False
        self.info_name = []
        self.info_value = []
        self._info_name = False
        self._info_value = False
        self.info = {}

開發者ID:jtyoui，項目名稱:Jtyoui，代碼行數:12，代碼來源:Encyclopedias.py

示例11: init

# 需要導入模塊: from html.parser import HTMLParser [as 別名]
# 或者: from html.parser.HTMLParser import __init__ [as 別名]
def __init__(self):
        HTMLParser.__init__(self)
        self.weather_7d = False
        self.name = False
        self.addr = ''
        self.data_7d = []
        self.string = ''

開發者ID:jtyoui，項目名稱:Jtyoui，代碼行數:9，代碼來源:WeatherAddress.py

示例12: init

# 需要導入模塊: from html.parser import HTMLParser [as 別名]
# 或者: from html.parser.HTMLParser import __init__ [as 別名]
def __init__(self, base_url, concurrency=10):
        self.q = queues.Queue()
        self.q2 = queues.Queue()
        self.start = time.time()
        self.fetching = set()
        self.fetched = set()
        self.base_url = base_url
        self.concurrency = concurrency
        self.i = 0

開發者ID:makelove，項目名稱:Python_Master_Courses，代碼行數:11，代碼來源:tornado-crawler-demo2.py

示例13: get_links

# 需要導入模塊: from html.parser import HTMLParser [as 別名]
# 或者: from html.parser.HTMLParser import __init__ [as 別名]
def get_links(self, html):
        class URLSeeker(HTMLParser):
            def __init__(self):
                HTMLParser.__init__(self)
                self.urls = []

            def handle_starttag(self, tag, attrs):
                href = dict(attrs).get('href')
                if href and tag == 'a':
                    self.urls.append(href)

        url_seeker = URLSeeker()
        url_seeker.feed(html)
        return url_seeker.urls

開發者ID:makelove，項目名稱:Python_Master_Courses，代碼行數:16，代碼來源:tornado-crawler-demo2.py

示例14: get_links

# 需要導入模塊: from html.parser import HTMLParser [as 別名]
# 或者: from html.parser.HTMLParser import __init__ [as 別名]
def get_links(html):#解析HTML
    class URLSeeker(HTMLParser):
        def __init__(self):
            HTMLParser.__init__(self)
            self.urls = []

        def handle_starttag(self, tag, attrs):
            href = dict(attrs).get('href')
            if href and tag == 'a':
                self.urls.append(href)

    url_seeker = URLSeeker()
    url_seeker.feed(html)
    return url_seeker.urls

開發者ID:makelove，項目名稱:Python_Master_Courses，代碼行數:16，代碼來源:tornado-crawler-demo1.py

示例15: init

# 需要導入模塊: from html.parser import HTMLParser [as 別名]
# 或者: from html.parser.HTMLParser import __init__ [as 別名]
def __init__(self, v, typ=None):
        self.type = typ
        self.value = v.strip("\n\r\t ")

開發者ID:manatlan，項目名稱:vbuild，代碼行數:5，代碼來源:__init__.py

注：本文中的html.parser.HTMLParser.__init__方法示例由純淨天空整理自Github/MSDocs等開源代碼及文檔管理平台，相關代碼片段篩選自各路編程大神貢獻的開源項目，源碼版權歸原作者所有，傳播和使用請參考對應項目的License；未經允許，請勿轉載。

示例1: __init__

示例2: __init__

示例3: __init__

示例4: __init__

示例5: __init__

示例6: __init__

示例7: __init__

示例8: __init__