當前位置: 首頁>>代碼示例>>Python>>正文


Python Detector.detect方法代碼示例

本文整理匯總了Python中Detector.Detector.detect方法的典型用法代碼示例。如果您正苦於以下問題:Python Detector.detect方法的具體用法?Python Detector.detect怎麽用?Python Detector.detect使用的例子?那麽, 這裏精選的方法代碼示例或許可以為您提供幫助。您也可以進一步了解該方法所在Detector.Detector的用法示例。


在下文中一共展示了Detector.detect方法的3個代碼示例,這些例子默認根據受歡迎程度排序。您可以為喜歡或者感覺有用的代碼點讚,您的評價將有助於係統推薦出更棒的Python代碼示例。

示例1: performAnalyse

# 需要導入模塊: from Detector import Detector [as 別名]
# 或者: from Detector.Detector import detect [as 別名]
 def performAnalyse(self, htmlnode):
     se = StructureExtractor()
     se.drawFeature(htmlnode)
     extractor = Extractor(htmlnode)
     extractor.process()
     detector = Detector()
     detector.detect(htmlnode)
     (tp, fp, fn) = self.calcAccTitleLine(htmlnode)
     cerr = self.calcAccColumn(htmlnode)
     return (tp, fp, fn, cerr)
開發者ID:cheungzq,項目名稱:WebParser,代碼行數:12,代碼來源:Analyser.py

示例2: process

# 需要導入模塊: from Detector import Detector [as 別名]
# 或者: from Detector.Detector import detect [as 別名]
 def process(self,root):
     se = StructureExtractor()
     se.drawFeature(root)
     self.extractor = Extractor(root)
     self.extractor.process()
     #self.crossP = self.extractor.string2sparse(self.htmlnode.attrib['crossP'],self.extractor.totalheight+1)
     Config.init()
     detector = Detector()#Config.nbTLstr)
     detector.detect(root)
     self.toolbox.setDetector(detector)
開發者ID:cheungzq,項目名稱:WebParser,代碼行數:12,代碼來源:visualizer.py

示例3: __init__

# 需要導入模塊: from Detector import Detector [as 別名]
# 或者: from Detector.Detector import detect [as 別名]
class Analyser:
    def __init__(self):
        Config.init()
        self.detector = Detector()#Config.nbTLstr)

    def analyse(self, xmlfilelist):
        parser = etree.XMLParser(recover=True)
        total_tp = 0
        total_fp = 0
        total_fn = 0
        fnfid = {}
        fpfid = {}
        cerrs = dict.fromkeys(['AUTHOR', 'COUNT_READ', 'COUNT_REPLY', 'TITLE', 'TM_POST', 'TM_REPLY'],0)
        cerrfiles = {}
        num = 0
        for xmlfile in xmlfilelist:
            #print(xmlfile)
            if num % 200 == 0 :
                print(num/len(xmlfilelist))
                print('REV.150')
                print('total_tp:', total_tp)
                print('total_fp:', total_fp)
                print('total_fn:', total_fn)
                print('fnfid:', fnfid)
                print('fpfid:', fpfid)

                print('cerrs:',cerrs)
                print('cerrfiles:', cerrfiles)
            num += 1
            root = etree.parse(xmlfile,parser).getroot()
            htmlnode = root[0]
            se = StructureExtractor()
            se.drawFeature(htmlnode)
            extractor = Extractor(htmlnode)
            extractor.process()
            self.detector.detect(htmlnode)
            (tp, fp, fn) = self.calcAccTitleLine(htmlnode)
            total_tp += tp
            total_fp += fp
            total_fn += fn
            if fn == 0:
                cerr = self.calcAccColumn(htmlnode)
                for k in cerr:
                    cerrs[k] += 1
                if len(cerr)>0:
                    cerrfiles[path.basename(xmlfile)] = (cerr, root.attrib['fid'])
            if fp > 0:
                #print(xmlfile)
                fpfid[root.attrib['fid']] = fpfid.get(root.attrib['fid'],0) + 1
            if fn > 0:
                print(xmlfile)
                fnfid[root.attrib['fid']] = fnfid.get(root.attrib['fid'],0) + 1
        print('REV.150')
        print('total_tp:', total_tp)
        print('total_fp:', total_fp)
        print('total_fn:', total_fn)
        print('fnfid:', fnfid)
        print('fpfid:', fpfid)

        print('cerrs:',cerrs)
        print('cerrfiles:', cerrfiles)

    def analyseOnce(self, xmlfile):
        parser = etree.XMLParser(recover=True)
        root = etree.parse(xmlfile,parser).getroot()
        htmlnode = root[0]
        return self.performAnalyse(htmlnode)

    def performAnalyse(self, htmlnode):
        se = StructureExtractor()
        se.drawFeature(htmlnode)
        extractor = Extractor(htmlnode)
        extractor.process()
        detector = Detector()
        detector.detect(htmlnode)
        (tp, fp, fn) = self.calcAccTitleLine(htmlnode)
        cerr = self.calcAccColumn(htmlnode)
        return (tp, fp, fn, cerr)

    def calcAccTitleLine(self, root):
        ptls = set(root.findall('.//*[@predict="{}"]'.format(LABEL['TITLE_LINE'])))
        ttls = set(root.findall('.//*[@label="{}"]'.format(LABEL['TITLE_LINE'])))
        tp = len(ptls & ttls)
        fp = len(ptls) - tp
        fn = len(ttls) - tp
        return (tp, fp, fn)
    def calcAccColumn(self, root):
        k = 1
        columns = {}
        while True:
            cs = root.findall('.//*[@column="{}"]'.format(k))
            if len(cs) == 0:
                break
            columns[k] = set(cs)
            k += 1
        dls = ['AUTHOR', 'COUNT_READ', 'COUNT_REPLY', 'TITLE', 'TM_POST', 'TM_REPLY']
        err = set()
        for key in dls:
            ts = set(root.findall('.//*[@predict="{}"]//*[@label="{}"]'.format(LABEL['TITLE_LINE'],LABEL[key])))
            cs = set()
#.........這裏部分代碼省略.........
開發者ID:cheungzq,項目名稱:WebParser,代碼行數:103,代碼來源:Analyser.py


注:本文中的Detector.Detector.detect方法示例由純淨天空整理自Github/MSDocs等開源代碼及文檔管理平台,相關代碼片段篩選自各路編程大神貢獻的開源項目,源碼版權歸原作者所有,傳播和使用請參考對應項目的License;未經允許,請勿轉載。