当前位置: 首页>>代码示例>>Python>>正文


Python pyocr.get_available_tools方法代码示例

本文整理汇总了Python中pyocr.get_available_tools方法的典型用法代码示例。如果您正苦于以下问题:Python pyocr.get_available_tools方法的具体用法?Python pyocr.get_available_tools怎么用?Python pyocr.get_available_tools使用的例子?那么恭喜您, 这里精选的方法代码示例或许可以为您提供帮助。您也可以进一步了解该方法所在pyocr的用法示例。


在下文中一共展示了pyocr.get_available_tools方法的6个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Python代码示例。

示例1: __init__

# 需要导入模块: import pyocr [as 别名]
# 或者: from pyocr import get_available_tools [as 别名]
def __init__(self, ocr_language):
        tools = pyocr.get_available_tools()
        if len(tools) == 0:
            print("No OCR tool found")
            sys.exit(1)
        self.tool = tools[0]
        print("OCR tool: %s" % self.tool)

        try:
            langs = self.tool.get_available_languages()
            self.lang = langs[0]
            if ocr_language in langs:
                self.lang = ocr_language
            print("OCR selected language: %s (available: %s)" % (self.lang.upper(), ", ".join(langs)))
        except Exception as e:
            print("{}".format(e)) 
开发者ID:lucab85,项目名称:PDFtoTXT,代码行数:18,代码来源:LocalOCR.py

示例2: __init__

# 需要导入模块: import pyocr [as 别名]
# 或者: from pyocr import get_available_tools [as 别名]
def __init__(self, path):
        
        ocr_language = 'eng'
        
        path = path

        #if call(['which', 'tesseract']): #Run the command described by args
        #    print("tesseract-ocr missing") #No tesseract installed
        
        tools = pyocr.get_available_tools()
        if len(tools) == 0:
            print("No OCR tool found")
            sys.exit(1)
        self.tool = tools[0]
        print("OCR tool: %s" % self.tool)

        try:
            langs = self.tool.get_available_languages()
            self.lang = langs[0]
            if ocr_language in langs:
                self.lang = ocr_language
            print("OCR selected language: %s (available: %s)" % (self.lang.upper(), ", ".join(langs)))
        except Exception as e:
            print("{}".format(e)) 
开发者ID:aryaminus,项目名称:saram,代码行数:26,代码来源:saram.py

示例3: check_required_software

# 需要导入模块: import pyocr [as 别名]
# 或者: from pyocr import get_available_tools [as 别名]
def check_required_software():
        logger = logging.getLogger(__name__)
        tools = pyocr.get_available_tools()
        if len(tools) == 0:
            raise PyOCRIntegrationNoOCRFound('No OCR tool has been found on '
                                             'this system. Make sure it\'s on')
        elif len(tools) == 1:
            logger.info("I've found only one ocr tool [%s]. This is not exactly "
                        "an error but you should get better results if you have "
                        "both Tesseract and Cuneiform installed"
                        % tools[0].get_name())
        else:
            logger.info("I've found all required software. We're good to go =)") 
开发者ID:nfscan,项目名称:ocr-process-service,代码行数:15,代码来源:ocr.py

示例4: initialize

# 需要导入模块: import pyocr [as 别名]
# 或者: from pyocr import get_available_tools [as 别名]
def initialize(self):
		''' Initialize Tesseract and load it up for speed '''
		tools = pyocr.get_available_tools()
		if len(tools) == 0:
			print("No tools found, do you have Tesseract installed?")
			sys.exit(1)
		self.tool = tools[0]
		self.langs = self.tool.get_available_languages() 
开发者ID:008karan,项目名称:PAN_OCR,代码行数:10,代码来源:tesseract_ocr.py

示例5: get_default_ocr_lang

# 需要导入模块: import pyocr [as 别名]
# 或者: from pyocr import get_available_tools [as 别名]
def get_default_ocr_lang():
    # Try to guess based on the system locale what would be
    # the best OCR language

    ocr_tools = pyocr.get_available_tools()
    if len(ocr_tools) == 0:
        return DEFAULT_OCR_LANG
    ocr_langs = ocr_tools[0].get_available_languages()

    lang = find_language()
    if hasattr(lang, 'iso639_3_code') and lang.iso639_3_code in ocr_langs:
        return lang.iso639_3_code
    if hasattr(lang, 'terminology') and lang.terminology in ocr_langs:
        return lang.terminology
    return DEFAULT_OCR_LANG 
开发者ID:openpaperwork,项目名称:paperwork-backend,代码行数:17,代码来源:config.py

示例6: image_to_string

# 需要导入模块: import pyocr [as 别名]
# 或者: from pyocr import get_available_tools [as 别名]
def image_to_string(self, filename):
        tools = pyocr.get_available_tools()
        if len(tools) == 0:
            raise PyOCRIntegrationNoOCRFound('No OCR tool has been found on '
                                             'this system. Make sure it\'s on'
                                             'PATH variable of your system')

        filename_split, fileextension_split = os.path.splitext(filename)

        grayscale_filename = filename_split + '_gray' + fileextension_split
        with WandImage(filename=filename) as img:
            img.type = 'grayscale'
            img.save(filename=grayscale_filename)

        adaptive_thresh_filename = filename_split + '_adt' + fileextension_split
        ScikitImageIntegration.adaptive_threshold(grayscale_filename, adaptive_thresh_filename)

        processes = []
        for tool in tools:
            if tool.get_name() == "Tesseract":

                thread_t = self._OCRProcessingThread(tool, self.lang, filename)
                thread_t.start()
                processes.append(thread_t)

            else:
                thread_c_raw = self._OCRProcessingThread(tool, self.lang,
                                                         filename)
                thread_c_raw.start()
                processes.append(thread_c_raw)

                thread_c_gs = self._OCRProcessingThread(tool, self.lang,
                                                        grayscale_filename)
                thread_c_gs.start()
                processes.append(thread_c_gs)

                thread_c_prd = self._OCRProcessingThread(tool, self.lang,
                                                         adaptive_thresh_filename)
                thread_c_prd.start()
                processes.append(thread_c_prd)

        # Wait this all threads finish processing
        result = []
        threads_running = True
        while threads_running:
            found_thread_alive = False
            for p in processes:
                if p.is_alive():
                    found_thread_alive = True

            if not found_thread_alive:
                threads_running = False
                for p in processes:
                    result.append(p.return_value)

        # Removing generated files
        self._cleanup(grayscale_filename)
        self._cleanup(adaptive_thresh_filename)

        return result 
开发者ID:nfscan,项目名称:ocr-process-service,代码行数:62,代码来源:ocr.py


注:本文中的pyocr.get_available_tools方法示例由纯净天空整理自Github/MSDocs等开源代码及文档管理平台,相关代码片段筛选自各路编程大神贡献的开源项目,源码版权归原作者所有,传播和使用请参考对应项目的License;未经允许,请勿转载。