本文整理汇总了Java中net.sourceforge.tess4j.Tesseract.getInstance方法的典型用法代码示例。如果您正苦于以下问题:Java Tesseract.getInstance方法的具体用法?Java Tesseract.getInstance怎么用?Java Tesseract.getInstance使用的例子?那么, 这里精选的方法代码示例或许可以为您提供帮助。您也可以进一步了解该方法所在类net.sourceforge.tess4j.Tesseract
的用法示例。
在下文中一共展示了Tesseract.getInstance方法的11个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Java代码示例。
示例1: map
import net.sourceforge.tess4j.Tesseract; //导入方法依赖的package包/类
public void map(LongWritable key, Text url, OutputCollector<Text, Text> output, Reporter reporter) throws IOException {
File videoDownloadDir = Files.createTempDir();
VGet v = new VGet(new URL(url.toString()), videoDownloadDir);
v.download();
System.loadLibrary(Core.NATIVE_LIBRARY_NAME);
File[] videoFiles = videoDownloadDir.listFiles();
Arrays.sort(videoFiles);
File[] videoFramesFiles = VideoProcessing.parseVideo(videoFiles[0], 70);
File[] processedVideoFrames = VideoProcessing.cutImages(videoFramesFiles);
Tesseract instance = Tesseract.getInstance();
instance.setDatapath("/usr/share/tesseract-ocr");
instance.setTessVariable("LC_NUMERIC", "C");
for (File image: processedVideoFrames) {
String result = null;
try {
result = instance.doOCR(image);
} catch (TesseractException e) {
e.printStackTrace();
}
if (!result.isEmpty()) {
word.set(result);
output.collect(url, word);
}
}
}
示例2: main
import net.sourceforge.tess4j.Tesseract; //导入方法依赖的package包/类
public static void main(final String[] args) {
try {
String _property = System.getProperty("java.io.tmpdir");
System.out.println(_property);
String _env = System.getenv("TESSDATA_PREFIX");
System.out.println(_env);
Image _image = new Image("d:\\test\\pdf\\test10.png");
BufferedImage orgin = _image.getAsBufferedImage();
BufferedImage textImage = ImageHelper.convertImageToGrayscale(orgin);
int _width = textImage.getWidth();
int _multiply = (_width * 5);
int _height = textImage.getHeight();
int _multiply_1 = (_height * 5);
BufferedImage _scaledInstance = ImageHelper.getScaledInstance(textImage, _multiply, _multiply_1);
textImage = _scaledInstance;
Tesseract instance = Tesseract.getInstance();
instance.setLanguage("chi_sim");
System.out.println("instance done");
String result = instance.doOCR(textImage);
System.out.println(result);
} catch (Throwable _e) {
throw Exceptions.sneakyThrow(_e);
}
}
示例3: recognizeText
import net.sourceforge.tess4j.Tesseract; //导入方法依赖的package包/类
/**
* Zooms the text image to make it easier to read
* */
public static String recognizeText(Image image) {
LibraryLoaderSingleton.getInstance();
Image scaledImage = image.scale(8);
Tesseract instance = Tesseract.getInstance(); // JNA Interface Mapping
instance.setLanguage("eng");
System.setProperty("jna.encoding", "UTF8");
instance.setOcrEngineMode(TessAPI.TessOcrEngineMode.OEM_DEFAULT);
try {
String result = instance.doOCR(scaledImage.getInnerImage());
return result;
} catch (TesseractException e) {
throw new IllegalStateException(e);
}
catch(Exception ex){
throw new IllegalStateException("An error during text recognition was encountered.");
}
}
示例4: recognizeYText
import net.sourceforge.tess4j.Tesseract; //导入方法依赖的package包/类
public static String recognizeYText(Image image) {
LibraryLoaderSingleton.getInstance();
Image scaledImage = image.scale(8);
Tesseract instance = Tesseract.getInstance(); // JNA Interface Mapping
instance.setLanguage("eng");
System.setProperty("jna.encoding", "UTF8");
instance.setOcrEngineMode(TessAPI.TessOcrEngineMode.OEM_DEFAULT);
try {
String result = instance.doOCR(scaledImage.getInnerImage());
return result;
} catch (TesseractException e) {
throw new IllegalStateException(e);
}
catch(Exception ex){
throw new IllegalStateException("An error during text recognition was encountered.");
}
}
示例5: main
import net.sourceforge.tess4j.Tesseract; //导入方法依赖的package包/类
public static void main(String[] args){
try {
boolean load = true;
load = false;
// BufferedImage image = ImageIO.read(new URL("http://www.miitbeian.gov.cn/captcha.jpg")) ;
// if(load){
// ImageIO.write(image, "jpg", new File("E:/captcha.jpg") );
// }else{
// image = ImageIO.read(new File("D:\\爬虫测试\\yzm\\111.png")) ;
// }
BufferedImage image = ImageIO.read(new File("D:\\爬虫测试\\yzm\\11.jpg")) ;
// image = ImageUtil.grayFilter(image);
image = ImageUtil.binaryFilter(image);
image = ImageUtil.lineFilter(image);
// image = ImageUtil.lineFilter(image);
// image = ImageUtil.line2Filter(image);
// image = ImageUtil.point2Filter(image);
// image = ImageUtil.lineFilter(image);
image = ImageUtil.meanFilter(image);
// image = ImageUtil.lineFilter(image);
// image = ImageUtil.binaryFilter(image);
File imageFile = new File("E:/captcha5.jpg");
// imageFile = new File("E:/test/test.jpg");
ImageIO.write(image, "jpg", imageFile);
Tesseract tesseract = Tesseract.getInstance();
tesseract.setLanguage("eng");
String code = tesseract.doOCR(imageFile);
System.out.println(code);
} catch (Exception e) {
e.printStackTrace();
}
}
示例6: ocr
import net.sourceforge.tess4j.Tesseract; //导入方法依赖的package包/类
public static String ocr(File file) {
Tesseract instance = Tesseract.getInstance(); // JNA Interface Mapping
instance.setDatapath(tessdataPath);
instance.setLanguage("eng");
//instance.setLanguage("number");
String result = "";
try {
result = instance.doOCR(file);
} catch (TesseractException e) {
System.err.println(e.getMessage());
} finally {
}
return result;
}
示例7: recognizeXText
import net.sourceforge.tess4j.Tesseract; //导入方法依赖的package包/类
public static String recognizeXText(Image image) {
LibraryLoaderSingleton.getInstance();
Tesseract instance = Tesseract.getInstance(); // JNA Interface Mapping
instance.setOcrEngineMode(TessAPI.TessOcrEngineMode.OEM_TESSERACT_ONLY);
BufferedImage img = getScaledImage(image.getInnerImage(), image.getInnerImage().getWidth()*2, image.getInnerImage().getHeight()*2);
img = thresholdImage(img, 165);
try {
String result = instance.doOCR(img);
return result;
} catch (TesseractException e) {
throw new IllegalStateException(e);
}
catch(Exception ex){
throw new IllegalStateException("An error during text recognition was encountered.");
}
}
示例8: performOcr
import net.sourceforge.tess4j.Tesseract; //导入方法依赖的package包/类
/**
* Perform the actual OCR using Tesseract.
*
* @param image An image to be processed by OCR. Should be cropped and filtered to ensure the contrast is sufficient.
* @return The text that was recognised in the image
*/
protected String performOcr(BufferedImage image, int iteration) throws OcrException {
try {
Tesseract instance = Tesseract.getInstance();
instance.setPageSegMode(getTesseractPageSegMode(iteration));
String output = instance.doOCR(image);
return output.trim();
} catch (Exception e) {
throw new OcrException("Error performing OCR", e);
}
}
示例9: doOcrFile
import net.sourceforge.tess4j.Tesseract; //导入方法依赖的package包/类
@RequestMapping(value = "ocr/v0.9/upload", method = RequestMethod.POST, consumes = MediaType.APPLICATION_JSON_VALUE, produces = MediaType.APPLICATION_JSON_VALUE)
public Status doOcrFile(@RequestBody final Image image) throws Exception {
File tmpFile = File.createTempFile("ocr_image", image.getExtension());
try {
FileUtils.writeByteArrayToFile(tmpFile, Base64.decodeBase64(image.getImage()));
Tesseract tesseract = Tesseract.getInstance(); // JNA Interface Mapping
String imageText = tesseract.doOCR(tmpFile);
LOGGER.debug("OCR Image Text = " + imageText);
} catch (Exception e) {
LOGGER.error("Exception while converting/uploading image: ", e);
throw new TesseractException();
} finally {
tmpFile.delete();
}
return new Status("success");
}
示例10: doOcr
import net.sourceforge.tess4j.Tesseract; //导入方法依赖的package包/类
@RequestMapping(value = "ocr/v1/upload", method = RequestMethod.POST, consumes = MediaType.APPLICATION_JSON_VALUE, produces = MediaType.APPLICATION_JSON_VALUE)
public Status doOcr(@RequestBody Image image) throws Exception {
try {
//FileUtils.writeByteArrayToFile(tmpFile, Base64.decodeBase64(image.getImage()));
ByteArrayInputStream bis = new ByteArrayInputStream(Base64.decodeBase64(image.getImage()));
Tesseract tesseract = Tesseract.getInstance(); // JNA Interface Mapping
String imageText = tesseract.doOCR(ImageIO.read(bis));
image.setText(imageText);
repository.save(image);
LOGGER.debug("OCR Result = " + imageText);
} catch (Exception e) {
LOGGER.error("TessearctException while converting/uploading image: ", e);
throw new TesseractException();
}
return new Status("success");
}
示例11: parse
import net.sourceforge.tess4j.Tesseract; //导入方法依赖的package包/类
public static void parse(BufferedImage image) throws Exception {
Tesseract tesseract = Tesseract.getInstance();
tesseract.setLanguage(language);
// ImageIO.write(image, "PNG", new File("img/" + System.currentTimeMillis() + ".png"));
String text = tesseract.doOCR(image).trim();
text = text.replaceAll("[^\\w\n.,;!?\'\":»«„”\\(\\) ]", "");
System.out.println(text);
read(text);
}