import net.sourceforge.tess4j.ITesseract;
import net.sourceforge.tess4j.Tesseract;
import net.sourceforge.tess4j.TesseractException;
import javax.imageio.ImageIO;
import java.awt.*;
import java.awt.image.BufferedImage;
import java.io.File;
import java.util.HashMap;
import java.util.Map;
public class Tes_Cut {
public static void main(String[] args) throws Exception {
Map<String, String> resultMap = new HashMap<>();
int areaHeight = 245;
File imageFile = new File("/home/ubt/ocr/2.jpg");
if (!imageFile.exists()){
System.out.println("======== don't find this file! ========");
return;
}
BufferedImage image = ImageIO.read(imageFile);
if (image.getWidth() != 2590){
ImageUtils.zoomImage(imageFile, 2590, 3903);
imageFile = new File("/home/ubt/ocr/2.jpg");
}
ITesseract iTesseract = new Tesseract();
iTesseract.setDatapath("./tessdata/");
iTesseract.setLanguage("eng+chi_sim");
// iTesseract.setLanguage("eng");1857 2655
try {
String result1 = iTesseract.doOCR(imageFile, new Rectangle(50,40,2425,245));
System.out.println(TextUtils.clearFormat(result1));
resultMap.put("不动产", TextUtils.clearFormat(result1));
String result2 = iTesseract.doOCR(imageFile, new Rectangle(476,285,1978,245));
System.out.println(TextUtils.clearFormat(result2));
resultMap.put("权利人", TextUtils.clearFormat(result2));
String result3 = iTesseract.doOCR(imageFile, new Rectangle(476,530,1978,245));
System.out.println(TextUtils.clearFormat(result3));
resultMap.put("共有情况", TextUtils.clearFormat(result3));
String result4 = iTesseract.doOCR(imageFile, new Rectangle(476,775,1978,245));
System.out.println(TextUtils.clearFormat(result4));
resultMap.put("坐落", TextUtils.clearFormat(result4));
String result5 = iTesseract.doOCR(imageFile, new Rectangle(476,1020,1978,245));
System.out.println(TextUtils.clearFormat(result5));
resultMap.put("不动产单元号", TextUtils.clearFormat(result5));
String result6 = iTesseract.doOCR(imageFile, new Rectangle(476,1265,1978,245));
System.out.println(TextUtils.clearFormat(result6));
resultMap.put("权利类型", TextUtils.clearFormat(result6));
String result7 = iTesseract.doOCR(imageFile, new Rectangle(476,1510,1978,245));
System.out.println(TextUtils.clearFormat(result7));
resultMap.put("权利性质", TextUtils.clearFormat(result7));
String result8 = iTesseract.doOCR(imageFile, new Rectangle(476,1755,1978,245));
System.out.println(TextUtils.clearFormat(result8));
resultMap.put("用途", TextUtils.clearFormat(result8));
String result9 = iTesseract.doOCR(imageFile, new Rectangle(476,2000,1978,245));
System.out.println(TextUtils.clearFormat(result9));
resultMap.put("面积", TextUtils.clearFormat(result9));
String result10 = iTesseract.doOCR(imageFile, new Rectangle(476,2245,1978,245));
System.out.println(TextUtils.clearFormat(result10));
resultMap.put("使用期限", TextUtils.clearFormat(result10));
String result11 = iTesseract.doOCR(imageFile, new Rectangle(476,2490,1978,1300));
System.out.println(TextUtils.clearFormat(result11));
resultMap.put("权利其他状况", TextUtils.clearFormat(result11));
System.out.println(resultMap.toString());
// iTesseract.createDocuments(imageFile.getPath(), "a", Collections.singletonList(ITesseract.RenderedFormat.TEXT));
} catch (TesseractException e) {
e.printStackTrace();
}
}
}