import java.awt.Color;
import java.awt.image.BufferedImage;
import java.io.File;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;

import javax.imageio.ImageIO;

public class ImagePreProcess {
	
	//去除噪点
	public static int isWhite(int colorInt) {
		Color color = new Color(colorInt);
		if (color.getRed() + color.getGreen() + color.getBlue() > 590) {
			return 1;
		}
		return 0;
	}
	//移除背景
	public static BufferedImage removeBackgroud(String picFile)
			throws Exception {
		BufferedImage img = ImageIO.read(new File(picFile));
		int width = img.getWidth();
		int height = img.getHeight();
		for (int x = 0; x < width; ++x) {
			for (int y = 0; y < height; ++y) {
				if (isWhite(img.getRGB(x, y)) == 1) {
					img.setRGB(x, y, Color.WHITE.getRGB());
				} else {
					img.setRGB(x, y, Color.BLACK.getRGB());
				}
			}
		}
		return img;
	}
	//将要识别的图片拆分为单个字母的图片
	public static List<BufferedImage> splitImage(BufferedImage img)
			throws Exception {
		List<BufferedImage> subImgs = new ArrayList<BufferedImage>();
		//此处的数字应该根据验证码的大小做相应调整
		subImgs.add(img.getSubimage(25, 0, 12, 25));
		subImgs.add(img.getSubimage(38, 0, 11, 25));
		subImgs.add(img.getSubimage(48, 0, 11, 25));
		subImgs.add(img.getSubimage(58, 0, 11, 25));
		return subImgs;
	}
	//加载验证码模板库
	public static Map<BufferedImage, String> loadTrainData(String trainPath) throws Exception {
		Map<BufferedImage, String> map = new HashMap<BufferedImage, String>();
		File dir = new File(trainPath);
		File[] files = dir.listFiles();
		for (File file : files) {
			if(file.getName().endsWith("jpg"))
				map.put(ImageIO.read(file), file.getName().charAt(0) + "");
		}
		return map;
	}
	//进行对比识别
	public static String getSingleCharOcr(BufferedImage img,
			Map<BufferedImage, String> map) {
		String result = "";
		int width = img.getWidth();
		int height = img.getHeight();
		int min = width * height;
		for (BufferedImage bi : map.keySet()) {
			int count = 0;
			Label1: for (int x = 0; x < width && x < bi.getWidth(); ++x) {
				for (int y = 0; y < height && y < bi.getWidth(); ++y) {
					if (isWhite(img.getRGB(x, y)) != isWhite(bi.getRGB(x, y))) {
						count++;
						if (count >= min)
							break Label1;
					}
				}
			}
			if (count < min) {
				min = count;
				result = map.get(bi);
			}
		}
		return result;
	}
	//识别的入口
	public static String getAllOcr(String file) throws Exception {
		BufferedImage img = removeBackgroud(file);
		List<BufferedImage> listImg = splitImage(img);
		Map<BufferedImage, String> map = loadTrainData("C:/test/train");
		String result = "";
		for (BufferedImage bi : listImg) {
			result += getSingleCharOcr(bi, map);
		}
		ImageIO.write(img, "JPG", new File("C:/test/result/"+result+".jpg"));
		return result;
	}


	/**
	 * @param args
	 * @throws Exception
	 */
	public static void main(String[] args) throws Exception {
		String text = getAllOcr("C:/test/src.jpeg");
		System.out.println("jpg = " + text);
	}
}

 

posted on 2012-11-27 17:27  codevoter  阅读(221)  评论(0编辑  收藏  举报

ASP.NET HOSTING