Canvas简单验证码识别

有感于canvas无穷的魅力,使用canvas折腾了一个简单的验证码识别。当然是最简单的验证码识别了,不过准确率还好能达到100%。

首先看一下我们准备识别的验证码,绿色的背景,白色的噪点,黑色的文字(数字0-9),位置和颜色固定,没有旋转,够简单吧。

p1

思路:

1、收集验证码样本,要包括0-9所有的数字。

2、用ps等图像处理工具分析我们将要识别的验证码,得出第一个文字距离左边的位置,字距离顶部的位置,字的宽高以及字与字之间的间隔。这个过程要尽可能的精确,这是我们后期验证码识别是否正确的基本。

3、对验证码样本进行二值化,得出每个数字对应的二值化序列组成素材库。

4、取需要识别的图片的每个数字的二值化序列和素材库中的序列进行比对,比较其相似程度,得出对应的数字。

实现代码:

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
<!DOCTYPE html>
<html>
<head>
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge,chrome=1">
<title>Canvas简单验证码识别</title>
<meta name="description" content="">
<meta name="keywords" content="">
<link href="" rel="stylesheet">
</head>
<body>
<img src="#" id="code" align="absmiddle"  alt="">
<button id="recognize">识别</button>
<p>点击图片刷新验证码</p>
<script type="text/javascript">
    var OCR = (function(window,document,undefined){
        var offsetX,offsetY = 6,fontWidth,fontHeight,gap = 13,source,srcs,kus,codeId,recId;
        function init(codeContainerId,recognizeId){
            offsetX = 5;
            offsetY = 6
            fontWidth = 8;
            fontHeight = 10;
            gap = 13;
            source = {};
            srcs = ['images/p1.png','images/p2.png','images/p3.png','images/p4.png','images/p5.png','images/p6.png','images/p7.png','images/p8.png','images/p9.png','images/p10.png','images/p11.png','images/p12.png','images/p13.png','images/p14.png'];
            kus = [["3","2","2","1"],["4","6","7","5"],["9","8","1","6"],["0","3","5","0"]];
            codeId = codeContainerId;
            recId = recognizeId;
            initSource();
            getCode();
            addEvent();
        }
        function initSource(){
            for(var i=0;i<4;i++){
                (function(){
                    addSource(srcs[i],kus[i]);
                })();
            }
        }
        function getCode(){
            var im = document.getElementById("code"),
                randPic = srcs[(~~(Math.random()*srcs.length))];
            im.src = randPic;
        }
        function addSource(pic,numArr){
            var im = new Image(),
                canvas = document.createElement("canvas"),
                ctx = canvas.getContext("2d");
            im.onload = function(){
                canvas.width = this.width;
                canvas.height = this.height;
                ctx.drawImage(im,0,0);
                var imgData = ctx.getImageData(0,0,80,20);
                imgData = binaryzationImageData(imgData);
                ctx.putImageData(imgData,0,0);
                for(var i=1;i<=4;i++){
                    (function(i){
                        var imgData = ctx.getImageData(offsetX+gap*(i-1)+fontWidth*(i-1),offsetY,fontWidth,fontHeight);
                        !source[numArr[i-1]] && (source[numArr[i-1]] = imgData.data.join("").replace(/255/g,"1"));
                    })(i);
                }
            }
            im.src = pic;
        }
        function binaryzationImageData(imgData){
            for(var i=0;i<imgData.width*imgData.height;i++){
                var r = imgData.data[i*4+0],
                    g = imgData.data[i*4+1],
                    b = imgData.data[i*4+2];
                var gray = 0.299 * r + 0.587 * g + 0.114 * b;
                if(gray<=130){
                    gray = 0;
                }else{
                    gray = 255;
                }
                imgData.data[i*4+0] = imgData.data[i*4+1] = imgData.data[i*4+2] = gray;
            }
            return imgData;
        }
        function recognize(im){
            var canvas = document.createElement("canvas"),
                ctx = canvas.getContext("2d"),
                code = '';
            canvas.width = im.width;
            canvas.height = im.height;
            ctx.drawImage(im,0,0);
            for(var i=1;i<=4;i++){
                var imgData = ctx.getImageData(offsetX+gap*(i-1)+fontWidth*(i-1),offsetY,fontWidth,fontHeight);
                imgData = binaryzationImageData(imgData);
                var str = imgData.data.join("").replace(/255/g,"1");
                for(var index in source){
                    if(compare(source[index],str)>=99){
                        code += index;
                        break;
                    }
                }
            }
            alert(code);
        }
        function getObjectLength(o){
            var len = 0;
            for(var index in o){
                if(o.hasOwnProperty(index)){
                    len ++;
                }
            }
            return len;
        }
        function compare(x, y) {
            var x = x.split(""),
                y = y.split(""),
                z = 0,
                s = Math.max(x.length,y.length),
                a = x.shift(),
                b = y.shift();
            while(a !== undefined && b !== undefined) {
                if (a === b) {
                    z++;
                }
                a = x.shift();
                b = y.shift();
            }
            return z/s * 100;
        }
        function addEvent(){
            document.getElementById(recId).onclick = function(){
                recognize(document.getElementById(codeId));
            }
            document.getElementById(codeId).onclick = function(){
                getCode();
            }
        }
        return { init : init }
    })(window,document);
 
    OCR.init("code","recognize");
</script>
</body>
</html>

在线Demo:http://demo.deanhan.cn/recognize

转自:https://www.deanhan.cn/js-ocr.html

posted @   笠航  阅读(651)  评论(0编辑  收藏  举报
编辑推荐:
· 开发者必知的日志记录最佳实践
· SQL Server 2025 AI相关能力初探
· Linux系列:如何用 C#调用 C方法造成内存泄露
· AI与.NET技术实操系列(二):开始使用ML.NET
· 记一次.NET内存居高不下排查解决与启示
阅读排行:
· 阿里最新开源QwQ-32B,效果媲美deepseek-r1满血版,部署成本又又又降低了!
· 开源Multi-agent AI智能体框架aevatar.ai,欢迎大家贡献代码
· Manus重磅发布:全球首款通用AI代理技术深度解析与实战指南
· 被坑几百块钱后,我竟然真的恢复了删除的微信聊天记录!
· AI技术革命,工作效率10个最佳AI工具
点击右上角即可分享
微信分享提示