字符识别

import cv2
import pytesseract
pytesseract.pytesseract.tesseract_cmd=r'E:\tesseract\tesseract.exe'
#字符识别(英文,数字)
# img = cv2.imread('img_1.png')
# img = cv2.cvtColor(img,cv2.COLOR_BGR2RGB)
# yimg,ximg,_ = img.shape #(y,x)
# # print(pytesseract.image_to_string(img)) #内容
# # print(pytesseract.image_to_boxes(img)) #字符位置
# boxes = pytesseract.image_to_boxes(img)
# for i in boxes.splitlines():
# i = i.split(' ')
# print(i)
# x,y,w,h = int(i[1]),int(i[2]),int(i[3]),int(i[4])
# cv2.rectangle(img,(x,yimg-y),(w,yimg-h),(0,0,255),1)
# cv2.putText(img,i[0],(x,yimg-y),cv2.FONT_HERSHEY_COMPLEX,1,(0,0,255),2)
# cv2.imshow('result',img)
# cv2.waitKey(0)

#字符识别(单词)
# pytesseract.pytesseract.tesseract_cmd=r'E:\tesseract\tesseract.exe'
# img = cv2.imread('img_1.png')
# img = cv2.cvtColor(img,cv2.COLOR_BGR2RGB)
# yimg,ximg,_ = img.shape #(y,x)
# boexs = pytesseract.image_to_data(img)
# print(boexs)
#第一种方法
# for x,i in enumerate(boexs.splitlines()):
# if x != 0:
# i = i.split()
# print(i)
#第二种方法
# for i in boexs.splitlines()[1::]:
# i = i.split()
# print(i)
# if len(i) == 12:
# x,y,w,h = int(i[6]),int(i[7]),int(i[8]),int(i[9])
# cv2.rectangle(img,(x,y),(x+w,y+h),(0,0,255),1)
# cv2.putText(img,i[11],(x,y),cv2.FONT_HERSHEY_COMPLEX,1,(0,0,255),2)
# cv2.imshow('result',img)
# cv2.waitKey(0)

#字符识别(数字)
# pytesseract.pytesseract.tesseract_cmd=r'E:\tesseract\tesseract.exe'
# img = cv2.imread('img_1.png')
# img = cv2.cvtColor(img,cv2.COLOR_BGR2RGB)
# yimg,ximg,_ = img.shape #(y,x)
# cong = r'--oem 3 --psm 6 outputbase digits'
# boxes = pytesseract.image_to_boxes(img,config=cong)
# for i in boxes.splitlines():
# i = i.split(' ')
# x,y,w,h = int(i[1]),int(i[2]),int(i[3]),int(i[4])
# cv2.rectangle(img,(x,yimg-y),(w,yimg-h),(0,0,255),1)
# cv2.putText(img,i[0],(x,yimg-y),cv2.FONT_HERSHEY_COMPLEX,1,(0,0,255),2)
# cv2.imshow('result',img)
# cv2.waitKey(0)

#中文识别
from PIL import Image
img = Image.open('../img_5.png')
text = pytesseract.image_to_string(img,lang='chi_sim')#config='psm - 6'
print(text)
posted @   记录——去繁就简  阅读(76)  评论(0编辑  收藏  举报
相关博文:
阅读排行:
· DeepSeek 开源周回顾「GitHub 热点速览」
· 物流快递公司核心技术能力-地址解析分单基础技术分享
· .NET 10首个预览版发布:重大改进与新特性概览!
· AI与.NET技术实操系列(二):开始使用ML.NET
· 单线程的Redis速度为什么快?
点击右上角即可分享
微信分享提示