【Python】Python简单验证码识别-JobPlus

1.通过二值化处理去掉干扰线

2.对黑白图片进行降噪，去掉那些单独的黑色像素点

3.消除边框上附着的黑色像素点

4.识别图像中的文字，去掉空格与’.’

[python]

from PIL import Image
from aip import AipOcr
file='1-1-7'
# 二值化处理,转化为黑白图片
def two_value():
for i in range(1, 5):
# 打开文件夹中的图片
image = Image.open(file+'.jpg')
# 灰度图
lim = image.convert('L')
# 灰度阈值设为165，低于这个值的点全部填白色
threshold = 165
table = []
for j in range(256):
if j < threshold:
table.append(0)
else:
table.append(1)
bim = lim.point(table, '1')
bim.save(file+'.1.jpg')
two_value()
# 去除干扰线
im = Image.open(file+'.1.jpg')
# 图像二值化
data = im.getdata()
w, h = im.size
black_point = 0
for x in range(1, w - 1):
for y in range(1, h - 1):
mid_pixel = data[w * y + x] # 中央像素点像素值
if mid_pixel < 50: # 找出上下左右四个方向像素点像素值
top_pixel = data[w * (y - 1) + x]
left_pixel = data[w * y + (x - 1)]
down_pixel = data[w * (y + 1) + x]
right_pixel = data[w * y + (x + 1)]
# 判断上下左右的黑色像素点总个数
if top_pixel < 5: #小于5比小于10更精确
black_point += 1
if left_pixel < 5:
black_point += 1
if down_pixel < 5:
black_point += 1
if right_pixel < 5:
black_point += 1
if black_point < 1:
im.putpixel((x, y), 255)
# print(black_point)
black_point = 0
im.save(file+'.2.jpg')
# 去除干扰线
im = Image.open(file+'.2.jpg')
# 图像二值化
data = im.getdata()
w, h = im.size
black_point = 0
for x in range(1, w - 1):
for y in range(1, h - 1):
if x < 2 or y < 2:
im.putpixel((x - 1, y - 1), 255)
if x > w - 3 or y > h - 3:
im.putpixel((x + 1, y + 1), 255)
im.save(file+'.3.jpg')
# 定义常量
APP_ID = '11352343'
API_KEY = 'Nd5Z1NkGoLDvHwBnD2bFLpCE'
SECRET_KEY = 'A9FsnnPj1Ys2Gof70SNgYo23hKOIK8Os'
# 初始化AipFace对象
aipOcr = AipOcr(APP_ID, API_KEY, SECRET_KEY)
# 读取图片
filePath=file+'.3.jpg'
def get_file_content(filePath):
with open(filePath, 'rb') as fp:
return fp.read()
# 定义参数变量
options = {
'detect_direction': 'true',
'language_type': 'CHN_ENG',
}
# 调用通用文字识别接口
result = aipOcr.basicGeneral(get_file_content(filePath), options)
print(result)
words_result=result['words_result']
for i in range(len(words_result)):
print(words_result[i]['words'].replace(' ','').replace('.','')) #去掉可能被识别的空格与.

1.通过二值化处理去掉干扰线2.对黑白图片进行降噪，去掉那些单独的黑色像素点3.消除边框上附着的黑色像素点4.识别图像中的文字，去掉空格与’.’[python] <ol><li>from PIL import Image  </li><li>from aip import AipOcr  </li><li>  </li><li>file='1-1-7'  </li><li>  </li><li># 二值化处理,转化为黑白图片  </li><li>def two_value():  </li><li>    for i in range(1, 5):  </li><li>        # 打开文件夹中的图片    </li><li>        image = Image.open(file+'.jpg')  </li><li>        # 灰度图    </li><li>        lim = image.convert('L')  </li><li>        # 灰度阈值设为165，低于这个值的点全部填白色    </li><li>        threshold = 165  </li><li>        table = []  </li><li>  </li><li>        for j in range(256):  </li><li>            if j < threshold:  </li><li>                table.append(0)  </li><li>            else:  </li><li>                table.append(1)  </li><li>  </li><li>        bim = lim.point(table, '1')  </li><li>        bim.save(file+'.1.jpg')  </li><li>  </li><li>two_value()  </li><li>  </li><li># 去除干扰线  </li><li>im = Image.open(file+'.1.jpg')  </li><li># 图像二值化  </li><li>data = im.getdata()  </li><li>w, h = im.size  </li><li>black_point = 0  </li><li>  </li><li>for x in range(1, w - 1):  </li><li>    for y in range(1, h - 1):  </li><li>        mid_pixel = data[w * y + x]  # 中央像素点像素值  </li><li>        if mid_pixel < 50:  # 找出上下左右四个方向像素点像素值  </li><li>            top_pixel = data[w * (y - 1) + x]  </li><li>            left_pixel = data[w * y + (x - 1)]  </li><li>            down_pixel = data[w * (y + 1) + x]  </li><li>            right_pixel = data[w * y + (x + 1)]  </li><li>  </li><li>            # 判断上下左右的黑色像素点总个数  </li><li>            if top_pixel < 5:   #小于5比小于10更精确  </li><li>                black_point += 1  </li><li>            if left_pixel < 5:  </li><li>                black_point += 1  </li><li>            if down_pixel < 5:  </li><li>                black_point += 1  </li><li>            if right_pixel < 5:  </li><li>                black_point += 1  </li><li>            if black_point < 1:  </li><li>                im.putpixel((x, y), 255)  </li><li>                # print(black_point)  </li><li>            black_point = 0  </li><li>  </li><li>im.save(file+'.2.jpg')  </li><li>  </li><li># 去除干扰线  </li><li>im = Image.open(file+'.2.jpg')  </li><li># 图像二值化  </li><li>data = im.getdata()  </li><li>w, h = im.size  </li><li>black_point = 0  </li><li>  </li><li>for x in range(1, w - 1):  </li><li>    for y in range(1, h - 1):  </li><li>        if x < 2 or y < 2:  </li><li>            im.putpixel((x - 1, y - 1), 255)  </li><li>        if x > w - 3 or y > h - 3:  </li><li>            im.putpixel((x + 1, y + 1), 255)  </li><li>  </li><li>im.save(file+'.3.jpg')  </li><li>  </li><li># 定义常量  </li><li>APP_ID = '11352343'  </li><li>API_KEY = 'Nd5Z1NkGoLDvHwBnD2bFLpCE'  </li><li>SECRET_KEY = 'A9FsnnPj1Ys2Gof70SNgYo23hKOIK8Os'  </li><li>  </li><li># 初始化AipFace对象  </li><li>aipOcr = AipOcr(APP_ID, API_KEY, SECRET_KEY)  </li><li>  </li><li># 读取图片  </li><li>filePath=file+'.3.jpg'  </li><li>def get_file_content(filePath):  </li><li>    with open(filePath, 'rb') as fp:  </li><li>        return fp.read()  </li><li>  </li><li># 定义参数变量  </li><li>options = {  </li><li>    'detect_direction': 'true',  </li><li>    'language_type': 'CHN_ENG',  </li><li>}  </li><li>  </li><li># 调用通用文字识别接口  </li><li>result = aipOcr.basicGeneral(get_file_content(filePath), options)  </li><li>print(result)  </li><li>words_result=result['words_result']  </li><li>for i in range(len(words_result)):  </li><li>    print(words_result[i]['words'].replace(' ','').replace('.',''))  #去掉可能被识别的空格与.  </li></ol><img src="https://file.jobplus.com.cn/2018/06/07/d4246f78b58e4f6cb9f5e505de514681.png" _src="https://file.jobplus.com.cn/2018/06/07/d4246f78b58e4f6cb9f5e505de514681.png" style=""/><img src="https://file.jobplus.com.cn/2018/06/07/b165fbbe5bb24f648038da62b8113f02.png" _src="https://file.jobplus.com.cn/2018/06/07/b165fbbe5bb24f648038da62b8113f02.png" style=""/>

关于我们

法律声明

帮助中心

商务合作

相关文章

关于我们

法律声明

帮助中心

商务合作