python爬虫进阶-每日一学(gif验证码识别)
2023-12-26 13:46:50
#!/usr/bin/python3
# -*- coding: utf-8 -*-
# @Time : 2023/12/26 11:26
# @Author : jia666666
# @FileName: 01 下载.py
import time
from PIL import Image
import ddddocr
import io
import requests
headers = {
"Host": "credit.customs.gov.cn",
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:121.0) Gecko/20100101 Firefox/121.0",
"Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,*/*;q=0.8",
"Accept-Language": "zh-CN,zh;q=0.8,zh-TW;q=0.7,zh-HK;q=0.5,en-US;q=0.3,en;q=0.2",
"Accept-Encoding": "gzip, deflate",
"Upgrade-Insecure-Requests": "1",
"Connection": "keep-alive"
}
def get_yzm():
while True:
url = f"http://credit.customs.gov.cn/ccppserver/verifyCode/creator?{int(time.time() * 1000)}"
response = requests.get(url, headers=headers, verify=False)
#先保存本地在识别
if savesign:
with open(savepath, 'wb') as file:
file.write(response.content)
image = Image.open(savepath)
else:
#不保存本地
image=Image.open(io.BytesIO(response.content))
start_time = time.time()
# 存储识别结果的字符串
ocrresult = ''
# 出现几次停止
ocrcount = 3
# 最后结果
endres = ''
i=0#开始帧
while True:
try:
image.seek(i)
ocr = ddddocr.DdddOcr()
res = ocr.classification(image)
ocrresult = ocrresult + res
if len(res) == 4:
if ocrresult.count(res) >= ocrcount:
endres = res
break
if endres:
break
else:
i=i+1
except Exception as e:
pass
break
if endres:
print("用时", time.time() - start_time)
return endres
#gif是否保存本地
savesign=True
#保存本地的路径
savepath=r"yzm.gif"
print("gif识别结果",get_yzm())
文章来源:https://blog.csdn.net/jia666666/article/details/135219149
本文来自互联网用户投稿,该文观点仅代表作者本人,不代表本站立场。本站仅提供信息存储空间服务,不拥有所有权,不承担相关法律责任。 如若内容造成侵权/违法违规/事实不符,请联系我的编程经验分享网邮箱:veading@qq.com进行投诉反馈,一经查实,立即删除!
本文来自互联网用户投稿,该文观点仅代表作者本人,不代表本站立场。本站仅提供信息存储空间服务,不拥有所有权,不承担相关法律责任。 如若内容造成侵权/违法违规/事实不符,请联系我的编程经验分享网邮箱:veading@qq.com进行投诉反馈,一经查实,立即删除!