Selenium 初步使用之自动登录（包含识别验证码），超级详细 – 小飞侠

Selenium 初步使用之自动登录（包含识别验证码），超级详细

Post author:xfxia
Post published:2023年9月8日
Post category:其他

一、简介

初次开始使用Selenium，于是开始用登录作为联手项目，是一个真实的登录界面，包含验证码（验证码是难点，获取与识别），以下会讲的很详细，我怕我下次又忘记了

我采用Selenium + python + 百度云OCR，安装等教程自行百度，我就不多说了

二、selenium打开浏览器获取相应el

from selenium import webdriver
from selenium.webdriver.common.by import By
import base64
#注册Chrome驱动,打开浏览器网址
driver = webdriver.Chrome()
url = "************"
driver.get(url)
#获取相应el
driver.find_element(By.NAME,"***").send_keys('***')
driver.find_element(By.NAME, "***").send_keys('***')
#获取图片
png = driver.find_element(By.CSS_SELECTOR,"****")
img_url = png.get_attribute("src")  # 获得图片的url，本次测试的是bs64生成，采用解码获得图片
head, context = img_url.split(",")  # 截取后字段的bas64编码
img_data = base64.b64decode(context)
image = Image.open(BytesIO(img_data));
image.save("capt.png")

这段代码主要是利用selenium打开网站，获取到相应的dom，

~~find_element_by_id~~

等写法已经统一换为find_element(By.ID, “***”)等了，先将图片保存下来考研方便后续的识别

三、验证码预处理

验证码一般无法直接识别，我们需要通过灰度、二值、降噪等手段，使得图片更加清晰，提高图片的识别准确率

下列代码需要提前引入以下包

from PIL import Image

1.灰度化

img = img.convert('L')  # P模式转换为L模式(灰度模式默认阈值127)

2.二值化

count = 230  # 设定阈值，阈值的大小由图片的清晰度等自行调节
table = []
for i in range(256):
    if i < count:
        table.append(0)
    else:
        table.append(1)
img = img.point(table, '1')
img.save('captcha.png')

3.降噪

pixdata = img.load()
w,h = img.size
for y in range(1,h-1):
   for x in range(1,w-1):
        count = 0
        if pixdata[x,y-1] > 245:
            count = count + 1
        if pixdata[x,y+1] > 245:
            count = count + 1
        if pixdata[x-1,y] > 245:
            count = count + 1
        if pixdata[x+1,y] > 245:
            count = count + 1
        if count > 2:
            pixdata[x,y] = 255
return img

四、百度云识别

需要提前注册

from aip import AipOcr
# 识别码
APP_ID = '****'
API_KEY = '****'
SECRET_KEY = '****'
# 初始化对象
client = AipOcr(APP_ID, API_KEY, SECRET_KEY)
# 读取图片
def get_file_content(file_path):
    with open(file_path, 'rb') as f:
        return f.read()

image = get_file_content('end.png') # 传入图片
# 定义参数变量
options = {'language_type': 'ENG', }  # 识别语言类型，默认为'CHN_ENG'中英文混合
#  调用通用文字识别
result = client.basicGeneral(image, options)  # 高精度接口 basicAccurate
for word in result['words_result']:
    captcha = (word['words'])

print('识别结果：' + captcha)
return captcha

五、完整代码

import base64
from io import BytesIO
from selenium import webdriver
from selenium.webdriver.common.by import By
from PIL import Image
from time import sleep
from aip import AipOcr

# 对二值化的图像进行降噪处理，使得识别更加准确
def depoint(img):
    pixdata = img.load()
    w,h = img.size
    for y in range(1,h-1):
        for x in range(1,w-1):
            count = 0
            if pixdata[x,y-1] > 245:
                count = count + 1
            if pixdata[x,y+1] > 245:
                count = count + 1
            if pixdata[x-1,y] > 245:
                count = count + 1
            if pixdata[x+1,y] > 245:
                count = count + 1
            if count > 2:
                pixdata[x,y] = 255
    return img

# 获得验证码，并进行处理，二值化
def deal_image():
    png = driver.find_element(By.CSS_SELECTOR,".*******")
    img_url = png.get_attribute("src")  # 获得图片的url，本次测试的是bs64生成，采用解码获得图片
    head, context = img_url.split(",")  # 截取后字段的bas64编码
    img_data = base64.b64decode(context)
    image = Image.open(BytesIO(img_data));
    image.save("capt.png")

    img = Image.open('capt.png')
    img = img.convert('L')  # P模式转换为L模式(灰度模式默认阈值127)
    count = 230  # 设定阈值，阈值的大小由图片的清晰度等自行调节
    table = []
    for i in range(256):
        if i < count:
            table.append(0)
        else:
            table.append(1)

    # print(table)

    img = img.point(table, '1')
    img.save('captcha.png')

# 调用百度云OCR API 进行识别
def discern_captcha():
    # 识别码
    APP_ID = '****'
    API_KEY = '****'
    SECRET_KEY = '****'
    # 初始化对象
    client = AipOcr(APP_ID, API_KEY, SECRET_KEY)
    # 读取图片
    def get_file_content(file_path):
        with open(file_path, 'rb') as f:
            return f.read()

    image = get_file_content('end.png') # 传入图片
    # 定义参数变量
    options = {'language_type': 'ENG', }  # 识别语言类型，默认为'CHN_ENG'中英文混合
    #  调用通用文字识别
    result = client.basicGeneral(image, options)  # 高精度接口 basicAccurate
    for word in result['words_result']:
        captcha = (word['words'])

    print('识别结果：' + captcha)
    return captcha

# 登录事件，若识别不准确需点击第二次重复
def ClickRandomCode():
    deal_image()
    image = depoint(Image.open('captcha.png'))
    image.save('end.png')
    image = depoint(Image.open('end.png'))
    image.save("end.png")
    randomCode = discern_captcha()
    driver.find_element(By.NAME, "randomCode").send_keys(randomCode)
    driver.find_element(By.CSS_SELECTOR, ".card-z .el-button").click()
    sleep(2) # 错误或成功信息有延迟
    try:
        text = driver.find_element(By.CSS_SELECTOR, ".el-message__content").text
        if (text == "验证码错误"):
            driver.find_element(By.CSS_SELECTOR, ".verification-code > img").click()
            driver.find_element(By.CSS_SELECTOR, ".verification-code > img").clear()
            ClickRandomCode() # 递归调用直至正确
            print("验证码错误")
        else:
            print("登录成功")
    except:
        print("ok")

def login(***,***):
    driver.find_element(By.NAME,"****").send_keys(***)
    driver.find_element(By.NAME, "***").send_keys(***)
    ClickRandomCode()

if __name__ == '__main__':
    driver = webdriver.Chrome()
    url = "*****"
    driver.get(url)
    login("****","****")

版权声明：本文为weixin_45496777原创文章，遵循 CC 4.0 BY-SA 版权协议，转载请附上原文出处链接和本声明。

原文链接：https://blog.csdn.net/weixin_45496777/article/details/129957357