Python破解BiliBili滑块验证码,完美避开人机识别( 三 )

终章(完整代码)

Python破解BiliBili滑块验证码,完美避开人机识别

文章插图
 
本文完整示例代码如下# -*- coding: utf-8 -*-# @Date:2020/2/15 2:09# @Author: Lu# @Description bilibili滑块验证码识别 。B站有反爬限制 , 过快地拖拽会提示“怪物吃了拼图 , 请重试” 。# 目前B站有三张图片 , 只要对比完整图和缺失滑块背景图的像素 , 就可以得到偏移图片y轴距离 , 减去滑块空白距离=需要滑动的像素距离# 这里采用边缘检测 , 检测缺失滑块的底图是否存在一条灰色竖线 , 即认为是滑块目标位置 , 存在失败的概率 , 适用范围应该更大些 。from selenium import webdriverimport timeimport base64from PIL import Imagefrom io import BytesIOfrom selenium.webdriver.support.ui import WebDriverWaitimport randomimport copyclass VeriImageUtil():def __init__(self):self.defaultConfig = {"grayOffset": 20,"opaque": 1,"minVerticalLineCount": 30}self.config = copy.deepcopy(self.defaultConfig)def updateConfig(self, config):# temp = copy.deepcopy(config)for k in self.config:if k in config.keys():self.config[k] = config[k]def getMaxOffset(self, *args):# 计算偏移平均值最大的数av = sum(args) / len(args)maxOffset = 0for a in args:offset = abs(av - a)if offset > maxOffset:maxOffset = offsetreturn maxOffsetdef isGrayPx(self, r, g, b):# 是否是灰度像素点 , 允许波动offsetreturn self.getMaxOffset(r, g, b) < self.config["grayOffset"]def isDarkStyle(self, r, g, b):# 灰暗风格return r < 128 and g < 128 and b < 128def isOpaque(self, px):# 不透明return px[3] >= 255 * self.config["opaque"]def getVerticalLineOffsetX(self, bgImage):# bgImage = Image.open("./image/bg.png")# bgImage.im.mode = 'RGBA'bgBytes = bgImage.load()x = 0while x < bgImage.size[0]:y = 0# 点》》线 , 灰度线条数量verticalLineCount = 0while y < bgImage.size[1]:px = bgBytes[x, y]r = px[0]g = px[1]b = px[2]# alph = px[3]# print(px)if self.isDarkStyle(r, g, b) and self.isGrayPx(r, g, b) and self.isOpaque(px):verticalLineCount += 1else:verticalLineCount = 0y += 1continueif verticalLineCount >= self.config["minVerticalLineCount"]:# 连续多个像素都是灰度像素 , 直线 , 认为需要滑动这么多# print(x, y)return xy += 1x += 1passclass DragUtil():def __init__(self, driver):self.driver = driverdef __getRadomPauseScondes(self):""":return:随机的拖动暂停时间"""return random.uniform(0.6, 0.9)def simulateDragX(self, source, targetOffsetX):"""模仿人的拖拽动作:快速沿着X轴拖动(存在误差) , 再暂停 , 然后修正误差防止被检测为机器人 , 出现“图片被怪物吃掉了”等验证失败的情况:param source:要拖拽的html元素:param targetOffsetX: 拖拽目标x轴距离:return: None"""action_chains = webdriver.ActionChains(self.driver)# 点击 , 准备拖拽action_chains.click_and_hold(source)# 拖动次数 , 二到三次dragCount = random.randint(2, 3)if dragCount == 2:# 总误差值sumOffsetx = random.randint(-15, 15)action_chains.move_by_offset(targetOffsetX + sumOffsetx, 0)# 暂停一会action_chains.pause(self.__getRadomPauseScondes())# 修正误差 , 防止被检测为机器人 , 出现图片被怪物吃掉了等验证失败的情况action_chains.move_by_offset(-sumOffsetx, 0)elif dragCount == 3:# 总误差值sumOffsetx = random.randint(-15, 15)action_chains.move_by_offset(targetOffsetX + sumOffsetx, 0)# 暂停一会action_chains.pause(self.__getRadomPauseScondes())# 已修正误差的和fixedOffsetX = 0# 第一次修正误差if sumOffsetx < 0:offsetx = random.randint(sumOffsetx, 0)else:offsetx = random.randint(0, sumOffsetx)fixedOffsetX = fixedOffsetX + offsetxaction_chains.move_by_offset(-offsetx, 0)action_chains.pause(self.__getRadomPauseScondes())# 最后一次修正误差action_chains.move_by_offset(-sumOffsetx + fixedOffsetX, 0)action_chains.pause(self.__getRadomPauseScondes())else:raise Exception("莫不是系统出现了问题?!")# 参考action_chains.drag_and_drop_by_offset()action_chains.release()action_chains.perform()def simpleSimulateDragX(self, source, targetOffsetX):"""简单拖拽模仿人的拖拽:快速沿着X轴拖动 , 直接一步到达正确位置 , 再暂停一会儿 , 然后释放拖拽动作B站是依据是否有暂停时间来分辨人机的 , 这个方法适用 。:param source::param targetOffsetX::return: None"""action_chains = webdriver.ActionChains(self.driver)# 点击 , 准备拖拽action_chains.click_and_hold(source)action_chains.pause(0.2)action_chains.move_by_offset(targetOffsetX, 0)action_chains.pause(0.6)action_chains.release()action_chains.perform()def checkVeriImage(driver):WebDriverWait(driver, 5).until(lambda driver: driver.find_element_by_css_selector('.geetest_canvas_bg.geetest_absolute'))time.sleep(1)im_info = driver.execute_script('return document.getElementsByClassName("geetest_canvas_bg geetest_absolute")[0].toDataURL("image/png");')# 拿到base64编码的图片信息im_base64 = im_info.split(',')[1]# 转为bytes类型im_bytes = base64.b64decode(im_base64)with open('./temp_bg.png', 'wb') as f:# 保存图片到本地f.write(im_bytes)image_data = https://www.isolves.com/it/cxkf/yy/Python/res/res/webdriver/geckodriver_x64_0.26.0.exe",options=options)driver.get('https://passport.bilibili.com/login')time.sleep(3)driver.find_element_by_css_selector("#login-username").send_keys("1234567")driver.find_element_by_css_selector("#login-passwd").send_keys("abcdefg")driver.find_element_by_css_selector(".btn.btn-login").click()time.sleep(2)checkVeriImage(driver)pass#该方法用来确认元素是否存在 , 如果存在返回flag=true , 否则返回falsedef isElementExist(driver, css):try:driver.find_element_by_css_selector(css)return Trueexcept:return Falseif __name__ == '__main__':task()


推荐阅读