import reimport requestsimport cv2import timeimport randomfrom selenium import webdriverfrom selenium.webdriver.common.by import Byfrom selenium.webdriver.common.action_chains import ActionChainsfrom selenium.webdriver.chrome.options import Optionsdef download_image(url, path): headers = {"User-Agent": "Mozilla/5.0", "Referer": "https://www.douban.com/"} resp = requests.get(url, headers=headers)with open(path, "wb") as f: f.write(resp.content)print(f"已下载: {path}")def get_distance(bg_path, slider_path):"""计算滑块需要滑动的距离 bg_path: 背景图(有缺口的大图,原图尺寸 672x390) slider_path: 滑块大图(包含小滑块的完整图,原图尺寸 682x620) """# ========== 1. 读取图片 ==========bg = cv2.imread(bg_path) # 背景图,尺寸 672x390slider_big = cv2.imread(slider_path, cv2.IMREAD_UNCHANGED) # 滑块大图,尺寸 682x620,保留透明通道# ========== 2. 裁剪出小滑块 ========== # 为什么是 490:610 和 140:260?# 因为网页 CSS 里定义了滑块在屏幕上的显示位置和大小# 通过比例换算,得出在原图上小滑块的位置是 x=140, y=490, 宽高=120x120slider = slider_big[490:610, 140:260] # 从大图中切出 120x120 的小滑块# ========== 3. 提取滑块的形状 ========== # PNG图片有4个通道:R(红), G(绿), B(蓝), A(透明度) # 取第4个通道(Alpha通道),白色=滑块形状,黑色=透明背景slider_gray = slider[:, :, 3] # 只取透明度通道,得到滑块的形状轮廓# ========== 4. 背景图处理 ========== # 把彩色背景图转成黑白灰度图,去掉颜色干扰bg_gray = cv2.cvtColor(bg, cv2.COLOR_BGR2GRAY)# ========== 5. 边缘检测 ========== # Canny 边缘检测:把图片中物体的边缘用白线标出来# 参数 200,300 是高低阈值,值越大越敏感bg_edges = cv2.Canny(bg_gray, 200, 300) # 背景图的边缘轮廓slider_edges = cv2.Canny(slider_gray, 200, 300) # 滑块图的边缘轮廓# ========== 6. 模板匹配(核心算法)========== # 把滑块轮廓(slider_edges)作为模板,在背景轮廓(bg_edges)上滑动# TM_CCOEFF_NORMED:归一化相关系数匹配法,结果值范围 -1 到 1 # 值越大说明越像,1=完全相同,0=无关,-1=完全相反result = cv2.matchTemplate(bg_edges, slider_edges, cv2.TM_CCOEFF_NORMED)# 找到结果中最大值的位置(即最匹配的位置)# min_loc: 最小值位置, max_loc: 最大值位置_, _, _, max_loc = cv2.minMaxLoc(result)# ========== 7. 缺口在原图上的中心X坐标 ==========left = max_loc[0] # 缺口左上角的 X 坐标gap_original = left + 60 # 缺口中心X = 左上角X + 滑块宽度的一半(120/2=60) # 公式1:缺口中心X = 匹配到的左上角X + 滑块宽度 ÷ 2 # gap_original = left + 60 # ========== 8. 换算到网页显示尺寸 ========== # 原图宽度是 672px,但网页上显示的背景图宽度是 278px # 需要按比例缩放,才能得到真实的滑动距离display_width = 278 # 网页上背景图的显示宽度(固定值)original_width = bg.shape[1] # 原图宽度 = 672distance = gap_original * display_width / original_width# 公式2:网页滑动距离 = 原图缺口X × (网页显示宽度 ÷ 原图宽度) # distance = gap_original × (278 ÷ 672) # distance = gap_original × 0.413 # ========== 9. 输出并返回 ==========print(f"原图缺口X: {gap_original}, 最终距离: {distance:.2f}")return int(distance) - 10 # 减10是经验微调,实际测试后加的偏移量def extract_url_from_style(style): match = re.search(r'url\("([^"]+)"\)', style)return match.group(1) if match else Nonedef slide_simple(distance):"""直接滑到底"""return [distance]def get_tracks(distance):"""生成仿人滑动的轨迹数组 原理:模拟人的拖动习惯 —— 先加速后减速:param distance: 需要滑动的总距离(像素):return: 轨迹数组,每个元素是每次移动的偏移量(像素) """tracks = [] # 存储每一步移动的距离current = 0 # 当前已经移动的总距离mid = distance * 0.6 # 加速阶段的终点(前60%加速,后40%减速)t = 0.05 # 时间间隔(秒),越小轨迹越平滑v = 0 # 初始速度(像素/秒)# 循环生成轨迹,直到走完总距离while current < distance:# 根据当前位置决定加速度# 前60%:加速(a=20),模拟人启动时加快速度# 后40%:减速(a=-3),模拟人快到目标时减速a = 20 if current < mid else -3# 匀变速运动位移公式:s = v0 * t + 0.5 * a * t^2s = v * t + 0.5 * a * t * t# 累加位移current += s# 将本次移动距离取整后加入轨迹(像素必须是整数)tracks.append(round(s))# 更新速度:v = v0 + a * tv += a * t# 修正误差:因为取整可能导致总距离不等于目标距离total = sum(tracks)if total > distance:# 如果超了,从最后一步减去多余的部分tracks[-1] -= total - distanceelif total < distance:# 如果不够,补一步剩余距离tracks.append(distance - total)return tracksdef slide(driver):# 切换iframedriver.switch_to.frame(0) time.sleep(1) n = 1while n <= 5:try:# 获取背景图URLbg_element = driver.find_element(By.XPATH, '//*[@id="slideBg"]') style = bg_element.get_attribute("style") bg_url = style.split('url("')[1].split('")')[0]# 获取滑块大图元素(小方块那个)elem = driver.find_element(By.XPATH, '//*[@id="tcOperation"]/div[9]') style = elem.get_attribute("style") big_url = extract_url_from_style(style)print(f"背景图URL: {bg_url[:80]}...")print(f"滑块图URL: {big_url[:80]}...")# 下载图片download_image(bg_url, "bg.png") download_image(big_url, "slider_big.png")# 计算距离distance = get_distance("bg.png", "slider_big.png")print(f"需要滑动: {distance:.2f}px") tracks = slide_simple(distance)# 找滑块元素block = driver.find_element(By.XPATH, '//*[@id="tcOperation"]/div[7]')# 1. 按下滑块ActionChains(driver).click_and_hold(block).perform() time.sleep(0.1)# 2. 按轨迹滑动for track in tracks: ActionChains(driver).move_by_offset(xoffset=track, yoffset=random.uniform(-1, 1)).perform() time.sleep(random.uniform(0.01, 0.02))# 3. 松开滑块ActionChains(driver).release().perform() time.sleep(2)# 4. 检查验证是否成功# 如果验证成功,instructionText 会消失或变成其他状态block = driver.find_element(By.XPATH, '//*[@id="tcOperation"]/div[7]') n += 1print(f"第{n - 1}次验证失败,重试...")print(f"本次将会滑动:{distance}")except:print(f"第{n}次验证成功")breakdef main(): url = "https://www.已脱敏处理.com/login"options = Options() options.add_argument('--disable-blink-features=AutomationControlled') driver = webdriver.Chrome(options=options) driver.get(url) time.sleep(2)# 点击密码登录driver.find_element(By.CLASS_NAME, "account-tab-account").click() time.sleep(1)# 输入账号密码driver.find_element(By.NAME, "username").send_keys("20761430@qq.com") driver.find_element(By.NAME, "password").send_keys("wewewrqr") time.sleep(1)# 点击登录按钮driver.find_element(By.CLASS_NAME, "btn-account").click() time.sleep(3)# 滑动验证码(内部会自动下载图片、计算距离、滑动)slide(driver) # distance参数会被覆盖,随便传个0time.sleep(3)print("完成")# driver.quit()if __name__ == '__main__': main()