hCaptcha 是一種常見的驗證碼服務,用于區分人類用戶和自動化程序。由于其基于圖像識別和行為分析,下面介紹如何使用自動化點擊驗證碼完成登陸。
思路:登陸目標網站觸發驗證碼,截圖并發給打碼平臺返回坐標,模擬人工點擊完成驗證
1、注冊識別 hCaptcha API,獲取授權
import requests
def get_rect(base64_list, title_list):url = "https://api.acedata.cloud/captcha/recognition/hcaptcha"headers = {"accept": "application/json","authorization": "授權碼","content-type": "application/json"}payload = {"queries": base64_list,"question": ",".join(title_list)}response = requests.post(url, json=payload, headers=headers).json()return response
2、登陸目標網站,觸發網站驗證碼
co = ChromiumOptions().headless(False).auto_port()
co.set_argument('--enable-translate')
page = ChromiumPage(co)
co.incognito()
page.get('https://www.ebay.com/sh/ord/?filter=status%3AALL_ORDERS%2Ctimerange%3APREVIOUSMONTH')
if page.title != "Security Measure":login(page, username_str, password_str)
3、將驗證碼截圖獲取圖片并轉為base64編碼
def land():page.get_screenshot(path='tmp', name='pic.jpg', full_page=True)rangle = (74, 10, 474, 610) # 左、上、右、下img = Image.open(r'tmp/pic.jpg')cropped_img = img.crop(rangle)# 保存裁剪后的圖片cropped_img.save(r'tmp/cropped_image.png')title = (79, 15, 464, 130)img.crop(title).save(r"tmp/title.png")reader = easyocr.Reader(['ch_sim', 'en'])result = reader.readtext(img)title_list = []for detection in result:print(detection[1])title_list.append(detection[1])img1 = (79, 135, 209, 260)img.crop(img1).save(r"tmp/img1.png")img2 = (209, 135, 339, 260)img.crop(img2).save(r"tmp/img2.png")img3 = (339, 135, 469,260)img.crop(img3).save(r"tmp/img3.png")img4 = (79, 265, 209, 395)img.crop(img4).save(r"tmp/img4.png")img5 = (209, 265, 339, 395)img.crop(img5).save(r"tmp/img5.png")img6 = (339, 265, 469, 395)img.crop(img6).save(r"tmp/img6.png")img7 = (79, 395, 209, 525)img.crop(img7).save(r"tmp/img7.png")img8 = (209, 395, 339, 525)img.crop(img8).save(r"tmp/img8.png")img9 = (339, 395, 469, 525)img.crop(img9).save(r"tmp/img9.png")base64_list = []for i in range(1, 10):with open(f'tmp/img{i}.png', "rb") as img_file:encoded_string = base64.b64encode(img_file.read()).decode('utf-8')base64_list.append(encoded_string)return base64_list,title_list
4、將圖片列表和標題傳入圖片識別api返回目標坐標,模擬完成點擊
res = get_rect(base64_list, 'tmp/title.png')
objects = res["solution"]["objects"]
img_list = [img1, img2, img3, img4, img5, img6, img7, img8, img9]
print("1111", objects)
for i in range(9):if objects[i]:target = ((int(img_list[i][0]) + int(img_list[i][2])) / 2, (int(img_list[i][1]) + int(img_list[i][3])) / 2)page.actions.move_to(target).click()time.sleep(1)