验证码破解 | Selenium模拟登录简书
使用超级鹰打码平台处理登录的文字点击验证码
import time from io import BytesIO from PIL import Image from selenium import webdriver from selenium.webdriver import ActionChains from selenium.webdriver.common.by import By from selenium.webdriver.support.ui import WebDriverWait from selenium.webdriver.support import expected_conditions as EC from chaojiying import Chaojiying #为简书的用户账号和密码 EMAIL = PASSWORD = #此四者分别为,超级鹰的用户名,密码,软件ID,和验证码类型 CHAOJIYING_USERNAME = CHAOJIYING_PASSWORD = CHAOJIYING_SOFT_ID = CHAOJIYING_KIND = class Jianshu(): def __init__(self): self.url = 'https://www.jianshu.com/sign_in' self.browser = webdriver.Chrome() self.wait = WebDriverWait(self.browser, 20) self.email = EMAIL self.password = PASSWORD self.chaojiying = Chaojiying(CHAOJIYING_USERNAME, CHAOJIYING_PASSWORD, CHAOJIYING_SOFT_ID) def __del__(self): self.browser.close() def open(self): """ 打开网页输入用户名密码 :return: None """ self.browser.get(self.url) email = self.wait.until(EC.presence_of_element_located((By.ID, 'session_email_or_mobile_number'))) password = self.wait.until(EC.presence_of_element_located((By.ID, 'session_password'))) email.send_keys(self.email) password.send_keys(self.password) def get_touclick_button(self): """ 获取初始验证按钮 :return: """ button = self.wait.until(EC.element_to_be_clickable((By.CLASS_NAME, 'sign-in-button'))) return button def get_touclick_element(self): """ 获取验证图片对象 :return: 图片对象 """ element = self.wait.until(EC.presence_of_element_located((By.CLASS_NAME, 'geetest_widget'))) return element def get_position(self): """ 获取验证码位置 :return: 验证码位置元组 """ element = self.get_touclick_element() time.sleep(2) location = element.location size = element.size top, bottom, left, right = location['y'], location['y'] + size['height'], location['x'], location['x'] + size['width'] top = int(top) bottom = int(bottom) left = int(left) right = int(right) return (top, bottom, left, right) def get_screenshot(self): """ 获取网页截图 :return: 截图对象 """ screenshot = self.browser.get_screenshot_as_png() screenshot = Image.open(BytesIO(screenshot)) return screenshot def get_touclick_image(self, name='captch.png'): """ 获取验证码图片 :return: 图片对象 """ top, bottom, left, right = self.get_position() print('验证码位置', top, bottom, left, right) screenshot = self.get_screenshot() captcha = screenshot.crop((left, top, right, bottom)) captcha.save(name) return captcha def get_points(self, captcha_result): """ 解析识别结果 :param captcha_result: 识别结果 :return: 转化后的结果 """ groups = captcha_result.get('pic_str').split('|') locations = [[int(number) for number in group.split(',')] for group in groups] return locations def touch_click_words(self, locations): """ 点击验证图片 :param locations: 点击位置 :return: None """ for location in locations: print(location) ActionChains(self.browser).move_to_element_with_offset(self.get_touclick_element(), location[0],location[1]).click().perform() time.sleep(1) def touch_click_verify(self): """ 点击验证按钮 :return: None """ button = self.wait.until(EC.element_to_be_clickable((By.CLASS_NAME, 'geetest_commit'))) button.click() def login(self): """ 登录 :return: None """ submit = self.wait.until(EC.element_to_be_clickable((By.ID, '_submit'))) submit.click() time.sleep(10) print('登录成功') def crack(self): """ 破解入口 :return: None """ self.open() # 点击验证按钮 button = self.get_touclick_button() button.click() # 获取验证码图片 image = self.get_touclick_image() bytes_array = BytesIO() image.save(bytes_array, format='PNG') # 识别验证码 result = self.chaojiying.post_pic(bytes_array.getvalue(), CHAOJIYING_KIND) print(result) locations = self.get_points(result) self.touch_click_words(locations) self.touch_click_verify() # 判定是否成功 # time.sleep(10) try: success = self.wait.until( EC.text_to_be_present_in_element((By.CLASS_NAME, 'btn write-btn'), '验证成功')) print(success) except: # 失败后重试 # if not success: print("验证失败,重新尝试") self.crack() # else: # self.login() if __name__ == '__main__': crack = Jianshu() crack.crack()
输出结果:
验证码位置 256 664 354 672
{'err_no': 0, 'err_str': 'OK', 'pic_id': '2084311523163100007', 'pic_str': '216,256|91,189|142,243', 'md5': 'c25ad4f3e9746e9aa6fe4930ed10db4a'}
[216, 256]
[91, 189]
[142, 243]