Selenium模拟登录魅族

Selenium模拟登录魅族

  • 魅族的验证码采用了第三方「极验」验证码平台,破解比较复杂,故采用打码平台超级鹰进行识别。原理是将验证码图片转换成字节流发送给超级鹰,超级鹰会返回验证码所在的坐标。
  • 超级鹰注册后绑定微信会获取1000题分供测试使用。
  • 超级鹰python API
#!/usr/bin/env python
# coding:utf-8

import requests
from hashlib import md5


# 超级鹰打码平台

class Chaojiying(object):

    def __init__(self, username, password, soft_id):
        self.username = username
        password = password.encode('utf8')
        self.password = md5(password).hexdigest()
        self.soft_id = soft_id
        self.base_params = {
            'user': self.username,
            'pass2': self.password,
            'softid': self.soft_id,
        }
        self.headers = {
            'Connection': 'Keep-Alive',
            'User-Agent': 'Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 5.1; Trident/4.0)',
        }

    def PostPic(self, im, codetype):
        """
        im: 图片字节
        codetype: 题目类型 参考 http://www.chaojiying.com/price.html
        """
        params = {
            'codetype': codetype,
        }
        params.update(self.base_params)
        files = {'userfile': ('ccc.jpg', im)}
        r = requests.post('http://upload.chaojiying.net/Upload/Processing.php', data=params, files=files,
                          headers=self.headers)
        return r.json()

    def ReportError(self, im_id):
        """
        im_id:报错题目的图片ID
        """
        params = {
            'id': im_id,
        }
        params.update(self.base_params)
        r = requests.post('http://upload.chaojiying.net/Upload/ReportError.php', data=params, headers=self.headers)
        return r.json()


if __name__ == '__main__':
    chaojiying = Chaojiying('xxxx', 'xxxx', 'xxxx')
    im = open('captch.png', 'rb').read()
    print(chaojiying.PostPic(im, 9004))

  • meizu_login.py
    ==难点是验证码图片的获取要完整,在这里我选择了通过URL去获取,获得的图片类似于下图:==


    captcha.png
import time
import urllib.request
from io import BytesIO
from PIL import Image
from selenium import webdriver
from selenium.webdriver import ActionChains
from selenium.webdriver.common.by import By
from selenium.webdriver.support.ui import WebDriverWait
from selenium.webdriver.support import expected_conditions as EC

from robot.media_admin.meizu_spider.chaojiying import Chaojiying
from utils.LogUtil import LogHandler

logger = LogHandler('meizu_login')

CHAOJIYING_USERNAME = 'xxx'
CHAOJIYING_PASSWORD = 'xxx'
CHAOJIYING_SOFT_ID = '901142' #软件ID官网生成
CHAOJIYING_KIND = '9004' 


class MeizuLogin():
    """
    主类
    通过调用 chaojiying 类中的 多个方法进行图片上传,结果获取
    """

    def __init__(self, username, password):
        self.url = "https://login.flyme.cn/sso?appuri=http%3A%2F%2Fmzdsp.meizu.com%2Flogin&useruri=&sid=&service=app&" \
                   "autodirct=true"
        path = '自己设备上chromedriver的路径'
        self.browser = webdriver.Chrome(executable_path=path)
        self.browser.maximize_window()
        self.wait = WebDriverWait(self.browser, 20)
        self.email = username
        self.password = password
        self.chaojiying = Chaojiying(CHAOJIYING_USERNAME, CHAOJIYING_PASSWORD, CHAOJIYING_SOFT_ID)

    def __del__(self):
        self.browser.close()

    def open(self):
        """
        打开网页输入用户名密码
        :return: None
        """
        self.browser.get(self.url)
        email = self.wait.until(EC.presence_of_element_located((By.ID, 'account')))
        password = self.wait.until(EC.presence_of_element_located((By.ID, 'password')))
        email.send_keys(self.email)
        password.send_keys(self.password)

    def get_touclick_element(self):
        """
        获取验证图片对象,就是验证码的点击区域
        :return: 图片对象
        """

        element = self.wait.until(EC.presence_of_element_located(
            (By.CLASS_NAME, 'geetest_item_img')))
        return element

    def get_position(self):
        """
        从节点对象,获取验证码位置
        :return: 验证码位置元组
        """
        element = self.get_touclick_element()
        time.sleep(2)
        location = element.location
        size = element.size
        top, bottom, left, right = location['y'], location['y'] + size['height'], location['x'], location['x'] + size[
            'width']
        return (top * 2, bottom * 2, left * 2, right * 2)

    def get_screenshot(self):
        """
        根据验证码位置,获取网页截图
        :return: 截图对象
        """
        screenshot = self.browser.get_screenshot_as_png()
        screenshot = Image.open(BytesIO(screenshot))
        return screenshot

    def get_touclick_image(self, name='captcha.png'):
        """
        保存验证码图片到本地
        :return: 图片对象
        """
        top, bottom, left, right = self.get_position()
        print('验证码位置', top, bottom, left, right)
        screenshot = self.get_screenshot()
        captcha = screenshot.crop((left, top, right, bottom))
        captcha.save(name)
        return captcha

    def get_points(self, captcha_result):
        """
        {'err_no': 0, 'err_str': 'OK', 'pic_id': '9069220022448500002', 'pic_str': '208,75|269,156', 'md5': 'a2175369130a2ca56a77573cbf5cc7dc'}
        解析识别结果,就是解析超级鹰返回的数据
        :param captcha_result: 识别结果
        :return: 转化后的结果
        """
        groups = captcha_result.get('pic_str').split('|')
        locations = [[int(number) for number in group.split(',')] for group in groups]
        return locations

    def touch_click_words(self, locations):
        """
        点击验证图片
        :param locations: 点击位置
        :return: None
        """
        for location in locations:
            print(location)
            ActionChains(self.browser).move_to_element_with_offset(self.get_touclick_element(), location[0],
                                                                   location[1]).click().perform()
            time.sleep(1)

    def crack(self):
        """
        破解入口
        :return: None
        """
        try:
            self.open()
            self.browser.find_element_by_class_name('geetest_radar_tip_content').click()
            time.sleep(2)
            # 获取验证码图片
            image_src = str(self.browser.find_element_by_class_name('geetest_item_img').get_attribute('src'))
            print(image_src)
            image_src = image_src + 'png'
            image = urllib.request.urlretrieve(image_src, filename='captcha.png')
            im = open('captcha.png', 'rb').read()
            # 识别验证码
            result = self.chaojiying.PostPic(im, CHAOJIYING_KIND)
            logger.info(result)
            locations = self.get_points(result)
            print(locations)
            # 进行点击图片
            self.touch_click_words(locations)
            time.sleep(2)

            # 点击登陆
            self.browser.find_element_by_class_name('geetest_commit_tip').click()
            time.sleep(1)
            submit = self.wait.until(EC.element_to_be_clickable((By.ID, 'login')))
            submit.click()
            time.sleep(2)
            login_id = self.browser.find_element_by_xpath('//*[@id="app"]/header/div[2]/div/p[2]/small').text
            print(login_id)
            return login_id
        except Exception as e:
            # 如果失败了超级鹰会返回分值
            logger.error('登录失败:%s', e)
            self.chaojiying.ReportError(result['pic_id'])
            return None
        finally:
            # 退出chrome-headless 浏览器
            self.browser.quit()


if __name__ == '__main__':
    username = 'xxx'
    password = 'xxx'
    for i in range(3):
        crack = MeizuLogin(username, password)
        uid = crack.crack()
        if uid is None:
            continue
        else:
            print(uid)
            break

©著作权归作者所有,转载或内容合作请联系作者
平台声明:文章内容(如有图片或视频亦包括在内)由作者上传并发布,文章内容仅代表作者本人观点,简书系信息发布平台,仅提供信息存储服务。

推荐阅读更多精彩内容

  • 爬虫验证码中还是有很多的特别难破解的,比如BT的12306 哈哈~,是不是被难倒了,没关系,这次说的是打码平台,可...
    煎炼阅读 5,110评论 0 2
  • 2018.8.21(545~403) 女儿今天继续赶着录制小时候听的录音磁带,她要把小时候听过的录音转化为电子...
    方正省阅读 1,192评论 0 0
  • 材料:梅心肉(高手说,要眉毛肉,关键我对猪身上的分布不清楚,大家自己问度娘,话说这块肉比较嫩) 调料:叉烧酱(推荐...
    阳的乐活阅读 984评论 0 2
  • 2017年12月7日,我有幸受邀参加了微博“V影响力峰会法律论坛”。各位大V、金V的经验分享、圆桌讨论,让我这个一...
    罗艺律师阅读 235评论 0 1