使用selenium添加cookie模拟登录

登录的网站为拉勾网,URL = https://www.lagou.com/jobs/list_python?labelWords=&fromSearch=true&suginput=
首先登录拉勾网,获取cookie

    def get_cookies(self, first_url='https://www.lagou.com/jobs/list_python?labelWords=&fromSearch=true&suginput='):
        # 获取登录cookie
        self.driver.get(first_url)
        self.driver.find_element_by_class_name('body-btn').click()
        self.driver.find_element_by_class_name('login').click()
        self.driver.find_element_by_xpath('//input[@type="text"]').send_keys('这里输入账号')
        self.driver.find_element_by_xpath('//input[@type="password"]').send_keys('这里输入密码')
        self.driver.find_element_by_class_name('login-password').click()

        # 休眠时间手动打码
        time.sleep(30)
        self.driver.find_element_by_class_name('body-btn').click()
        cookies = self.driver.get_cookies()  # 可以获取cookie下次登录使用
        with open('5-cookies.json', 'w') as f:
            json.dump(cookies, f)

然后使用保存在本地的cookie绕过验证码登录,要注意add_cookie方法中传递的cookie结构

    def get_page(self, first_url='https://www.lagou.com/jobs/list_python?labelWords=&fromSearch=true&suginput='):
        # 读取本地cookie
        with open('5-cookies.json', 'r') as f:
            cookies = json.load(f)

        # 添加的cookie的形式{'name' : 'foo', 'value' : 'bar', 'path' : '/', 'secure':True}
        add_cookies = []
        for cookie in cookies:
            add_cookie = {'name': cookie['name'],
                   'value': cookie['value'],
                   'path': cookie['path'],
                   'secure': cookie['secure']}
            add_cookies.append(add_cookie)
        print(add_cookies)

        # 获取页面使用cookie登录
        self.driver.get(first_url)
        time.sleep(3)
        self.driver.find_element_by_class_name('body-btn').click()
        self.driver.delete_all_cookies()
        # 逐条添加cookie
        for cookie in add_cookies:
            self.driver.add_cookie(cookie)
        self.driver.get(first_url)
        self.driver.find_element_by_class_name('body-btn').click()

        # 清空搜索框输入python
        ipt = self.driver.find_element_by_id('keyword')
        ipt.clear()
        ipt.send_keys('python')
        self.driver.find_element_by_id('submit').click()

你可能感兴趣的:(Python爬虫)