您现在的位置是：首页 > 其它

当前栏目

19.SimLogin_case07

2023-09-11 14:21:24 时间

# 模拟登录豆瓣

from urllib.request import urlretrieve
import requests
from bs4 import BeautifulSoup
from os import remove
try:
    import cookielib
except BaseException:
    import http.cookiejar as cookielib
try:
    from PIL import Image
except BaseException:
    pass

url = 'https://accounts.douban.com/login'

datas = {'source': 'index_nav',
         'remember': 'on'}

headers = {
    'Referer': 'https://www.douban.com/',
    'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36'
    ' (KHTML, like Gecko) Chrome/60.0.3112.101 Safari/537.36',
    'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8',
    'Accept-Language': 'zh-CN,zh;q=0.8'}

# 尝试使用cookie信息
session = requests.session()
session.cookies = cookielib.LWPCookieJar(filename='cookies')
try:
    session.cookies.load(ignore_discard=True)
except BaseException:
    print("Cookies未能加载")
    # cookies加载不成功，则输入账号密码信息
    datas['form_email'] = input('Please input your account:')
    datas['form_password'] = input('Please input your password:')

def get_captcha():
    '''
    获取验证码及其ID
    '''
    r = requests.post(url, data=datas, headers=headers)
    page = r.text
    soup = BeautifulSoup(page, "html.parser")
    # 利用bs4获得验证码图片地址
    img_src = soup.find('img', {'id': 'captcha_image'}).get('src')
    urlretrieve(img_src, 'captcha.jpg')
    try:
        im = Image.open('captcha.jpg')
        im.show()
        im.close()
    except BaseException:
        print('到本地目录打开captcha.jpg获取验证码')
    finally:
        captcha = input('please input the captcha:')
        remove('captcha.jpg')
    captcha_id = soup.find(
        'input', {'type': 'hidden', 'name': 'captcha-id'}).get('value')
    return captcha, captcha_id

def isLogin():
    '''
    通过查看用户个人账户信息来判断是否已经登录
    '''
    url = "https://www.douban.com/accounts/"
    login_code = session.get(url, headers=headers,
                             allow_redirects=False).status_code
    if login_code == 200:
        return True
    else:
        return False

def login():
    captcha, captcha_id = get_captcha()
    # 增加表数据
    datas['captcha-solution'] = captcha
    datas['captcha-id'] = captcha_id
    login_page = session.post(url, data=datas, headers=headers)
    page = login_page.text
    soup = BeautifulSoup(page, "html.parser")
    result = soup.findAll('div', attrs={'class': 'title'})
    # 进入豆瓣登陆后页面，打印热门内容
    for item in result:
        print(item.find('a').get_text())
    # 保存 cookies 到文件，
    # 下次可以使用 cookie 直接登录，不需要输入账号和密码
    session.cookies.save()

if __name__ == '__main__':
    if isLogin():
        print('Login successfully')
    else:
        login()

猜你喜欢

【开发者思维】优秀开发者应该具备的25个思维习惯
拿下“[warn] (OS 64)指定的网络名不再可用”错误
辉芒微电子-使用verilog实现一个或门的电路。
nginx js、css多个请求合并为一个请求(concat模块)
160. 相交链表 ——【Leetcode每日一题】
IOCP(完成端口)开发手记(3)
tesseract图像识别验证码：安装使用和避免坑
(NO.00001)iOS游戏SpeedBoy Lite成形记(二十一)
常见的反爬措施：UA反爬和Cookie反爬
MVC 编程模型及其变种
SAP Emarsys 的前后台技术栈
ios开发UI篇—Kvc简单介绍
设计模式----解释器模式
第十三届蓝桥杯 C++ B组省赛 C 题——刷题统计（AC）
JS 异步错误捕获
java 23种设计模式深入理解
【English】20190418

相关主题

zl程序教程

当前栏目

19.SimLogin_case07

相关文章