码迷,mamicode.com
首页 > 其他好文 > 详细

抽屉网点赞爬虫

时间:2018-08-24 00:29:03      阅读:246      评论:0      收藏:0      [点我收藏+]

标签:pass   turn   gecko   认证   log   windows   ike   win   nbsp   

import requests
from bs4 import BeautifulSoup
import time


user_cookie = ""
# 注意:抽屉网    cookies中的gpsd是最要的验证数据
def login(phone_id, phone_pwd):
    global user_cookie
    # 因为抽屉的cookie设置比较特别,其cookie为未登录状态下的cookie通过登录成功来进行验证,从而认证为登录状态下的cookie
    r1 = requests.get(
        url= https://dig.chouti.com/,
        headers = {
            User-Agent: Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.106 Safari/537.36,
        }
    )
    user_cookie = r1.cookies.get_dict()

    r2 = requests.post(
        url= https://dig.chouti.com/login,
        headers = {
            User-Agent: Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.106 Safari/537.36,
        },
        data = {
            "phone": "86%d" % int(phone_id),
            "password": phone_pwd,
            "oneMonth": 1
        },
        cookies = user_cookie
    )
    # 返回认证后的cookie
    return user_cookie

def thumbsup():
    # 抽屉新热榜只有120页
    i=1
    while i <= 120:
        r3 = requests.get(
            url= https://dig.chouti.com/all/hot/recent/%d% i,
            headers = {
                User-Agent: Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.106 Safari/537.36,
            },
            cookies = user_cookie,
        )
        print("正在给第%d页点赞" % i,)
        soup = BeautifulSoup(r3.text, html.parser)
        res_list = soup.find_all(name=div, attrs={class: item})
        for res in res_list:
            requests.post(
                url=https://dig.chouti.com/link/vote?linksId=%d % int(res.find(name=img).attrs[lang]),
                headers={
                    User-Agent: Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.106 Safari/537.36,
                },
                cookies=user_cookie
            )
            time.sleep(0.5)
        i+=1
        print("准备执行下一页...")


def main():
    login("手机号", "密码")
    thumbsup()


if __name__ == "__main__":
    main()

 

抽屉网点赞爬虫

标签:pass   turn   gecko   认证   log   windows   ike   win   nbsp   

原文地址:https://www.cnblogs.com/fengbo1113/p/9527199.html

(0)
(0)
   
举报
评论 一句话评论(0
登录后才能评论!
© 2014 mamicode.com 版权所有  联系我们:gaon5@hotmail.com
迷上了代码!