模拟登陆豆瓣

Python3 使用post提交表单登陆豆瓣

import urllib.request
import requests
import http.cookiejar
import zlib
import json
import random
import time
import urllib
from lxml import etree

#全局取消证书验证
import ssl
ssl._create_default_https_context = ssl._create_unverified_context

#获取Cookiejar对象(存在本机的cookie消息)
#cookie = http.cookiejar.CookieJar()
#opener = urllib.request.install_opener(urllib.request.HTTPCookieProcessor(cookie))
url = 'https://accounts.douban.com/login'

hds = [{'User-Agent','Mozilla/5.0 (Windows; U; Windows NT 6.1; en-US; rv:1.9.1.6) Gecko/20091201 Firefox/3.5.6'},
       {'User-Agent','Mozilla/5.0 (Windows NT 6.2) AppleWebKit/535.11 (KHTML, like Gecko) Chrome/17.0.963.12 Safari/535.11'},
       {'User-Agent','Mozilla/5.0 (compatible; MSIE 10.0; Windows NT 6.2; Trident/6.0)'},
       {'User-Agent','Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:34.0) Gecko/20100101 Firefox/34.0'},
       {'User-Agent','Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Ubuntu Chromium/44.0.2403.89 Chrome/44.0.2403.89 Safari/537.36'},
       {'User-Agent','Mozilla/5.0 (Macintosh; U; Intel Mac OS X 10_6_8; en-us) AppleWebKit/534.50 (KHTML, like Gecko) Version/5.1 Safari/534.50'},
       {'User-Agent','Mozilla/5.0 (Windows; U; Windows NT 6.1; en-us) AppleWebKit/534.50 (KHTML, like Gecko) Version/5.1 Safari/534.50'},
       {'User-Agent','Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0'},
       {'User-Agent','Mozilla/5.0 (Macintosh; Intel Mac OS X 10.6; rv:2.0.1) Gecko/20100101 Firefox/4.0.1'},
       {'User-Agent','Mozilla/5.0 (Windows NT 6.1; rv:2.0.1) Gecko/20100101 Firefox/4.0.1'},
       {'User-Agent','Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_0) AppleWebKit/535.11 (KHTML, like Gecko) Chrome/17.0.963.56 Safari/535.11'},
       {'User-Agent','Opera/9.80 (Macintosh; Intel Mac OS X 10.6.8; U; en) Presto/2.8.131 Version/11.11'},
       {'User-Agent','Opera/9.80 (Windows NT 6.1; U; en) Presto/2.8.131 Version/11.11'}]

Formdata ={
       'redir':'https://www.douban.com/people/175030420/',
       'form_email':'xxxxxxxxxx',
       'form_password':'xxxxxxxxxx',
       'login':'登陆',
}

#将Formdata进行转码
Formdata = urllib.parse.urlencode(Formdata)
headers = {'User-agent':'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/60.0.3112.113 Safari/537.36'}
#headers = {'User-Agent','Mozilla/5.0 (Macintosh; Intel Mac OS X 10.6; rv:2.0.1) Gecko/20100101 Firefox/4.0.1'}
content = requests.post(url,data=Formdata,headers=headers,verify = False)  # verify必须要写,用于取消全局验证

con = content.text

con = etree.HTML(con)
#使用xpath提取Form表单中所需的信息
captcha_url = con.xpath('//img[@id="captcha_image"]/@src')[0]
captcha_id = con.xpath('//input[@name="captcha-id"]/@value')[0]
filename = '../爬虫数据/captcha.png'
#手动输入验证码
urllib.request.urlretrieve(captcha_url,filename)
captcha = input("please input the captcha:")
captcha_solution = captcha
#captcha-id = captcha_id
Formdata ={
       'redir':'https://www.douban.com/people/175030420/',
       'form_email':'your email',
       'form_password':'your password',
       'login':u'登陆',
       'captcha-solution':captcha,
       'captcha-id':captcha_id,
}
con = requests.post(url,data=Formdata,headers=headers,verify = False)
page = con.text
print(page)
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值