更新后的登录,学习下有点意思

pull/4/head
xn055591 2018-01-31 19:13:30 +08:00
parent 936b39b8fd
commit bdb12778e7
1 changed files with 69 additions and 16 deletions

View File

@ -1,27 +1,80 @@
import requests,time # -*- coding:UTF-8 -*-
import requests , time
import hmac ,json
from bs4 import BeautifulSoup from bs4 import BeautifulSoup
url = 'https://www.zhihu.com/login/email' from hashlib import sha1
def get_captcha(data):
def get_captcha(data,need_cap):
''' 处理验证码 '''
if need_cap is False:
return
with open('captcha.gif','wb') as fb: with open('captcha.gif','wb') as fb:
fb.write(data) fb.write(data)
return input('captcha') return input('captcha:')
def get_signature(grantType,clientId,source,timestamp):
''' 处理签名 '''
hm = hmac.new(b'd1b964811afb40118a12068ff74a12f4',None,sha1)
hm.update(str.encode(grantType))
hm.update(str.encode(clientId))
hm.update(str.encode(source))
hm.update(str.encode(timestamp))
return str(hm.hexdigest())
def login(username,password,oncaptcha,sessiona,headers):
''' 处理登录 '''
resp1 = sessiona.get('https://www.zhihu.com/signin',headers=headers) # 拿cookie:_xsrf
resp2 = sessiona.get('https://www.zhihu.com/api/v3/oauth/captcha?lang=cn',headers=headers) # 拿cookie:capsion_ticket
need_cap = json.loads(resp2.text)["show_captcha"] # {"show_captcha":false} 表示不用验证码
grantType = 'password'
clientId = 'c3cef7c66a1843f8b3a9e6a1e3160e20'
source ='com.zhihu.web'
timestamp = str((time.time()*1000)).split('.')[0] # 签名只按这个时间戳变化
def login(username,password,oncaptcha):
sessiona = requests.Session()
headers = {'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:47.0) Gecko/20100101 Firefox/47.0'}
xyz = sessiona.get('https://www.zhihu.com/#signin',headers=headers).content
_xsrf = BeautifulSoup(sessiona.get('https://www.zhihu.com/#signin',headers=headers).content,'html.parser').find('input',attrs={'name':'_xsrf'}).get('value')
captcha_content = sessiona.get('https://www.zhihu.com/captcha.gif?r=%d&type=login'%(time.time()*1000),headers=headers).content captcha_content = sessiona.get('https://www.zhihu.com/captcha.gif?r=%d&type=login'%(time.time()*1000),headers=headers).content
data = { data = {
"_xsrf":_xsrf, "client_id":clientId,
"email":username, "grant_type":grantType,
"timestamp":timestamp,
"source":source,
"signature": get_signature(grantType,clientId,source,timestamp), # 获取签名
"username":username,
"password":password, "password":password,
"remember_me":True, "lang":"cn",
"captcha":oncaptcha(captcha_content) "captcha":oncaptcha(captcha_content,need_cap), # 获取图片验证码
"ref_source":"other_",
"utm_source":""
} }
resp = sessiona.post('https://www.zhihu.com/login/email',data,headers=headers).content
print(resp) print("**2**: "+str(data))
print("-"*50)
resp = sessiona.post('https://www.zhihu.com/api/v3/oauth/sign_in',data,headers=headers).content
print(BeautifulSoup(resp,'html.parser'))
print("-"*50)
return resp return resp
if __name__ == "__main__": if __name__ == "__main__":
login('email','password',get_captcha) sessiona = requests.Session()
headers = {'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:47.0) Gecko/20100101 Firefox/47.0','authorization':'oauth c3cef7c66a1843f8b3a9e6a1e3160e20'}
login('12345678@qq.com','12345678',get_captcha,sessiona,headers) # 用户名密码换自己的就好了
resp = sessiona.get('https://www.zhihu.com/inbox',headers=headers) # 登录进去了,可以看私信了
print(BeautifulSoup(resp.content ,'html.parser'))
### chcp 65001 (win下改变cmd字符集)
### python c:\python34\login_zhihu.py
### 有非常无语的事情发生,还以为代码没生效