Skip to content

Commit

Permalink
更新后的登录,学习下有点意思
Browse files Browse the repository at this point in the history
  • Loading branch information
xn055591 committed Jan 31, 2018
1 parent 936b39b commit bdb1277
Showing 1 changed file with 69 additions and 16 deletions.
85 changes: 69 additions & 16 deletions login_zhihu.py
Original file line number Diff line number Diff line change
@@ -1,27 +1,80 @@
import requests,time
# -*- coding:UTF-8 -*-

import requests , time
import hmac ,json
from bs4 import BeautifulSoup
url = 'https://www.zhihu.com/login/email'
def get_captcha(data):
from hashlib import sha1


def get_captcha(data,need_cap):
''' 处理验证码 '''
if need_cap is False:
return
with open('captcha.gif','wb') as fb:
fb.write(data)
return input('captcha')
return input('captcha:')

def get_signature(grantType,clientId,source,timestamp):
''' 处理签名 '''

hm = hmac.new(b'd1b964811afb40118a12068ff74a12f4',None,sha1)
hm.update(str.encode(grantType))
hm.update(str.encode(clientId))
hm.update(str.encode(source))
hm.update(str.encode(timestamp))

def login(username,password,oncaptcha):
sessiona = requests.Session()
headers = {'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:47.0) Gecko/20100101 Firefox/47.0'}
xyz = sessiona.get('https://www.zhihu.com/#signin',headers=headers).content
_xsrf = BeautifulSoup(sessiona.get('https://www.zhihu.com/#signin',headers=headers).content,'html.parser').find('input',attrs={'name':'_xsrf'}).get('value')
return str(hm.hexdigest())



def login(username,password,oncaptcha,sessiona,headers):
''' 处理登录 '''

resp1 = sessiona.get('https://www.zhihu.com/signin',headers=headers) # 拿cookie:_xsrf
resp2 = sessiona.get('https://www.zhihu.com/api/v3/oauth/captcha?lang=cn',headers=headers) # 拿cookie:capsion_ticket
need_cap = json.loads(resp2.text)["show_captcha"] # {"show_captcha":false} 表示不用验证码

grantType = 'password'
clientId = 'c3cef7c66a1843f8b3a9e6a1e3160e20'
source ='com.zhihu.web'
timestamp = str((time.time()*1000)).split('.')[0] # 签名只按这个时间戳变化

captcha_content = sessiona.get('https://www.zhihu.com/captcha.gif?r=%d&type=login'%(time.time()*1000),headers=headers).content

data = {
"_xsrf":_xsrf,
"email":username,
"client_id":clientId,
"grant_type":grantType,
"timestamp":timestamp,
"source":source,
"signature": get_signature(grantType,clientId,source,timestamp), # 获取签名
"username":username,
"password":password,
"remember_me":True,
"captcha":oncaptcha(captcha_content)
"lang":"cn",
"captcha":oncaptcha(captcha_content,need_cap), # 获取图片验证码
"ref_source":"other_",
"utm_source":""
}
resp = sessiona.post('https://www.zhihu.com/login/email',data,headers=headers).content
print(resp)

print("**2**: "+str(data))
print("-"*50)
resp = sessiona.post('https://www.zhihu.com/api/v3/oauth/sign_in',data,headers=headers).content
print(BeautifulSoup(resp,'html.parser'))

print("-"*50)
return resp

if __name__ == "__main__":
login('email','password',get_captcha)
sessiona = requests.Session()
headers = {'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:47.0) Gecko/20100101 Firefox/47.0','authorization':'oauth c3cef7c66a1843f8b3a9e6a1e3160e20'}

login('[email protected]','12345678',get_captcha,sessiona,headers) # 用户名密码换自己的就好了
resp = sessiona.get('https://www.zhihu.com/inbox',headers=headers) # 登录进去了,可以看私信了
print(BeautifulSoup(resp.content ,'html.parser'))




### chcp 65001 (win下改变cmd字符集)
### python c:\python34\login_zhihu.py
### 有非常无语的事情发生,还以为代码没生效

0 comments on commit bdb1277

Please sign in to comment.