1. 程式人生 > >Python爬去知乎上問題下所有圖片

Python爬去知乎上問題下所有圖片

sts dal b- log email token db4 trie fin

技術分享圖片
from zhihu_oauth import ZhihuClient
from zhihu_oauth.exception import NeedCaptchaException

client = ZhihuClient()

try:
    client.login(email_or_phone, password)
    print(u"登陸成功!")
except NeedCaptchaException:
    # 保存驗證碼並提示輸入,重新登錄
    with open(a.gif, wb) as f:
        f.write(client.get_captcha())
    captcha 
= input(please input captcha:) client.login(+8613872273541, z289784552, captcha) print(u"登陸成功!") client.save_token(token.pkl)
獲取Token 技術分享圖片
from __future__ import print_function # 使用python3的print方法
from zhihu_oauth import ZhihuClient
import re
import os
import urllib.request

client = ZhihuClient()
# 登錄 client.load_token(token.pkl) # 加載token文件 id = 46508954 # https://www.zhihu.com/question/24400664(長得好看是一種怎麽樣的體驗) question = client.question(id) print(u"問題:",question.title) print(u"回答數量:",question.answer_count) os.mkdir(question.title + u"(圖片)") path = question.title + u"(圖片)" index = 1 # 圖片序號 for answer in
question.answers: content = answer.content # 回答內容 re_compile = re.compile(r<img src="(https://pic\d\.zhimg\.com/.*?\.(jpg|png))".*?>) img_lists = re.findall(re_compile, content) if (img_lists): for img in img_lists: img_url = img[0] # 圖片url urllib.request.urlretrieve(img_url, path + u"/%d.jpg" % index) print(u"成功保存第%d張圖片" % index) index += 1
加載Token並讀取數據

Python爬去知乎上問題下所有圖片