爬百度100次
阿新 • • 發佈:2018-02-28
框架 url odin class range aid quest htm ise
1 import requests 2 import time 3 4 def getHTMLText(url): 5 try: 6 r= requests.get(url, timeout= 20) 7 r.raise_for_status() 8 r.encoding= r.apparent_encoding 9 return r.text 10 except: 11 return "異常退出" 12 13 def main(): 14 url = "https://www.baidu.com" 15 start= time.time() 16 for i in range(100): 17 getHTMLText(url) 18 print(‘第%d次成功‘%(i+1)) 19 20 end= time.time() 21 print("爬取用時為: ", (end- start), "秒") 22 23 if __name__ == "__main__": 24 main()
基本爬蟲框架,註意raise_fo_status與try,except的配合使用,方便檢查錯誤
爬百度100次