import?urllib.request????#?Python之后urllib2改為urllib.request
print("方法一")
url?=?"https://dxy.com/faq"
response_1?=?urllib.request.urlopen(url)
print(response_1.getcode())????#?截取狀態(tài)碼,是200則成功
#?print(response_1.read())?????#?未解碼
print(len(response_1.read()))
print("\n方法二")
request?=?urllib.request(url)??????#?錯誤一
request.add_header("user-agent","Mozilla/5.0?")????#?將爬蟲偽裝成瀏覽器
response_2?=?urllib.request.urlopen(request)
print(response_2.getcode())
print(len(response_2.read()))
print("\n方法三")
cj?=?cookielib.CookieJar()?????????#?錯誤二
opener?=?urllib.request.build_opener(urllib.request.HTTPCookieProcessor(cj))
urllib.request.install_opener(opener)
response_3?=?urllib.request.urlopen(url)
print(response_3.getcode())????#?截取狀態(tài)碼,是200則成功
print?cj
print(len(response_3.read()))
2019-08-29
第三個地方 我還用了了?
2019-08-29
這里是request = urllib.request.Request(url)? #返回的是一個request對象