import urllib.request
weburl =
"http://www.douban.com/"
webheader = {
'User-Agent':
'Mozilla/5.0 (Windows NT 6.1; WOW64; rv:23.0) Gecko/20100101 Firefox/23.0'}
req = urllib.request.Request(
url=weburl,
headers=webheader)
webPage=urllib.request.urlopen(req)
data = webPage.read()
data = data.decode(
'UTF-8')
print(data)
打印出来的内容就是f12出现的内容
print(
type(webPage))
网页类型
print(webPage.geturl())
网址
print(webPage.info())
网站信息
print(webPage.getcode())
网站验证码