基本爬取代码
import requests
def getHTMLText(url
):
try:
kv
= {'user-agent':'Mozilla/5.0'}
r
= requests
.get
(url
, headers
= kv
)
r
.raise_for_status
()
r
.encoding
= r
.apparent_encoding
return r
.text
[:1000]
except:
return '产生异常'
if __name__
=='__main__':
url
= 'http://www.baidu.com/'
print(getHTMLText
(url
))
转载请注明原文地址:https://ipadbbs.8miu.com/read-46901.html