python爬虫通用框架

import requests


def getHTMLText(url):

try:

r = requests.get(url,timeout=30)

r.raise_for_status()  # 如果状态不是200,引发HTTP-Error异常

#print(r.status_code)

r.encoding = r.apparent_encoding

return r.text

except:

return "产生异常"


if __name__=="__main__":

url = "https://item.jd.com/5107323.html"

print(getHTMLText(url))


猜你喜欢

转载自blog.51cto.com/13941177/2353820