爬虫学习

#通用爬虫框架
import requests as r
def getHTMLText(url):
    try:
        t=r.get(url,timeout=30)     #请求网页得到对象
        t.raise_for_status()        #如果状态不是200,引发HTTPError
        t.encoding=t.apparent_encoding  #使得返回解码是正确的
        return t.text
    except:
        return "产生异常"
if __name__ == "__main__":
    url = "http://www.baidu.com"
    print(getHTMLText(url))

原文地址:https://www.cnblogs.com/xinqidian/p/10200805.html