爬虫-retrying用法

文档:https://pypi.org/project/retrying/

安装

pip install retrying

设置最大重试次数

# coding=utf-8
import requests
from retrying import retry

headers = {"User-Agent":"Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/71.0.3578.80 Safari/537.36"}

@retry(stop_max_attempt_number=3)  # 如果报错 则最大重试次数为3  stop_max_attempt_number设置最大重试次数
def _parse_url(url, method,data,proxies):
    print("*" * 20)
    if method=="POST":
        response = requests.post(url, data=data, headers=headers, proxies=proxies)
    else:
        response = requests.get(url, headers=headers, timeout=3, proxies=proxies)
    assert response.status_code==200
    return response.content.decode()

def parse_url(url, method="GET", data=None, proxies={}):
    try:
        html_str = _parse_url(url, method, data, proxies)
    except:
        html_str = None

    return html_str

if __name__ == '__main__':
    url = "www.baidu.com"
    print(parse_url(url))
原文地址:https://www.cnblogs.com/yifengs/p/11724629.html