srapy自定义起始url

# -*- coding: utf-8 -*-
import scrapy
from scrapy.http import Request
from scrapy.core.engine import ExecutionEngine

class ChoutiSpider(scrapy.Spider):
    name = 'baidu'
    allowed_domains = ['baidu.com']
    start_urls = ['http://baidu.com/']

    def start_requests(self):

        for url in self.start_urls:
            yield Request(url,dont_filter=True,callback=self.parse1)
            #yield 返回一个生成器,生成器可以被循环

    def parse(self, response):
        pass

  

原文地址:https://www.cnblogs.com/catherine007/p/8624805.html