srapy自定义起始url

# -*- coding: utf-8 -*-
import scrapy
from scrapy.http import Request
from scrapy.core.engine import ExecutionEngine

class ChoutiSpider(scrapy.Spider):
    name = 'baidu'
    allowed_domains = ['baidu.com']
    start_urls = ['http://baidu.com/']

    def start_requests(self):

        for url in self.start_urls:
            yield Request(url,dont_filter=True,callback=self.parse1)
            #yield 返回一个生成器,生成器可以被循环

    def parse(self, response):
        pass

  

posted @ 2018-03-22 16:43  老王的农场  阅读(161)  评论(0编辑  收藏  举报