4.1创建爬虫项目
mkvirtualenv article_spiderscrapy startproject AiticleSpiderscrapy genspider {爬虫名称} {网站域名}scrapy genspider jobbole blog.jobbole.com# -*- coding: utf-8 -*-
import scrapy
class JobboleSpider(scrapy.Spider):
name = 'jobbole'
allowed_domains = ['blog.jobbole.com']
start_urls = ['http://blog.jobbole.com/']
def parse(self, response):
passLast updated