Commit e9a72ff93a8a99a5107bbc6118235cc0f27c15a8
1 parent
5867e020
Exists in
master
Tune to CentOS
Showing
1 changed file
with
2 additions
and
2 deletions
Show diff stats
crawler/crawler/spiders/ImgCrawler.py
1 | -from scrapy.spider import Spider | |
1 | +from scrapy.spider import BaseSpider | |
2 | 2 | from scrapy.http import Request |
3 | 3 | from crawler.items import CrawlerItem |
4 | 4 | import re |
5 | 5 | |
6 | -class Crawler(Spider): | |
6 | +class Crawler(BaseSpider): | |
7 | 7 | name = 'img' |
8 | 8 | allowed_domains = ['www.cs.tsinghua.edu.cn'] |
9 | 9 | start_urls = ['http://www.cs.tsinghua.edu.cn'] | ... | ... |