diff --git a/Chapter05_Scrapy/wikiSpider/wikiSpider/articleItems.py b/Chapter05_Scrapy/wikiSpider/wikiSpider/articleItems.py index 0ccd9c0..d322fed 100644 --- a/Chapter05_Scrapy/wikiSpider/wikiSpider/articleItems.py +++ b/Chapter05_Scrapy/wikiSpider/wikiSpider/articleItems.py @@ -1,5 +1,5 @@ -from scrapy.contrib.linkextractors import LinkExtractor -from scrapy.contrib.spiders import CrawlSpider, Rule +from scrapy.linkextractors import LinkExtractor +from scrapy.spiders import CrawlSpider, Rule from wikiSpider.items import Article class ArticleSpider(CrawlSpider): @@ -17,4 +17,4 @@ def parse_items(self, response): article['text'] = response.xpath('//div[@id="mw-content-text"]//text()').extract() lastUpdated = response.css('li#footer-info-lastmod::text').extract_first() article['lastUpdated'] = lastUpdated.replace('This page was last edited on ', '') - return article \ No newline at end of file + return article