問題描述:
ImportError:“ImportError: cannot import name jianshuItem”
[[email protected] jianshu]# scrapy crawl jianshu
Traceback (most recent call last):
File "/usr/bin/scrapy", line 11, in <module>
sys.exit(execute())
File "/usr/lib64/python2.7/site-packages/scrapy/cmdline.py", line 149, in execute
cmd.crawler_process = CrawlerProcess(settings)
File "/usr/lib64/python2.7/site-packages/scrapy/crawler.py", line 249, in __init__
super(CrawlerProcess, self).__init__(settings)
File "/usr/lib64/python2.7/site-packages/scrapy/crawler.py", line 137, in __init__
self.spider_loader = _get_spider_loader(settings)
File "/usr/lib64/python2.7/site-packages/scrapy/crawler.py", line 336, in _get_spider_loader
return loader_cls.from_settings(settings.frozencopy())
File "/usr/lib64/python2.7/site-packages/scrapy/spiderloader.py", line 61, in from_settings
return cls(settings)
File "/usr/lib64/python2.7/site-packages/scrapy/spiderloader.py", line 25, in __init__
self._load_all_spiders()
File "/usr/lib64/python2.7/site-packages/scrapy/spiderloader.py", line 47, in _load_all_spiders
for module in walk_modules(name):
File "/usr/lib64/python2.7/site-packages/scrapy/utils/misc.py", line 71, in walk_modules
submod = import_module(fullpath)
File "/usr/lib64/python2.7/importlib/__init__.py", line 37, in import_module
__import__(name)
File "/home/BS/scrapy/jianshu/jianshu/spiders/jianshu_Spider.py", line 2, in <module>
from jianshu.items import jianshuItem
ImportError: cannot import name jianshuItem
解決問題,過程如下:
[[email protected] jianshu]# cat items.py
# -*- coding: utf-8 -*-
# Define here the models for your scraped items
#
# See documentation in:
# https://doc.scrapy.org/en/latest/topics/items.html
import scrapy
class JianshuItem(scrapy.Item):
# define the fields for your item here like:
title = scrapy.Field()
url = scrapy.Field()
author = scrapy.Field()
readNum = scrapy.Field()
commentNum = scrapy.Field()
likeNum = scrapy.Field()
~
~
"items.py" 18L, 420C written
[[email protected] spiders]# vi jianshu_Spider.py
import scrapy
from jianshu.items import JianshuItem
class jianshu_spider(scrapy.Spider):
name = 'jianshu'
allowed_domains = ['www.jianshu.com']
start_urls = ['http://www.jianshu.com/top/monthly']
def parse(self , response):
item = JianshuItem()
selector = Selector(response)
selector.xpath('//ul[@class="article-list thumbnails"]/li')
for article in articles:
title = article.xpath('//div/h4/a/text()').extract()
url = article.xpath('//div/h4/a/@href').extract()
author = article.xpath('//div/p/a/text()').extract()
item['title'] = title
item['url'] = url
item['author'] = author
yield item
~
~
~
~
~
"jianshu_Spider.py" 21L, 625C written
解決思路:
解決xx_spider.py中的 from 項目名.items import item.py中class的名字+Item
如項目名為jianshu,item.py中class名字為Jianshu,則,此處為:from jianshu.items import JianshuItem ,否則将會報出如上錯誤。