def __init__(self, feed_file=None, feed_title=None, feed_link=None, feed_description=None,
crawler_settings=None):
settings = crawler_settings if crawler_settings else dict(self.default_settings)
if feed_file:
settings['FEED_FILE'] = feed_file
if feed_title:
settings['FEED_TITLE'] = feed_title
if feed_link:
settings['FEED_LINK'] = feed_link
if feed_description:
settings['FEED_DESCRIPTION'] = feed_description
self.crawler = get_crawler(settings_dict=settings)
self.spider = scrapy.Spider.from_crawler(self.crawler, 'example.com')
self.spider.parse = lambda response: ()
item_processor = settings.get('ITEM_PROCESSOR')
if not item_processor:
item_processor = RaisedItemPipelineManager
elif isinstance(item_processor, six.string_types):
item_processor = load_object(item_processor)
self.ipm = item_processor.from_crawler(self.crawler)
评论列表
文章目录