def process_item(self, item, spider):
if item['site'] == 'Qua':
if item['company']:
item['company'] = wash(item['company'])
if item['flight_time']:
item['flight_time'] = wash(item['flight_time'])
if item['airports']:
item['airports'] = wash(item['airports'])
if item['passtime']:
item['passtime'] = wash(item['passtime'])
if item['price']:
item['price'] = wash(item['price'])
for data in item:
if not data:
raise DropItem("Missing data!")
self.collection.insert(dict(item))
log.msg("Question added to MongoDB database!",
level=log.DEBUG, spider=spider)
elif item['site'] == 'Ctrip':
self.collection.insert(dict(item))
log.msg("Question added to MongoDB database!",
level=log.DEBUG, spider=spider)
return item
评论列表
文章目录