def process_item(self, item, spider):
job_title_company = item['title'] + item['company']
if job_title_company in self.title_company:
raise DropItem("Duplicate item found: %s" % (item))
else:
self.title_company.add(job_title_company)
return item
评论列表
文章目录