def process_item(self, item, spider): if item['link'] in self.ids_seen: raise DropItem("Duplicate item found:%s" % item) else: self.ids_seen.add(item['link']) return item