def process_item(self, item, spider): if item['pid'] in self.ids_seen: raise DropItem("Duplicate item found: %s" % item) else: self.ids_seen.add(item['pid']) return item