def run(self):
self.total = self.get_total() or 5000000
if not self.total:
print('error loading document total; using estimate')
index_queue = multiprocessing.Queue()
bulk_index_process = multiprocessing.Process(
target=self.bulk_index, args=(index_queue,),
)
bulk_index_process.start()
for comment in self.iter_comments():
self.stats['fetched'] += 1
if not self.stats['fetched'] % 500:
print('fetched %s/%s\t%s%%\t%s' % (self.stats['fetched'], self.total,
int(self.stats['fetched'] / self.total * 100),
comment['date_disseminated']))
index_queue.put(comment)
index_queue.put(None)
bulk_index_process.join()
return self.stats['fetched']
评论列表
文章目录