excrawler.py 文件源码

python
阅读 24 收藏 0 点赞 0 评论 0

项目:ExHentaiCrawler 作者: nothinghappen 项目源码 文件源码
def doCrawlNewest(self):
        flag = True
        while flag:
            futures = []
            #??????5?
            with ThreadPoolExecutor(max_workers = 5) as executor:
                for i in range(self.context['currentPage'],self.context['currentPage'] + 5):
                    futures.append(executor.submit(self.getMangaDataByPage,i))
            wait(futures)
            #??????
            for f in futures:    
                gmetadata = f.result()
                for data in gmetadata:
                    #????????
                    if int(data['posted']) <= self.context['newestPosted']:
                        info("info","excrawler.crawlNewest","???????????? posted:" + data['posted'])
                        setConfig("app","new_context","")
                        flag = False
                        exit()
                    #??
                    if int(data['posted']) < self.context['currentPosted']:
                        self.db.insertEromanga(data)
                        self.context['currentPosted'] = int(data['posted'])
                self.context['currentPage'] += 1
评论列表
文章目录


问题


面经


文章

微信
公众号

扫码关注公众号