def accepted(self, response):
sel = Selector(response)
next_url = sel.xpath('//p/a/@href')[2].extract()
table_tr = sel.xpath('//table')[-1].xpath('.//tr')[1:]
for tr in table_tr:
name = tr.xpath('.//td/a/text()').extract()[0]
problem_id = tr.xpath('.//td[3]/a/text()').extract()[0].strip()
submit_time = tr.xpath('.//td/text()').extract()[-1]
self.solved[problem_id] = submit_time
self.item['solved'] = self.solved
if table_tr:
yield Request('http://' + self.allowed_domains[0] + '/' + next_url,
callback = self.accepted
)
yield self.item
评论列表
文章目录