def get_data(self):
content = yield httpclient.AsyncHTTPClient().fetch(self.url)
# content = httpclient.HTTPClient().fetch(self.url)
if not content.error:
root = html.fromstring(content.body.decode('utf-8'))
else:
raise gen.Return(None)
bangumi_info = []
for i in range(1, 8):
weekday = i
if weekday == 7:
weekday = 0
for e in root.xpath('//*[@id="tab_100895_%d"]//*[@class="v-meta-title"]/a' % i):
title, hour, minute = self.TIME_PATTERN.match(e.text).groups()
update_time = datetime.time(int(hour), int(minute))
info = {'weekday': weekday,
'url': e.attrib['href'],
'title': title,
'update_time': update_time}
bangumi_info.append(info)
raise gen.Return(bangumi_info)
评论列表
文章目录