def __init__(self, conf=None, conn=None):
# Save conf/conn
self.conf = conf
self.conn = conn
# Make urls
self.start_urls = [
'http://www.takedaclinicaltrials.com/browse/?protocol_id=',
]
# Make rules
self.rules = [
Rule(LinkExtractor(
allow=r'browse/summary/',
), callback=parse_record),
Rule(LinkExtractor(
allow=r'browse',
)),
]
# Inherit parent
super(Spider, self).__init__()
评论列表
文章目录