def __init__(self, url):
super(Spider, self).__init__()
self.start_urls = [url]
self.le = LinkExtractor(canonicalize=False)
self.files_le = LinkExtractor(
tags=['a'], attrs=['href'], deny_extensions=[], canonicalize=False)
评论列表
文章目录