def parse_page(self, response):
pattern = re.compile('<tr><td>(.*?)</td><td>(.*?)</td><td>(.*?)</td><td>(.*?)</td><td>(.*?)</td></tr>',
re.S)
items = re.findall(pattern, response.body)
for i, item in enumerate(items):
if i >= 1:
proxy = Proxy()
proxy.set_value(
ip = item[0],
port = item[1],
country = item[2],
anonymity = item[3],
source = self.name
)
self.add_proxy(proxy = proxy)
评论列表
文章目录