def prepare_url(self):
url_parsed = urlparse(self.raw_base_url)
items = url_parsed.path.split('/')
if len(items) > 0:
item = items[-1]
items = items[:-1]
new_path = '/'.join(items)
else:
item = ''
new_path = url_parsed.path
url = urlunparse((url_parsed.scheme, url_parsed.netloc, new_path, '', '', ''))
if item.endswith('.php'):
self.site_lang = 'php'
elif item.endswith('.asp'):
self.site_lang = 'asp'
elif item.endswith('.aspx'):
self.site_lang = 'aspx'
if self.site_lang != '':
logger.info('site_lang: %s' % self.site_lang)
self.base_url = url
self.first_item = item
logger.info('base_url: %s' % url)
logger.info('first_item: %s' % item)
评论列表
文章目录