def _parse_url(self, url):
"""
Downloads and parses a URL, returns xml root.
"""
try:
from lxml.html import parse
except ImportError: # pragma: no cover
raise ImportError("Please install lxml if you want to use the "
"{0!r} class".format(self.__class__.__name__))
doc = parse(self._read_url_as_StringIO(url))
root = doc.getroot()
if root is None: # pragma: no cover
raise RemoteDataError("Parsed URL {0!r} has no root"
"element".format(url))
return root
评论列表
文章目录