def simple_parse_to_segments(html, debug=False, **kwargs):
html = fix_urls(html)
html = '<html>' + html + '</html>' # html.parser seems to ignore the final entityref without html closure
parser = simpleHTMLParser(debug)
return parser.feed(html)
评论列表
文章目录