def lrc2dict(lrc):
time_stamps = re.findall(r'\[[^\]]+\]', lrc)
html_parser = HTMLParser.HTMLParser()
if time_stamps:
# ????
lyric = lrc
for tplus in time_stamps:
lyric = lyric.replace(tplus, '').replace('\r', '').replace('\n', '').replace('????','').replace('???','').replace('?????','').replace('???','').replace('??','').replace('??','').replace('??','').replace('??','')
lyric = lyric.replace('???', '').replace('??', '').replace('????', '').replace('???', '').replace('??', '').replace('???', '')
# ????
# tplus: [02:31.79]
# t 02:31.79
# print lyric
print html_parser.unescape(lyric)
return html_parser.unescape(lyric)
else:
return ''
评论列表
文章目录