def query_hujiang(key_word):
if not key_word:
return []
headers = {
'User-Agent': 'Mozilla/5.0 (iPhone; CPU iPhone OS 9_1 like Mac OS X) AppleWebKit/601.1.46 (KHTML, like Gecko) Version/9.0 Mobile/13B143 Safari/601.1',
'Accept-Encoding': 'gzip, deflate, sdch',
}
url = "https://m.hujiang.com/d/dict_jp_api.ashx?type=jc&w={0}".format(urllib.quote(key_word))
proxies = {}
response = requests.get(url, headers=headers, verify=False, proxies=proxies)
try:
defines = response.json()
except:
return []
for i in range(len(defines)):
Comment = defines[i]["Comment"]
comments = re.findall("<br/>([^a-zA-Z]+)<br/>", Comment)
tmp = ", ".join(comments)
# ??tmp??, ??????????
# tmp = Comment if not tmp else tmp
# ???????????
# mch = re.search(u"(?.+??)", tmp)
# tmp = mch.group(1) if mch else tmp
# ??????
tmp = re.sub(u"\?.+?\?", "", tmp)
tmp = re.sub(u"\(.+?\)", "", tmp)
tmp = re.sub(u"?+?", "", tmp)
defines[i]["Comment"] = tmp
defines[i]["PronounceJp"] = re.sub("\[|\]", "", defines[i]["PronounceJp"])
return defines
### static files
评论列表
文章目录