Mmrz-Sync.py 文件源码

python
阅读 18 收藏 0 点赞 0 评论 0

项目:Mmrz-Sync 作者: zhanglintc 项目源码 文件源码
def query_hujiang(key_word):
    if not key_word:
        return []

    headers = {
        'User-Agent': 'Mozilla/5.0 (iPhone; CPU iPhone OS 9_1 like Mac OS X) AppleWebKit/601.1.46 (KHTML, like Gecko) Version/9.0 Mobile/13B143 Safari/601.1',
        'Accept-Encoding': 'gzip, deflate, sdch',
        }

    url = "https://m.hujiang.com/d/dict_jp_api.ashx?type=jc&w={0}".format(urllib.quote(key_word))

    proxies = {}
    response = requests.get(url, headers=headers, verify=False, proxies=proxies)
    try:
        defines = response.json()
    except:
        return []

    for i in range(len(defines)):
        Comment = defines[i]["Comment"]
        comments = re.findall("<br/>([^a-zA-Z]+)<br/>", Comment)

        tmp = ", ".join(comments)

        # ??tmp??, ??????????
        # tmp = Comment if not tmp else tmp

        # ???????????
        # mch = re.search(u"(?.+??)", tmp)
        # tmp = mch.group(1) if mch else tmp

        # ??????
        tmp = re.sub(u"\?.+?\?",   "", tmp)
        tmp = re.sub(u"\(.+?\)",  "", tmp)
        tmp = re.sub(u"?+?",     "", tmp)

        defines[i]["Comment"] = tmp

        defines[i]["PronounceJp"] = re.sub("\[|\]", "", defines[i]["PronounceJp"])

    return defines

### static files
评论列表
文章目录


问题


面经


文章

微信
公众号

扫码关注公众号