downloadmiddle.py 文件源码

python
阅读 29 收藏 0 点赞 0 评论 0

项目:Spider 作者: poluo 项目源码 文件源码
def process_vcode(self, response):
        vcode_url = response.css('#content > div > div.article > form > img::attr(src)').extract_first()
        vcode = recognize_url(vcode_url)

        import enchant
        import requests
        d = enchant.Dict("en_US")
        valid = d.check("enchant")
        if valid:
            id_index = response.url.find('id=')
            try:
                original_url = response.css(
                    '#content > div > div.article > form > input[type="hidden"]:nth-child(8)::attr(value)').extract_first()
            except Exception:
                original_url = 'https://movie.douban.com/search/%E6%B0%B8%E4%BD%9C%E5%8D%9A%E7%BE%8E'
            vcode_id = response.url[id_index + 3:]
            frmdata = {"captcha-solution": "".format(vcode), "captcha-id": "".format(vcode_id),
                       "original-url": "".format(original_url)}
            requests.post(url=response.url, data=frmdata, headers=response.headers)
        else:
            print('wrong vcode')
评论列表
文章目录


问题


面经


文章

微信
公众号

扫码关注公众号