def process_vcode(self, response):
vcode_url = response.css('#content > div > div.article > form > img::attr(src)').extract_first()
vcode = recognize_url(vcode_url)
import enchant
import requests
d = enchant.Dict("en_US")
valid = d.check("enchant")
if valid:
id_index = response.url.find('id=')
try:
original_url = response.css(
'#content > div > div.article > form > input[type="hidden"]:nth-child(8)::attr(value)').extract_first()
except Exception:
original_url = 'https://movie.douban.com/search/%E6%B0%B8%E4%BD%9C%E5%8D%9A%E7%BE%8E'
vcode_id = response.url[id_index + 3:]
frmdata = {"captcha-solution": "".format(vcode), "captcha-id": "".format(vcode_id),
"original-url": "".format(original_url)}
requests.post(url=response.url, data=frmdata, headers=response.headers)
else:
print('wrong vcode')
评论列表
文章目录