main.py 文件源码

python
阅读 19 收藏 0 点赞 0 评论 0

项目:PythonSpider 作者: cccyb 项目源码 文件源码
def getPage(self, url, postdata=None, headers=None):
        try:
            cookie = cookielib.CookieJar()
            opener = urllib2.build_opener(urllib2.HTTPCookieProcessor(cookie))
            if postdata is None:
                if headers is None:
                    request = urllib2.Request(url)
                else:
                    request = urllib2.Request(url, headers=headers)
            else:
                if headers is not None:
                    request = urllib2.Request(url, postdata, headers)
            page = opener.open(request)
            redirect_url = opener.open(request).geturl()  # ?????url
            soup = BeautifulSoup(page, 'html.parser')
            return page, soup, redirect_url
        # ???????
        except urllib2.URLError, e:
            if hasattr(e, "reason"):
                print u"????,????", e.reason
                return None

    # ?????
评论列表
文章目录


问题


面经


文章

微信
公众号

扫码关注公众号