GetFans_Oracle.py 文件源码

python
阅读 29 收藏 0 点赞 0 评论 0

项目:danmu-bilibili 作者: saberxxy 项目源码 文件源码
def getSoup(start, stop):

    try:
        for number in range(start, stop+1):

            url = 'http://space.bilibili.com/'+str(number)+'/#!/'
            dcap = dict(DesiredCapabilities.PHANTOMJS)
            dcap["phantomjs.page.settings.userAgent"] = (
                "Mozilla/5.0 (Windows NT 6.1; WOW64; rv:50.0) Gecko/20100101 Firefox/50.0"
            )
            dcap["phantomjs.page.settings.loadImages"] = False  #??????????
            driver = webdriver.PhantomJS(executable_path='G:\\Anaconda3\\phantomjs\\bin\\phantomjs.exe',
                                         desired_capabilities=dcap)
            driver.get(url)
            content = driver.page_source  # ??????
            driver.close()
            driver.quit()  #??????????????
            soup = BeautifulSoup(content, 'lxml')
            username= getInfo(soup)  # ?????
            uid = number  # number??uid
            get_fans_uid = GetFansUid(number)
            fansuid, fansnumber = get_fans_uid.get_uids()  # ????id?????

            saveData(uid, username, fansnumber, fansuid)  # ?????
    except Exception:
        print("get page error")
        return getSoup(number+1, stop+1)


# ????
评论列表
文章目录


问题


面经


文章

微信
公众号

扫码关注公众号