mian3.py 文件源码-python代码片段

mian3.py 文件源码

python

阅读 17 收藏 0 点赞 0 评论 0

项目：ProxyIPCrawler 作者: uilliu 项目源码文件源码

def caiji2(self):   #“???IP”
    # ??????IP???????????????????????????????
    of = open('proxy.txt', 'w')
    url = 'http://www.haodailiip.com/guonei/'
    for i in range(1,20):
        Url = 'http://www.haodailiip.com/guonei/' + str(i)
        print u"????"+Url
        html = requests.get(Url).text
        bs = BeautifulSoup(html)
        table = bs.find('table',{"class":"proxy_table"})
        tr = table.findAll('tr')
        for i in range(1,31):
            td = tr[i].findAll('td')
            proxy_ip = td[0].text.strip()
            proxy_port = td[1].text.strip()
            of.write('http=%s:%s\n' %(proxy_ip,proxy_port))
            print 'http=%s:%s\n' %(proxy_ip,proxy_port)
        time.sleep(2)
    of.closed