def GetPg(self,code):#??????
try:
ret = urllib.urlopen("http://money.finance.sina.com.cn/corp/go.php/vISSUE_ShareBonus/stockid/" + code + ".phtml")
soup = BeautifulSoup(Tools().smartCode(ret.read()), "html.parser")
dict = {}
for x in soup.find_all('tbody'):
for e in str(x).split('_blank'):
if "type=2" in e:
td = re.findall(r'<td>(.+?)</td>', e)
dict.update({td[0]: {u"????".encode('gbk', 'ignore').decode('gbk'): td[0],
u"????".encode('gbk', 'ignore').decode('gbk'): td[1],
u"????".encode('gbk', 'ignore').decode('gbk'): td[2],
u"????".encode('gbk', 'ignore').decode('gbk'): td[3],
u"???".encode('gbk', 'ignore').decode('gbk'): td[4],
u"?????".encode('gbk', 'ignore').decode('gbk'): td[5],
u"?????".encode('gbk', 'ignore').decode('gbk'): td[6],
u"?????".encode('gbk', 'ignore').decode('gbk'): td[7],
u"?????".encode('gbk', 'ignore').decode('gbk'): td[8],
}})
return pandas.DataFrame.from_dict(dict, orient="index")
except:
return None
评论列表
文章目录