def get_pages(query):
pages = list()
if len(query.strip()) <= 0:
raise ValueError
response = requests.get(SEARCH_URL + str(query))
soup = BeautifulSoup(markup=response.text, features="lxml")
if soup is None:
raise Exception
if "search" in str(soup.title).lower():
result_ul = soup.find(name="ul", attrs={"class": "mw-search-results"})
results_list = result_ul.find_all("li")
for li in results_list:
li_div = li.find(name="div", attrs={"class": "mw-search-result-heading"})
a = li_div.find("a")
link = "https://en.wikipedia.org" + a["href"]
heading = str(a.text)
pages.append((link, heading))
return pages
else:
return wikipedia.summary(query)
评论列表
文章目录