import requests
from bs4 import BeautifulSoup
alluniv = []
def getHTMLText(url):
    try:
        r = requests.get(url,timeout=30)
        r.raise_for_status()#提高状态。
        r.encoding = 'utf-8'
        return r.text
    except:
        return''
def fillunivlist(soup):
    data = soup.find_all('tr')
    for tr in data:
        ltd = tr.find_all('td')
        if len(ltd)==0:
            continue
        singleuniv = []
        for td in ltd:
            singleuniv.append(td.string)
        alluniv.append(singleuniv)
def printunivlist(num):
    print('{:^4}{:^10}{:^5}{:^8}{:^10}'.format("排名","学校名称","省市","总分","培养规模"))
    for i in range(num):
        u=alluniv[i]
        print("{:^4}{:^10}{:^5}{:^8}{:^10}".format(u[0], u[1],u[2],u[3],u[6]))
def main(num):
        url = 'http://www.zuihaodaxue.cn/\zuihaodaxuepaiming2016.html'
        html = getHTMLText(url)
        soup = BeautifulSoup(html, 'html.parser')
        fillunivlist(soup)
        printunivlist(num)
main(10)
抓取大学排名

相关文章:

  • 2021-04-30
  • 2022-12-23
  • 2022-12-23
  • 2022-01-02
  • 2022-02-08
  • 2021-12-12
  • 2021-04-07
  • 2022-01-16
猜你喜欢
  • 2022-02-07
  • 2021-10-12
  • 2021-08-07
  • 2021-12-01
  • 2022-12-23
  • 2022-01-11
相关资源
相似解决方案