|

楼主 |
发表于 2020-1-18 15:08:17
|
显示全部楼层
以下是源代码- import requests
- from bs4 import BeautifulSoup
- import os
- import bs4
- def getHTMLText(url):
- try:
- r=requests.get(url,30)
- r.raise_for_status()
- r.encoding=r.apparent_encoding
- return r.text
- except:
- return"产生错误:url调用"
- return ""
- def fillUnivList(ulist,html):
- soup=BeautifulSoup(html,"html.parser")
- for tr in soup.find('tbody').children:
- if isinstance(tr,bs4.element.Tag):
- tds=tr("td")
- ulist.append([tds[0].string,tds[1].string,tds[2].string])
- def output(ulist,num):
- print("{:^10]\t{:^6]\t{:^10]}".format("排名","学校名称","总分"))
- for i in range(num):
- u=ulist[i]
- print("{:^10]\t{:^6]\t{:^10]}".format(u[0],u[1],u[2]))
- def main():
- uinfo=[]
- url="http://www.zuihaodaxue.com/zuihaodaxuepaiming2016.html"
- html=getHTMLText(url)
- fillUnivList(uinfo,html)
- output(uinfo,20)
- main()
复制代码 |
|