2015年最好大学排名爬取

import requests
from bs4 import BeautifulSoup
allU=[]
def getHTMLText(ur1):
try:
r=requests.get(ur1,timeout=30)
r.raise_for_status()
r.encoding='utf-8'
return r.text
except:
return ""
def fillUnivList(soup):
data=soup.find_all('tr')
for tr in data:
ltd=tr.find_all('td')
if len(ltd)==0:
continue
singleUniv=[]
for td in ltd:
singleUniv.append(td.string)
allU.append(singleUniv)
def printUnivList(num):
print("{:^4}{:^10}{:^5}{:^8}{:^10}".format(chr(12288),"排名","学校名称","省市","总分","培养规模"))
for i in range(num):
u=allU[i]
print("{:^4}{:^10}{:^5}{:^8}{:^10}".format(chr(12288),u[0],u[1],u[2],u[3],u[6]))

l='http://www.zuihaodaxue.cn/zuihaodaxuepaiming2015_0.html'
html=getHTMLText(l)
soup=BeautifulSoup(html,"html.parser")
fillUnivList(soup)
printUnivList(30)

 

posted @ 2020-05-13 15:59  Lysim  阅读(127)  评论(0)    收藏  举报