python 【BeautifulSoup【新】】

 

 1 #知识点== 输出格式======BeautifulSoup=========requests===
 2 import requests
 3 
 4 import requests,bs4
 5 from bs4 import BeautifulSoup
 6 
 7 def getHtml(url):
 8     try:
 9         r = requests.get(url,timeout=20)
10         r.raise_for_status()
11         r.encoding = r.apparent_encoding
12         return r.text
13     except:
14         return "失败"
15 
16 
17 def fillUnivList(ulist,html):
18     soup = BeautifulSoup(html,"html.parser")
19     
20     for tr in soup.find('tbody').children:
21         if isinstance(tr,bs4.element.Tag):
22             tds = tr('td')
23             ulist.append([tds[0].string,tds[1].string,tds[2].string,tds[3].string])
24 
25 
26 def printUnivList(ulist,num):
27     splt = "{0:^10}\t{1:^15}\t{2:^15}\t{3:^5}"
28     print(splt.format("排名","学校名称","地址","分数",chr(12288)))
29     for i in range(num):
30         u=ulist[i]
31         print(splt.format(u[0],u[1],u[2],u[3],chr(12288)))
32         
33 
34 def main():
35 
36     uinfo = []
37 
38     url = "http://www.zuihaodaxue.cn/shengyuanzhiliangpaiming2018.html"
39 
40     html = getHtml(url)
41 
42     fillUnivList(uinfo,html)
43 
44     printUnivList(uinfo,100)
45 main()
中国大学排名

 

 

 

 

 

 

 

 

 

 

 

 

 

 

 

 

 

 

 

posted @ 2018-08-03 15:33  Justice-V  阅读(88)  评论(0)    收藏  举报