爬虫练习【知乎热榜】
def ut_zhihu_rank():
url = ''
i = 0
md = ''
headers = {
'user-agent':'ua'
}
res = requests.get(url, headers=headers)
soup = BeautifulSoup(res.content,'lxml')
text = soup.select('#js-initialData')[0].string
# print(text)
json_ = json.loads(text)
list = json_['initialState']['topstory']['hotList']
for li in list:
i += 1
if i>10:
break
# print(li)
title = li['target']['titleArea']['text']
link = li['target']['link']['url']
md += f'{i}. [{title}]({link})\n\n'
return md
仅作学习交流用途,侵权立删

浙公网安备 33010602011771号