爬虫练习【知乎热榜】

def ut_zhihu_rank():

url = ''
i = 0
md = ''
headers = {
    'user-agent':'ua'
}
res = requests.get(url, headers=headers)
soup = BeautifulSoup(res.content,'lxml')
text = soup.select('#js-initialData')[0].string
# print(text)
json_ = json.loads(text)
list = json_['initialState']['topstory']['hotList']
for li in list:
    i += 1
    if i>10:
        break
    # print(li)
    title = li['target']['titleArea']['text']
    link = li['target']['link']['url']
    md += f'{i}. [{title}]({link})\n\n'
return md

仅作学习交流用途,侵权立删

posted @ 2021-09-11 21:08  Timor88  阅读(52)  评论(0)    收藏  举报