python之requests

'''
&name : xiaowen
&time : 2021/8/19
&content : 获取段子
'''

import requests
from lxml import etree
import re
import time

def get_content(url):
headers = {"User-Agent":"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/7.36 (KHTML, like Gecko) Chrome/3.0.3.61 Safari/7.36"}
resbost = requests.get(url = url,headers = headers)
resbost.encoding = 'utf-8'
html_1 = etree.HTML(resbost.text)
z_div = html_1.xpath('/html/body/div[1]/div/div[2]/div')
#print(z_div)
for i in z_div:
s = i.xpath('./a[1]/@href')[0]
#print(s)
url_1='https://www.
.com'+s
resbost_1 = requests.get(url = url_1,headers = headers)
resbost_1.encoding = 'utf-8'
html_2 = resbost_1.text
s_1 = re.compile(r'<di* class="content">(?P.?)</di>',re.S)
text_content = s_1.finditer(html_2)
resbost_1.close()
for j in text_content:
time.sleep(1)
print('\n',j.group("content"))
if name == 'main':
print('欢迎使用本程序🙃')
time.sleep(0.5)
a = int(input('请输入页数(1-14):'))
if a <= 14:
print('正在加载')
time.sleep(0.5)
url = 'https://www.
**.com/text/page/{}/'.format(a)
get_content(url)
else:
print('输入错误')

posted @ 2021-09-07 22:53  _温  阅读(59)  评论(0)    收藏  举报

" ┆♡┆ ┆,┆人┆善┆,┆今┆在┆生┆ ┆娘┆匿┆意┆此┆姑┆ ┆扰┆得┆ ┆小┆ ┆♡┆"
" ┆♡┆ ┆暖┆予┆其┆望┆生┆打┆往┆ ┆往┆与┆止┆所┆娘┆ ┆姑┆姑┆ ┆生┆ ┆♡┆"
" ┆♡┆ ┆色┆君┆身┆姑┆就┆扰┆北┆ ┆南┆年┆于┆有┆勿┆ ┆娘┆娘┆ ┆不┆ ┆♡┆"
" ┆♡┆ ┆浮┆欢┆,┆娘┆此┆姑┆瞧┆ ┆走┆华┆唇┆爱┆怪┆ ┆良┆青┆ ┆才┆ ┆♡┆"
" ┆♡┆ ┆余┆喜┆遇┆日┆别┆娘┆,┆ ┆,┆,┆齿┆慕┆,┆ ┆久┆睐┆ ┆,┆ ┆♡┆"
" ┆♡┆ ┆生┆城┆良┆后┆过┆,┆不┆ ┆小┆姑┆,┆之┆自┆ ┆,┆,┆ ┆未┆ ┆♡┆"