爬虫实例(8)
import requests
import re
url='https://www.qiushibaike.com/text/'
header = {
'User-Agent':'Mozilla/5.0(Windows;U;WindowsNT6.1;en-us)AppleWebKit/534.50(KHTML,likeGecko)Version/5.1Safari/534.50'
}
response= requests.get(url,headers=header)
info=response.text
print(info)
f1=re.findall(r'<div class="content">\s*<span>\s*(.+)\s*</span>',info)
print('-'*1000)
print(f1)
with open('xiaohua.txt','w',encoding='utf-8') as f:
for fs in f1:
f.write(fs+'\n\n\n')

浙公网安备 33010602011771号