爬虫实例(8)


import requests
import re
url='https://www.qiushibaike.com/text/'
header = {
    'User-Agent':'Mozilla/5.0(Windows;U;WindowsNT6.1;en-us)AppleWebKit/534.50(KHTML,likeGecko)Version/5.1Safari/534.50'
}
response= requests.get(url,headers=header)
info=response.text
print(info)
f1=re.findall(r'<div class="content">\s*<span>\s*(.+)\s*</span>',info)


print('-'*1000)
print(f1)
with open('xiaohua.txt','w',encoding='utf-8') as f:
    for fs in f1:
        f.write(fs+'\n\n\n')
posted @ 2020-07-09 17:07  kuanleung  阅读(6)  评论(0)    收藏  举报  来源