07.糗事百科图片(正则)

'''
<div class="thumb">.*?<img src="(.*?)" alt.*?</div>
'''
import requests
import re
import os
if not os.path.exists('./糗事百科图片'):
os.mkdir('./糗事百科图片')
headers={
'User-Agent':'Mozilla/5.0 (Macintosh; Intel Mac OS X 10.15; rv:82.0) Gecko/20100101 Firefox/82.0'
}
ex='<div class="thumb">.*?<img src="(.*?)" alt.*?</div>'
for i in range(1,6):
url='https://www.qiushibaike.com/imgrank/page/'+str(i)
response=requests.get(url=url,headers=headers)
page_text=response.text
img_src_list=re.findall(ex,page_text,re.S)
for img_src in img_src_list:
img=requests.get(url='https:'+img_src,headers=headers).content
fileName=img_src.split('/')[-1]
file_path='./糗事百科图片/'+fileName
with open (file_path,'wb') as fp:
fp.write(img)



posted @ 2020-12-08 15:32  nan4457  阅读(642)  评论(0)    收藏  举报