python爬虫学习(一)requests+bs4爬取图片

import requests
from bs4 import BeautifulSoup
import time

url = "http://www.bizhi360.com/meinv/"
resp = requests.get(url)
resp.encoding = "utf-8"
#print(resp.text)
main_page = BeautifulSoup(resp.text,"html.parser")

ul = main_page.find("ul")
#print(ul)
a = ul.find_all("a")
#print(a)
for i in a:
    #print(i.get('href'))#直接通过get就可以拿到属性值
    #获取数组中的href的值href=""里的值
    url_detail = "http://www.bizhi360.com/"+str(i.get('href'))# 获取每一张图片的url
    #print(url_detail)
    resp_detail = requests.get(url_detail)
    resp_detail.encoding = 'utf-8'
    #print(resp_detail.text)
    main_detail = BeautifulSoup(resp_detail.text,"html.parser")
    div = main_detail.find("div",class_="content").find("a",class_="download")
    title = main_detail.find("h1",class_="title").text
    print(title)
    img_url = div.get('href')
    img_resp = requests.get(img_url)
    print(img_url)
    #下载图片
    img_name = str(title)+".jpg"
    with open(img_name, mode="wb") as f:
    #写的是图片用wb
        f.write(img_resp.content)#img_resp.content #这里拿到的是字节
        #图片内容写入文件
    time.sleep(1)
 

 

posted @ 2021-06-24 16:33  YuyuFishSmile  阅读(325)  评论(0)    收藏  举报