from bs4 import BeautifulSoup
import urllib.request
request=urllib.request.Request('https://ss3.bdstatic.com/70cFv8Sh_Q1YnxGkpoWK1HF6hhy/it/u=3193006289,3802606706&fm=26&gp=0.jpg')
response=urllib.request.urlopen(request)
data=response.read()
print(data)
with open('first_down.jpg','wb') as fp:
    fp.write(data)
    print("download finished")

  在看书的时候有点迷糊。尝试自己弄下。大概步骤是先找到图片的网

from bs4 import BeautifulSoup
import re
import urllib.request
request=urllib.request.Request('http://bbs.tianya.cn/post-tianyamyself-331739-1.shtml')
print(request)
response=urllib.request.urlopen(request,timeout=3000)
data=response.read()
print(data)
regex=r'http://[\S]*\.jpg'
pattern=re.compile(regex)
get_img=re.findall(pattern,repr(data))
print(get_img)
print(type(get_img))
num=1
for i in get_img:

    try:

        request2=urllib.request.urlopen(i,timeout=3000).read()
        with open('%s.jpg' % num, 'wb') as fp:
            fp.write(request2)
        num = num + 1
    except :
        pass

print("done")

 

址。通过urllib解析网址之后得到data数据。 然后通过open函数写道firs_img.jpg文件中。这个是最关键的步骤

posted on 2017-08-17 22:42  uxiuxi  阅读(130)  评论(0)    收藏  举报