from bs4 import BeautifulSoup
import urllib.request
request=urllib.request.Request('https://ss3.bdstatic.com/70cFv8Sh_Q1YnxGkpoWK1HF6hhy/it/u=3193006289,3802606706&fm=26&gp=0.jpg')
response=urllib.request.urlopen(request)
data=response.read()
print(data)
with open('first_down.jpg','wb') as fp:
fp.write(data)
print("download finished")
在看书的时候有点迷糊。尝试自己弄下。大概步骤是先找到图片的网
from bs4 import BeautifulSoup import re import urllib.request request=urllib.request.Request('http://bbs.tianya.cn/post-tianyamyself-331739-1.shtml') print(request) response=urllib.request.urlopen(request,timeout=3000) data=response.read() print(data) regex=r'http://[\S]*\.jpg' pattern=re.compile(regex) get_img=re.findall(pattern,repr(data)) print(get_img) print(type(get_img)) num=1 for i in get_img: try: request2=urllib.request.urlopen(i,timeout=3000).read() with open('%s.jpg' % num, 'wb') as fp: fp.write(request2) num = num + 1 except : pass print("done")
址。通过urllib解析网址之后得到data数据。 然后通过open函数写道firs_img.jpg文件中。这个是最关键的步骤
浙公网安备 33010602011771号