簡單的靜態網頁的圖片獲取:html
import urllib import re import os url = 'http://www.toutiao.com/a6467889113046450702/' def getHTML(url): html = urllib.request.urlopen(url).read() return html def getIMG(html): s = r'img src="(http://.+?)"' pat = re.compile(s) imglist = pat.findall(html) return imglist html = getHTML(url) html = html.decode('UTF-8') imglist = getIMG(html) imgname = 0 path = 'D:\\pic\\' if not os.path.isdir(path): os.mkdir(path) print('建立文件夾%s'%path) for url in imglist: filepath = path+'%d.jpg'%imgname print('正在下載第%d張照片...' % (imgname+1)) urllib.request.urlretrieve(url, filepath ) imgname = imgname+1 print('下載完成!')
動態網頁圖片獲取url