天天看點

python 圖檔抓取 并儲存到本地

首先安裝包:

# html的解析庫
pip install BeautifulSoup4
# 圖檔處理的庫
pip install pillow
pip install requests
           
import requests
from bs4 import BeautifulSoup
from PIL import Image
import os 
from io import BytesIO
import time
 
url = "http://www.yestone.com/gallery/1501754333627"
headers = {"User-Agent": "Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/55.0.2883.87 Safari/537.36"}
 
r = requests.get(url, headers=headers)
soup = BeautifulSoup(r.content, 'html.parser')
# items = soup.find_all('img', class_='img-responsive')
items = soup.find_all('img', attrs={'data-v-32e60122':''})
 
folder_path = './photo'
 
if os.path.exists(folder_path) == False:
   os.makedirs(folder_path)
 
for index, item in enumerate(items):
    if item:
        turl = item.get('src')
        if not turl.startswith('http:'):
            continue
        html = requests.get(item.get('src'))
        img_name = str(index + 1) + '.png'
        image = Image.open(BytesIO(html.content))
        image.save(folder_path+"/"+img_name)
        print('第%d張圖檔下載下傳完成' % (index + 1))
        time.sleep(1)  # 自定義延時
print('抓取完成')