Python爬取圖片並存儲

'''
思路: 從縮略圖頁面開始爬取
1) 先爬取所有縮略圖的a標籤
2)
3)
'''
import requests
from bs4 import BeautifulSoup
import os
if not os.path.exists("男神圖集"):
    os.makedirs("男神圖集")
import lxml
from urllib import request

url = "http://www.shuaia.net/index_50.html"

if __name__ == '__main__':
    for i in range(5):
        url = "http://www.shuaia.net/index_5%d.html"%i
        req = requests.get(url = url)
        req.encoding = 'utf-8'
        print("響應碼: ", req.status_code)
        html = req.text
        bf2 = BeautifulSoup(html, 'lxml')
        a_list = bf2.find_all("a", class_="itemimg-view")
        for item in a_list:
            print (item)
            #print(item.get('href'), item.get("title"))
            name = item.get("title")
            down_url = "http://www.shuaia.net" + item.get("href")
            #下載
            request.urlretrieve(filename="男神圖集/%s.jpg" %name, url = down_url)
            print("%s下載成功"%name + '>'*10)

 

發表評論
所有評論
還沒有人評論,想成為第一個評論的人麼? 請在上方評論欄輸入並且點擊發布.
相關文章