python3抓取百度首頁皮膚

import sys, importlib, os, urllib.request
importlib.reload(sys)

def download_pic(url):
    file_name = url[55:]
    path = 'C:\\Users\\user\\Desktop\\baidu_background\\'
    # name = path+file_name.replace('/', '_')
    name = path + file_name
    if not os.path.exists(name):
        headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/66.0.3359.181 Safari/537.36'}
        try:
            req = urllib.request.Request(url=url, headers=headers)
            pic_tmp = urllib.request.urlopen(req, timeout=5).read()
            with open(name, "wb") as file:
                file.write(pic_tmp)
                file.close()
        except urllib.request.URLError as e:
            print("error", e)
        except:
            return("UNKNOWN ERROR")

        # data = urllib.request.urlretrieve(url, name)
    else:
        print("this pic exit error...")

def main():
    preurl = "https://ss1.bdstatic.com/kvoZeXSm1A5BphGlnYG/skin_zoom/"
    for i in range(1, 1000):
        fullurl = preurl + str(i) + ".jpg"
        download_pic(fullurl)
        pic_url = 'C:\\Users\\users\\Desktop\\baidu_background\\'
        pic_size = os.path.getsize(pic_url + str(i) + ".jpg")
        if pic_size == 15821:
            os.remove(pic_url + str(i) + ".jpg")
            print(pic_url + str(i) + ".jpg" + "  finished!")

if __name__ == '__main__':
    main()
    print("Done!")

發表評論
所有評論
還沒有人評論,想成為第一個評論的人麼? 請在上方評論欄輸入並且點擊發布.
相關文章