python爬取下載網易雲歌單歌曲

import requests, os, time, sys, re
from urllib import request
from scrapy.selector import Selector


class wangyiyun():
    def __init__(self):
        self.headers = {
            'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/55.0.2883.87 Safari/537.36',
            'Referer': 'http://music.163.com/'}
        self.main_url = 'https://music.163.com/'
        self.session = requests.Session()
        self.session.headers = self.headers

    def get_songurls(self, playlist):
        '''進入所選歌單頁面,得出歌單裏每首歌各自的ID 形式就是“song?id=64006"'''
        url = self.main_url + 'playlist?id=%d' % playlist
        re = self.session.get(url)  # 直接用session進入網頁,懶得構造了
        sel = Selector(text=re.text)  # 用scrapy的Selector,懶得用BS4了
        songurls = sel.xpath('//ul[@class="f-hide"]/li/a/@href').extract()
        return songurls  # 所有歌曲組成的list
        ##['/song?id=64006', '/song?id=63959', '/song?id=25642714', '/song?id=63914', '/song?id=4878122', '/song?id=63650']

    def get_songinfo(self, songurl):
        '''根據songid進入每首歌信息的網址,得到歌曲的信息
        return:'64006','陳小春-失戀王'''
        url = self.main_url + songurl
        re = self.session.get(url)
        sel = Selector(text=re.text)
        song_id = url.split('=')[1]
        song_name = sel.xpath("//em[@class='f-ff2']/text()").extract_first()
        singer = '&'.join(sel.xpath("//p[@class='des s-fc4']/span/a/text()").extract())
        songname = singer + '-' + song_name
        return str(song_id), songname

    def download_song(self, songurl, dir_path):
        '''根據歌曲url,下載mp3文件'''
        song_id, songname = self.get_songinfo(songurl)  # 根據歌曲url得出ID、歌名
        song_url = 'http://music.163.com/song/media/outer/url?id=%s.mp3' % song_id
        path = dir_path + os.sep + songname + '.mp3'  # 文件路徑
        request.urlretrieve(song_url, path)  # 下載文件

    def work(self, playlist):
        songurls = self.get_songurls(playlist)  # 輸入歌單編號,得到歌單所有歌曲的url
        dir_path = r'C:\Users\HP\Desktop\Music'
        for songurl in songurls:
            self.download_song(songurl, dir_path)  # 下載歌曲


if __name__ == '__main__':
    d = wangyiyun()
    d.work(2895575219)
    ```
發表評論
所有評論
還沒有人評論,想成為第一個評論的人麼? 請在上方評論欄輸入並且點擊發布.
相關文章