python爬蟲執行個體--網易雲音樂排行榜爬蟲
進過各種努力, 終于找到了個大神寫的部落格,3.6版本的python
python 代碼下載下傳位址: https://github.com/imyxuan/Netease
from Crypto.Cipher import AES
第一次錯誤: 提示沒有安裝Visual Studio 2015 Microsoft Build Tools 14.0
下載下傳位址: https://www.microsoft.com/en-us/download/details.aspx?id=48130
運作修複工具修複完了後提示c++有異常 ,需要擴充修複.....然後工具-->選項-->擴充-->開始擴充.然後再修複一遍,提示c++修複成功!!
隻能百度了: ,安裝這個弄的:
1.設定Microsoft Visual Studio 14.0的環境變量 VCINSTALLDIR 變量值 C:\Program Files (x86)\Microsoft Visual Studio 14.0\VC(預設安裝位置,請根據自己的安裝位置确定)如圖:

3.在指令行(cmd)中執行 set CL=-FI"%VCINSTALLDIR%\INCLUDE\stdint.h"
終于安裝成功了, 然後信心滿滿的重新開機了我的PyCharm, 結果運作的時候還是找不到那個Crypto子產品,這是已經過去好幾個小時了沒辦法, 隻能百度了..
python 的Crypto 安裝目錄: C:\Users\Administrator\AppData\Local\Programs\Python\Python36\Lib\site-packages
# coding: utf-8
# 聲明: 是這個大神寫的, 和沒啥關系,我隻是改了改
from Crypto.Cipher import AES
import base64
import requests
import sys
headers = {
'Cookie': 'appver=1.5.0.75771;',
'Referer': 'http://music.163.com/',
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/63.0.3239.132 Safari/537.36'
}
first_param = "{\"ids\":\"[%d]\",\"br\":128000,\"csrf_token\":\"\"}"
second_param = "010001"
third_param = "00e0b509f6259df8642dbc35662901477df22677ec152b5ff68ace615bb7b725152b3ab17a876aea8a5aa76d2e417629ec4ee341f56135fccf695280104e0312ecbda92557c93870114af6c9d05c4f7f0c3685b7a46bee255932575cce10b424d813cfe4875d3e82047b97ddef52741d546b8e289dc6935b3ece0462db0a22b8e7"
forth_param = "0CoJUm6Qyw8W8jud"
def get_params():
iv = "0102030405060708"
first_key = forth_param
second_key = 16 * 'F'
h_encText = AES_encrypt(first_param, first_key, iv)
h_encText = AES_encrypt(h_encText, second_key, iv)
return h_encText
def get_encSecKey():
encSecKey = "257348aecb5e556c066de214e531faadd1c55d814f9be95fd06d6bff9f4c7a41f831f6394d5a3fd2e3881736d94a02ca919d952872e7d0a50ebfa1769a7a62d512f5f1ca21aec60bc3819a9c3ffca5eca9a0dba6d6f7249b06f5965ecfff3695b54e1c28f3f624750ed39e7de08fc8493242e26dbc4484a01c76f739e135637c"
return encSecKey
def AES_encrypt(text, key, iv):
pad = 16 - len(text) % 16
if isinstance(text, str):
text = text + pad * chr(pad)
else:
text = text.decode('utf-8') + pad * chr(pad)
encryptor = AES.new(key, AES.MODE_CBC, iv)
encrypt_text = encryptor.encrypt(text)
encrypt_text = base64.b64encode(encrypt_text)
return encrypt_text
def get_json(url, params, encSecKey):
data = {
"params": params,
"encSecKey": encSecKey
}
response = requests.post(url, headers=headers, data=data).json()
return response['data']
# 榜單歌曲批量下載下傳
# r = requests.get('http://music.163.com/api/playlist/detail?id=2884035') # 網易原創歌曲榜
# r = requests.get('http://music.163.com/api/playlist/detail?id=19723756') # 雲音樂飙升榜
# r = requests.get('http://music.163.com/api/playlist/detail?id=3778678') # 雲音樂熱歌榜
#r = requests.get('http://music.163.com/api/playlist/detail?id=3779629') # 雲音樂新歌榜
# 歌單歌曲批量下載下傳
# r = requests.get('http://music.163.com/api/playlist/detail?id=123415635') # 雲音樂歌單——【華語】中國風的韻律,中國人的印記
# r = requests.get('http://music.163.com/api/playlist/detail?id=122732380') # 雲音樂歌單——那不是愛,隻是寂寞說的謊
r=requests.get("http://music.163.com/api/playlist/detail?id=2884035",headers=headers)
arr=r.json()['result']['tracks']
for i in range(100):
toplistMP3ID =str(arr[i]['id'])
toplistMP3Title = str(arr[i]['name'])
music_id = toplistMP3ID
first_param = "{\"ids\":\"[%d]\",\"br\":128000,\"csrf_token\":\"\"}" % int(music_id)
url = 'https://music.163.com/weapi/song/enhance/player/url?csrf_token='
params = get_params()
encSecKey = get_encSecKey()
"""
rsp:{
'data': [{
'gain': 2.3073,
'type': 'mp3',
'url': 'http://m10.music.126.net/20180111133509/24c79548414f7aa7407985818cb16a39/ymusic/333c/66b1/e5ec/
72aeb13aca24c989295e58e8384e3f97.mp3',
'md5': '72aeb13aca24c989295e58e8384e3f97',
'flag': 0, 'code': 200, 'payed': 0, 'id': 151619, 'expi': 1200, 'size': 3868307,
'uf': None, 'br': 128000, 'fee': 0, 'canExtend': False}], 'code': 200}
"""
rsp = get_json(url, params, encSecKey)
music_url = rsp[0].get('url')
if music_url:
music = requests.get(music_url)
name = sys.path[0] + "/mp3/%s.mp3" % toplistMP3Title
print(name)
with open(name, "wb") as code:
code.write(music.content)
# music_id = input('請輸入歌曲ID:')