当前位置: 首页 > 工具软件 > 163music > 使用案例 >

PHP爬虫音乐缓存,爬取网易云音乐热评[附上音乐下载]

楮乐邦
2023-12-01

[Python] 纯文本查看 复制代码import requests

import time,os

from bs4 import BeautifulSoup

class Music_down:

def __init__(self):

self.headers = {

"User-Agent": "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/73.0.3683.86 Safari/537.36",

}

self.url = "http://music.163.com/song/media/outer/url?id="

def get_name_byId(self, id):

base_url = "https://music.163.com/song?id={}".format(id)

response = requests.get(base_url, headers=self.headers)

html = BeautifulSoup(response.text, 'lxml')

self.name = html.select('.f-ff2')[0].text

response.close()

self.download(self.name,id)

def download(self, name, id):

#这里出现了下载错误 关于歌的名字问题 不能存在/

# name = name.replace('\xa0', '')

name = name.replace('/', '')

# name = "".join(name.split().remove(" "))

if not os.path.exists('./music'):

os.mkdir('./music')

print("music文件夹创建成功,在当前目录下")

res = requests.get(self.url + id, headers=self.headers)

with open('./music/'+name+'.mp3', 'ab+') as f:

f.write(res.content)

print("*********"+name+"*****下载完成")

def get_music_id(self, urls):

try:

html = requests.get(urls,headers=self.headers).text

except:

print("请输入正确的网址!!!")

return

text = BeautifulSoup(html, 'lxml')

ids = text.select('.f-hide li a')

print("总共%d个文件" % len(ids))

for id in ids:

music_id = id.get('href').split('=')[1]

name = id.text

self.download(name, music_id)

time.sleep(1)

if __name__ == '__main__':

music = Music_down()

while True:

print("""

网易云获取热评:

1. 通过歌曲的id

2. 通过歌单的连接

0. 退出

""")

number = 0

try:

number = int(input("请输入: "))

except:

input("请输入数字")

if number == 2:

song_url = input("请输入歌单的网址: ")

song_url = song_url.replace('/#','')

# print(song_url)

music.get_music_id(song_url)

elif number == 1:

id = input("请输入歌曲的id: ")

music.get_name_byId(id)

elif number == 0:

exit()

else:

print("没有该选项")

 类似资料: