Python学习之路-网易云音乐评论爬取-工具盒子

爬取指定歌单内所有歌曲的热评, 写得很垃, 不想改了
import csv
import json
import time
import urllib.request
code = 'utf-8'
def http_r(url, c):
设置UA
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) '
'Chrome/90.0.4430.212 Safari/537.36'
}
request = urllib.request.Request(url=url, headers=headers)
return urllib.request.urlopen(request).read().decode(c)
def getUrls(playListID):  # 通过歌单ID利用接口获取歌曲列表并提取出歌曲ID
s = []
print('开始获取歌曲列表')
for key in json.loads(http_r("https://api.fczbl.vip/163/?type=playlist&amp;id=" + playListID, code)):
s.append((key['url']).replace('https://api.fczbl.vip/163/?type=url&amp;id=', ''))
print('已获取 ' + str(len(s)) + ' 首歌曲')
return s
def getContent(url, c):  # 获取接口内容, 判断是否获取失败
back = http_r(url, c)
while back[0:1] != '{' and ((json.loads(back))["code"] &lt; 0):
print('获取失败, 重试中')
time.sleep(1)
back = http_r(url, c)
return back
def getComment(urls):  # 解析接口返回内容
i = 0
n = str(len(urls))
url_1 = 'https://api.fczbl.vip/163/?type=single&amp;id='  # 第三方API
url_2 = 'https://music.163.com/api/v1/resource/comments/R_SO_4_'  # 网易云音乐评论API
print("开始获取歌曲详情")
newCsv()
for mID in urls:
i += 1
print(mID + ' (' + str(i) + '/' + n + '): 正在获取歌曲详情')
info_m = getContent(url_1 + mID, code)
info_m = json.loads(info_m)
print(mID + ' (' + str(i) + '/' + n + '): 正在获取评论列表')
hotCommentsList = getContent(url_2 + mID, code)
    try:
        hotCommentsList = (json.loads(hotCommentsList))[&quot;hotComments&quot;]  # 热评列表
    except Exception:
        print(mID + ' (' + str(i) + '/' + n + '): 获取失败已跳过')
        continue
print(mID + ' (' + str(i) + '/' + n + '): 已获取到 ' + str(len(hotCommentsList)) + ' 条热评')
hotComments = {}
print(mID + ' (' + str(i) + '/' + n + '): 正在解析热评列表')
for val in hotCommentsList:
    hotComments[val[&amp;quot;user&amp;quot;][&amp;quot;nickname&amp;quot;]] = val[&amp;quot;content&amp;quot;]
info = {&amp;quot;title&amp;quot;: info_m[&amp;quot;name&amp;quot;], &amp;quot;author&amp;quot;: info_m[&amp;quot;artist&amp;quot;], &amp;quot;comment&amp;quot;: hotComments}
print(mID + ' (' + str(i) + '/' + n + '): ' + str(info))
writeOut(info)
time.sleep(2)


def writeOut(info):  # 将解析好的数据按格式写入文本
with open('infos.csv', 'a', encoding='utf-8') as file_obj:  # 将数据追加写出到同级目录下的infos.txt中
f_csv = csv.writer(file_obj)
name = info['title']
author = info['author']
commentList = info['comment']
    for key in commentList:
        f_csv.writerow([name, author, key, commentList[key]])

def newCsv():
with open('infos.csv', 'w', encoding='utf-8')as f:
f_csv = csv.writer(f)
f_csv.writerow(['歌曲名', '歌曲作者', '评论者', '评论'])
musicIDList = getUrls(&quot;926056136&quot;) # 歌单ID getComment(musicIDList)
51工具盒子

Python学习之路-网易云音乐评论爬取

设置UA

厉飞雨

相关推荐

最新文章

猜你喜欢

快捷分类