[已解决]程序报错，论坛的大佬的，复制了跑不出来

颂风侯 · 发表于 2024-10-11 12:44:36

马上注册，结交更多好友，享用更多功能^_^

您需要登录才可以下载或查看，没有账号？立即注册

x

import requests
import re
import json
import os
def get_name(singer):
    url = 'https://c.y.qq.com/soso/fcgi-bin/client_search_cp'
    params = {
    'catZhida': '1',
    'w': singer,
    }
    headers = {
    'referer': 'https://y.qq.com/portal/search.html',
    'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/66.0.3359.139 Safari/537.36'
    }
    html = requests.get(url,headers=headers,params=params).text
    content = re.compile('callback\((.*)\)').findall(html)[0]
    content = json.loads(content)
    data = content.get('data')
    song = data.get('song')
    lists = song.get('list')
    name = []
    for list in lists:
        singer = list.get('singer')[0].get('mid')
        name.append(singer)
    name = name[0]
    return name
def get_html(name,singer):
    url = 'https://c.y.qq.com/v8/fcg-bin/fcg_v8_singer_track_cp.fcg'
    params = {
    'singermid': name,
    'order': 'listen',
    'begin': '0',
    'num': '30',
    }
    headers = {
    'referer': 'https://y.qq.com/n/yqq/singer/003aQYLo2x8izP.html',
    'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/66.0.3359.139 Safari/537.36'
    }
    html = requests.get(url,headers=headers,params=params).text
    return html
def get_music(vkey,songname,filename,singer):
    if vkey and songname:
        url3 = 'http://dl.stream.qqmusic.qq.com/' + filename + '?vkey=' + vkey + '&guid=7133372870&uin=0&fromtag=66'
        headers = {
        'referer': 'https://y.qq.com/n/yqq/singer/003aQYLo2x8izP.html',
        'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/66.0.3359.139 Safari/537.36'
        }
        music = requests.get(url3,headers=headers).content
        dir = singer
        if not os.path.exists(dir):
            os.mkdir(dir)
        with open(dir+'/'+songname+'.m4a','wb') as f:
            f.write(music)
        print(songname,'__',singer)
def get_vkey(strMediaMid,songmid,songname,singer):
    if strMediaMid and songmid and songname :
        url2 = 'https://c.y.qq.com/base/fcgi-bin/fcg_music_express_mobile3.fcg'
        params = {
        'g_tk': '5381',
        'jsonpCallback': 'MusicJsonCallback8571665793949388',
        'loginUin': '0',
        'hostUin': '0',
        'format': 'json',
        'inCharset': 'utf8',
        'outCharset': 'utf-8',
        'notice': '0',
        'platform': 'yqq',
        'needNewCode': '0',
        'cid': '205361747',
        'callback': 'MusicJsonCallback8571665793949388',
        'uin': '0',
        'songmid': songmid,
        'filename': 'C400'+ strMediaMid + '.m4a',
        'guid': '7133372870'
        }
        headers = {
        'referer': 'https://y.qq.com/portal/player.html',
        'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/66.0.3359.139 Safari/537.36'
        }
        detail_html = requests.get(url2,headers=headers,params=params).text
        vkey_disc = re.compile('MusicJsonCallback8571665793949388\((.*?)\)').findall(detail_html)[0]
        vkey_disc = json.loads(vkey_disc)
        data = vkey_disc['data']
        items = data.get('items')[0]
        vkey = items.get('vkey')
        get_music(vkey,songname,'C400'+ strMediaMid + '.m4a',singer)
def get_list(detail_html,singer):
    if detail_html:
        lists = re.compile('data":{"list":(.*?),"singer_id',re.S).findall(detail_html)[0]
        datas = json.loads(lists)
        for data in datas:
            musicData = data.get('musicData')
            strMediaMid = musicData.get('strMediaMid')
            songmid = musicData.get('songmid')
            songname = musicData.get('songname')
            get_vkey(strMediaMid,songmid,songname,singer)
def main():
    singer = input('请输入您想要下载的歌手：')
    name = get_name(singer)
    detail_html = get_html(name,singer)
    get_list(detail_html,singer)
if __name__ == '__main__':
    main()

复制代码

复制的论坛大神的，跑不出来
报错如下
D:\PYTHON_NEW\pack20240926\pythonProject1\.venv\Scripts\python.exe D:\PYTHON_NEW\pack20240926\pythonProject1\tkinter练习\爬虫测试\测试qq音乐爬虫.py
D:\PYTHON_NEW\pack20240926\pythonProject1\tkinter练习\爬虫测试\测试qq音乐爬虫.py:37: SyntaxWarning: invalid escape sequence '′content=re.compile(′callback\((.∗)
').findall(html)[zxsq-anti-bbcode-0]
D:\PYTHON_NEW\pack20240926\pythonProject1\tkinter练习\爬虫测试\测试qq音乐爬虫.py:177: SyntaxWarning: invalid escape sequence '′vkeydisc=re.compile(′MusicJsonCallback8571665793949388\((.∗?)
').findall(detail_html)[zxsq-anti-bbcode-0]

最佳答案

月排行榜 / 总排行榜

Stubborn

2024-10-14 18:01:24

爬虫有时效性的，

这报错，一般就是网站请求给的数据不对头，后续清洗数据报错

跳转到最佳答案楼层

Stubborn · 发表于 2024-10-14 18:01:24

这个最佳答案由 Stubborn 给出，感谢 Stubborn 的回答。

单击隐藏图章

爬虫有时效性的，

这报错，一般就是网站请求给的数据不对头，后续清洗数据报错

账号		自动登录	找回密码
密码			立即注册

[已解决]程序报错，论坛的大佬的，复制了跑不出来

马上注册，结交更多好友，享用更多功能^_^

浏览过的版块