py每日spider案例之某website之music搜索接口(泡椒音乐)


import requests


headers = {
    "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
    "accept-language": "zh-CN,zh;q=0.9",
    "cache-control": "no-cache",
    "pragma": "no-cache",
    "priority": "u=0, i",
    "sec-ch-ua": "\"Not;A=Brand\";v=\"99\", \"Google Chrome\";v=\"139\", \"Chromium\";v=\"139\"",
    "sec-ch-ua-mobile": "?0",
    "sec-ch-ua-platform": "\"Windows\"",
    "sec-fetch-dest": "document",
    "sec-fetch-mode": "navigate",
    "sec-fetch-site": "same-origin",
    "sec-fetch-user": "?1",
    "upgrade-insecure-requests": "1",
    "user-agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/139.0.0.0 Safari/537.36"
}
cookies = {
    "Hm_tf_jfee1h5kk8a": "1754279868",
    "sl-session": "3Fl/W554pmgUv0WaqyjrLw==",
    "Hm_lvt_jfee1h5kk8a": "1754279868,1755653950",
    "Hm_lpvt_jfee1h5kk8a": "1755653950"
}
url = "https://pjmp3.com/search.php"
params = {
    "keyword": "方大同"
}
response = requests.get(url, headers=headers, cookies=cookies, params=params)

html=etree.HTML(response.text)
href=html.xpath('//div[@class="search-result-list-content"]/a/@href')
for h in href:
    url = "https://pjmp3.com/song.php"
    params = {
        "id": h.split('=')[-1]
    }
    response = requests.get(url, headers=headers, cookies=cookies, params=params)
    audio=re.findall('url\: \'(.*?)\'',response.text)[-1]
    name=re.findall('name\: \'(.*?)\'',response.text)[-1]
    artist=re.findall('artist\: \'(.*?)\'',response.text)[-1]
    print(name,artist,audio)

image

目标网址

posted @ 2025-08-20 09:46  我不是萧海哇~~~  阅读(32)  评论(0)    收藏  举报