import requests,re,csv
url = ‘https://www.kugou.com/yy/rank/home/1-6666.html?from=rank‘
headers = {
‘cookie’: ‘kg_mid=f1758fea893ad2cb5692e0594f568d24; kg_dfid=0R8fRo1RCwT4031R1L35tHo4; kg_dfid_collect=d41d8cd98f00b204e9800998ecf8427e; ACK_SERVER_10016=%7B%22list%22%3A%5B%5B%22bjreg-user.kugou.com%22%5D%5D%7D; ACK_SERVER_10017=%7B%22list%22%3A%5B%5B%22bjverifycode.service.kugou.com%22%5D%5D%7D; ACK_SERVER_10015=%7B%22list%22%3A%5B%5B%22bjlogin-user.kugou.com%22%5D%5D%7D; Hm_lvt_aedee6983d4cfc62f509129360d6bb3d=1645503860; kg_mid_temp=f1758fea893ad2cb5692e0594f568d24; Hm_lpvt_aedee6983d4cfc62f509129360d6bb3d=1645503922’,
‘referer’: ‘https://www.kugou.com/yy/rank/home/1-8888.html?from=rank‘,
‘user-agent’: ‘Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.102 Safari/537.36’,
}
res = requests.get(url=url,headers=headers,proxies={‘http’:’http://111.59.199.58:8118'})
html = res.content.decode(‘utf-8’)
# print(html)
pattern = ‘.?
- (.?)
data = re.search(pattern=pattern,string=html,flags=re.S).group(1)
# print(data)
li_list = re.findall(‘(
# print(li_list)
data_list = []
for li in li_list:
# print(li)
data_pattern = ‘.?
data_list.append({‘歌名’:re.sub(‘\s’,’’,re.match(pattern=data_pattern,string=li,flags=re.S).group(2)),’歌手’:re.match(pattern=data_pattern,string=li,flags=re.S).group(3),’详情链接’:re.match(pattern=data_pattern,string=li,flags=re.S).group(1)})
Csv_header = (‘歌名’,’歌手’,’详情链接’)
with open(‘D:\桌面\新建文件夹\酷狗飙升榜.csv’,’w’,newline=’’) as f:
writer = csv.DictWriter(f,Csv_header)
writer.writeheader()
writer.writerows(data_list)
print(“保存成功”)
