python爬虫 爬取mp3
import requests
from lxml import etree
import os
if __name__=='__main__':
if not os.path.exists('xiaofang'):
os.mkdir('xiaofang')
url='https://www.yespik.com/search-sound/77822.html'
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/96.0.4664.93 Safari/537.36'
}
resp = requests.get(url=url, headers=headers).text
# fp=open('a.html','w',encoding='utf-8')
# fp.write(resp)
# fp.close()
#数据解析
tree=etree.HTML(resp)
ul_list=tree.xpath('/html/body/div[4]/div[1]/div')
# print(ul_list)
for li in ul_list:
wang_url = li.xpath('div/div[3]/audio/source/@src')[0]
wang_url='http:'+ wang_url
print(wang_url)
name= li.xpath('div/div[2]/a/text()')[0]+'.mp3'
print(name)
data1 = requests.get(url=wang_url, headers=headers)
data2=data1.content
# # 压缩包路径
page3_path = 'xiaofang/' + name
with open(page3_path, mode='wb') as fp:
fp.write(data2)
print(name, "下载完成!!!")