使用BeautifulSoup4修改的百度新歌榜下载脚本,,import urlli


import urllib,jsonfrom bs4 import  BeautifulSoupf=urllib.urlopen('http://music.baidu.com/top/new')content=f.read()s=BeautifulSoup(content)items=s.select("#songListWrapper li")for i in range(len(items)):    songs=json.loads(items[i]['data-songitem'])    sid=songs['songItem']['sid']    sname=songs['songItem']['sname']    author=songs['songItem']['author']    downpage=urllib.urlopen('http://music.baidu.com/song/%s/download'% str(sid)).read()    soupDown=BeautifulSoup(downpage)    dlink=soupDown.select("a#download")[0].get('href')[22:] #踢掉开头的22个字符/data/music/file?link=    urllib.urlretrieve(dlink,sname+'-'+author+'.mp3')#该片段来自于http://byrx.net

评论关闭