1. 程式人生 > 其它 >爬蟲 豆瓣音樂 top250

爬蟲 豆瓣音樂 top250

技術標籤:python爬蟲

豆瓣音樂top250爬取,並將內容寫入檔案

from urllib.request import Request, urlopen
import bs4
import requests
import re
import json
import xlwt

workbook = xlwt.Workbook(encoding='utf-8')
worksheet = workbook.add_sheet('sheet1', cell_overwrite_ok=True)
worksheet.write(0, 0, label='歌名')
worksheet.write(0, 1, label='歌手')
worksheet.write(0, 2, label='時間')
worksheet.write(0, 3, label='型別')
worksheet.write(0, 4, label='評分')
z = 1
url=('https://music.douban.com/top250?start=0')#.format(i)
header = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/84.0.4147.105 Safari/537.36'}
ret = Request(url=url, headers=header)
html = urlopen(ret)
bs = bs4.BeautifulSoup(html, 'html.parser')



alls = bs.find_all('div',{'class':'pl2'})
for x in alls:
    music_name = x.find('a').get_text()
    leixing = x.find('p').get_text().split('/ ')
    score = x.find('span',{'class':'rating_nums'}).get_text()
    singer = leixing[0]
    time = leixing[1]
    type = leixing[-1]
    # print(leixing)

    worksheet.write(z,0,music_name)
    worksheet.write(z,1, singer)
    worksheet.write(z,2,time)
    worksheet.write(z,3,type)
    worksheet.write(z,4,score)
    z += 1
workbook.save('yinyue.xls')