python爬虫爬取豆瓣音乐top250

286 阅读1分钟

`

import requests
import re

headers = {
    'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/102.0.5005.63 Safari/537.36 Edg/102.0.1245.33'}


for i in range(0, 100, 25):
    url = f'https://music.douban.com/top250?start={i}'
    print(url)
    r = requests.get(url, headers=headers).text

    time = re.findall(r'<p class="pl">.+/(.+)/.+/.+/.+</p>', r)
    star = re.findall(r'<span class="rating_nums">(.+)</span>', r)
    people = re.findall(r'\w+人评价', r)
    name = re.findall(r'<a.+music_subject_search.+title=".+- (.+)".+>', r)

    for x in range(0, 25):
        print('该歌曲时间为:' + time[x])
        print('该歌曲评价为:' + star[x])
        print('评价人数为:' + people[x])
        print('歌曲名称为:' + name[x])
        print('---------')
        # x += 1


# <p class="pl">(.+)</p>
# print(m)

print(star)

`