You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
102201518/爬取单个视频弹幕并以文档形式输出.py

16 lines
782 B

This file contains ambiguous Unicode characters!

This file contains ambiguous Unicode characters that may be confused with others in your current locale. If your use case is intentional and legitimate, you can safely ignore this warning. Use the Escape button to highlight these characters.

import requests#爬取网页源码
import re#对解析后的文件进行弹幕匹配
url = 'https://api.bilibili.com/x/v1/dm/list.so?oid=1663877514'
headers = {
'user-agent' : 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/128.0.0.0 Safari/537.36 Edg/128.0.0.0'
}#模拟浏览器发送请求
response = requests.get(url=url, headers=headers)#通过requests模块内get请求方式对url发送请求
response.encoding = response.apparent_encoding
print(response.text)#获取数据
data_list = re.findall('<d p=".*?">(.*?)</d>',response.text)#解析数据
for index in data_list:
with open('弹幕.txt',mode='a',encoding='utf-8') as f:#输出为文本
f.write(index)
f.write('\n')#换行
print(index)