1 Star 0 Fork 0

Jeremy / bilibili_wordcloud

加入 Gitee
与超过 1200万 开发者一起发现、参与优秀开源项目,私有仓库也完全免费 :)
免费加入
该仓库未声明开源许可证文件(LICENSE),使用请关注具体项目描述及其代码上游依赖。
克隆/下载
get_danmu.py 1.97 KB
一键复制 编辑 原始数据 按行查看 历史
yanjunjie 提交于 2020-05-02 19:19 . update
import requests
import re
import traceback
import sys
def req_url(url):
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/80.0.3987.100 Safari/537.36',
}
res = requests.get(url, headers=headers)
return res
# 根据BV号获取CID
def get_cid(number):
"""
:param number:B站视频的BV号
:return:对应的CID
"""
url = f'https://api.bilibili.com/x/player/pagelist?bvid={number}&jsonp=jsonp'
cid_list = []
res = req_url(url)
res_json = res.json()
for item in res_json['data']:
cid_list.append(item['cid'])
return cid_list
# 根据CID获取弹幕
def get_danmu_by_cid(cid_list):
all_danmu_list = []
for cid in cid_list:
url = f'https://api.bilibili.com/x/v1/dm/list.so?oid={cid}'
res = req_url(url)
res_xml = res.content.decode(encoding='utf8')
pattern = re.compile('<d.*?>(.*?)</d>')
danmu_list = pattern.findall(res_xml)
all_danmu_list.append(danmu_list)
return all_danmu_list
# 保存弹幕
def save_danmu_to_file(all_danmu_list, bv):
file_name = f'{bv}.txt'
with open(file_name, mode='w', encoding='utf8') as f:
i = 0
for danmu_list in all_danmu_list:
for item in danmu_list:
i += 1
f.write(item)
f.write('\n')
print(f'获取到弹幕{i}条')
def main(bv_number):
try:
if type(bv_number) != str:
print('格式有误')
sys.exit(0)
elif len(bv_number) == 0:
print('输入为空')
sys.exit(0)
else:
cid_list = get_cid(bv_number)
all_danmu_list = get_danmu_by_cid(cid_list)
save_danmu_to_file(all_danmu_list, bv_number)
except Exception:
print(traceback.format_exc())
if __name__ == '__main__':
av = input('请输入要查询弹幕列表的BV号,格式:avXXXXXXXX:')
main(av)
Python
1
https://gitee.com/HashJeremy/bilibili_wordcloud.git
git@gitee.com:HashJeremy/bilibili_wordcloud.git
HashJeremy
bilibili_wordcloud
bilibili_wordcloud
master

搜索帮助