写了一个下载 bilibili 字幕的脚本, 分享一下 ...

作者：master9 发布时间：2024-4-17 21:14:51

想下载一个视频教程,发现字幕没有下载. 网上也没有工具,就自己写了一个
[Python] 纯文本查看复制代码"""下载哔哩哔哩字幕
"""
import math
import os
import time
import requests
import json
def convert_json_to_srt(json_files_path):
"""
json 格式的字幕转为 srt 格式
代码来源 https://www.jianshu.com/p/66450e9554f8
"""
json_files = os.listdir(json_files_path)
srt_files_path = os.path.join(json_files_path, 'srt')  # 更改后缀后字幕文件的路径
isExists = os.path.exists(srt_files_path)
if not isExists:
      os.mkdir(srt_files_path)
for json_file in json_files:
      file_name = json_file.replace(json_file[-5:], '.srt')  # 改变转换后字幕的后缀
      file = ''  # 这个变量用来保存数据
      i = 1
      # 将此处文件位置进行修改，加上utf-8是为了避免处理中文时报错
      with open(os.path.join(json_files_path, json_file), encoding='utf-8') as f:
         datas = json.load(f)  # 加载文件数据
         f.close()
      for data in datas['body']:
         start = data['from']  # 获取开始时间
         stop = data['to']  # 获取结束时间
         content = data['content']  # 获取字幕内容
         file += '{}\n'.format(i)  # 加入序号
         hour = math.floor(start) // 3600
         minute = (math.floor(start) - hour * 3600) // 60
         sec = math.floor(start) - hour * 3600 - minute * 60
         minisec = int(math.modf(start)[0] * 100)  # 处理开始时间
         file += str(hour).zfill(2) + ':' + str(minute).zfill(2) + ':' + str(sec).zfill(2) + ',' + str(
            minisec).zfill(2)  # 将数字填充0并按照格式写入
         file += ' --> '
         hour = math.floor(stop) // 3600
         minute = (math.floor(stop) - hour * 3600) // 60
         sec = math.floor(stop) - hour * 3600 - minute * 60
         minisec = abs(int(math.modf(stop)[0] * 100 - 1))  # 此处减1是为了防止两个字幕同时出现
         file += str(hour).zfill(2) + ':' + str(minute).zfill(2) + ':' + str(sec).zfill(2) + ',' + str(
            minisec).zfill(2)
         file += '\n' + content + '\n\n'  # 加入字幕文字
         i += 1
      with open(os.path.join(srt_files_path, file_name), 'w', encoding='utf-8') as f:
         f.write(file)  # 将数据写入文件
def download_subtitle_json(bvid: str):
"""
下载字幕
"""
sub_dir = f'./{bvid}'
if not os.path.isdir(sub_dir):
      os.mkdir('./{bvid}')
headers = {
      'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:125.0) Gecko/20100101 Firefox/125.0',
      'Accept': 'application/json, text/plain, */*',
      'Accept-Language': 'en-US,en;q=0.5',
      # 'Accept-Encoding': 'gzip, deflate, br',
      'Referer': 'https://www.bilibili.com/video/{bvid}/?p=1',
      'Origin': 'https://www.bilibili.com',
      'Connection': 'keep-alive',
      # TODO 改为自己的cookie , 通过浏览器的 network(网络) 复制
      'Cookie': "",
      'Sec-Fetch-Dest': 'empty',
      'Sec-Fetch-Mode': 'cors',
      'Sec-Fetch-Site': 'same-site',
}
resp = requests.get(f'https://www.bilibili.com/video/{bvid}/', headers=headers)
text = resp.text
aid = text[text.find('"aid"') + 6:]
aid = aid[:aid.find(',')]
cid_back = requests.get("http://api.bilibili.com/x/player/pagelist?bvid={}".format(bvid), headers=headers)
if cid_back.status_code != 200:
      print('获取 playlist 失败')
cid_json = json.loads(cid_back.content)
for item in cid_json['data']:
      cid = item['cid']
      title = item['part'] + '.json'
      params = {
         'aid': aid,
         'cid': cid,
         'isGaiaAvoided': 'false',
         'web_location': '1315873',
         'w_rid': '364cdf378b75ef6a0cee77484ce29dbb',
         'wts': int(time.time()),
      }
      wbi_resp = requests.get('https://api.bilibili.com/x/player/wbi/v2', params=params, headers=headers)
      if wbi_resp.status_code != 200:
         print('获取字幕链接失败')
      subtitle_links = wbi_resp.json()['data']["subtitle"]['subtitles']
      if subtitle_links:
         # 默认下载第一个字幕
         subtitle_url = "https:" + subtitle_links[0]['subtitle_url']
         subtitle_resp = requests.get(subtitle_url, headers=headers)
         open(os.path.join(sub_dir, title), 'w', encoding='utf-8').write(subtitle_resp.text)
if __name__ == '__main__':
# todo 改成需要下载的 bvid, https://www.bilibili.com/video/[b]
BVID = 'BV1s8411v7nE'
download_subtitle_json(BVID)
# convert_json_to_srt(f'./{BVID}')

字幕, 写了

写了一个下载 bilibili 字幕的脚本, 分享一下

相关帖子

热门主题

最近收BA的人很多交易了要立刻取消BA 教训

刚看了一个视频，让我又清醒了一下

小小农民新开中转站，欢迎来踩

港版安卓机是满血的国际版安卓机吗？

我 ThreeJSON 又回来了： V 友们批评得对！

继之前 5.4 的 “收口”之后， 5.6 Sol 好

折腾 homelab 挺长时间了建了一个群想不

codex 打开风扇狂转怎么办

Vibe 的一个中文起名小工具

你们明天要去看周星驰的电影么？

热门板块

公告

网站帮助 - Yoo趣儿

我们的愿景

在 Yoo趣儿投放广告

Yoo趣儿网站用户应遵守规则