mirror of
https://github.com/JefferyHcool/BiliNote.git
synced 2026-06-04 07:10:07 +08:00
- whisper: model.bin 截断/损坏时删目录重下重试一次,修「Unable to
open file model.bin」死循环;mlx 同样按 config.json 判完整性
- /generate_note 加就绪门禁:本地转写引擎模型没下好直接拦截,返回
reason=transcriber_model_not_ready,不让任务静默卡在首次下载
- 全局代理:新增 ProxyConfigManager(JSON 配置 + HTTP_PROXY env 兜底)
+ build_openai_client,统一注入代理到 LLM/Groq 客户端;yt-dlp 与
youtube-transcript-api 也走代理
- build_openai_client 校验 api_key 非空,空 key 给「xxx 的 API Key
未配置」而不是天书般的 Illegal header value b'Bearer '
- universal_gpt: 模型拒绝自定义 temperature(o1/o3/gpt-5 系列)时
就地去掉参数重试,不消耗重试预算
- connect_test 改用真实 chat completion 而非 /v1/models 探测
- main.py: lifespan 拆 [startup 1/5..5/5] 分段日志 + 异常清晰定位
- /sys_health 重构为结构化返回 {backend,ffmpeg,db,whisper_model}
Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
115 lines
4.2 KiB
Python
115 lines
4.2 KiB
Python
import json
|
||
import os
|
||
from pathlib import Path
|
||
from typing import Optional, Dict, Any
|
||
|
||
|
||
class TranscriberConfigManager:
|
||
"""管理转写器配置,存储在 JSON 文件中,支持前端动态修改。"""
|
||
|
||
def __init__(self, filepath: str = "config/transcriber.json"):
|
||
self.path = Path(filepath)
|
||
self.path.parent.mkdir(parents=True, exist_ok=True)
|
||
|
||
def _read(self) -> Dict[str, Any]:
|
||
if not self.path.exists():
|
||
return {}
|
||
try:
|
||
with self.path.open("r", encoding="utf-8") as f:
|
||
return json.load(f)
|
||
except Exception:
|
||
return {}
|
||
|
||
def _write(self, data: Dict[str, Any]):
|
||
with self.path.open("w", encoding="utf-8") as f:
|
||
json.dump(data, f, ensure_ascii=False, indent=2)
|
||
|
||
def get_config(self) -> Dict[str, Any]:
|
||
"""获取当前转写器配置,fallback 到环境变量默认值。
|
||
|
||
whisper 默认 size 从 'medium' (~1.5GB) 改为 'tiny' (~75MB):
|
||
新装用户没主动设置时不应该被首次下载卡住。想要更高精度可在「音频转写配置」
|
||
页主动切换。
|
||
"""
|
||
data = self._read()
|
||
return {
|
||
"transcriber_type": data.get(
|
||
"transcriber_type",
|
||
os.getenv("TRANSCRIBER_TYPE", "fast-whisper"),
|
||
),
|
||
"whisper_model_size": data.get(
|
||
"whisper_model_size",
|
||
os.getenv("WHISPER_MODEL_SIZE", "tiny"),
|
||
),
|
||
}
|
||
|
||
def update_config(
|
||
self,
|
||
transcriber_type: str,
|
||
whisper_model_size: Optional[str] = None,
|
||
) -> Dict[str, Any]:
|
||
"""更新转写器配置并持久化。"""
|
||
data = self._read()
|
||
data["transcriber_type"] = transcriber_type
|
||
if whisper_model_size is not None:
|
||
data["whisper_model_size"] = whisper_model_size
|
||
self._write(data)
|
||
return self.get_config()
|
||
|
||
def get_transcriber_type(self) -> str:
|
||
return self.get_config()["transcriber_type"]
|
||
|
||
def get_whisper_model_size(self) -> str:
|
||
return self.get_config()["whisper_model_size"]
|
||
|
||
def is_model_ready(self) -> Dict[str, Any]:
|
||
"""当前转写器是否就绪可用。
|
||
|
||
返回 {ready, transcriber_type, model_size, downloading, reason}:
|
||
- 在线引擎 (groq/bcut/kuaishou):永远 ready(不需要本地模型)
|
||
- fast-whisper:检查 whisper-{size}/model.bin 落盘
|
||
- mlx-whisper:检查 {repo_id}/config.json 落盘
|
||
给 /generate_note 入口做「开始视频前先确认模型下载好」的门禁用。
|
||
"""
|
||
cfg = self.get_config()
|
||
ttype = cfg["transcriber_type"]
|
||
size = cfg["whisper_model_size"]
|
||
result = {
|
||
"ready": True,
|
||
"transcriber_type": ttype,
|
||
"model_size": size,
|
||
"downloading": False,
|
||
"reason": "",
|
||
}
|
||
if ttype not in ("fast-whisper", "mlx-whisper"):
|
||
return result # 在线引擎无需本地模型
|
||
|
||
# 延迟 import 避免与 routers.config 的循环依赖;只取纯函数,不触发路由副作用
|
||
try:
|
||
from app.routers.config import (
|
||
_check_whisper_model_exists,
|
||
_check_mlx_whisper_model_exists,
|
||
_downloading,
|
||
)
|
||
except Exception as e:
|
||
# 拿不到检查函数时保守放行,不要把用户卡死
|
||
result["reason"] = f"无法检查模型状态: {e}"
|
||
return result
|
||
|
||
if ttype == "fast-whisper":
|
||
downloaded = _check_whisper_model_exists(size, "whisper")
|
||
downloading = _downloading.get(size) == "downloading"
|
||
else: # mlx-whisper
|
||
downloaded = _check_mlx_whisper_model_exists(size)
|
||
downloading = _downloading.get(f"mlx-{size}") == "downloading"
|
||
|
||
result["downloading"] = downloading
|
||
if downloaded:
|
||
return result
|
||
result["ready"] = False
|
||
result["reason"] = (
|
||
f"转写模型 {ttype} / {size} 尚未下载就绪"
|
||
+ (",正在下载中,请稍候" if downloading else ",请先在「设置 → 音频转写配置」页下载")
|
||
)
|
||
return result
|