mirror of
https://github.com/JefferyHcool/BiliNote.git
synced 2026-05-11 18:10:06 +08:00
### v1.1.0 - #### Added - 新增 AI 笔记风格选择 - 新增 AI 笔记返回格式选择 - 添加 AI 自定义笔记备注 Prompt - 添加任务失败重试 - 添加全局设置页,可在设置页进行模型设置 - #### Optimize - 优化前端样式,优化用户体验 - 增加生成中间产物,可用于失败后加快生成速度 - #### Fix - 修复视频截图视频过早删除错误
115 lines
3.9 KiB
Python
115 lines
3.9 KiB
Python
import requests
|
||
import logging
|
||
import os
|
||
from typing import Union, List, Dict, Optional
|
||
|
||
from app.decorators.timeit import timeit
|
||
from app.models.transcriber_model import TranscriptSegment, TranscriptResult
|
||
from app.transcriber.base import Transcriber
|
||
from app.utils.logger import get_logger
|
||
from events import transcription_finished
|
||
|
||
logger = get_logger(__name__)
|
||
|
||
class KuaishouTranscriber(Transcriber):
|
||
"""快手语音识别实现"""
|
||
|
||
API_URL = "https://ai.kuaishou.com/api/effects/subtitle_generate"
|
||
|
||
def __init__(self):
|
||
pass
|
||
|
||
def _load_file(self, file_path: str) -> bytes:
|
||
"""读取文件内容"""
|
||
with open(file_path, 'rb') as f:
|
||
return f.read()
|
||
|
||
def _submit(self, file_path: str) -> dict:
|
||
"""提交识别请求"""
|
||
try:
|
||
file_binary = self._load_file(file_path)
|
||
|
||
payload = {
|
||
"typeId": "1"
|
||
}
|
||
|
||
# 使用文件名作为上传文件名
|
||
file_name = os.path.basename(file_path)
|
||
files = [('file', (file_name, file_binary, 'audio/mpeg'))]
|
||
|
||
logger.info(f"开始向快手API提交请求,文件: {file_name}")
|
||
response = requests.post(self.API_URL, data=payload, files=files, timeout=300)
|
||
response.raise_for_status() # 检查HTTP错误
|
||
|
||
result = response.json()
|
||
print('result',result)
|
||
# 检查快手API返回是否包含错误
|
||
if "data" not in result or result.get("code", 0) != 0:
|
||
error_msg = f"快手API返回错误: {result.get('message', '未知错误')}"
|
||
logger.error(error_msg)
|
||
raise Exception(error_msg)
|
||
|
||
return result
|
||
|
||
except requests.exceptions.RequestException as e:
|
||
error_msg = f"快手ASR请求网络错误: {str(e)}"
|
||
logger.error(error_msg)
|
||
raise
|
||
except Exception as e:
|
||
error_msg = f"快手ASR请求处理错误: {str(e)}"
|
||
logger.error(error_msg)
|
||
raise
|
||
|
||
@timeit
|
||
def transcript(self, file_path: str) -> TranscriptResult:
|
||
"""执行转录过程,符合 Transcriber 接口"""
|
||
try:
|
||
logger.info(f"开始处理文件: {file_path}")
|
||
|
||
# 提交请求并获取结果
|
||
logger.info("向快手API提交识别请求...")
|
||
result_data = self._submit(file_path)
|
||
|
||
logger.info("请求成功,处理结果...")
|
||
|
||
# 提取分段数据
|
||
segments = []
|
||
full_text = ""
|
||
|
||
# 解析快手API返回的文本段
|
||
texts = result_data.get('data', {}).get('text', [])
|
||
for u in texts:
|
||
text = u.get('text', '').strip()
|
||
start_time = float(u.get('start_time', 0))
|
||
end_time = float(u.get('end_time', 0))
|
||
|
||
full_text += text + " "
|
||
segments.append(TranscriptSegment(
|
||
start=start_time,
|
||
end=end_time,
|
||
text=text
|
||
))
|
||
|
||
# 创建结果对象
|
||
result = TranscriptResult(
|
||
language="zh", # 快手API可能不返回语言信息,默认为中文
|
||
full_text=full_text.strip(),
|
||
segments=segments,
|
||
raw=result_data
|
||
)
|
||
|
||
# 触发完成事件
|
||
# self.on_finish(file_path, result)
|
||
|
||
return result
|
||
|
||
except Exception as e:
|
||
logger.error(f"快手ASR处理失败: {str(e)}")
|
||
raise
|
||
|
||
def on_finish(self, video_path: str, result: TranscriptResult) -> None:
|
||
"""转录完成的回调"""
|
||
logger.info(f"快手ASR转写完成: {video_path}")
|
||
transcription_finished.send({
|
||
"file_path": video_path,
|
||
}) |