From f4801d5be7238537dd84ba103dca605ac02d09c3 Mon Sep 17 00:00:00 2001 From: huangjianwu Date: Mon, 23 Mar 2026 17:31:30 +0800 Subject: [PATCH 1/2] =?UTF-8?q?feat(youtube):=20=E4=BD=BF=E7=94=A8=20youtu?= =?UTF-8?q?be-transcript-api=20=E4=BC=98=E5=85=88=E8=8E=B7=E5=8F=96?= =?UTF-8?q?=E5=AD=97=E5=B9=95=EF=BC=8C=E6=9C=89=E5=AD=97=E5=B9=95=E6=97=B6?= =?UTF-8?q?=E8=B7=B3=E8=BF=87=E9=9F=B3=E9=A2=91=E4=B8=8B=E8=BD=BD?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit - 新增 YouTubeSubtitleFetcher 模块,通过 youtube-transcript-api 获取字幕 - 重构笔记生成流程:缓存 → 平台字幕 → 按需下载 → 转写 fallback - 有字幕时仅提取视频元信息,不下载音视频文件 - 添加 youtube-transcript-api 依赖 Co-Authored-By: Claude Opus 4.6 --- backend/app/downloaders/base.py | 3 +- backend/app/downloaders/youtube_downloader.py | 134 +++--------------- backend/app/downloaders/youtube_subtitle.py | 98 +++++++++++++ backend/app/services/note.py | 105 ++++++++++---- backend/requirements.txt | 1 + 5 files changed, 203 insertions(+), 138 deletions(-) create mode 100644 backend/app/downloaders/youtube_subtitle.py diff --git a/backend/app/downloaders/base.py b/backend/app/downloaders/base.py index a4dfb07..d1e71ad 100644 --- a/backend/app/downloaders/base.py +++ b/backend/app/downloaders/base.py @@ -22,7 +22,8 @@ class Downloader(ABC): @abstractmethod def download(self, video_url: str, output_dir: str = None, - quality: DownloadQuality = "fast", need_video: Optional[bool] = False) -> AudioDownloadResult: + quality: DownloadQuality = "fast", need_video: Optional[bool] = False, + skip_download: bool = False) -> AudioDownloadResult: ''' :param need_video: diff --git a/backend/app/downloaders/youtube_downloader.py b/backend/app/downloaders/youtube_downloader.py index 2a081bb..bb8ed8a 100644 --- a/backend/app/downloaders/youtube_downloader.py +++ b/backend/app/downloaders/youtube_downloader.py @@ -1,5 +1,4 @@ import os -import json import logging from abc import ABC from typing import Union, Optional, List @@ -7,8 +6,9 @@ from typing import Union, Optional, List import yt_dlp from app.downloaders.base import Downloader, DownloadQuality +from app.downloaders.youtube_subtitle import YouTubeSubtitleFetcher from app.models.notes_model import AudioDownloadResult -from app.models.transcriber_model import TranscriptResult, TranscriptSegment +from app.models.transcriber_model import TranscriptResult from app.utils.path_helper import get_data_dir from app.utils.url_parser import extract_video_id @@ -25,12 +25,13 @@ class YoutubeDownloader(Downloader, ABC): video_url: str, output_dir: Union[str, None] = None, quality: DownloadQuality = "fast", - need_video:Optional[bool]=False + need_video: Optional[bool] = False, + skip_download: bool = False, ) -> AudioDownloadResult: if output_dir is None: output_dir = get_data_dir() if not output_dir: - output_dir=self.cache_data + output_dir = self.cache_data os.makedirs(output_dir, exist_ok=True) output_path = os.path.join(output_dir, "%(id)s.%(ext)s") @@ -42,15 +43,17 @@ class YoutubeDownloader(Downloader, ABC): 'quiet': False, } + if skip_download: + ydl_opts['skip_download'] = True + with yt_dlp.YoutubeDL(ydl_opts) as ydl: - info = ydl.extract_info(video_url, download=True) + info = ydl.extract_info(video_url, download=not skip_download) video_id = info.get("id") title = info.get("title") duration = info.get("duration", 0) cover_url = info.get("thumbnail") - ext = info.get("ext", "m4a") # 兜底用 m4a + ext = info.get("ext", "m4a") audio_path = os.path.join(output_dir, f"{video_id}.{ext}") - print('os.path.join(output_dir, f"{video_id}.{ext}")',os.path.join(output_dir, f"{video_id}.{ext}")) return AudioDownloadResult( file_path=audio_path, @@ -59,8 +62,8 @@ class YoutubeDownloader(Downloader, ABC): cover_url=cover_url, platform="youtube", video_id=video_id, - raw_info={'tags':info.get('tags')}, #全部返回会报错 - video_path=None # ❗音频下载不包含视频路径 + raw_info={'tags': info.get('tags')}, + video_path=None, ) def download_video( @@ -101,115 +104,20 @@ class YoutubeDownloader(Downloader, ABC): def download_subtitles(self, video_url: str, output_dir: str = None, langs: List[str] = None) -> Optional[TranscriptResult]: """ - 尝试获取YouTube视频字幕(优先人工字幕,其次自动生成) + 通过 YouTube InnerTube API 直接获取字幕(优先人工字幕,其次自动生成)。 + 比 yt_dlp 方式更轻量,无需写临时文件到磁盘。 :param video_url: 视频链接 - :param output_dir: 输出路径 + :param output_dir: 未使用(保留接口兼容) :param langs: 优先语言列表 :return: TranscriptResult 或 None """ - if output_dir is None: - output_dir = get_data_dir() - if not output_dir: - output_dir = self.cache_data - os.makedirs(output_dir, exist_ok=True) - if langs is None: - langs = ['zh-Hans', 'zh', 'zh-CN', 'zh-TW', 'en', 'en-US'] + langs = ['zh-Hans', 'zh', 'zh-CN', 'zh-TW', 'en', 'en-US', 'ja'] video_id = extract_video_id(video_url, "youtube") - - ydl_opts = { - 'writesubtitles': True, - 'writeautomaticsub': True, - 'subtitleslangs': langs, - 'subtitlesformat': 'json3', - 'skip_download': True, - 'outtmpl': os.path.join(output_dir, f'{video_id}.%(ext)s'), - 'quiet': True, - } - - try: - with yt_dlp.YoutubeDL(ydl_opts) as ydl: - info = ydl.extract_info(video_url, download=True) - - # 查找下载的字幕文件 - subtitles = info.get('requested_subtitles') or {} - if not subtitles: - logger.info(f"YouTube视频 {video_id} 没有可用字幕") - return None - - # 按优先级查找字幕文件 - subtitle_file = None - detected_lang = None - for lang in langs: - if lang in subtitles: - subtitle_file = os.path.join(output_dir, f"{video_id}.{lang}.json3") - detected_lang = lang - break - - # 如果按优先级没找到,取第一个可用的 - if not subtitle_file: - for lang, sub_info in subtitles.items(): - subtitle_file = os.path.join(output_dir, f"{video_id}.{lang}.json3") - detected_lang = lang - break - - if not subtitle_file or not os.path.exists(subtitle_file): - logger.info(f"字幕文件不存在: {subtitle_file}") - return None - - # 解析字幕文件 - return self._parse_json3_subtitle(subtitle_file, detected_lang) - - except Exception as e: - logger.warning(f"获取YouTube字幕失败: {e}") - return None - - def _parse_json3_subtitle(self, subtitle_file: str, language: str) -> Optional[TranscriptResult]: - """ - 解析 json3 格式字幕文件 - - :param subtitle_file: 字幕文件路径 - :param language: 语言代码 - :return: TranscriptResult - """ - try: - with open(subtitle_file, 'r', encoding='utf-8') as f: - data = json.load(f) - - segments = [] - events = data.get('events', []) - - for event in events: - # json3 格式中时间单位是毫秒 - start_ms = event.get('tStartMs', 0) - duration_ms = event.get('dDurationMs', 0) - - # 提取文本 - segs = event.get('segs', []) - text = ''.join(seg.get('utf8', '') for seg in segs).strip() - - if text: # 只添加非空文本 - segments.append(TranscriptSegment( - start=start_ms / 1000.0, - end=(start_ms + duration_ms) / 1000.0, - text=text - )) - - if not segments: - return None - - full_text = ' '.join(seg.text for seg in segments) - - logger.info(f"成功解析YouTube字幕,共 {len(segments)} 段") - return TranscriptResult( - language=language, - full_text=full_text, - segments=segments, - raw={'source': 'youtube_subtitle', 'file': subtitle_file} - ) - - except Exception as e: - logger.warning(f"解析字幕文件失败: {e}") - return None + fetcher = YouTubeSubtitleFetcher() + print( + f"尝试获取字幕,video_id={video_id}, langs={langs}" + ) + return fetcher.fetch_subtitles(video_id, langs) diff --git a/backend/app/downloaders/youtube_subtitle.py b/backend/app/downloaders/youtube_subtitle.py new file mode 100644 index 0000000..d59a871 --- /dev/null +++ b/backend/app/downloaders/youtube_subtitle.py @@ -0,0 +1,98 @@ +""" +通过 youtube-transcript-api 获取 YouTube 字幕。 +优先人工字幕,其次自动生成字幕。不依赖 yt_dlp,无需下载任何文件。 +""" + +from typing import Optional, List + +from youtube_transcript_api import YouTubeTranscriptApi + +from app.models.transcriber_model import TranscriptResult, TranscriptSegment +from app.utils.logger import get_logger + +logger = get_logger(__name__) + + +class YouTubeSubtitleFetcher: + """通过 youtube-transcript-api 获取 YouTube 字幕。""" + + def __init__(self): + self._api = YouTubeTranscriptApi() + + def fetch_subtitles( + self, + video_id: str, + langs: Optional[List[str]] = None, + ) -> Optional[TranscriptResult]: + if langs is None: + langs = ["zh-Hans", "zh", "zh-CN", "zh-TW", "en", "en-US", "ja"] + + try: + # 1. 列出所有可用字幕 + transcript_list = self._api.list(video_id) + + available = [] + for t in transcript_list: + available.append( + f"{t.language_code}({'auto' if t.is_generated else 'manual'})" + ) + logger.info(f"可用字幕轨道: {', '.join(available)}") + + # 2. 按优先级查找:先人工字幕,再自动字幕 + transcript = None + try: + transcript = transcript_list.find_manually_created_transcript(langs) + logger.info(f"选中人工字幕: {transcript.language_code} ({transcript.language})") + except Exception: + try: + transcript = transcript_list.find_generated_transcript(langs) + logger.info(f"选中自动字幕: {transcript.language_code} ({transcript.language})") + except Exception: + # 都没匹配,取第一个可用的 + for t in transcript_list: + transcript = t + source = "auto" if t.is_generated else "manual" + logger.info(f"使用首个可用字幕: {t.language_code} ({source})") + break + + if not transcript: + logger.info(f"YouTube 视频 {video_id} 没有任何可用字幕") + return None + + # 3. 获取字幕内容 + fetched = transcript.fetch() + segments = [] + for snippet in fetched: + text = snippet.get("text", "").strip() if isinstance(snippet, dict) else str(snippet).strip() + if not text: + continue + start = snippet.get("start", 0) if isinstance(snippet, dict) else 0 + duration = snippet.get("duration", 0) if isinstance(snippet, dict) else 0 + segments.append(TranscriptSegment( + start=float(start), + end=float(start) + float(duration), + text=text, + )) + + if not segments: + logger.warning(f"YouTube 字幕内容为空: {video_id}") + return None + + full_text = " ".join(seg.text for seg in segments) + logger.info(f"成功获取 YouTube 字幕,共 {len(segments)} 段") + + return TranscriptResult( + language=transcript.language_code, + full_text=full_text, + segments=segments, + raw={ + "source": "youtube_transcript_api", + "language": transcript.language, + "language_code": transcript.language_code, + "is_generated": transcript.is_generated, + }, + ) + + except Exception as e: + logger.warning(f"YouTube 字幕获取失败: {e}") + return None diff --git a/backend/app/services/note.py b/backend/app/services/note.py index 81d35c0..ebbe83a 100644 --- a/backend/app/services/note.py +++ b/backend/app/services/note.py @@ -133,8 +133,46 @@ class NoteGenerator: audio_cache_file = NOTE_OUTPUT_DIR / f"{task_id}_audio.json" transcript_cache_file = NOTE_OUTPUT_DIR / f"{task_id}_transcript.json" markdown_cache_file = NOTE_OUTPUT_DIR / f"{task_id}_markdown.md" - print(audio_cache_file) - # 1. 下载音频/视频 + # 1. 获取字幕/转写:优先缓存 → 平台字幕 → 音频转写 + transcript = None + + # 尝试读取缓存 + if transcript_cache_file.exists(): + logger.info(f"检测到转写缓存 ({transcript_cache_file}),尝试读取") + try: + data = json.loads(transcript_cache_file.read_text(encoding="utf-8")) + segments = [TranscriptSegment(**seg) for seg in data.get("segments", [])] + transcript = TranscriptResult( + language=data.get("language"), + full_text=data["full_text"], + segments=segments, + ) + logger.info(f"已从缓存加载转写结果,共 {len(segments)} 段") + except Exception as e: + logger.warning(f"加载转写缓存失败: {e}") + + # 缓存没有,尝试获取平台字幕 + if transcript is None: + logger.info("尝试获取平台字幕(优先于音频下载)...") + try: + transcript = downloader.download_subtitles(video_url) + if transcript and transcript.segments: + logger.info(f"成功获取平台字幕,共 {len(transcript.segments)} 段") + transcript_cache_file.write_text( + json.dumps(asdict(transcript), ensure_ascii=False, indent=2), + encoding="utf-8", + ) + else: + transcript = None + logger.info("平台无可用字幕,将下载音频后转写") + except Exception as e: + logger.warning(f"获取平台字幕失败: {e},将下载音频后转写") + transcript = None + + # 2. 下载音频/视频 + # 有字幕时只提取元信息,不下载音视频文件(除非需要截图/视频理解) + has_transcript = transcript is not None + need_full_download = not has_transcript or screenshot or video_understanding audio_meta = self._download_media( downloader=downloader, video_url=video_url, @@ -147,18 +185,19 @@ class NoteGenerator: video_understanding=video_understanding, video_interval=video_interval, grid_size=grid_size, + skip_download=not need_full_download, ) - # 2. 获取字幕/转写文字 - # 优先尝试获取平台字幕,没有再 fallback 到音频转写 - transcript = self._get_transcript( - downloader=downloader, - video_url=video_url, - audio_file=audio_meta.file_path, - transcript_cache_file=transcript_cache_file, - status_phase=TaskStatus.TRANSCRIBING, - task_id=task_id, - ) + # 3. 如果前面没拿到字幕,走转写流程 + if transcript is None: + transcript = self._get_transcript( + downloader=downloader, + video_url=video_url, + audio_file=audio_meta.file_path, + transcript_cache_file=transcript_cache_file, + status_phase=TaskStatus.TRANSCRIBING, + task_id=task_id, + ) # 3. GPT 总结 markdown = self._summarize_text( @@ -331,6 +370,7 @@ class NoteGenerator: video_understanding: bool, video_interval: int, grid_size: List[int], + skip_download: bool = False, ) -> AudioDownloadResult | None: """ 1. 检查音频缓存;若不存在,则根据需要下载音频或视频(若需截图/可视化)。 @@ -353,7 +393,34 @@ class NoteGenerator: task_id = audio_cache_file.stem.split("_")[0] self._update_status(task_id, status_phase) + # 已有缓存,尝试加载 + if audio_cache_file.exists(): + logger.info(f"检测到音频缓存 ({audio_cache_file}),直接读取") + try: + data = json.loads(audio_cache_file.read_text(encoding="utf-8")) + return AudioDownloadResult(**data) + except Exception as e: + logger.warning(f"读取音频缓存失败,将重新下载:{e}") + # 有字幕且不需要截图/视频理解时,只提取元信息不下载文件 + if skip_download: + logger.info("已有字幕,仅提取视频元信息(不下载音视频)") + try: + audio = downloader.download( + video_url=video_url, + quality=quality, + output_dir=output_path, + need_video=False, + skip_download=True, + ) + audio_cache_file.write_text( + json.dumps(asdict(audio), ensure_ascii=False, indent=2), + encoding="utf-8", + ) + logger.info(f"元信息提取完成 ({audio_cache_file})") + return audio + except Exception as exc: + logger.warning(f"元信息提取失败,将尝试完整下载: {exc}") # 判断是否需要下载视频 need_video = screenshot or video_understanding @@ -368,9 +435,8 @@ class NoteGenerator: self.video_path = Path(video_path_str) logger.info(f"视频下载完成:{self.video_path}") - # 若指定了 grid_size,则生成缩略图 if grid_size: - self.video_img_urls=VideoReader( + self.video_img_urls = VideoReader( video_path=str(self.video_path), grid_size=tuple(grid_size), frame_interval=frame_interval, @@ -382,17 +448,9 @@ class NoteGenerator: logger.info("未指定 grid_size,跳过缩略图生成") except Exception as exc: logger.error(f"视频下载失败:{exc}") - self._handle_exception(task_id, exc) raise - # 已有缓存,尝试加载 - if audio_cache_file.exists(): - logger.info(f"检测到音频缓存 ({audio_cache_file}),直接读取") - try: - data = json.loads(audio_cache_file.read_text(encoding="utf-8")) - return AudioDownloadResult(**data) - except Exception as e: - logger.warning(f"读取音频缓存失败,将重新下载:{e}") + # 下载音频 try: logger.info("开始下载音频") @@ -402,7 +460,6 @@ class NoteGenerator: output_dir=output_path, need_video=need_video, ) - # 缓存 audio 元信息到本地 JSON audio_cache_file.write_text(json.dumps(asdict(audio), ensure_ascii=False, indent=2), encoding="utf-8") logger.info(f"音频下载并缓存成功 ({audio_cache_file})") return audio diff --git a/backend/requirements.txt b/backend/requirements.txt index b3afa64..b29b0ab 100644 --- a/backend/requirements.txt +++ b/backend/requirements.txt @@ -124,5 +124,6 @@ weasyprint==65.1 webencodings==0.5.1 websockets==15.0.1 yarl==1.19.0 +youtube-transcript-api>=1.0.0 yt-dlp==2025.3.31 zopfli==0.2.3.post1 From 60909822610619cfec0c4a243146289e0a12da0a Mon Sep 17 00:00:00 2001 From: huangjianwu Date: Mon, 23 Mar 2026 17:52:30 +0800 Subject: [PATCH 2/2] =?UTF-8?q?docs:=20=E6=9B=B4=E6=96=B0=20README=20?= =?UTF-8?q?=E8=87=B3=20v2.0.0=EF=BC=8C=E8=A1=A5=E5=85=85=E6=96=B0=E5=8A=9F?= =?UTF-8?q?=E8=83=BD=E8=AF=B4=E6=98=8E=E5=92=8C=20Docker=20=E9=83=A8?= =?UTF-8?q?=E7=BD=B2=E6=96=B9=E5=BC=8F?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit - 版本号升级为 2.0.0(README、tauri.conf.json、about 页面) - 新增 v2.0.0 功能说明:RAG 问答、Function Calling、封面 Banner、面板折叠等 - Docker 部署改为推荐方式,支持 docker pull 预构建镜像 - 补充源码部署为方式二,修正前端访问端口为 3015 - 更新功能特性列表,补充快手、AI 问答等新功能 - TODO 标记 RAG 问答为已完成 Co-Authored-By: Claude Opus 4.6 --- BillNote_frontend/src-tauri/tauri.conf.json | 2 +- .../src/pages/SettingPage/about.tsx | 2 +- README.md | 85 ++++++++++++++----- 3 files changed, 66 insertions(+), 23 deletions(-) diff --git a/BillNote_frontend/src-tauri/tauri.conf.json b/BillNote_frontend/src-tauri/tauri.conf.json index 0609150..79bf8e2 100644 --- a/BillNote_frontend/src-tauri/tauri.conf.json +++ b/BillNote_frontend/src-tauri/tauri.conf.json @@ -1,7 +1,7 @@ { "$schema": "../node_modules/@tauri-apps/cli/config.schema.json", "productName": "BiliNote", - "version": "1.8.1", + "version": "2.0.0", "identifier": "com.jefferyhuang.bilinote", "build": { "frontendDist": "../dist", diff --git a/BillNote_frontend/src/pages/SettingPage/about.tsx b/BillNote_frontend/src/pages/SettingPage/about.tsx index 5ef3c11..c4c1ce0 100644 --- a/BillNote_frontend/src/pages/SettingPage/about.tsx +++ b/BillNote_frontend/src/pages/SettingPage/about.tsx @@ -26,7 +26,7 @@ export default function AboutPage() { height={50} className="rounded-lg" /> -

BiliNote v1.8.1

+

BiliNote v2.0.0

AI 视频笔记生成工具 让 AI 为你的视频做笔记 diff --git a/README.md b/README.md index 22402a1..6759c9f 100644 --- a/README.md +++ b/README.md @@ -3,17 +3,17 @@

BiliNote Banner

-

BiliNote v1.8.1

+

BiliNote v2.0.0

AI 视频笔记生成工具 让 AI 为你的视频做笔记

- + - +

@@ -22,30 +22,48 @@ ## ✨ 项目简介 -BiliNote 是一个开源的 AI 视频笔记助手,支持通过哔哩哔哩、YouTube、抖音等视频链接,自动提取内容并生成结构清晰、重点明确的 Markdown 格式笔记。支持插入截图、原片跳转等功能。 +BiliNote 是一个开源的 AI 视频笔记助手,支持通过哔哩哔哩、YouTube、抖音等视频链接,自动提取内容并生成结构清晰、重点明确的 Markdown 格式笔记。支持插入截图、原片跳转、AI 问答等功能。 + ## 📝 使用文档 详细文档可以查看[这里](https://docs.bilinote.app/) ## 体验地址 可以通过访问 [这里](https://www.bilinote.app/) 进行体验,速度略慢,不支持长视频。 -## 📦 Windows 打包版 -本项目提供了 Windows 系统的 exe 文件,可在[release](https://github.com/JefferyHcool/BiliNote/releases/tag/v1.1.1)进行下载。**注意一定要在没有中文路径的环境下运行。** +## 📦 桌面版下载 +本项目提供了 Windows 和 macOS 桌面客户端,可在 [Releases](https://github.com/JefferyHcool/BiliNote/releases) 页面下载最新版本。 + +> Windows 用户请注意:一定要在没有中文路径的环境下运行。 ## 🔧 功能特性 -- 支持多平台:Bilibili、YouTube、本地视频、抖音(后续会加入更多平台) +- 支持多平台:Bilibili、YouTube、本地视频、抖音、快手 - 支持返回笔记格式选择 - 支持笔记风格选择 - 支持多模态视频理解 - 支持多版本记录保留 -- 支持自行配置 GPT 大模型 -- 本地模型音频转写(支持 Fast-Whisper) +- 支持自行配置 GPT 大模型(OpenAI、DeepSeek、Qwen 等) +- 本地模型音频转写(支持 Fast-Whisper、MLX-Whisper、Groq、BCut) - GPT 大模型总结视频内容 - 自动生成结构化 Markdown 笔记 - 可选插入截图(自动截取) - 可选内容跳转链接(关联原视频) - 任务记录与历史回看 +- 基于 RAG 的笔记内容 AI 问答(支持 Function Calling) +- 笔记顶部视频封面 Banner 展示 +- 工作区和生成历史面板支持折叠/展开 + +### v2.0.0 新增 + +- 基于 RAG 的笔记内容 AI 问答功能,支持半屏/全屏模式 +- AI 问答支持 Function Calling,模型可主动查询原文数据 +- RAG 索引支持视频元信息(标题、作者、简介、标签等) +- AI 回复支持 Markdown 渲染 +- 笔记顶部新增视频封面 Banner +- 工作区和生成历史面板支持折叠/展开 +- 笔记开头添加来源链接功能 +- YouTube 字幕优先获取,有字幕时跳过音频下载 +- 性能优化与转写器配置改进 ## 📸 截图预览 ![screenshot](./doc/image1.png) @@ -56,7 +74,34 @@ BiliNote 是一个开源的 AI 视频笔记助手,支持通过哔哩哔哩、Y ## 🚀 快速开始 -### 1. 克隆仓库 +### 方式一:Docker 部署(推荐) + +确保已安装 Docker,直接拉取预构建镜像运行: + +```bash +docker pull ghcr.io/jefferyhcool/bilinote:latest + +docker run -d -p 80:80 \ + -v bilinote-data:/app/backend/data \ + --name bilinote \ + ghcr.io/jefferyhcool/bilinote:latest +``` + +访问:`http://localhost` + +也可以使用 docker-compose 本地构建: + +```bash +# 标准部署 +docker-compose up -d + +# GPU 加速部署(需要 NVIDIA GPU) +docker-compose -f docker-compose.gpu.yml up -d +``` + +### 方式二:源码部署 + +#### 1. 克隆仓库 ```bash git clone https://github.com/JefferyHcool/BiliNote.git @@ -64,7 +109,7 @@ cd BiliNote mv .env.example .env ``` -### 2. 启动后端(FastAPI) +#### 2. 启动后端(FastAPI) ```bash cd backend @@ -72,7 +117,7 @@ pip install -r requirements.txt python main.py ``` -### 3. 启动前端(Vite + React) +#### 3. 启动前端(Vite + React) ```bash cd BillNote_frontend @@ -80,11 +125,12 @@ pnpm install pnpm dev ``` -访问:`http://localhost:5173` +访问:`http://localhost:3015` ## ⚙️ 依赖说明 + ### 🎬 FFmpeg -本项目依赖 ffmpeg 用于音频处理与转码,必须安装: +本项目依赖 ffmpeg 用于音频处理与转码,源码部署时必须安装: ```bash # Mac (brew) brew install ffmpeg @@ -96,26 +142,23 @@ sudo apt install ffmpeg # 请从官网下载安装:https://ffmpeg.org/download.html ``` > ⚠️ 若系统无法识别 ffmpeg,请将其加入系统环境变量 PATH +> +> Docker 部署已内置 FFmpeg,无需额外安装。 ### 🚀 CUDA 加速(可选) 若你希望更快地执行音频转写任务,可使用具备 NVIDIA GPU 的机器,并启用 fast-whisper + CUDA 加速版本: 具体 `fast-whisper` 配置方法,请参考:[fast-whisper 项目地址](http://github.com/SYSTRAN/faster-whisper#requirements) -### 🐳 使用 Docker 一键部署 - -确保你已安装 Docker 和 Docker Compose: - -[docker 部署](https://github.com/JefferyHcool/bilinote-deploy/blob/master/README.md) - ## 🧠 TODO - [x] 支持抖音及快手等视频平台 - [x] 支持前端设置切换 AI 模型切换、语音转文字模型 - [x] AI 摘要风格自定义(学术风、口语风、重点提取等) -- [ ] 笔记导出为 PDF / Word / Notion - [x] 加入更多模型支持 - [x] 加入更多音频转文本模型支持 +- [x] 基于 RAG 的笔记内容 AI 问答 +- [ ] 笔记导出为 PDF / Word / Notion ### Contact and Join-联系和加入社区 年会恢复更新以后放出最新社区地址