mirror of
https://github.com/snailyp/gemini-balance.git
synced 2026-06-07 00:29:36 +08:00
- 统一 add_error_log 的 request_time:优先使用 request_datetime, 否则使用 datetime.now(),去除 timezone.utc,避免与请求日志时区不一致 - 在 Gemini/OpenAI/Vertex/Embedding 等服务的异常处理处补充传入 request_datetime,使错误日志与请求日志可一一对应 - stats: 移除失败记录的错误日志时间窗匹配与 error_log_id 附带,降低查询开销 与误关联风险;建议通过统一时间戳(key + request_time)或独立错误日志 查询接口完成关联 - 调整部分导入顺序与长行换行等代码风格,无功能改动 BREAKING CHANGE: 统计详情接口不再返回 error_log_id 字段。需要关联错误日志的 客户端请改为基于 key 与 request_time 在错误日志接口中检索。
88 lines
3.0 KiB
Python
88 lines
3.0 KiB
Python
import datetime
|
|
import re
|
|
import time
|
|
from typing import List, Union
|
|
|
|
import openai
|
|
from openai import APIStatusError
|
|
from openai.types import CreateEmbeddingResponse
|
|
|
|
from app.config.config import settings
|
|
from app.database.services import add_error_log, add_request_log
|
|
from app.log.logger import get_embeddings_logger
|
|
|
|
logger = get_embeddings_logger()
|
|
|
|
|
|
class EmbeddingService:
|
|
|
|
async def create_embedding(
|
|
self, input_text: Union[str, List[str]], model: str, api_key: str
|
|
) -> CreateEmbeddingResponse:
|
|
"""Create embeddings using OpenAI API with database logging"""
|
|
start_time = time.perf_counter()
|
|
request_datetime = datetime.datetime.now()
|
|
is_success = False
|
|
status_code = None
|
|
response = None
|
|
error_log_msg = ""
|
|
if isinstance(input_text, list):
|
|
request_msg_log = {
|
|
"input_truncated": [
|
|
str(item)[:100] + "..." if len(str(item)) > 100 else str(item)
|
|
for item in input_text[:5]
|
|
]
|
|
}
|
|
if len(input_text) > 5:
|
|
request_msg_log["input_truncated"].append("...")
|
|
else:
|
|
request_msg_log = {
|
|
"input_truncated": (
|
|
input_text[:1000] + "..." if len(input_text) > 1000 else input_text
|
|
)
|
|
}
|
|
|
|
try:
|
|
client = openai.OpenAI(api_key=api_key, base_url=settings.BASE_URL)
|
|
response = client.embeddings.create(input=input_text, model=model)
|
|
is_success = True
|
|
status_code = 200
|
|
return response
|
|
except APIStatusError as e:
|
|
is_success = False
|
|
status_code = e.status_code
|
|
error_log_msg = f"OpenAI API error: {e}"
|
|
logger.error(f"Error creating embedding (APIStatusError): {error_log_msg}")
|
|
raise e
|
|
except Exception as e:
|
|
is_success = False
|
|
error_log_msg = f"Generic error: {e}"
|
|
logger.error(f"Error creating embedding (Exception): {error_log_msg}")
|
|
match = re.search(r"status code (\d+)", str(e))
|
|
if match:
|
|
status_code = int(match.group(1))
|
|
else:
|
|
status_code = 500
|
|
raise e
|
|
finally:
|
|
end_time = time.perf_counter()
|
|
latency_ms = int((end_time - start_time) * 1000)
|
|
if not is_success:
|
|
await add_error_log(
|
|
gemini_key=api_key,
|
|
model_name=model,
|
|
error_type="openai-embedding",
|
|
error_log=error_log_msg,
|
|
error_code=status_code,
|
|
request_msg=request_msg_log,
|
|
request_datetime=request_datetime,
|
|
)
|
|
await add_request_log(
|
|
model_name=model,
|
|
api_key=api_key,
|
|
is_success=is_success,
|
|
status_code=status_code,
|
|
latency_ms=latency_ms,
|
|
request_time=request_datetime,
|
|
)
|