2025-12-10 20:52:44 +08:00
|
|
|
|
"""
|
|
|
|
|
|
Claude Chat Handler - 基于通用 Chat Handler 基类的简化实现
|
|
|
|
|
|
|
|
|
|
|
|
继承 ChatHandlerBase,只需覆盖格式特定的方法。
|
|
|
|
|
|
代码量从原来的 ~1470 行减少到 ~120 行。
|
|
|
|
|
|
"""
|
|
|
|
|
|
|
|
|
|
|
|
from typing import Any, Dict, Optional
|
|
|
|
|
|
|
|
|
|
|
|
from src.api.handlers.base.chat_handler_base import ChatHandlerBase
|
2025-12-16 00:02:49 +08:00
|
|
|
|
from src.api.handlers.base.utils import extract_cache_creation_tokens
|
2025-12-10 20:52:44 +08:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class ClaudeChatHandler(ChatHandlerBase):
|
|
|
|
|
|
"""
|
|
|
|
|
|
Claude Chat Handler - 处理 Claude Chat/CLI API 格式的请求
|
|
|
|
|
|
|
|
|
|
|
|
格式特点:
|
|
|
|
|
|
- 使用 input_tokens/output_tokens
|
|
|
|
|
|
- 支持 cache_creation_input_tokens/cache_read_input_tokens
|
|
|
|
|
|
- 请求格式:ClaudeMessagesRequest
|
|
|
|
|
|
"""
|
|
|
|
|
|
|
|
|
|
|
|
FORMAT_ID = "CLAUDE"
|
|
|
|
|
|
|
|
|
|
|
|
def extract_model_from_request(
|
|
|
|
|
|
self,
|
|
|
|
|
|
request_body: Dict[str, Any],
|
|
|
|
|
|
path_params: Optional[Dict[str, Any]] = None, # noqa: ARG002
|
|
|
|
|
|
) -> str:
|
|
|
|
|
|
"""
|
|
|
|
|
|
从请求中提取模型名 - Claude 格式实现
|
|
|
|
|
|
|
|
|
|
|
|
Claude API 的 model 在请求体顶级字段。
|
|
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
|
request_body: 请求体
|
|
|
|
|
|
path_params: URL 路径参数(Claude 不使用)
|
|
|
|
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
|
|
模型名
|
|
|
|
|
|
"""
|
|
|
|
|
|
model = request_body.get("model")
|
|
|
|
|
|
return str(model) if model else "unknown"
|
|
|
|
|
|
|
|
|
|
|
|
def apply_mapped_model(
|
|
|
|
|
|
self,
|
|
|
|
|
|
request_body: Dict[str, Any],
|
|
|
|
|
|
mapped_model: str,
|
|
|
|
|
|
) -> Dict[str, Any]:
|
|
|
|
|
|
"""
|
|
|
|
|
|
将映射后的模型名应用到请求体
|
|
|
|
|
|
|
|
|
|
|
|
Claude API 的 model 在请求体顶级字段。
|
|
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
|
request_body: 原始请求体
|
|
|
|
|
|
mapped_model: 映射后的模型名
|
|
|
|
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
|
|
更新了 model 字段的请求体
|
|
|
|
|
|
"""
|
|
|
|
|
|
result = dict(request_body)
|
|
|
|
|
|
result["model"] = mapped_model
|
|
|
|
|
|
return result
|
|
|
|
|
|
|
2025-12-16 00:02:49 +08:00
|
|
|
|
async def _convert_request(self, request: Any) -> Any:
|
2025-12-10 20:52:44 +08:00
|
|
|
|
"""
|
|
|
|
|
|
将请求转换为 Claude 格式
|
|
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
|
request: 原始请求对象
|
|
|
|
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
|
|
ClaudeMessagesRequest 对象
|
|
|
|
|
|
"""
|
|
|
|
|
|
from src.api.handlers.claude.converter import OpenAIToClaudeConverter
|
|
|
|
|
|
from src.models.claude import ClaudeMessagesRequest
|
|
|
|
|
|
from src.models.openai import OpenAIRequest
|
|
|
|
|
|
|
|
|
|
|
|
# 如果已经是 Claude 格式,直接返回
|
|
|
|
|
|
if isinstance(request, ClaudeMessagesRequest):
|
|
|
|
|
|
return request
|
|
|
|
|
|
|
|
|
|
|
|
# 如果是 OpenAI 格式,转换为 Claude 格式
|
|
|
|
|
|
if isinstance(request, OpenAIRequest):
|
|
|
|
|
|
converter = OpenAIToClaudeConverter()
|
|
|
|
|
|
claude_dict = converter.convert_request(request.dict())
|
|
|
|
|
|
return ClaudeMessagesRequest(**claude_dict)
|
|
|
|
|
|
|
|
|
|
|
|
# 如果是字典,根据内容判断格式
|
|
|
|
|
|
if isinstance(request, dict):
|
|
|
|
|
|
if "messages" in request and len(request["messages"]) > 0:
|
|
|
|
|
|
first_msg = request["messages"][0]
|
|
|
|
|
|
if "role" in first_msg and "content" in first_msg:
|
|
|
|
|
|
# 可能是 OpenAI 格式
|
|
|
|
|
|
converter = OpenAIToClaudeConverter()
|
|
|
|
|
|
claude_dict = converter.convert_request(request)
|
|
|
|
|
|
return ClaudeMessagesRequest(**claude_dict)
|
|
|
|
|
|
|
|
|
|
|
|
# 否则假设已经是 Claude 格式
|
|
|
|
|
|
return ClaudeMessagesRequest(**request)
|
|
|
|
|
|
|
|
|
|
|
|
return request
|
|
|
|
|
|
|
|
|
|
|
|
def _extract_usage(self, response: Dict) -> Dict[str, int]:
|
|
|
|
|
|
"""
|
|
|
|
|
|
从 Claude 响应中提取 token 使用情况
|
|
|
|
|
|
|
|
|
|
|
|
Claude 格式使用:
|
|
|
|
|
|
- input_tokens / output_tokens
|
|
|
|
|
|
- cache_creation_input_tokens / cache_read_input_tokens
|
2025-12-16 00:02:49 +08:00
|
|
|
|
- 新格式:claude_cache_creation_5_m_tokens / claude_cache_creation_1_h_tokens
|
2025-12-10 20:52:44 +08:00
|
|
|
|
"""
|
|
|
|
|
|
usage = response.get("usage", {})
|
|
|
|
|
|
|
|
|
|
|
|
return {
|
2025-12-16 00:02:49 +08:00
|
|
|
|
"input_tokens": usage.get("input_tokens", 0),
|
|
|
|
|
|
"output_tokens": usage.get("output_tokens", 0),
|
|
|
|
|
|
"cache_creation_input_tokens": extract_cache_creation_tokens(usage),
|
|
|
|
|
|
"cache_read_input_tokens": usage.get("cache_read_input_tokens", 0),
|
2025-12-10 20:52:44 +08:00
|
|
|
|
}
|
|
|
|
|
|
|
2025-12-16 00:02:49 +08:00
|
|
|
|
def _normalize_response(self, response: Dict[str, Any]) -> Dict[str, Any]:
|
2025-12-10 20:52:44 +08:00
|
|
|
|
"""
|
|
|
|
|
|
规范化 Claude 响应
|
|
|
|
|
|
|
|
|
|
|
|
Args:
|
|
|
|
|
|
response: 原始响应
|
|
|
|
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
|
|
规范化后的响应
|
|
|
|
|
|
"""
|
2025-12-19 01:20:30 +08:00
|
|
|
|
# 作为中转站,直接透传响应,不做标准化处理
|
2025-12-10 20:52:44 +08:00
|
|
|
|
return response
|