diff --git a/relay/channel/ali/adaptor.go b/relay/channel/ali/adaptor.go index f3cc4b6c..faf70981 100644 --- a/relay/channel/ali/adaptor.go +++ b/relay/channel/ali/adaptor.go @@ -223,11 +223,8 @@ func (a *Adaptor) DoResponse(c *gin.Context, resp *http.Response, info *relaycom switch info.RelayFormat { case types.RelayFormatClaude: if supportsAliAnthropicMessages(info.UpstreamModelName) { - if info.IsStream { - return claude.ClaudeStreamHandler(c, resp, info) - } - - return claude.ClaudeHandler(c, resp, info) + adaptor := claude.Adaptor{} + return adaptor.DoResponse(c, resp, info) } adaptor := openai.Adaptor{} diff --git a/relay/channel/claude/adaptor.go b/relay/channel/claude/adaptor.go index 29595391..a713c17d 100644 --- a/relay/channel/claude/adaptor.go +++ b/relay/channel/claude/adaptor.go @@ -95,6 +95,7 @@ func (a *Adaptor) DoRequest(c *gin.Context, info *relaycommon.RelayInfo, request } func (a *Adaptor) DoResponse(c *gin.Context, resp *http.Response, info *relaycommon.RelayInfo) (usage any, err *types.NewAPIError) { + info.FinalRequestRelayFormat = types.RelayFormatClaude if info.IsStream { return ClaudeStreamHandler(c, resp, info) } else { diff --git a/relay/channel/codex/adaptor.go b/relay/channel/codex/adaptor.go index d8a4e866..42f3b8e4 100644 --- a/relay/channel/codex/adaptor.go +++ b/relay/channel/codex/adaptor.go @@ -26,7 +26,7 @@ func (a *Adaptor) ConvertGeminiRequest(c *gin.Context, info *relaycommon.RelayIn } func (a *Adaptor) ConvertClaudeRequest(*gin.Context, *relaycommon.RelayInfo, *dto.ClaudeRequest) (any, error) { - return nil, errors.New("codex channel: endpoint not supported") + return nil, errors.New("codex channel: /v1/messages endpoint not supported") } func (a *Adaptor) ConvertAudioRequest(c *gin.Context, info *relaycommon.RelayInfo, request dto.AudioRequest) (io.Reader, error) { @@ -41,15 +41,15 @@ func (a *Adaptor) Init(info *relaycommon.RelayInfo) { } func (a *Adaptor) ConvertOpenAIRequest(c *gin.Context, info *relaycommon.RelayInfo, request *dto.GeneralOpenAIRequest) (any, error) { - return nil, errors.New("codex channel: endpoint not supported") + return nil, errors.New("codex channel: /v1/chat/completions endpoint not supported") } func (a *Adaptor) ConvertRerankRequest(c *gin.Context, relayMode int, request dto.RerankRequest) (any, error) { - return nil, errors.New("codex channel: endpoint not supported") + return nil, errors.New("codex channel: /v1/rerank endpoint not supported") } func (a *Adaptor) ConvertEmbeddingRequest(c *gin.Context, info *relaycommon.RelayInfo, request dto.EmbeddingRequest) (any, error) { - return nil, errors.New("codex channel: endpoint not supported") + return nil, errors.New("codex channel: /v1/embeddings endpoint not supported") } func (a *Adaptor) ConvertOpenAIResponsesRequest(c *gin.Context, info *relaycommon.RelayInfo, request dto.OpenAIResponsesRequest) (any, error) { diff --git a/relay/channel/deepseek/adaptor.go b/relay/channel/deepseek/adaptor.go index 6de2653b..57fcf3d0 100644 --- a/relay/channel/deepseek/adaptor.go +++ b/relay/channel/deepseek/adaptor.go @@ -95,11 +95,8 @@ func (a *Adaptor) DoRequest(c *gin.Context, info *relaycommon.RelayInfo, request func (a *Adaptor) DoResponse(c *gin.Context, resp *http.Response, info *relaycommon.RelayInfo) (usage any, err *types.NewAPIError) { switch info.RelayFormat { case types.RelayFormatClaude: - if info.IsStream { - return claude.ClaudeStreamHandler(c, resp, info) - } else { - return claude.ClaudeHandler(c, resp, info) - } + adaptor := claude.Adaptor{} + return adaptor.DoResponse(c, resp, info) default: adaptor := openai.Adaptor{} return adaptor.DoResponse(c, resp, info) diff --git a/relay/channel/moonshot/adaptor.go b/relay/channel/moonshot/adaptor.go index 25a6e2a3..c2f6ee4a 100644 --- a/relay/channel/moonshot/adaptor.go +++ b/relay/channel/moonshot/adaptor.go @@ -102,11 +102,8 @@ func (a *Adaptor) ConvertEmbeddingRequest(c *gin.Context, info *relaycommon.Rela func (a *Adaptor) DoResponse(c *gin.Context, resp *http.Response, info *relaycommon.RelayInfo) (usage any, err *types.NewAPIError) { switch info.RelayFormat { case types.RelayFormatClaude: - if info.IsStream { - return claude.ClaudeStreamHandler(c, resp, info) - } else { - return claude.ClaudeHandler(c, resp, info) - } + adaptor := claude.Adaptor{} + return adaptor.DoResponse(c, resp, info) default: adaptor := openai.Adaptor{} return adaptor.DoResponse(c, resp, info) diff --git a/relay/channel/vertex/adaptor.go b/relay/channel/vertex/adaptor.go index 7c48907e..c8d27276 100644 --- a/relay/channel/vertex/adaptor.go +++ b/relay/channel/vertex/adaptor.go @@ -365,10 +365,11 @@ func (a *Adaptor) DoRequest(c *gin.Context, info *relaycommon.RelayInfo, request } func (a *Adaptor) DoResponse(c *gin.Context, resp *http.Response, info *relaycommon.RelayInfo) (usage any, err *types.NewAPIError) { + claudeAdaptor := claude.Adaptor{} if info.IsStream { switch a.RequestMode { case RequestModeClaude: - return claude.ClaudeStreamHandler(c, resp, info) + return claudeAdaptor.DoResponse(c, resp, info) case RequestModeGemini: if info.RelayMode == constant.RelayModeGemini { return gemini.GeminiTextGenerationStreamHandler(c, info, resp) @@ -381,7 +382,7 @@ func (a *Adaptor) DoResponse(c *gin.Context, resp *http.Response, info *relaycom } else { switch a.RequestMode { case RequestModeClaude: - return claude.ClaudeHandler(c, resp, info) + return claudeAdaptor.DoResponse(c, resp, info) case RequestModeGemini: if info.RelayMode == constant.RelayModeGemini { return gemini.GeminiTextGenerationHandler(c, info, resp) diff --git a/relay/channel/volcengine/adaptor.go b/relay/channel/volcengine/adaptor.go index 22caa6b9..9f2b8e80 100644 --- a/relay/channel/volcengine/adaptor.go +++ b/relay/channel/volcengine/adaptor.go @@ -347,10 +347,8 @@ func (a *Adaptor) DoRequest(c *gin.Context, info *relaycommon.RelayInfo, request func (a *Adaptor) DoResponse(c *gin.Context, resp *http.Response, info *relaycommon.RelayInfo) (usage any, err *types.NewAPIError) { if info.RelayFormat == types.RelayFormatClaude { if _, ok := channelconstant.ChannelSpecialBases[info.ChannelBaseUrl]; ok { - if info.IsStream { - return claude.ClaudeStreamHandler(c, resp, info) - } - return claude.ClaudeHandler(c, resp, info) + adaptor := claude.Adaptor{} + return adaptor.DoResponse(c, resp, info) } } diff --git a/relay/channel/zhipu_4v/adaptor.go b/relay/channel/zhipu_4v/adaptor.go index 7e25c7ca..597c4859 100644 --- a/relay/channel/zhipu_4v/adaptor.go +++ b/relay/channel/zhipu_4v/adaptor.go @@ -109,11 +109,8 @@ func (a *Adaptor) DoRequest(c *gin.Context, info *relaycommon.RelayInfo, request func (a *Adaptor) DoResponse(c *gin.Context, resp *http.Response, info *relaycommon.RelayInfo) (usage any, err *types.NewAPIError) { switch info.RelayFormat { case types.RelayFormatClaude: - if info.IsStream { - return claude.ClaudeStreamHandler(c, resp, info) - } else { - return claude.ClaudeHandler(c, resp, info) - } + adaptor := claude.Adaptor{} + return adaptor.DoResponse(c, resp, info) default: if info.RelayMode == relayconstant.RelayModeImagesGenerations { return zhipu4vImageHandler(c, resp, info) diff --git a/relay/common/relay_info.go b/relay/common/relay_info.go index 5b25ebf0..a30e4867 100644 --- a/relay/common/relay_info.go +++ b/relay/common/relay_info.go @@ -148,6 +148,8 @@ type RelayInfo struct { // RequestConversionChain records request format conversions in order, e.g. // ["openai", "openai_responses"] or ["openai", "claude"]. RequestConversionChain []types.RelayFormat + // 最终请求到上游的格式 TODO: 当前仅设置了Claude + FinalRequestRelayFormat types.RelayFormat ThinkingContentInfo TokenCountMeta diff --git a/relay/compatible_handler.go b/relay/compatible_handler.go index 21180d8d..eeb7b7aa 100644 --- a/relay/compatible_handler.go +++ b/relay/compatible_handler.go @@ -334,7 +334,7 @@ func postConsumeQuota(ctx *gin.Context, relayInfo *relaycommon.RelayInfo, usage var audioInputQuota decimal.Decimal var audioInputPrice float64 - isClaudeUsageSemantic := relayInfo.ChannelType == constant.ChannelTypeAnthropic + isClaudeUsageSemantic := relayInfo.FinalRequestRelayFormat == types.RelayFormatClaude if !relayInfo.PriceData.UsePrice { baseTokens := dPromptTokens // 减去 cached tokens