From 6c036d7b59e6c6b3b187828c7d7b5d696964f51c Mon Sep 17 00:00:00 2001 From: IanShaw027 <131567472+IanShaw027@users.noreply.github.com> Date: Sun, 4 Jan 2026 20:49:34 +0800 Subject: [PATCH 01/13] =?UTF-8?q?fix(frontend):=20=E4=BC=98=E5=8C=96?= =?UTF-8?q?=E5=89=8D=E7=AB=AF=E7=BB=84=E4=BB=B6=E5=92=8C=E5=9B=BD=E9=99=85?= =?UTF-8?q?=E5=8C=96=E6=94=AF=E6=8C=81?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit - 添加 Accept-Language 请求头支持后端翻译 - 优化账户状态指示器和测试模态框 - 简化用户属性表单和配置模态框 - 新增多个国际化翻译条目 - 重构管理视图代码,提升可维护性 --- frontend/src/api/client.ts | 7 ++ .../account/AccountStatusIndicator.vue | 13 +-- .../components/account/AccountTestModal.vue | 16 ++-- .../src/components/user/UserAttributeForm.vue | 13 +-- .../user/UserAttributesConfigModal.vue | 10 +-- frontend/src/i18n/locales/en.ts | 48 +++++++++++ frontend/src/i18n/locales/zh.ts | 35 +++++++- frontend/src/views/admin/DashboardView.vue | 2 +- frontend/src/views/admin/GroupsView.vue | 12 +-- frontend/src/views/admin/ProxiesView.vue | 18 ++-- frontend/src/views/admin/RedeemView.vue | 6 +- .../src/views/admin/SubscriptionsView.vue | 2 +- frontend/src/views/admin/UsersView.vue | 86 ++++++------------- frontend/src/views/setup/SetupWizardView.vue | 63 ++++++++------ 14 files changed, 189 insertions(+), 142 deletions(-) diff --git a/frontend/src/api/client.ts b/frontend/src/api/client.ts index 3aac41a6..0aafd893 100644 --- a/frontend/src/api/client.ts +++ b/frontend/src/api/client.ts @@ -5,6 +5,7 @@ import axios, { AxiosInstance, AxiosError, InternalAxiosRequestConfig } from 'axios' import type { ApiResponse } from '@/types' +import { getLocale } from '@/i18n' // ==================== Axios Instance Configuration ==================== @@ -27,6 +28,12 @@ apiClient.interceptors.request.use( if (token && config.headers) { config.headers.Authorization = `Bearer ${token}` } + + // Attach locale for backend translations + if (config.headers) { + config.headers['Accept-Language'] = getLocale() + } + return config }, (error) => { diff --git a/frontend/src/components/account/AccountStatusIndicator.vue b/frontend/src/components/account/AccountStatusIndicator.vue index 914678a5..2783dbd9 100644 --- a/frontend/src/components/account/AccountStatusIndicator.vue +++ b/frontend/src/components/account/AccountStatusIndicator.vue @@ -52,7 +52,7 @@
- Rate limited until {{ formatTime(account.rate_limit_reset_at) }} + {{ t('admin.accounts.statuses.rateLimitedUntil', { time: formatTime(account.rate_limit_reset_at) }) }}
@@ -77,7 +77,7 @@
- Overloaded until {{ formatTime(account.overload_until) }} + {{ t('admin.accounts.statuses.overloadedUntil', { time: formatTime(account.overload_until) }) }}
@@ -96,9 +96,12 @@ From d36392b74f7579e23e499997d0c6b9d97aba0f1d Mon Sep 17 00:00:00 2001 From: IanShaw027 <131567472+IanShaw027@users.noreply.github.com> Date: Sun, 4 Jan 2026 21:09:14 +0800 Subject: [PATCH 02/13] fix(frontend): comprehensive i18n cleanup and Select component hardening --- backend/internal/handler/gateway_handler.go | 80 ++++-- backend/internal/service/gateway_service.go | 84 +++++- .../src/components/common/GroupSelector.vue | 6 +- frontend/src/components/common/Select.vue | 241 ++++++++++++------ frontend/src/composables/useClipboard.ts | 9 +- frontend/src/i18n/locales/en.ts | 16 +- frontend/src/i18n/locales/zh.ts | 7 +- frontend/src/utils/format.ts | 88 ++++--- frontend/src/views/admin/DashboardView.vue | 12 - frontend/src/views/admin/UsersView.vue | 2 +- frontend/src/views/user/DashboardView.vue | 12 - frontend/src/views/user/KeysView.vue | 5 +- 12 files changed, 374 insertions(+), 188 deletions(-) diff --git a/backend/internal/handler/gateway_handler.go b/backend/internal/handler/gateway_handler.go index 118c42fa..5674386b 100644 --- a/backend/internal/handler/gateway_handler.go +++ b/backend/internal/handler/gateway_handler.go @@ -128,7 +128,7 @@ func (h *GatewayHandler) Messages(c *gin.Context) { // 2. 【新增】Wait后二次检查余额/订阅 if err := h.billingCacheService.CheckBillingEligibility(c.Request.Context(), apiKey.User, apiKey, apiKey.Group, subscription); err != nil { log.Printf("Billing eligibility check failed after wait: %v", err) - h.handleStreamingAwareError(c, http.StatusForbidden, "billing_error", err.Error(), streamStarted) + h.handleStreamingAwareError(c, http.StatusForbidden, "permission_error", "Insufficient balance or active subscription required", streamStarted) return } @@ -156,8 +156,9 @@ func (h *GatewayHandler) Messages(c *gin.Context) { for { selection, err := h.gatewayService.SelectAccountWithLoadAwareness(c.Request.Context(), apiKey.GroupID, sessionKey, reqModel, failedAccountIDs) if err != nil { + log.Printf("Select account failed: %v", err) if len(failedAccountIDs) == 0 { - h.handleStreamingAwareError(c, http.StatusServiceUnavailable, "api_error", "No available accounts: "+err.Error(), streamStarted) + h.handleStreamingAwareError(c, http.StatusServiceUnavailable, "api_error", "No available accounts for requested model", streamStarted) return } h.handleFailoverExhausted(c, lastFailoverStatus, streamStarted) @@ -280,8 +281,9 @@ func (h *GatewayHandler) Messages(c *gin.Context) { // 选择支持该模型的账号 selection, err := h.gatewayService.SelectAccountWithLoadAwareness(c.Request.Context(), apiKey.GroupID, sessionKey, reqModel, failedAccountIDs) if err != nil { + log.Printf("Select account failed: %v", err) if len(failedAccountIDs) == 0 { - h.handleStreamingAwareError(c, http.StatusServiceUnavailable, "api_error", "No available accounts: "+err.Error(), streamStarted) + h.handleStreamingAwareError(c, http.StatusServiceUnavailable, "api_error", "No available accounts for requested model", streamStarted) return } h.handleFailoverExhausted(c, lastFailoverStatus, streamStarted) @@ -566,32 +568,68 @@ func (h *GatewayHandler) handleFailoverExhausted(c *gin.Context, statusCode int, func (h *GatewayHandler) mapUpstreamError(statusCode int) (int, string, string) { switch statusCode { case 401: - return http.StatusBadGateway, "upstream_error", "Upstream authentication failed, please contact administrator" + return http.StatusBadGateway, "api_error", "Upstream authentication failed, please contact administrator" case 403: - return http.StatusBadGateway, "upstream_error", "Upstream access forbidden, please contact administrator" + return http.StatusBadGateway, "api_error", "Upstream access forbidden, please contact administrator" case 429: return http.StatusTooManyRequests, "rate_limit_error", "Upstream rate limit exceeded, please retry later" case 529: return http.StatusServiceUnavailable, "overloaded_error", "Upstream service overloaded, please retry later" case 500, 502, 503, 504: - return http.StatusBadGateway, "upstream_error", "Upstream service temporarily unavailable" + return http.StatusBadGateway, "api_error", "Upstream service temporarily unavailable" default: - return http.StatusBadGateway, "upstream_error", "Upstream request failed" + return http.StatusBadGateway, "api_error", "Upstream request failed" } } +func normalizeAnthropicErrorType(errType string) string { + switch errType { + case "invalid_request_error", + "authentication_error", + "permission_error", + "not_found_error", + "rate_limit_error", + "api_error", + "overloaded_error": + return errType + case "billing_error": + // Not an Anthropic-standard error type; map to the closest equivalent. + return "permission_error" + case "upstream_error": + // Not an Anthropic-standard error type; keep clients compatible. + return "api_error" + default: + return "api_error" + } +} + +const maxPublicErrorMessageLen = 512 + +func sanitizePublicErrorMessage(message string) string { + cleaned := strings.TrimSpace(message) + cleaned = strings.ReplaceAll(cleaned, "\r", " ") + cleaned = strings.ReplaceAll(cleaned, "\n", " ") + if len(cleaned) > maxPublicErrorMessageLen { + cleaned = cleaned[:maxPublicErrorMessageLen] + "..." + } + return cleaned +} + // handleStreamingAwareError handles errors that may occur after streaming has started func (h *GatewayHandler) handleStreamingAwareError(c *gin.Context, status int, errType, message string, streamStarted bool) { + normalizedType := normalizeAnthropicErrorType(errType) + publicMessage := sanitizePublicErrorMessage(message) + if streamStarted { // Stream already started, send error as SSE event then close flusher, ok := c.Writer.(http.Flusher) if ok { - // Send error event in SSE format with proper JSON marshaling + // Anthropic streaming spec: send `event: error` with JSON `data`. errorData := map[string]any{ "type": "error", "error": map[string]string{ - "type": errType, - "message": message, + "type": normalizedType, + "message": publicMessage, }, } jsonBytes, err := json.Marshal(errorData) @@ -599,8 +637,11 @@ func (h *GatewayHandler) handleStreamingAwareError(c *gin.Context, status int, e _ = c.Error(err) return } - errorEvent := fmt.Sprintf("data: %s\n\n", string(jsonBytes)) - if _, err := fmt.Fprint(c.Writer, errorEvent); err != nil { + if _, err := fmt.Fprintf(c.Writer, "event: error\n"); err != nil { + _ = c.Error(err) + return + } + if _, err := fmt.Fprintf(c.Writer, "data: %s\n\n", string(jsonBytes)); err != nil { _ = c.Error(err) } flusher.Flush() @@ -609,16 +650,19 @@ func (h *GatewayHandler) handleStreamingAwareError(c *gin.Context, status int, e } // Normal case: return JSON response with proper status code - h.errorResponse(c, status, errType, message) + h.errorResponse(c, status, normalizedType, publicMessage) } // errorResponse 返回Claude API格式的错误响应 func (h *GatewayHandler) errorResponse(c *gin.Context, status int, errType, message string) { + normalizedType := normalizeAnthropicErrorType(errType) + publicMessage := sanitizePublicErrorMessage(message) + c.JSON(status, gin.H{ "type": "error", "error": gin.H{ - "type": errType, - "message": message, + "type": normalizedType, + "message": publicMessage, }, }) } @@ -674,7 +718,8 @@ func (h *GatewayHandler) CountTokens(c *gin.Context) { // 校验 billing eligibility(订阅/余额) // 【注意】不计算并发,但需要校验订阅/余额 if err := h.billingCacheService.CheckBillingEligibility(c.Request.Context(), apiKey.User, apiKey, apiKey.Group, subscription); err != nil { - h.errorResponse(c, http.StatusForbidden, "billing_error", err.Error()) + log.Printf("Billing eligibility check failed: %v", err) + h.errorResponse(c, http.StatusForbidden, "permission_error", "Insufficient balance or active subscription required") return } @@ -684,7 +729,8 @@ func (h *GatewayHandler) CountTokens(c *gin.Context) { // 选择支持该模型的账号 account, err := h.gatewayService.SelectAccountForModel(c.Request.Context(), apiKey.GroupID, sessionHash, parsedReq.Model) if err != nil { - h.errorResponse(c, http.StatusServiceUnavailable, "api_error", "No available accounts: "+err.Error()) + log.Printf("Select account failed: %v", err) + h.errorResponse(c, http.StatusServiceUnavailable, "api_error", "No available accounts for requested model") return } diff --git a/backend/internal/service/gateway_service.go b/backend/internal/service/gateway_service.go index 97e4c2e8..cbd4abd7 100644 --- a/backend/internal/service/gateway_service.go +++ b/backend/internal/service/gateway_service.go @@ -929,8 +929,16 @@ func (s *GatewayService) getOAuthToken(ctx context.Context, account *Account) (s // 重试相关常量 const ( - maxRetries = 10 // 最大重试次数 - retryDelay = 3 * time.Second // 重试等待时间 + // 最大尝试次数(包含首次请求)。过多重试会导致请求堆积与资源耗尽。 + maxRetryAttempts = 5 + + // 指数退避:第 N 次失败后的等待 = retryBaseDelay * 2^(N-1),并且上限为 retryMaxDelay。 + retryBaseDelay = 300 * time.Millisecond + retryMaxDelay = 3 * time.Second + + // 最大重试耗时(包含请求本身耗时 + 退避等待时间)。 + // 用于防止极端情况下 goroutine 长时间堆积导致资源耗尽。 + maxRetryElapsed = 10 * time.Second ) func (s *GatewayService) shouldRetryUpstreamError(account *Account, statusCode int) bool { @@ -953,6 +961,40 @@ func (s *GatewayService) shouldFailoverUpstreamError(statusCode int) bool { } } +func retryBackoffDelay(attempt int) time.Duration { + // attempt 从 1 开始,表示第 attempt 次请求刚失败,需要等待后进行第 attempt+1 次请求。 + if attempt <= 0 { + return retryBaseDelay + } + delay := retryBaseDelay * time.Duration(1<<(attempt-1)) + if delay > retryMaxDelay { + return retryMaxDelay + } + return delay +} + +func sleepWithContext(ctx context.Context, d time.Duration) error { + if d <= 0 { + return nil + } + timer := time.NewTimer(d) + defer func() { + if !timer.Stop() { + select { + case <-timer.C: + default: + } + } + }() + + select { + case <-ctx.Done(): + return ctx.Err() + case <-timer.C: + return nil + } +} + // isClaudeCodeClient 判断请求是否来自 Claude Code 客户端 // 简化判断:User-Agent 匹配 + metadata.user_id 存在 func isClaudeCodeClient(userAgent string, metadataUserID string) bool { @@ -1069,7 +1111,8 @@ func (s *GatewayService) Forward(ctx context.Context, c *gin.Context, account *A // 重试循环 var resp *http.Response - for attempt := 1; attempt <= maxRetries; attempt++ { + retryStart := time.Now() + for attempt := 1; attempt <= maxRetryAttempts; attempt++ { // 构建上游请求(每次重试需要重新构建,因为请求体需要重新读取) upstreamReq, err := s.buildUpstreamRequest(ctx, c, account, body, token, tokenType, reqModel) if err != nil { @@ -1079,6 +1122,9 @@ func (s *GatewayService) Forward(ctx context.Context, c *gin.Context, account *A // 发送请求 resp, err = s.httpUpstream.Do(upstreamReq, proxyURL, account.ID, account.Concurrency) if err != nil { + if resp != nil && resp.Body != nil { + _ = resp.Body.Close() + } return nil, fmt.Errorf("upstream request failed: %w", err) } @@ -1089,6 +1135,11 @@ func (s *GatewayService) Forward(ctx context.Context, c *gin.Context, account *A _ = resp.Body.Close() if s.isThinkingBlockSignatureError(respBody) { + // 避免在重试预算已耗尽时再发起额外请求 + if time.Since(retryStart) >= maxRetryElapsed { + resp.Body = io.NopCloser(bytes.NewReader(respBody)) + break + } log.Printf("Account %d: detected thinking block signature error, retrying with filtered thinking blocks", account.ID) // 过滤thinking blocks并重试(使用更激进的过滤) @@ -1121,11 +1172,27 @@ func (s *GatewayService) Forward(ctx context.Context, c *gin.Context, account *A // 检查是否需要通用重试(排除400,因为400已经在上面特殊处理过了) if resp.StatusCode >= 400 && resp.StatusCode != 400 && s.shouldRetryUpstreamError(account, resp.StatusCode) { - if attempt < maxRetries { - log.Printf("Account %d: upstream error %d, retry %d/%d after %v", - account.ID, resp.StatusCode, attempt, maxRetries, retryDelay) + if attempt < maxRetryAttempts { + elapsed := time.Since(retryStart) + if elapsed >= maxRetryElapsed { + break + } + + delay := retryBackoffDelay(attempt) + remaining := maxRetryElapsed - elapsed + if delay > remaining { + delay = remaining + } + if delay <= 0 { + break + } + + log.Printf("Account %d: upstream error %d, retry %d/%d after %v (elapsed=%v/%v)", + account.ID, resp.StatusCode, attempt, maxRetryAttempts, delay, elapsed, maxRetryElapsed) _ = resp.Body.Close() - time.Sleep(retryDelay) + if err := sleepWithContext(ctx, delay); err != nil { + return nil, err + } continue } // 最后一次尝试也失败,跳出循环处理重试耗尽 @@ -1142,6 +1209,9 @@ func (s *GatewayService) Forward(ctx context.Context, c *gin.Context, account *A } break } + if resp == nil || resp.Body == nil { + return nil, errors.New("upstream request failed: empty response") + } defer func() { _ = resp.Body.Close() }() // 处理重试耗尽的情况 diff --git a/frontend/src/components/common/GroupSelector.vue b/frontend/src/components/common/GroupSelector.vue index 5b78808b..c67d32fc 100644 --- a/frontend/src/components/common/GroupSelector.vue +++ b/frontend/src/components/common/GroupSelector.vue @@ -1,8 +1,8 @@ \ No newline at end of file + diff --git a/frontend/src/i18n/locales/zh.ts b/frontend/src/i18n/locales/zh.ts index e3d1cbaf..f452601d 100644 --- a/frontend/src/i18n/locales/zh.ts +++ b/frontend/src/i18n/locales/zh.ts @@ -1611,21 +1611,6 @@ export default { deleteProxy: '删除代理', deleteConfirmMessage: "确定要删除代理 '{name}' 吗?", testProxy: '测试代理', - columns: { - name: '名称', - protocol: '协议', - address: '地址', - priority: '优先级', - status: '状态', - lastCheck: '最近检测', - actions: '操作' - }, - protocols: { - http: 'HTTP', - https: 'HTTPS', - socks5: 'SOCKS5', - socks5h: 'SOCKS5H (服务端解析 DNS)' - }, columns: { nameLabel: '名称', namePlaceholder: '请输入代理名称', diff --git a/frontend/src/views/admin/UsersView.vue b/frontend/src/views/admin/UsersView.vue index 2ee8af08..d2a8833c 100644 --- a/frontend/src/views/admin/UsersView.vue +++ b/frontend/src/views/admin/UsersView.vue @@ -14,29 +14,9 @@
+
- - +
@@ -53,10 +25,6 @@
-
- - -
@@ -71,8 +39,8 @@ @@ -80,39 +48,30 @@ \ No newline at end of file + diff --git a/frontend/src/components/common/SearchInput.vue b/frontend/src/components/common/SearchInput.vue new file mode 100644 index 00000000..d0311a8e --- /dev/null +++ b/frontend/src/components/common/SearchInput.vue @@ -0,0 +1,54 @@ + + + diff --git a/frontend/src/components/common/StatusBadge.vue b/frontend/src/components/common/StatusBadge.vue new file mode 100644 index 00000000..a844b6cc --- /dev/null +++ b/frontend/src/components/common/StatusBadge.vue @@ -0,0 +1,39 @@ + + + diff --git a/frontend/src/components/user/UserAttributeForm.vue b/frontend/src/components/user/UserAttributeForm.vue index 17879c30..96996cdc 100644 --- a/frontend/src/components/user/UserAttributeForm.vue +++ b/frontend/src/components/user/UserAttributeForm.vue @@ -93,13 +93,10 @@ + \ No newline at end of file diff --git a/frontend/src/views/admin/UsersView.vue b/frontend/src/views/admin/UsersView.vue index d2a8833c..47a31270 100644 --- a/frontend/src/views/admin/UsersView.vue +++ b/frontend/src/views/admin/UsersView.vue @@ -4,36 +4,35 @@ @@ -46,6 +45,7 @@ + @@ -54,23 +54,23 @@ - - + + - - - + + From 87426e5ddaa7428c402f34363cb53c45b6aae1e3 Mon Sep 17 00:00:00 2001 From: IanShaw027 <131567472+IanShaw027@users.noreply.github.com> Date: Sun, 4 Jan 2026 22:32:36 +0800 Subject: [PATCH 07/13] =?UTF-8?q?fix(backend):=20=E6=94=B9=E8=BF=9B=20thin?= =?UTF-8?q?king/tool=20block=20=E7=AD=BE=E5=90=8D=E5=A4=84=E7=90=86?= =?UTF-8?q?=E5=92=8C=E9=87=8D=E8=AF=95=E7=AD=96=E7=95=A5?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 主要改动: - request_transformer: thinking block 缺少签名时降级为文本而非丢弃,保留内容并在上层禁用 thinking mode - antigravity_gateway_service: 新增两阶段降级策略,先处理 thinking blocks,如仍失败且涉及 tool 签名错误则进一步降级 tool blocks - gateway_request: 新增 FilterSignatureSensitiveBlocksForRetry 函数,支持将 tool_use/tool_result 降级为文本 - gateway_request: 改进 FilterThinkingBlocksForRetry,禁用顶层 thinking 配置以避免结构约束冲突 - gateway_service: 实现保守的两阶段重试逻辑,优先保留内容,仅在必要时降级工具调用 - 新增 antigravity_gateway_service_test.go 测试签名块剥离逻辑 - 更新相关测试用例以验证降级行为 此修复解决了跨平台/账户切换时历史消息签名失效导致的请求失败问题。 --- .../pkg/antigravity/request_transformer.go | 40 ++- .../antigravity/request_transformer_test.go | 23 +- .../service/antigravity_gateway_service.go | 237 ++++++++++++++-- .../antigravity_gateway_service_test.go | 83 ++++++ backend/internal/service/gateway_request.go | 262 ++++++++++++++++-- .../internal/service/gateway_request_test.go | 122 ++++++++ backend/internal/service/gateway_service.go | 108 +++++--- .../service/gemini_messages_compat_service.go | 50 ++++ 8 files changed, 815 insertions(+), 110 deletions(-) create mode 100644 backend/internal/service/antigravity_gateway_service_test.go diff --git a/backend/internal/pkg/antigravity/request_transformer.go b/backend/internal/pkg/antigravity/request_transformer.go index 0d2f1a00..ab9a6f09 100644 --- a/backend/internal/pkg/antigravity/request_transformer.go +++ b/backend/internal/pkg/antigravity/request_transformer.go @@ -22,7 +22,7 @@ func TransformClaudeToGemini(claudeReq *ClaudeRequest, projectID, mappedModel st allowDummyThought := strings.HasPrefix(mappedModel, "gemini-") // 1. 构建 contents - contents, err := buildContents(claudeReq.Messages, toolIDToName, isThinkingEnabled, allowDummyThought) + contents, strippedThinking, err := buildContents(claudeReq.Messages, toolIDToName, isThinkingEnabled, allowDummyThought) if err != nil { return nil, fmt.Errorf("build contents: %w", err) } @@ -31,7 +31,15 @@ func TransformClaudeToGemini(claudeReq *ClaudeRequest, projectID, mappedModel st systemInstruction := buildSystemInstruction(claudeReq.System, claudeReq.Model) // 3. 构建 generationConfig - generationConfig := buildGenerationConfig(claudeReq) + reqForConfig := claudeReq + if strippedThinking { + // If we had to downgrade thinking blocks to plain text due to missing/invalid signatures, + // disable upstream thinking mode to avoid signature/structure validation errors. + reqCopy := *claudeReq + reqCopy.Thinking = nil + reqForConfig = &reqCopy + } + generationConfig := buildGenerationConfig(reqForConfig) // 4. 构建 tools tools := buildTools(claudeReq.Tools) @@ -120,8 +128,9 @@ func buildSystemInstruction(system json.RawMessage, modelName string) *GeminiCon } // buildContents 构建 contents -func buildContents(messages []ClaudeMessage, toolIDToName map[string]string, isThinkingEnabled, allowDummyThought bool) ([]GeminiContent, error) { +func buildContents(messages []ClaudeMessage, toolIDToName map[string]string, isThinkingEnabled, allowDummyThought bool) ([]GeminiContent, bool, error) { var contents []GeminiContent + strippedThinking := false for i, msg := range messages { role := msg.Role @@ -129,9 +138,12 @@ func buildContents(messages []ClaudeMessage, toolIDToName map[string]string, isT role = "model" } - parts, err := buildParts(msg.Content, toolIDToName, allowDummyThought) + parts, strippedThisMsg, err := buildParts(msg.Content, toolIDToName, allowDummyThought) if err != nil { - return nil, fmt.Errorf("build parts for message %d: %w", i, err) + return nil, false, fmt.Errorf("build parts for message %d: %w", i, err) + } + if strippedThisMsg { + strippedThinking = true } // 只有 Gemini 模型支持 dummy thinking block workaround @@ -165,7 +177,7 @@ func buildContents(messages []ClaudeMessage, toolIDToName map[string]string, isT }) } - return contents, nil + return contents, strippedThinking, nil } // dummyThoughtSignature 用于跳过 Gemini 3 thought_signature 验证 @@ -174,8 +186,9 @@ const dummyThoughtSignature = "skip_thought_signature_validator" // buildParts 构建消息的 parts // allowDummyThought: 只有 Gemini 模型支持 dummy thought signature -func buildParts(content json.RawMessage, toolIDToName map[string]string, allowDummyThought bool) ([]GeminiPart, error) { +func buildParts(content json.RawMessage, toolIDToName map[string]string, allowDummyThought bool) ([]GeminiPart, bool, error) { var parts []GeminiPart + strippedThinking := false // 尝试解析为字符串 var textContent string @@ -183,13 +196,13 @@ func buildParts(content json.RawMessage, toolIDToName map[string]string, allowDu if textContent != "(no content)" && strings.TrimSpace(textContent) != "" { parts = append(parts, GeminiPart{Text: strings.TrimSpace(textContent)}) } - return parts, nil + return parts, false, nil } // 解析为内容块数组 var blocks []ContentBlock if err := json.Unmarshal(content, &blocks); err != nil { - return nil, fmt.Errorf("parse content blocks: %w", err) + return nil, false, fmt.Errorf("parse content blocks: %w", err) } for _, block := range blocks { @@ -208,8 +221,11 @@ func buildParts(content json.RawMessage, toolIDToName map[string]string, allowDu if block.Signature != "" { part.ThoughtSignature = block.Signature } else if !allowDummyThought { - // Claude 模型需要有效 signature,跳过无 signature 的 thinking block - log.Printf("Warning: skipping thinking block without signature for Claude model") + // Claude 模型需要有效 signature;在缺失时降级为普通文本,并在上层禁用 thinking mode。 + if strings.TrimSpace(block.Thinking) != "" { + parts = append(parts, GeminiPart{Text: block.Thinking}) + } + strippedThinking = true continue } else { // Gemini 模型使用 dummy signature @@ -276,7 +292,7 @@ func buildParts(content json.RawMessage, toolIDToName map[string]string, allowDu } } - return parts, nil + return parts, strippedThinking, nil } // parseToolResultContent 解析 tool_result 的 content diff --git a/backend/internal/pkg/antigravity/request_transformer_test.go b/backend/internal/pkg/antigravity/request_transformer_test.go index d3a1d918..60ee6f63 100644 --- a/backend/internal/pkg/antigravity/request_transformer_test.go +++ b/backend/internal/pkg/antigravity/request_transformer_test.go @@ -15,15 +15,15 @@ func TestBuildParts_ThinkingBlockWithoutSignature(t *testing.T) { description string }{ { - name: "Claude model - drop thinking without signature", + name: "Claude model - downgrade thinking to text without signature", content: `[ {"type": "text", "text": "Hello"}, {"type": "thinking", "thinking": "Let me think...", "signature": ""}, {"type": "text", "text": "World"} ]`, allowDummyThought: false, - expectedParts: 2, // thinking 内容被丢弃 - description: "Claude模型应丢弃无signature的thinking block内容", + expectedParts: 3, // thinking 内容降级为普通 text part + description: "Claude模型缺少signature时应将thinking降级为text,并在上层禁用thinking mode", }, { name: "Claude model - preserve thinking block with signature", @@ -52,7 +52,7 @@ func TestBuildParts_ThinkingBlockWithoutSignature(t *testing.T) { for _, tt := range tests { t.Run(tt.name, func(t *testing.T) { toolIDToName := make(map[string]string) - parts, err := buildParts(json.RawMessage(tt.content), toolIDToName, tt.allowDummyThought) + parts, _, err := buildParts(json.RawMessage(tt.content), toolIDToName, tt.allowDummyThought) if err != nil { t.Fatalf("buildParts() error = %v", err) @@ -71,6 +71,17 @@ func TestBuildParts_ThinkingBlockWithoutSignature(t *testing.T) { t.Fatalf("expected thought part with signature sig_real_123, got thought=%v signature=%q", parts[1].Thought, parts[1].ThoughtSignature) } + case "Claude model - downgrade thinking to text without signature": + if len(parts) != 3 { + t.Fatalf("expected 3 parts, got %d", len(parts)) + } + if parts[1].Thought { + t.Fatalf("expected downgraded text part, got thought=%v signature=%q", + parts[1].Thought, parts[1].ThoughtSignature) + } + if parts[1].Text != "Let me think..." { + t.Fatalf("expected downgraded text %q, got %q", "Let me think...", parts[1].Text) + } case "Gemini model - use dummy signature": if len(parts) != 3 { t.Fatalf("expected 3 parts, got %d", len(parts)) @@ -91,7 +102,7 @@ func TestBuildParts_ToolUseSignatureHandling(t *testing.T) { t.Run("Gemini uses dummy tool_use signature", func(t *testing.T) { toolIDToName := make(map[string]string) - parts, err := buildParts(json.RawMessage(content), toolIDToName, true) + parts, _, err := buildParts(json.RawMessage(content), toolIDToName, true) if err != nil { t.Fatalf("buildParts() error = %v", err) } @@ -105,7 +116,7 @@ func TestBuildParts_ToolUseSignatureHandling(t *testing.T) { t.Run("Claude model - preserve valid signature for tool_use", func(t *testing.T) { toolIDToName := make(map[string]string) - parts, err := buildParts(json.RawMessage(content), toolIDToName, false) + parts, _, err := buildParts(json.RawMessage(content), toolIDToName, false) if err != nil { t.Fatalf("buildParts() error = %v", err) } diff --git a/backend/internal/service/antigravity_gateway_service.go b/backend/internal/service/antigravity_gateway_service.go index cbe78ea5..835ffa0a 100644 --- a/backend/internal/service/antigravity_gateway_service.go +++ b/backend/internal/service/antigravity_gateway_service.go @@ -443,35 +443,70 @@ func (s *AntigravityGatewayService) Forward(ctx context.Context, c *gin.Context, // Antigravity /v1internal 链路在部分场景会对 thought/thinking signature 做严格校验, // 当历史消息携带的 signature 不合法时会直接 400;去除 thinking 后可继续完成请求。 if resp.StatusCode == http.StatusBadRequest && isSignatureRelatedError(respBody) { - retryClaudeReq := claudeReq - retryClaudeReq.Messages = append([]antigravity.ClaudeMessage(nil), claudeReq.Messages...) + // Conservative two-stage fallback: + // 1) Disable top-level thinking + thinking->text + // 2) Only if still signature-related 400: also downgrade tool_use/tool_result to text. - stripped, stripErr := stripThinkingFromClaudeRequest(&retryClaudeReq) - if stripErr == nil && stripped { - log.Printf("Antigravity account %d: detected signature-related 400, retrying once without thinking blocks", account.ID) + retryStages := []struct { + name string + strip func(*antigravity.ClaudeRequest) (bool, error) + }{ + {name: "thinking-only", strip: stripThinkingFromClaudeRequest}, + {name: "thinking+tools", strip: stripSignatureSensitiveBlocksFromClaudeRequest}, + } + + for _, stage := range retryStages { + retryClaudeReq := claudeReq + retryClaudeReq.Messages = append([]antigravity.ClaudeMessage(nil), claudeReq.Messages...) + + stripped, stripErr := stage.strip(&retryClaudeReq) + if stripErr != nil || !stripped { + continue + } + + log.Printf("Antigravity account %d: detected signature-related 400, retrying once (%s)", account.ID, stage.name) retryGeminiBody, txErr := antigravity.TransformClaudeToGemini(&retryClaudeReq, projectID, mappedModel) - if txErr == nil { - retryReq, buildErr := antigravity.NewAPIRequest(ctx, action, accessToken, retryGeminiBody) - if buildErr == nil { - retryResp, retryErr := s.httpUpstream.Do(retryReq, proxyURL, account.ID, account.Concurrency) - if retryErr == nil { - // Retry success: continue normal success flow with the new response. - if retryResp.StatusCode < 400 { - _ = resp.Body.Close() - resp = retryResp - respBody = nil - } else { - // Retry still errored: replace error context with retry response. - retryBody, _ := io.ReadAll(io.LimitReader(retryResp.Body, 2<<20)) - _ = retryResp.Body.Close() - respBody = retryBody - resp = retryResp - } - } else { - log.Printf("Antigravity account %d: signature retry request failed: %v", account.ID, retryErr) - } + if txErr != nil { + continue + } + retryReq, buildErr := antigravity.NewAPIRequest(ctx, action, accessToken, retryGeminiBody) + if buildErr != nil { + continue + } + retryResp, retryErr := s.httpUpstream.Do(retryReq, proxyURL, account.ID, account.Concurrency) + if retryErr != nil { + log.Printf("Antigravity account %d: signature retry request failed (%s): %v", account.ID, stage.name, retryErr) + continue + } + + if retryResp.StatusCode < 400 { + _ = resp.Body.Close() + resp = retryResp + respBody = nil + break + } + + retryBody, _ := io.ReadAll(io.LimitReader(retryResp.Body, 2<<20)) + _ = retryResp.Body.Close() + + // If this stage fixed the signature issue, we stop; otherwise we may try the next stage. + if retryResp.StatusCode != http.StatusBadRequest || !isSignatureRelatedError(retryBody) { + respBody = retryBody + resp = &http.Response{ + StatusCode: retryResp.StatusCode, + Header: retryResp.Header.Clone(), + Body: io.NopCloser(bytes.NewReader(retryBody)), } + break + } + + // Still signature-related; capture context and allow next stage. + respBody = retryBody + resp = &http.Response{ + StatusCode: retryResp.StatusCode, + Header: retryResp.Header.Clone(), + Body: io.NopCloser(bytes.NewReader(retryBody)), } } } @@ -555,7 +590,7 @@ func extractAntigravityErrorMessage(body []byte) string { // stripThinkingFromClaudeRequest converts thinking blocks to text blocks in a Claude Messages request. // This preserves the thinking content while avoiding signature validation errors. // Note: redacted_thinking blocks are removed because they cannot be converted to text. -// It also disables top-level `thinking` to prevent dummy-thought injection during retry. +// It also disables top-level `thinking` to avoid upstream structural constraints for thinking mode. func stripThinkingFromClaudeRequest(req *antigravity.ClaudeRequest) (bool, error) { if req == nil { return false, nil @@ -585,6 +620,92 @@ func stripThinkingFromClaudeRequest(req *antigravity.ClaudeRequest) (bool, error continue } + filtered := make([]map[string]any, 0, len(blocks)) + modifiedAny := false + for _, block := range blocks { + t, _ := block["type"].(string) + switch t { + case "thinking": + thinkingText, _ := block["thinking"].(string) + if thinkingText != "" { + filtered = append(filtered, map[string]any{ + "type": "text", + "text": thinkingText, + }) + } + modifiedAny = true + case "redacted_thinking": + modifiedAny = true + case "": + if thinkingText, hasThinking := block["thinking"].(string); hasThinking { + if thinkingText != "" { + filtered = append(filtered, map[string]any{ + "type": "text", + "text": thinkingText, + }) + } + modifiedAny = true + } else { + filtered = append(filtered, block) + } + default: + filtered = append(filtered, block) + } + } + + if !modifiedAny { + continue + } + + if len(filtered) == 0 { + filtered = append(filtered, map[string]any{ + "type": "text", + "text": "(content removed)", + }) + } + + newRaw, err := json.Marshal(filtered) + if err != nil { + return changed, err + } + req.Messages[i].Content = newRaw + changed = true + } + + return changed, nil +} + +// stripSignatureSensitiveBlocksFromClaudeRequest is a stronger retry degradation that additionally converts +// tool blocks to plain text. Use this only after a thinking-only retry still fails with signature errors. +func stripSignatureSensitiveBlocksFromClaudeRequest(req *antigravity.ClaudeRequest) (bool, error) { + if req == nil { + return false, nil + } + + changed := false + if req.Thinking != nil { + req.Thinking = nil + changed = true + } + + for i := range req.Messages { + raw := req.Messages[i].Content + if len(raw) == 0 { + continue + } + + // If content is a string, nothing to strip. + var str string + if json.Unmarshal(raw, &str) == nil { + continue + } + + // Otherwise treat as an array of blocks and convert signature-sensitive blocks to text. + var blocks []map[string]any + if err := json.Unmarshal(raw, &blocks); err != nil { + continue + } + filtered := make([]map[string]any, 0, len(blocks)) modifiedAny := false for _, block := range blocks { @@ -603,6 +724,49 @@ func stripThinkingFromClaudeRequest(req *antigravity.ClaudeRequest) (bool, error case "redacted_thinking": // Remove redacted_thinking (cannot convert encrypted content) modifiedAny = true + case "tool_use": + // Convert tool_use to text to avoid upstream signature/thought_signature validation errors. + // This is a retry-only degradation path, so we prioritise request validity over tool semantics. + name, _ := block["name"].(string) + id, _ := block["id"].(string) + input := block["input"] + inputJSON, _ := json.Marshal(input) + text := "(tool_use)" + if name != "" { + text += " name=" + name + } + if id != "" { + text += " id=" + id + } + if len(inputJSON) > 0 && string(inputJSON) != "null" { + text += " input=" + string(inputJSON) + } + filtered = append(filtered, map[string]any{ + "type": "text", + "text": text, + }) + modifiedAny = true + case "tool_result": + // Convert tool_result to text so it stays consistent when tool_use is downgraded. + toolUseID, _ := block["tool_use_id"].(string) + isError, _ := block["is_error"].(bool) + content := block["content"] + contentJSON, _ := json.Marshal(content) + text := "(tool_result)" + if toolUseID != "" { + text += " tool_use_id=" + toolUseID + } + if isError { + text += " is_error=true" + } + if len(contentJSON) > 0 && string(contentJSON) != "null" { + text += "\n" + string(contentJSON) + } + filtered = append(filtered, map[string]any{ + "type": "text", + "text": text, + }) + modifiedAny = true case "": // Handle untyped block with "thinking" field if thinkingText, hasThinking := block["thinking"].(string); hasThinking { @@ -625,6 +789,14 @@ func stripThinkingFromClaudeRequest(req *antigravity.ClaudeRequest) (bool, error continue } + if len(filtered) == 0 { + // Keep request valid: upstream rejects empty content arrays. + filtered = append(filtered, map[string]any{ + "type": "text", + "text": "(content removed)", + }) + } + newRaw, err := json.Marshal(filtered) if err != nil { return changed, err @@ -747,11 +919,18 @@ func (s *AntigravityGatewayService) ForwardGemini(ctx context.Context, c *gin.Co break } - defer func() { _ = resp.Body.Close() }() + defer func() { + if resp != nil && resp.Body != nil { + _ = resp.Body.Close() + } + }() // 处理错误响应 if resp.StatusCode >= 400 { respBody, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20)) + // 尽早关闭原始响应体,释放连接;后续逻辑仍可能需要读取 body,因此用内存副本重新包装。 + _ = resp.Body.Close() + resp.Body = io.NopCloser(bytes.NewReader(respBody)) // 模型兜底:模型不存在且开启 fallback 时,自动用 fallback 模型重试一次 if s.settingService != nil && s.settingService.IsModelFallbackEnabled(ctx) && @@ -760,15 +939,13 @@ func (s *AntigravityGatewayService) ForwardGemini(ctx context.Context, c *gin.Co if fallbackModel != "" && fallbackModel != mappedModel { log.Printf("[Antigravity] Model not found (%s), retrying with fallback model %s (account: %s)", mappedModel, fallbackModel, account.Name) - // 关闭原始响应,释放连接(respBody 已读取到内存) - _ = resp.Body.Close() - fallbackWrapped, err := s.wrapV1InternalRequest(projectID, fallbackModel, body) if err == nil { fallbackReq, err := antigravity.NewAPIRequest(ctx, upstreamAction, accessToken, fallbackWrapped) if err == nil { fallbackResp, err := s.httpUpstream.Do(fallbackReq, proxyURL, account.ID, account.Concurrency) if err == nil && fallbackResp.StatusCode < 400 { + _ = resp.Body.Close() resp = fallbackResp } else if fallbackResp != nil { _ = fallbackResp.Body.Close() diff --git a/backend/internal/service/antigravity_gateway_service_test.go b/backend/internal/service/antigravity_gateway_service_test.go new file mode 100644 index 00000000..c3d9ce4c --- /dev/null +++ b/backend/internal/service/antigravity_gateway_service_test.go @@ -0,0 +1,83 @@ +package service + +import ( + "encoding/json" + "testing" + + "github.com/Wei-Shaw/sub2api/internal/pkg/antigravity" + "github.com/stretchr/testify/require" +) + +func TestStripSignatureSensitiveBlocksFromClaudeRequest(t *testing.T) { + req := &antigravity.ClaudeRequest{ + Model: "claude-sonnet-4-5", + Thinking: &antigravity.ThinkingConfig{ + Type: "enabled", + BudgetTokens: 1024, + }, + Messages: []antigravity.ClaudeMessage{ + { + Role: "assistant", + Content: json.RawMessage(`[ + {"type":"thinking","thinking":"secret plan","signature":""}, + {"type":"tool_use","id":"t1","name":"Bash","input":{"command":"ls"}} + ]`), + }, + { + Role: "user", + Content: json.RawMessage(`[ + {"type":"tool_result","tool_use_id":"t1","content":"ok","is_error":false}, + {"type":"redacted_thinking","data":"..."} + ]`), + }, + }, + } + + changed, err := stripSignatureSensitiveBlocksFromClaudeRequest(req) + require.NoError(t, err) + require.True(t, changed) + require.Nil(t, req.Thinking) + + require.Len(t, req.Messages, 2) + + var blocks0 []map[string]any + require.NoError(t, json.Unmarshal(req.Messages[0].Content, &blocks0)) + require.Len(t, blocks0, 2) + require.Equal(t, "text", blocks0[0]["type"]) + require.Equal(t, "secret plan", blocks0[0]["text"]) + require.Equal(t, "text", blocks0[1]["type"]) + + var blocks1 []map[string]any + require.NoError(t, json.Unmarshal(req.Messages[1].Content, &blocks1)) + require.Len(t, blocks1, 1) + require.Equal(t, "text", blocks1[0]["type"]) + require.NotEmpty(t, blocks1[0]["text"]) +} + +func TestStripThinkingFromClaudeRequest_DoesNotDowngradeTools(t *testing.T) { + req := &antigravity.ClaudeRequest{ + Model: "claude-sonnet-4-5", + Thinking: &antigravity.ThinkingConfig{ + Type: "enabled", + BudgetTokens: 1024, + }, + Messages: []antigravity.ClaudeMessage{ + { + Role: "assistant", + Content: json.RawMessage(`[{"type":"thinking","thinking":"secret plan"},{"type":"tool_use","id":"t1","name":"Bash","input":{"command":"ls"}}]`), + }, + }, + } + + changed, err := stripThinkingFromClaudeRequest(req) + require.NoError(t, err) + require.True(t, changed) + require.Nil(t, req.Thinking) + + var blocks []map[string]any + require.NoError(t, json.Unmarshal(req.Messages[0].Content, &blocks)) + require.Len(t, blocks, 2) + require.Equal(t, "text", blocks[0]["type"]) + require.Equal(t, "secret plan", blocks[0]["text"]) + require.Equal(t, "tool_use", blocks[1]["type"]) +} diff --git a/backend/internal/service/gateway_request.go b/backend/internal/service/gateway_request.go index 741fceaf..8e94dad2 100644 --- a/backend/internal/service/gateway_request.go +++ b/backend/internal/service/gateway_request.go @@ -84,25 +84,28 @@ func FilterThinkingBlocks(body []byte) []byte { return filterThinkingBlocksInternal(body, false) } -// FilterThinkingBlocksForRetry removes thinking blocks from HISTORICAL messages for retry scenarios. -// This is used when upstream returns signature-related 400 errors. +// FilterThinkingBlocksForRetry strips thinking-related constructs for retry scenarios. // -// Key insight: -// - User's thinking.type = "enabled" should be PRESERVED (user's intent) -// - Only HISTORICAL assistant messages have thinking blocks with signatures -// - These signatures may be invalid when switching accounts/platforms -// - New responses will generate fresh thinking blocks without signature issues +// Why: +// - Upstreams may reject historical `thinking`/`redacted_thinking` blocks due to invalid/missing signatures. +// - Anthropic extended thinking has a structural constraint: when top-level `thinking` is enabled and the +// final message is an assistant prefill, the assistant content must start with a thinking block. +// - If we remove thinking blocks but keep top-level `thinking` enabled, we can trigger: +// "Expected `thinking` or `redacted_thinking`, but found `text`" // -// Strategy: -// - Keep thinking.type = "enabled" (preserve user intent) -// - Remove thinking/redacted_thinking blocks from historical assistant messages -// - Ensure no message has empty content after filtering +// Strategy (B: preserve content as text): +// - Disable top-level `thinking` (remove `thinking` field). +// - Convert `thinking` blocks to `text` blocks (preserve the thinking content). +// - Remove `redacted_thinking` blocks (cannot be converted to text). +// - Ensure no message ends up with empty content. func FilterThinkingBlocksForRetry(body []byte) []byte { - // Fast path: check for presence of thinking-related keys in messages + // Fast path: check for presence of thinking-related keys in messages or top-level thinking config. if !bytes.Contains(body, []byte(`"type":"thinking"`)) && !bytes.Contains(body, []byte(`"type": "thinking"`)) && !bytes.Contains(body, []byte(`"type":"redacted_thinking"`)) && - !bytes.Contains(body, []byte(`"type": "redacted_thinking"`)) { + !bytes.Contains(body, []byte(`"type": "redacted_thinking"`)) && + !bytes.Contains(body, []byte(`"thinking":`)) && + !bytes.Contains(body, []byte(`"thinking" :`)) { return body } @@ -111,15 +114,19 @@ func FilterThinkingBlocksForRetry(body []byte) []byte { return body } - // DO NOT modify thinking.type - preserve user's intent to use thinking mode - // The issue is with historical message signatures, not the thinking mode itself + modified := false messages, ok := req["messages"].([]any) if !ok { return body } - modified := false + // Disable top-level thinking mode for retry to avoid structural/signature constraints upstream. + if _, exists := req["thinking"]; exists { + delete(req, "thinking") + modified = true + } + newMessages := make([]any, 0, len(messages)) for _, msg := range messages { @@ -149,13 +156,42 @@ func FilterThinkingBlocksForRetry(body []byte) []byte { blockType, _ := blockMap["type"].(string) - // Remove thinking/redacted_thinking blocks from historical messages - // These have signatures that may be invalid across different accounts - if blockType == "thinking" || blockType == "redacted_thinking" { + // Convert thinking blocks to text (preserve content) and drop redacted_thinking. + switch blockType { + case "thinking": + modifiedThisMsg = true + thinkingText, _ := blockMap["thinking"].(string) + if thinkingText == "" { + continue + } + newContent = append(newContent, map[string]any{ + "type": "text", + "text": thinkingText, + }) + continue + case "redacted_thinking": modifiedThisMsg = true continue } + // Handle blocks without type discriminator but with a "thinking" field. + if blockType == "" { + if rawThinking, hasThinking := blockMap["thinking"]; hasThinking { + modifiedThisMsg = true + switch v := rawThinking.(type) { + case string: + if v != "" { + newContent = append(newContent, map[string]any{"type": "text", "text": v}) + } + default: + if b, err := json.Marshal(v); err == nil && len(b) > 0 { + newContent = append(newContent, map[string]any{"type": "text", "text": string(b)}) + } + } + continue + } + } + newContent = append(newContent, block) } @@ -163,18 +199,15 @@ func FilterThinkingBlocksForRetry(body []byte) []byte { modified = true // Handle empty content after filtering if len(newContent) == 0 { - // For assistant messages, skip entirely (remove from conversation) - // For user messages, add placeholder to avoid empty content error - if role == "user" { - newContent = append(newContent, map[string]any{ - "type": "text", - "text": "(content removed)", - }) - msgMap["content"] = newContent - newMessages = append(newMessages, msgMap) + // Always add a placeholder to avoid upstream "non-empty content" errors. + placeholder := "(content removed)" + if role == "assistant" { + placeholder = "(assistant content removed)" } - // Skip assistant messages with empty content (don't append) - continue + newContent = append(newContent, map[string]any{ + "type": "text", + "text": placeholder, + }) } msgMap["content"] = newContent } @@ -183,6 +216,9 @@ func FilterThinkingBlocksForRetry(body []byte) []byte { if modified { req["messages"] = newMessages + } else { + // Avoid rewriting JSON when no changes are needed. + return body } newBody, err := json.Marshal(req) @@ -192,6 +228,172 @@ func FilterThinkingBlocksForRetry(body []byte) []byte { return newBody } +// FilterSignatureSensitiveBlocksForRetry is a stronger retry filter for cases where upstream errors indicate +// signature/thought_signature validation issues involving tool blocks. +// +// This performs everything in FilterThinkingBlocksForRetry, plus: +// - Convert `tool_use` blocks to text (name/id/input) so we stop sending structured tool calls. +// - Convert `tool_result` blocks to text so we keep tool results visible without tool semantics. +// +// Use this only when needed: converting tool blocks to text changes model behaviour and can increase the +// risk of prompt injection (tool output becomes plain conversation text). +func FilterSignatureSensitiveBlocksForRetry(body []byte) []byte { + // Fast path: only run when we see likely relevant constructs. + if !bytes.Contains(body, []byte(`"type":"thinking"`)) && + !bytes.Contains(body, []byte(`"type": "thinking"`)) && + !bytes.Contains(body, []byte(`"type":"redacted_thinking"`)) && + !bytes.Contains(body, []byte(`"type": "redacted_thinking"`)) && + !bytes.Contains(body, []byte(`"type":"tool_use"`)) && + !bytes.Contains(body, []byte(`"type": "tool_use"`)) && + !bytes.Contains(body, []byte(`"type":"tool_result"`)) && + !bytes.Contains(body, []byte(`"type": "tool_result"`)) && + !bytes.Contains(body, []byte(`"thinking":`)) && + !bytes.Contains(body, []byte(`"thinking" :`)) { + return body + } + + var req map[string]any + if err := json.Unmarshal(body, &req); err != nil { + return body + } + + modified := false + + // Disable top-level thinking for retry to avoid structural/signature constraints upstream. + if _, exists := req["thinking"]; exists { + delete(req, "thinking") + modified = true + } + + messages, ok := req["messages"].([]any) + if !ok { + return body + } + + newMessages := make([]any, 0, len(messages)) + + for _, msg := range messages { + msgMap, ok := msg.(map[string]any) + if !ok { + newMessages = append(newMessages, msg) + continue + } + + role, _ := msgMap["role"].(string) + content, ok := msgMap["content"].([]any) + if !ok { + newMessages = append(newMessages, msg) + continue + } + + newContent := make([]any, 0, len(content)) + modifiedThisMsg := false + + for _, block := range content { + blockMap, ok := block.(map[string]any) + if !ok { + newContent = append(newContent, block) + continue + } + + blockType, _ := blockMap["type"].(string) + switch blockType { + case "thinking": + modifiedThisMsg = true + thinkingText, _ := blockMap["thinking"].(string) + if thinkingText == "" { + continue + } + newContent = append(newContent, map[string]any{"type": "text", "text": thinkingText}) + continue + case "redacted_thinking": + modifiedThisMsg = true + continue + case "tool_use": + modifiedThisMsg = true + name, _ := blockMap["name"].(string) + id, _ := blockMap["id"].(string) + input := blockMap["input"] + inputJSON, _ := json.Marshal(input) + text := "(tool_use)" + if name != "" { + text += " name=" + name + } + if id != "" { + text += " id=" + id + } + if len(inputJSON) > 0 && string(inputJSON) != "null" { + text += " input=" + string(inputJSON) + } + newContent = append(newContent, map[string]any{"type": "text", "text": text}) + continue + case "tool_result": + modifiedThisMsg = true + toolUseID, _ := blockMap["tool_use_id"].(string) + isError, _ := blockMap["is_error"].(bool) + content := blockMap["content"] + contentJSON, _ := json.Marshal(content) + text := "(tool_result)" + if toolUseID != "" { + text += " tool_use_id=" + toolUseID + } + if isError { + text += " is_error=true" + } + if len(contentJSON) > 0 && string(contentJSON) != "null" { + text += "\n" + string(contentJSON) + } + newContent = append(newContent, map[string]any{"type": "text", "text": text}) + continue + } + + if blockType == "" { + if rawThinking, hasThinking := blockMap["thinking"]; hasThinking { + modifiedThisMsg = true + switch v := rawThinking.(type) { + case string: + if v != "" { + newContent = append(newContent, map[string]any{"type": "text", "text": v}) + } + default: + if b, err := json.Marshal(v); err == nil && len(b) > 0 { + newContent = append(newContent, map[string]any{"type": "text", "text": string(b)}) + } + } + continue + } + } + + newContent = append(newContent, block) + } + + if modifiedThisMsg { + modified = true + if len(newContent) == 0 { + placeholder := "(content removed)" + if role == "assistant" { + placeholder = "(assistant content removed)" + } + newContent = append(newContent, map[string]any{"type": "text", "text": placeholder}) + } + msgMap["content"] = newContent + } + + newMessages = append(newMessages, msgMap) + } + + if !modified { + return body + } + + req["messages"] = newMessages + newBody, err := json.Marshal(req) + if err != nil { + return body + } + return newBody +} + // filterThinkingBlocksInternal removes invalid thinking blocks from request // Strategy: // - When thinking.type != "enabled": Remove all thinking blocks diff --git a/backend/internal/service/gateway_request_test.go b/backend/internal/service/gateway_request_test.go index eb8af1da..8bcc1ee1 100644 --- a/backend/internal/service/gateway_request_test.go +++ b/backend/internal/service/gateway_request_test.go @@ -151,3 +151,125 @@ func TestFilterThinkingBlocks(t *testing.T) { }) } } + +func TestFilterThinkingBlocksForRetry_DisablesThinkingAndPreservesAsText(t *testing.T) { + input := []byte(`{ + "model":"claude-3-5-sonnet-20241022", + "thinking":{"type":"enabled","budget_tokens":1024}, + "messages":[ + {"role":"user","content":[{"type":"text","text":"Hi"}]}, + {"role":"assistant","content":[ + {"type":"thinking","thinking":"Let me think...","signature":"bad_sig"}, + {"type":"text","text":"Answer"} + ]} + ] + }`) + + out := FilterThinkingBlocksForRetry(input) + + var req map[string]any + require.NoError(t, json.Unmarshal(out, &req)) + _, hasThinking := req["thinking"] + require.False(t, hasThinking) + + msgs, ok := req["messages"].([]any) + require.True(t, ok) + require.Len(t, msgs, 2) + + assistant := msgs[1].(map[string]any) + content := assistant["content"].([]any) + require.Len(t, content, 2) + + first := content[0].(map[string]any) + require.Equal(t, "text", first["type"]) + require.Equal(t, "Let me think...", first["text"]) +} + +func TestFilterThinkingBlocksForRetry_DisablesThinkingEvenWithoutThinkingBlocks(t *testing.T) { + input := []byte(`{ + "model":"claude-3-5-sonnet-20241022", + "thinking":{"type":"enabled","budget_tokens":1024}, + "messages":[ + {"role":"user","content":[{"type":"text","text":"Hi"}]}, + {"role":"assistant","content":[{"type":"text","text":"Prefill"}]} + ] + }`) + + out := FilterThinkingBlocksForRetry(input) + + var req map[string]any + require.NoError(t, json.Unmarshal(out, &req)) + _, hasThinking := req["thinking"] + require.False(t, hasThinking) +} + +func TestFilterThinkingBlocksForRetry_RemovesRedactedThinkingAndKeepsValidContent(t *testing.T) { + input := []byte(`{ + "thinking":{"type":"enabled","budget_tokens":1024}, + "messages":[ + {"role":"assistant","content":[ + {"type":"redacted_thinking","data":"..."}, + {"type":"text","text":"Visible"} + ]} + ] + }`) + + out := FilterThinkingBlocksForRetry(input) + + var req map[string]any + require.NoError(t, json.Unmarshal(out, &req)) + _, hasThinking := req["thinking"] + require.False(t, hasThinking) + + msgs := req["messages"].([]any) + content := msgs[0].(map[string]any)["content"].([]any) + require.Len(t, content, 1) + require.Equal(t, "text", content[0].(map[string]any)["type"]) + require.Equal(t, "Visible", content[0].(map[string]any)["text"]) +} + +func TestFilterThinkingBlocksForRetry_EmptyContentGetsPlaceholder(t *testing.T) { + input := []byte(`{ + "thinking":{"type":"enabled"}, + "messages":[ + {"role":"assistant","content":[{"type":"redacted_thinking","data":"..."}]} + ] + }`) + + out := FilterThinkingBlocksForRetry(input) + + var req map[string]any + require.NoError(t, json.Unmarshal(out, &req)) + msgs := req["messages"].([]any) + content := msgs[0].(map[string]any)["content"].([]any) + require.Len(t, content, 1) + require.Equal(t, "text", content[0].(map[string]any)["type"]) + require.NotEmpty(t, content[0].(map[string]any)["text"]) +} + +func TestFilterSignatureSensitiveBlocksForRetry_DowngradesTools(t *testing.T) { + input := []byte(`{ + "thinking":{"type":"enabled","budget_tokens":1024}, + "messages":[ + {"role":"assistant","content":[ + {"type":"tool_use","id":"t1","name":"Bash","input":{"command":"ls"}}, + {"type":"tool_result","tool_use_id":"t1","content":"ok","is_error":false} + ]} + ] + }`) + + out := FilterSignatureSensitiveBlocksForRetry(input) + + var req map[string]any + require.NoError(t, json.Unmarshal(out, &req)) + _, hasThinking := req["thinking"] + require.False(t, hasThinking) + + msgs := req["messages"].([]any) + content := msgs[0].(map[string]any)["content"].([]any) + require.Len(t, content, 2) + require.Equal(t, "text", content[0].(map[string]any)["type"]) + require.Equal(t, "text", content[1].(map[string]any)["type"]) + require.Contains(t, content[0].(map[string]any)["text"], "tool_use") + require.Contains(t, content[1].(map[string]any)["text"], "tool_result") +} diff --git a/backend/internal/service/gateway_service.go b/backend/internal/service/gateway_service.go index ae633c65..c706fb80 100644 --- a/backend/internal/service/gateway_service.go +++ b/backend/internal/service/gateway_service.go @@ -1131,46 +1131,90 @@ func (s *GatewayService) Forward(ctx context.Context, c *gin.Context, account *A // 优先检测thinking block签名错误(400)并重试一次 if resp.StatusCode == 400 { respBody, readErr := io.ReadAll(io.LimitReader(resp.Body, 2<<20)) - if readErr == nil { - _ = resp.Body.Close() + if readErr == nil { + _ = resp.Body.Close() - if s.isThinkingBlockSignatureError(respBody) { - // 避免在重试预算已耗尽时再发起额外请求 - if time.Since(retryStart) >= maxRetryElapsed { - resp.Body = io.NopCloser(bytes.NewReader(respBody)) - break + if s.isThinkingBlockSignatureError(respBody) { + looksLikeToolSignatureError := func(msg string) bool { + m := strings.ToLower(msg) + return strings.Contains(m, "tool_use") || + strings.Contains(m, "tool_result") || + strings.Contains(m, "functioncall") || + strings.Contains(m, "function_call") || + strings.Contains(m, "functionresponse") || + strings.Contains(m, "function_response") + } + + // 避免在重试预算已耗尽时再发起额外请求 + if time.Since(retryStart) >= maxRetryElapsed { + resp.Body = io.NopCloser(bytes.NewReader(respBody)) + break } log.Printf("Account %d: detected thinking block signature error, retrying with filtered thinking blocks", account.ID) - // 过滤thinking blocks并重试(使用更激进的过滤) - filteredBody := FilterThinkingBlocksForRetry(body) - retryReq, buildErr := s.buildUpstreamRequest(ctx, c, account, filteredBody, token, tokenType, reqModel) - if buildErr == nil { - retryResp, retryErr := s.httpUpstream.Do(retryReq, proxyURL, account.ID, account.Concurrency) - if retryErr == nil { - // 使用重试后的响应,继续后续处理 - if retryResp.StatusCode < 400 { - log.Printf("Account %d: signature error retry succeeded", account.ID) - } else { - log.Printf("Account %d: signature error retry returned status %d", account.ID, retryResp.StatusCode) + // Conservative two-stage fallback: + // 1) Disable thinking + thinking->text (preserve content) + // 2) Only if upstream still errors AND error message points to tool/function signature issues: + // also downgrade tool_use/tool_result blocks to text. + + filteredBody := FilterThinkingBlocksForRetry(body) + retryReq, buildErr := s.buildUpstreamRequest(ctx, c, account, filteredBody, token, tokenType, reqModel) + if buildErr == nil { + retryResp, retryErr := s.httpUpstream.Do(retryReq, proxyURL, account.ID, account.Concurrency) + if retryErr == nil { + if retryResp.StatusCode < 400 { + log.Printf("Account %d: signature error retry succeeded (thinking downgraded)", account.ID) + resp = retryResp + break + } + + retryRespBody, retryReadErr := io.ReadAll(io.LimitReader(retryResp.Body, 2<<20)) + _ = retryResp.Body.Close() + if retryReadErr == nil && retryResp.StatusCode == 400 && s.isThinkingBlockSignatureError(retryRespBody) { + msg2 := extractUpstreamErrorMessage(retryRespBody) + if looksLikeToolSignatureError(msg2) && time.Since(retryStart) < maxRetryElapsed { + log.Printf("Account %d: signature retry still failing and looks tool-related, retrying with tool blocks downgraded", account.ID) + filteredBody2 := FilterSignatureSensitiveBlocksForRetry(body) + retryReq2, buildErr2 := s.buildUpstreamRequest(ctx, c, account, filteredBody2, token, tokenType, reqModel) + if buildErr2 == nil { + retryResp2, retryErr2 := s.httpUpstream.Do(retryReq2, proxyURL, account.ID, account.Concurrency) + if retryErr2 == nil { + resp = retryResp2 + break + } + if retryResp2 != nil && retryResp2.Body != nil { + _ = retryResp2.Body.Close() + } + log.Printf("Account %d: tool-downgrade signature retry failed: %v", account.ID, retryErr2) + } else { + log.Printf("Account %d: tool-downgrade signature retry build failed: %v", account.ID, buildErr2) + } + } + } + + // Fall back to the original retry response context. + resp = &http.Response{ + StatusCode: retryResp.StatusCode, + Header: retryResp.Header.Clone(), + Body: io.NopCloser(bytes.NewReader(retryRespBody)), + } + break } - resp = retryResp - break + if retryResp != nil && retryResp.Body != nil { + _ = retryResp.Body.Close() + } + log.Printf("Account %d: signature error retry failed: %v", account.ID, retryErr) + } else { + log.Printf("Account %d: signature error retry build request failed: %v", account.ID, buildErr) } - if retryResp != nil && retryResp.Body != nil { - _ = retryResp.Body.Close() - } - log.Printf("Account %d: signature error retry failed: %v", account.ID, retryErr) - } else { - log.Printf("Account %d: signature error retry build request failed: %v", account.ID, buildErr) + + // Retry failed: restore original response body and continue handling. + resp.Body = io.NopCloser(bytes.NewReader(respBody)) + break } - // 重试失败,恢复原始响应体继续处理 + // 不是thinking签名错误,恢复响应体 resp.Body = io.NopCloser(bytes.NewReader(respBody)) - break } - // 不是thinking签名错误,恢复响应体 - resp.Body = io.NopCloser(bytes.NewReader(respBody)) - } } // 检查是否需要通用重试(排除400,因为400已经在上面特殊处理过了) @@ -2037,7 +2081,7 @@ func (s *GatewayService) ForwardCountTokens(ctx context.Context, c *gin.Context, if resp.StatusCode == 400 && s.isThinkingBlockSignatureError(respBody) { log.Printf("Account %d: detected thinking block signature error on count_tokens, retrying with filtered thinking blocks", account.ID) - filteredBody := FilterThinkingBlocks(body) + filteredBody := FilterThinkingBlocksForRetry(body) retryReq, buildErr := s.buildCountTokensRequest(ctx, c, account, filteredBody, token, tokenType, reqModel) if buildErr == nil { retryResp, retryErr := s.httpUpstream.Do(retryReq, proxyURL, account.ID, account.Concurrency) diff --git a/backend/internal/service/gemini_messages_compat_service.go b/backend/internal/service/gemini_messages_compat_service.go index a1e3a83e..99e5bdf3 100644 --- a/backend/internal/service/gemini_messages_compat_service.go +++ b/backend/internal/service/gemini_messages_compat_service.go @@ -359,6 +359,7 @@ func (s *GeminiMessagesCompatService) Forward(ctx context.Context, c *gin.Contex if err != nil { return nil, s.writeClaudeError(c, http.StatusBadRequest, "invalid_request_error", err.Error()) } + originalClaudeBody := body proxyURL := "" if account.ProxyID != nil && account.Proxy != nil { @@ -479,6 +480,7 @@ func (s *GeminiMessagesCompatService) Forward(ctx context.Context, c *gin.Contex } var resp *http.Response + signatureRetryStage := 0 for attempt := 1; attempt <= geminiMaxRetries; attempt++ { upstreamReq, idHeader, err := buildReq(ctx) if err != nil { @@ -503,6 +505,46 @@ func (s *GeminiMessagesCompatService) Forward(ctx context.Context, c *gin.Contex return nil, s.writeClaudeError(c, http.StatusBadGateway, "upstream_error", "Upstream request failed after retries: "+sanitizeUpstreamErrorMessage(err.Error())) } + // Special-case: signature/thought_signature validation errors are not transient, but may be fixed by + // downgrading Claude thinking/tool history to plain text (conservative two-stage retry). + if resp.StatusCode == http.StatusBadRequest && signatureRetryStage < 2 { + respBody, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20)) + _ = resp.Body.Close() + + if isGeminiSignatureRelatedError(respBody) { + var strippedClaudeBody []byte + stageName := "" + switch signatureRetryStage { + case 0: + // Stage 1: disable thinking + thinking->text + strippedClaudeBody = FilterThinkingBlocksForRetry(originalClaudeBody) + stageName = "thinking-only" + signatureRetryStage = 1 + default: + // Stage 2: additionally downgrade tool_use/tool_result blocks to text + strippedClaudeBody = FilterSignatureSensitiveBlocksForRetry(originalClaudeBody) + stageName = "thinking+tools" + signatureRetryStage = 2 + } + retryGeminiReq, txErr := convertClaudeMessagesToGeminiGenerateContent(strippedClaudeBody) + if txErr == nil { + log.Printf("Gemini account %d: detected signature-related 400, retrying with downgraded Claude blocks (%s)", account.ID, stageName) + geminiReq = retryGeminiReq + // Consume one retry budget attempt and continue with the updated request payload. + sleepGeminiBackoff(1) + continue + } + } + + // Restore body for downstream error handling. + resp = &http.Response{ + StatusCode: http.StatusBadRequest, + Header: resp.Header.Clone(), + Body: io.NopCloser(bytes.NewReader(respBody)), + } + break + } + if resp.StatusCode >= 400 && s.shouldRetryGeminiUpstreamError(account, resp.StatusCode) { respBody, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20)) _ = resp.Body.Close() @@ -600,6 +642,14 @@ func (s *GeminiMessagesCompatService) Forward(ctx context.Context, c *gin.Contex }, nil } +func isGeminiSignatureRelatedError(respBody []byte) bool { + msg := strings.ToLower(strings.TrimSpace(extractAntigravityErrorMessage(respBody))) + if msg == "" { + msg = strings.ToLower(string(respBody)) + } + return strings.Contains(msg, "thought_signature") || strings.Contains(msg, "signature") +} + func (s *GeminiMessagesCompatService) ForwardNative(ctx context.Context, c *gin.Context, account *Account, originalModel string, action string, stream bool, body []byte) (*ForwardResult, error) { startTime := time.Now() From bfcc562c35043f48aef0d83f4e8734ec231f1a59 Mon Sep 17 00:00:00 2001 From: IanShaw027 <131567472+IanShaw027@users.noreply.github.com> Date: Sun, 4 Jan 2026 22:33:01 +0800 Subject: [PATCH 08/13] =?UTF-8?q?feat(backend):=20=E4=B8=BA=20JSON=20Schem?= =?UTF-8?q?a=20=E6=B8=85=E7=90=86=E6=B7=BB=E5=8A=A0=E8=AD=A6=E5=91=8A?= =?UTF-8?q?=E6=97=A5=E5=BF=97?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 改进 cleanJSONSchema 函数: - 新增 schemaValidationKeys 映射表,标记关键验证字段 - 新增 warnSchemaKeyRemovedOnce 函数,在移除关键验证字段时输出警告(每个 key 仅警告一次) - 支持通过环境变量 SUB2API_SCHEMA_CLEAN_WARN 控制警告开关 - 默认在非 release 模式下启用警告,便于开发调试 此改进响应代码审查建议,帮助开发者识别可能影响模型输出质量的 Schema 字段移除。 --- .../pkg/antigravity/request_transformer.go | 64 +++++++++++++++++-- 1 file changed, 59 insertions(+), 5 deletions(-) diff --git a/backend/internal/pkg/antigravity/request_transformer.go b/backend/internal/pkg/antigravity/request_transformer.go index ab9a6f09..2ef474e9 100644 --- a/backend/internal/pkg/antigravity/request_transformer.go +++ b/backend/internal/pkg/antigravity/request_transformer.go @@ -4,8 +4,11 @@ import ( "encoding/json" "fmt" "log" + "os" "strings" + "sync" + "github.com/gin-gonic/gin" "github.com/google/uuid" ) @@ -462,7 +465,7 @@ func cleanJSONSchema(schema map[string]any) map[string]any { if schema == nil { return nil } - cleaned := cleanSchemaValue(schema) + cleaned := cleanSchemaValue(schema, "$") result, ok := cleaned.(map[string]any) if !ok { return nil @@ -500,6 +503,56 @@ func cleanJSONSchema(schema map[string]any) map[string]any { return result } +var schemaValidationKeys = map[string]bool{ + "minLength": true, + "maxLength": true, + "pattern": true, + "minimum": true, + "maximum": true, + "exclusiveMinimum": true, + "exclusiveMaximum": true, + "multipleOf": true, + "uniqueItems": true, + "minItems": true, + "maxItems": true, + "minProperties": true, + "maxProperties": true, + "patternProperties": true, + "propertyNames": true, + "dependencies": true, + "dependentSchemas": true, + "dependentRequired": true, +} + +var warnedSchemaKeys sync.Map + +func schemaCleaningWarningsEnabled() bool { + // 可通过环境变量强制开关,方便排查:SUB2API_SCHEMA_CLEAN_WARN=true/false + if v := strings.TrimSpace(os.Getenv("SUB2API_SCHEMA_CLEAN_WARN")); v != "" { + switch strings.ToLower(v) { + case "1", "true", "yes", "on": + return true + case "0", "false", "no", "off": + return false + } + } + // 默认:非 release 模式下输出(debug/test) + return gin.Mode() != gin.ReleaseMode +} + +func warnSchemaKeyRemovedOnce(key, path string) { + if !schemaCleaningWarningsEnabled() { + return + } + if !schemaValidationKeys[key] { + return + } + if _, loaded := warnedSchemaKeys.LoadOrStore(key, struct{}{}); loaded { + return + } + log.Printf("[SchemaClean] removed unsupported JSON Schema validation field key=%q path=%q", key, path) +} + // excludedSchemaKeys 不支持的 schema 字段 // 基于 Claude API (Vertex AI) 的实际支持情况 // 支持: type, description, enum, properties, required, additionalProperties, items @@ -562,13 +615,14 @@ var excludedSchemaKeys = map[string]bool{ } // cleanSchemaValue 递归清理 schema 值 -func cleanSchemaValue(value any) any { +func cleanSchemaValue(value any, path string) any { switch v := value.(type) { case map[string]any: result := make(map[string]any) for k, val := range v { // 跳过不支持的字段 if excludedSchemaKeys[k] { + warnSchemaKeyRemovedOnce(k, path) continue } @@ -602,15 +656,15 @@ func cleanSchemaValue(value any) any { } // 递归清理所有值 - result[k] = cleanSchemaValue(val) + result[k] = cleanSchemaValue(val, path+"."+k) } return result case []any: // 递归处理数组中的每个元素 cleaned := make([]any, 0, len(v)) - for _, item := range v { - cleaned = append(cleaned, cleanSchemaValue(item)) + for i, item := range v { + cleaned = append(cleaned, cleanSchemaValue(item, fmt.Sprintf("%s[%d]", path, i))) } return cleaned From f60f943d0c462ae2f6c82150aba25a5f8dae882b Mon Sep 17 00:00:00 2001 From: IanShaw027 <131567472+IanShaw027@users.noreply.github.com> Date: Sun, 4 Jan 2026 22:49:40 +0800 Subject: [PATCH 09/13] =?UTF-8?q?fix:=20=E4=BF=AE=E5=A4=8D=E4=BB=A3?= =?UTF-8?q?=E7=A0=81=E5=AE=A1=E6=9F=A5=E6=8A=A5=E5=91=8A=E4=B8=AD=E7=9A=84?= =?UTF-8?q?4=E4=B8=AA=E5=85=B3=E9=94=AE=E9=97=AE=E9=A2=98?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 1. 资源管理冗余(ForwardGemini双重Close) - 错误分支读取body后立即关闭原始body,用内存副本重新包装 - defer添加nil guard,避免重复关闭 - fallback成功时显式关闭旧body,确保连接释放 2. Schema校验丢失(cleanJSONSchema移除字段无感知) - 新增schemaCleaningWarningsEnabled()支持环境变量控制 - 实现warnSchemaKeyRemovedOnce()在非release模式下告警 - 移除关键验证字段时输出warning,包含key和path 3. UI响应式风险(UsersView操作菜单硬编码定位) - 菜单改为先粗定位、渲染后测量、再clamp到视口内 - 添加max-height + overflow-auto,超出时可滚动 - 增强交互:点击其它位置/滚动/resize自动关闭或重新定位 4. 身份补丁干扰(TransformClaudeToGemini默认注入) - 新增TransformOptions + TransformClaudeToGeminiWithOptions - 系统设置新增enable_identity_patch、identity_patch_prompt - 完整打通handler/dto/service/frontend配置链路 - 默认保持启用,向后兼容现有行为 测试: - 后端单测全量通过:go test ./... - 前端类型检查通过:npm run typecheck --- .../internal/handler/admin/setting_handler.go | 10 ++++ backend/internal/handler/dto/settings.go | 4 ++ .../pkg/antigravity/request_transformer.go | 51 +++++++++++++++---- .../service/antigravity_gateway_service.go | 14 ++++- backend/internal/service/domain_constants.go | 4 ++ backend/internal/service/setting_service.go | 34 +++++++++++++ backend/internal/service/settings_view.go | 4 ++ frontend/src/api/admin/settings.ts | 4 ++ frontend/src/views/admin/SettingsView.vue | 5 +- frontend/src/views/admin/UsersView.vue | 49 ++++++++++++++++-- 10 files changed, 163 insertions(+), 16 deletions(-) diff --git a/backend/internal/handler/admin/setting_handler.go b/backend/internal/handler/admin/setting_handler.go index ed8f84be..a52b06b4 100644 --- a/backend/internal/handler/admin/setting_handler.go +++ b/backend/internal/handler/admin/setting_handler.go @@ -59,6 +59,8 @@ func (h *SettingHandler) GetSettings(c *gin.Context) { FallbackModelOpenAI: settings.FallbackModelOpenAI, FallbackModelGemini: settings.FallbackModelGemini, FallbackModelAntigravity: settings.FallbackModelAntigravity, + EnableIdentityPatch: settings.EnableIdentityPatch, + IdentityPatchPrompt: settings.IdentityPatchPrompt, }) } @@ -100,6 +102,10 @@ type UpdateSettingsRequest struct { FallbackModelOpenAI string `json:"fallback_model_openai"` FallbackModelGemini string `json:"fallback_model_gemini"` FallbackModelAntigravity string `json:"fallback_model_antigravity"` + + // Identity patch configuration (Claude -> Gemini) + EnableIdentityPatch bool `json:"enable_identity_patch"` + IdentityPatchPrompt string `json:"identity_patch_prompt"` } // UpdateSettings 更新系统设置 @@ -178,6 +184,8 @@ func (h *SettingHandler) UpdateSettings(c *gin.Context) { FallbackModelOpenAI: req.FallbackModelOpenAI, FallbackModelGemini: req.FallbackModelGemini, FallbackModelAntigravity: req.FallbackModelAntigravity, + EnableIdentityPatch: req.EnableIdentityPatch, + IdentityPatchPrompt: req.IdentityPatchPrompt, } if err := h.settingService.UpdateSettings(c.Request.Context(), settings); err != nil { @@ -218,6 +226,8 @@ func (h *SettingHandler) UpdateSettings(c *gin.Context) { FallbackModelOpenAI: updatedSettings.FallbackModelOpenAI, FallbackModelGemini: updatedSettings.FallbackModelGemini, FallbackModelAntigravity: updatedSettings.FallbackModelAntigravity, + EnableIdentityPatch: updatedSettings.EnableIdentityPatch, + IdentityPatchPrompt: updatedSettings.IdentityPatchPrompt, }) } diff --git a/backend/internal/handler/dto/settings.go b/backend/internal/handler/dto/settings.go index 14a12697..668fb2dc 100644 --- a/backend/internal/handler/dto/settings.go +++ b/backend/internal/handler/dto/settings.go @@ -33,6 +33,10 @@ type SystemSettings struct { FallbackModelOpenAI string `json:"fallback_model_openai"` FallbackModelGemini string `json:"fallback_model_gemini"` FallbackModelAntigravity string `json:"fallback_model_antigravity"` + + // Identity patch configuration (Claude -> Gemini) + EnableIdentityPatch bool `json:"enable_identity_patch"` + IdentityPatchPrompt string `json:"identity_patch_prompt"` } type PublicSettings struct { diff --git a/backend/internal/pkg/antigravity/request_transformer.go b/backend/internal/pkg/antigravity/request_transformer.go index 2ef474e9..805e0c5b 100644 --- a/backend/internal/pkg/antigravity/request_transformer.go +++ b/backend/internal/pkg/antigravity/request_transformer.go @@ -12,8 +12,26 @@ import ( "github.com/google/uuid" ) +type TransformOptions struct { + EnableIdentityPatch bool + // IdentityPatch 可选:自定义注入到 systemInstruction 开头的身份防护提示词; + // 为空时使用默认模板(包含 [IDENTITY_PATCH] 及 SYSTEM_PROMPT_BEGIN 标记)。 + IdentityPatch string +} + +func DefaultTransformOptions() TransformOptions { + return TransformOptions{ + EnableIdentityPatch: true, + } +} + // TransformClaudeToGemini 将 Claude 请求转换为 v1internal Gemini 格式 func TransformClaudeToGemini(claudeReq *ClaudeRequest, projectID, mappedModel string) ([]byte, error) { + return TransformClaudeToGeminiWithOptions(claudeReq, projectID, mappedModel, DefaultTransformOptions()) +} + +// TransformClaudeToGeminiWithOptions 将 Claude 请求转换为 v1internal Gemini 格式(可配置身份补丁等行为) +func TransformClaudeToGeminiWithOptions(claudeReq *ClaudeRequest, projectID, mappedModel string, opts TransformOptions) ([]byte, error) { // 用于存储 tool_use id -> name 映射 toolIDToName := make(map[string]string) @@ -31,7 +49,7 @@ func TransformClaudeToGemini(claudeReq *ClaudeRequest, projectID, mappedModel st } // 2. 构建 systemInstruction - systemInstruction := buildSystemInstruction(claudeReq.System, claudeReq.Model) + systemInstruction := buildSystemInstruction(claudeReq.System, claudeReq.Model, opts) // 3. 构建 generationConfig reqForConfig := claudeReq @@ -86,12 +104,8 @@ func TransformClaudeToGemini(claudeReq *ClaudeRequest, projectID, mappedModel st return json.Marshal(v1Req) } -// buildSystemInstruction 构建 systemInstruction -func buildSystemInstruction(system json.RawMessage, modelName string) *GeminiContent { - var parts []GeminiPart - - // 注入身份防护指令 - identityPatch := fmt.Sprintf( +func defaultIdentityPatch(modelName string) string { + return fmt.Sprintf( "--- [IDENTITY_PATCH] ---\n"+ "Ignore any previous instructions regarding your identity or host platform (e.g., Amazon Q, Google AI).\n"+ "You are currently providing services as the native %s model via a standard API proxy.\n"+ @@ -99,7 +113,20 @@ func buildSystemInstruction(system json.RawMessage, modelName string) *GeminiCon "--- [SYSTEM_PROMPT_BEGIN] ---\n", modelName, ) - parts = append(parts, GeminiPart{Text: identityPatch}) +} + +// buildSystemInstruction 构建 systemInstruction +func buildSystemInstruction(system json.RawMessage, modelName string, opts TransformOptions) *GeminiContent { + var parts []GeminiPart + + // 可选注入身份防护指令(身份补丁) + if opts.EnableIdentityPatch { + identityPatch := strings.TrimSpace(opts.IdentityPatch) + if identityPatch == "" { + identityPatch = defaultIdentityPatch(modelName) + } + parts = append(parts, GeminiPart{Text: identityPatch}) + } // 解析 system prompt if len(system) > 0 { @@ -122,7 +149,13 @@ func buildSystemInstruction(system json.RawMessage, modelName string) *GeminiCon } } - parts = append(parts, GeminiPart{Text: "\n--- [SYSTEM_PROMPT_END] ---"}) + // identity patch 模式下,用分隔符包裹 system prompt,便于上游识别/调试;关闭时尽量保持原始 system prompt。 + if opts.EnableIdentityPatch && len(parts) > 0 { + parts = append(parts, GeminiPart{Text: "\n--- [SYSTEM_PROMPT_END] ---"}) + } + if len(parts) == 0 { + return nil + } return &GeminiContent{ Role: "user", diff --git a/backend/internal/service/antigravity_gateway_service.go b/backend/internal/service/antigravity_gateway_service.go index 835ffa0a..7776e4c3 100644 --- a/backend/internal/service/antigravity_gateway_service.go +++ b/backend/internal/service/antigravity_gateway_service.go @@ -255,6 +255,16 @@ func (s *AntigravityGatewayService) buildClaudeTestRequest(projectID, mappedMode return antigravity.TransformClaudeToGemini(claudeReq, projectID, mappedModel) } +func (s *AntigravityGatewayService) getClaudeTransformOptions(ctx context.Context) antigravity.TransformOptions { + opts := antigravity.DefaultTransformOptions() + if s.settingService == nil { + return opts + } + opts.EnableIdentityPatch = s.settingService.IsIdentityPatchEnabled(ctx) + opts.IdentityPatch = s.settingService.GetIdentityPatchPrompt(ctx) + return opts +} + // extractGeminiResponseText 从 Gemini 响应中提取文本 func extractGeminiResponseText(respBody []byte) string { var resp map[string]any @@ -380,7 +390,7 @@ func (s *AntigravityGatewayService) Forward(ctx context.Context, c *gin.Context, } // 转换 Claude 请求为 Gemini 格式 - geminiBody, err := antigravity.TransformClaudeToGemini(&claudeReq, projectID, mappedModel) + geminiBody, err := antigravity.TransformClaudeToGeminiWithOptions(&claudeReq, projectID, mappedModel, s.getClaudeTransformOptions(ctx)) if err != nil { return nil, fmt.Errorf("transform request: %w", err) } @@ -466,7 +476,7 @@ func (s *AntigravityGatewayService) Forward(ctx context.Context, c *gin.Context, log.Printf("Antigravity account %d: detected signature-related 400, retrying once (%s)", account.ID, stage.name) - retryGeminiBody, txErr := antigravity.TransformClaudeToGemini(&retryClaudeReq, projectID, mappedModel) + retryGeminiBody, txErr := antigravity.TransformClaudeToGeminiWithOptions(&retryClaudeReq, projectID, mappedModel, s.getClaudeTransformOptions(ctx)) if txErr != nil { continue } diff --git a/backend/internal/service/domain_constants.go b/backend/internal/service/domain_constants.go index ec29b84a..9c61ea2e 100644 --- a/backend/internal/service/domain_constants.go +++ b/backend/internal/service/domain_constants.go @@ -101,6 +101,10 @@ const ( SettingKeyFallbackModelOpenAI = "fallback_model_openai" SettingKeyFallbackModelGemini = "fallback_model_gemini" SettingKeyFallbackModelAntigravity = "fallback_model_antigravity" + + // Request identity patch (Claude -> Gemini systemInstruction injection) + SettingKeyEnableIdentityPatch = "enable_identity_patch" + SettingKeyIdentityPatchPrompt = "identity_patch_prompt" ) // AdminAPIKeyPrefix is the prefix for admin API keys (distinct from user "sk-" keys). diff --git a/backend/internal/service/setting_service.go b/backend/internal/service/setting_service.go index b27cfedb..a331594e 100644 --- a/backend/internal/service/setting_service.go +++ b/backend/internal/service/setting_service.go @@ -130,6 +130,10 @@ func (s *SettingService) UpdateSettings(ctx context.Context, settings *SystemSet updates[SettingKeyFallbackModelGemini] = settings.FallbackModelGemini updates[SettingKeyFallbackModelAntigravity] = settings.FallbackModelAntigravity + // Identity patch configuration (Claude -> Gemini) + updates[SettingKeyEnableIdentityPatch] = strconv.FormatBool(settings.EnableIdentityPatch) + updates[SettingKeyIdentityPatchPrompt] = settings.IdentityPatchPrompt + return s.settingRepo.SetMultiple(ctx, updates) } @@ -213,6 +217,9 @@ func (s *SettingService) InitializeDefaultSettings(ctx context.Context) error { SettingKeyFallbackModelOpenAI: "gpt-4o", SettingKeyFallbackModelGemini: "gemini-2.5-pro", SettingKeyFallbackModelAntigravity: "gemini-2.5-pro", + // Identity patch defaults + SettingKeyEnableIdentityPatch: "true", + SettingKeyIdentityPatchPrompt: "", } return s.settingRepo.SetMultiple(ctx, defaults) @@ -269,6 +276,14 @@ func (s *SettingService) parseSettings(settings map[string]string) *SystemSettin result.FallbackModelGemini = s.getStringOrDefault(settings, SettingKeyFallbackModelGemini, "gemini-2.5-pro") result.FallbackModelAntigravity = s.getStringOrDefault(settings, SettingKeyFallbackModelAntigravity, "gemini-2.5-pro") + // Identity patch settings (default: enabled, to preserve existing behavior) + if v, ok := settings[SettingKeyEnableIdentityPatch]; ok && v != "" { + result.EnableIdentityPatch = v == "true" + } else { + result.EnableIdentityPatch = true + } + result.IdentityPatchPrompt = settings[SettingKeyIdentityPatchPrompt] + return result } @@ -298,6 +313,25 @@ func (s *SettingService) GetTurnstileSecretKey(ctx context.Context) string { return value } +// IsIdentityPatchEnabled 检查是否启用身份补丁(Claude -> Gemini systemInstruction 注入) +func (s *SettingService) IsIdentityPatchEnabled(ctx context.Context) bool { + value, err := s.settingRepo.GetValue(ctx, SettingKeyEnableIdentityPatch) + if err != nil { + // 默认开启,保持兼容 + return true + } + return value == "true" +} + +// GetIdentityPatchPrompt 获取自定义身份补丁提示词(为空表示使用内置默认模板) +func (s *SettingService) GetIdentityPatchPrompt(ctx context.Context) string { + value, err := s.settingRepo.GetValue(ctx, SettingKeyIdentityPatchPrompt) + if err != nil { + return "" + } + return value +} + // GenerateAdminAPIKey 生成新的管理员 API Key func (s *SettingService) GenerateAdminAPIKey(ctx context.Context) (string, error) { // 生成 32 字节随机数 = 64 位十六进制字符 diff --git a/backend/internal/service/settings_view.go b/backend/internal/service/settings_view.go index 65fc8c33..1fba5e13 100644 --- a/backend/internal/service/settings_view.go +++ b/backend/internal/service/settings_view.go @@ -32,6 +32,10 @@ type SystemSettings struct { FallbackModelOpenAI string `json:"fallback_model_openai"` FallbackModelGemini string `json:"fallback_model_gemini"` FallbackModelAntigravity string `json:"fallback_model_antigravity"` + + // Identity patch configuration (Claude -> Gemini) + EnableIdentityPatch bool `json:"enable_identity_patch"` + IdentityPatchPrompt string `json:"identity_patch_prompt"` } type PublicSettings struct { diff --git a/frontend/src/api/admin/settings.ts b/frontend/src/api/admin/settings.ts index cf5cba6d..cc91c09b 100644 --- a/frontend/src/api/admin/settings.ts +++ b/frontend/src/api/admin/settings.ts @@ -34,6 +34,10 @@ export interface SystemSettings { turnstile_enabled: boolean turnstile_site_key: string turnstile_secret_key: string + + // Identity patch configuration (Claude -> Gemini) + enable_identity_patch: boolean + identity_patch_prompt: string } /** diff --git a/frontend/src/views/admin/SettingsView.vue b/frontend/src/views/admin/SettingsView.vue index 25f73696..fc6ee66b 100644 --- a/frontend/src/views/admin/SettingsView.vue +++ b/frontend/src/views/admin/SettingsView.vue @@ -756,7 +756,10 @@ const form = reactive({ // Cloudflare Turnstile turnstile_enabled: false, turnstile_site_key: '', - turnstile_secret_key: '' + turnstile_secret_key: '', + // Identity patch (Claude -> Gemini) + enable_identity_patch: true, + identity_patch_prompt: '' }) function handleLogoUpload(event: Event) { diff --git a/frontend/src/views/admin/UsersView.vue b/frontend/src/views/admin/UsersView.vue index 47a31270..f5ce601a 100644 --- a/frontend/src/views/admin/UsersView.vue +++ b/frontend/src/views/admin/UsersView.vue @@ -37,7 +37,7 @@ -
+
\ No newline at end of file + diff --git a/frontend/src/views/admin/UsersView.vue b/frontend/src/views/admin/UsersView.vue index f5ce601a..6e896ab9 100644 --- a/frontend/src/views/admin/UsersView.vue +++ b/frontend/src/views/admin/UsersView.vue @@ -1,52 +1,562 @@ diff --git a/frontend/src/views/user/DashboardView.vue b/frontend/src/views/user/DashboardView.vue index ef406bea..39d2f877 100644 --- a/frontend/src/views/user/DashboardView.vue +++ b/frontend/src/views/user/DashboardView.vue @@ -1,13 +1,13 @@