backend/internal/service/gateway_request.go

package service

import (
	"bytes"
	"encoding/json"
	"fmt"
)

// ParsedRequest 保存网关请求的预解析结果
//
// 性能优化说明：
// 原实现在多个位置重复解析请求体（Handler、Service 各解析一次）：
// 1. gateway_handler.go 解析获取 model 和 stream
// 2. gateway_service.go 再次解析获取 system、messages、metadata
// 3. GenerateSessionHash 又一次解析获取会话哈希所需字段
//
// 新实现一次解析，多处复用：
// 1. 在 Handler 层统一调用 ParseGatewayRequest 一次性解析
// 2. 将解析结果 ParsedRequest 传递给 Service 层
// 3. 避免重复 json.Unmarshal，减少 CPU 和内存开销
type ParsedRequest struct {
	Body           []byte // 原始请求体（保留用于转发）
	Model          string // 请求的模型名称
	Stream         bool   // 是否为流式请求
	MetadataUserID string // metadata.user_id（用于会话亲和）
	System         any    // system 字段内容
	Messages       []any  // messages 数组
	HasSystem      bool   // 是否包含 system 字段（包含 null 也视为显式传入）
}

// ParseGatewayRequest 解析网关请求体并返回结构化结果
// 性能优化：一次解析提取所有需要的字段，避免重复 Unmarshal
func ParseGatewayRequest(body []byte) (*ParsedRequest, error) {
	var req map[string]any
	if err := json.Unmarshal(body, &req); err != nil {
		return nil, err
	}

	parsed := &ParsedRequest{
		Body: body,
	}

	if rawModel, exists := req["model"]; exists {
		model, ok := rawModel.(string)
		if !ok {
			return nil, fmt.Errorf("invalid model field type")
		}
		parsed.Model = model
	}
	if rawStream, exists := req["stream"]; exists {
		stream, ok := rawStream.(bool)
		if !ok {
			return nil, fmt.Errorf("invalid stream field type")
		}
		parsed.Stream = stream
	}
	if metadata, ok := req["metadata"].(map[string]any); ok {
		if userID, ok := metadata["user_id"].(string); ok {
			parsed.MetadataUserID = userID
		}
	}
	// system 字段只要存在就视为显式提供（即使为 null），
	// 以避免客户端传 null 时被默认 system 误注入。
	if system, ok := req["system"]; ok {
		parsed.HasSystem = true
		parsed.System = system
	}
	if messages, ok := req["messages"].([]any); ok {
		parsed.Messages = messages
	}

	return parsed, nil
}

// FilterThinkingBlocks removes thinking blocks from request body
// Returns filtered body or original body if filtering fails (fail-safe)
// This prevents 400 errors from invalid thinking block signatures
//
// Strategy:
//   - When thinking.type != "enabled": Remove all thinking blocks
//   - When thinking.type == "enabled": Only remove thinking blocks without valid signatures
//     (blocks with missing/empty/dummy signatures that would cause 400 errors)
func FilterThinkingBlocks(body []byte) []byte {
	return filterThinkingBlocksInternal(body, false)
}

// FilterThinkingBlocksForRetry strips thinking-related constructs for retry scenarios.
//
// Why:
//   - Upstreams may reject historical `thinking`/`redacted_thinking` blocks due to invalid/missing signatures.
//   - Anthropic extended thinking has a structural constraint: when top-level `thinking` is enabled and the
//     final message is an assistant prefill, the assistant content must start with a thinking block.
//   - If we remove thinking blocks but keep top-level `thinking` enabled, we can trigger:
//     "Expected `thinking` or `redacted_thinking`, but found `text`"
//
// Strategy (B: preserve content as text):
//   - Disable top-level `thinking` (remove `thinking` field).
//   - Convert `thinking` blocks to `text` blocks (preserve the thinking content).
//   - Remove `redacted_thinking` blocks (cannot be converted to text).
//   - Ensure no message ends up with empty content.
func FilterThinkingBlocksForRetry(body []byte) []byte {
	hasThinkingContent := bytes.Contains(body, []byte(`"type":"thinking"`)) ||
		bytes.Contains(body, []byte(`"type": "thinking"`)) ||
		bytes.Contains(body, []byte(`"type":"redacted_thinking"`)) ||
		bytes.Contains(body, []byte(`"type": "redacted_thinking"`)) ||
		bytes.Contains(body, []byte(`"thinking":`)) ||
		bytes.Contains(body, []byte(`"thinking" :`))

	// Also check for empty content arrays that need fixing.
	// Note: This is a heuristic check; the actual empty content handling is done below.
	hasEmptyContent := bytes.Contains(body, []byte(`"content":[]`)) ||
		bytes.Contains(body, []byte(`"content": []`)) ||
		bytes.Contains(body, []byte(`"content" : []`)) ||
		bytes.Contains(body, []byte(`"content" :[]`))

	// Fast path: nothing to process
	if !hasThinkingContent && !hasEmptyContent {
		return body
	}

	var req map[string]any
	if err := json.Unmarshal(body, &req); err != nil {
		return body
	}

	modified := false

	messages, ok := req["messages"].([]any)
	if !ok {
		return body
	}

	// Disable top-level thinking mode for retry to avoid structural/signature constraints upstream.
	if _, exists := req["thinking"]; exists {
		delete(req, "thinking")
		modified = true
	}

	newMessages := make([]any, 0, len(messages))

	for _, msg := range messages {
		msgMap, ok := msg.(map[string]any)
		if !ok {
			newMessages = append(newMessages, msg)
			continue
		}

		role, _ := msgMap["role"].(string)
		content, ok := msgMap["content"].([]any)
		if !ok {
			// String content or other format - keep as is
			newMessages = append(newMessages, msg)
			continue
		}

		newContent := make([]any, 0, len(content))
		modifiedThisMsg := false

		for _, block := range content {
			blockMap, ok := block.(map[string]any)
			if !ok {
				newContent = append(newContent, block)
				continue
			}

			blockType, _ := blockMap["type"].(string)

			// Convert thinking blocks to text (preserve content) and drop redacted_thinking.
			switch blockType {
			case "thinking":
				modifiedThisMsg = true
				thinkingText, _ := blockMap["thinking"].(string)
				if thinkingText == "" {
					continue
				}
				newContent = append(newContent, map[string]any{
					"type": "text",
					"text": thinkingText,
				})
				continue
			case "redacted_thinking":
				modifiedThisMsg = true
				continue
			}

			// Handle blocks without type discriminator but with a "thinking" field.
			if blockType == "" {
				if rawThinking, hasThinking := blockMap["thinking"]; hasThinking {
					modifiedThisMsg = true
					switch v := rawThinking.(type) {
					case string:
						if v != "" {
							newContent = append(newContent, map[string]any{"type": "text", "text": v})
						}
					default:
						if b, err := json.Marshal(v); err == nil && len(b) > 0 {
							newContent = append(newContent, map[string]any{"type": "text", "text": string(b)})
						}
					}
					continue
				}
			}

			newContent = append(newContent, block)
		}

		// Handle empty content: either from filtering or originally empty
		if len(newContent) == 0 {
			modified = true
			placeholder := "(content removed)"
			if role == "assistant" {
				placeholder = "(assistant content removed)"
			}
			newContent = append(newContent, map[string]any{
				"type": "text",
				"text": placeholder,
			})
			msgMap["content"] = newContent
		} else if modifiedThisMsg {
			modified = true
			msgMap["content"] = newContent
		}
		newMessages = append(newMessages, msgMap)
	}

	if modified {
		req["messages"] = newMessages
	} else {
		// Avoid rewriting JSON when no changes are needed.
		return body
	}

	newBody, err := json.Marshal(req)
	if err != nil {
		return body
	}
	return newBody
}

// FilterSignatureSensitiveBlocksForRetry is a stronger retry filter for cases where upstream errors indicate
// signature/thought_signature validation issues involving tool blocks.
//
// This performs everything in FilterThinkingBlocksForRetry, plus:
//   - Convert `tool_use` blocks to text (name/id/input) so we stop sending structured tool calls.
//   - Convert `tool_result` blocks to text so we keep tool results visible without tool semantics.
//
// Use this only when needed: converting tool blocks to text changes model behaviour and can increase the
// risk of prompt injection (tool output becomes plain conversation text).
func FilterSignatureSensitiveBlocksForRetry(body []byte) []byte {
	// Fast path: only run when we see likely relevant constructs.
	if !bytes.Contains(body, []byte(`"type":"thinking"`)) &&
		!bytes.Contains(body, []byte(`"type": "thinking"`)) &&
		!bytes.Contains(body, []byte(`"type":"redacted_thinking"`)) &&
		!bytes.Contains(body, []byte(`"type": "redacted_thinking"`)) &&
		!bytes.Contains(body, []byte(`"type":"tool_use"`)) &&
		!bytes.Contains(body, []byte(`"type": "tool_use"`)) &&
		!bytes.Contains(body, []byte(`"type":"tool_result"`)) &&
		!bytes.Contains(body, []byte(`"type": "tool_result"`)) &&
		!bytes.Contains(body, []byte(`"thinking":`)) &&
		!bytes.Contains(body, []byte(`"thinking" :`)) {
		return body
	}

	var req map[string]any
	if err := json.Unmarshal(body, &req); err != nil {
		return body
	}

	modified := false

	// Disable top-level thinking for retry to avoid structural/signature constraints upstream.
	if _, exists := req["thinking"]; exists {
		delete(req, "thinking")
		modified = true
	}

	messages, ok := req["messages"].([]any)
	if !ok {
		return body
	}

	newMessages := make([]any, 0, len(messages))

	for _, msg := range messages {
		msgMap, ok := msg.(map[string]any)
		if !ok {
			newMessages = append(newMessages, msg)
			continue
		}

		role, _ := msgMap["role"].(string)
		content, ok := msgMap["content"].([]any)
		if !ok {
			newMessages = append(newMessages, msg)
			continue
		}

		newContent := make([]any, 0, len(content))
		modifiedThisMsg := false

		for _, block := range content {
			blockMap, ok := block.(map[string]any)
			if !ok {
				newContent = append(newContent, block)
				continue
			}

			blockType, _ := blockMap["type"].(string)
			switch blockType {
			case "thinking":
				modifiedThisMsg = true
				thinkingText, _ := blockMap["thinking"].(string)
				if thinkingText == "" {
					continue
				}
				newContent = append(newContent, map[string]any{"type": "text", "text": thinkingText})
				continue
			case "redacted_thinking":
				modifiedThisMsg = true
				continue
			case "tool_use":
				modifiedThisMsg = true
				name, _ := blockMap["name"].(string)
				id, _ := blockMap["id"].(string)
				input := blockMap["input"]
				inputJSON, _ := json.Marshal(input)
				text := "(tool_use)"
				if name != "" {
					text += " name=" + name
				}
				if id != "" {
					text += " id=" + id
				}
				if len(inputJSON) > 0 && string(inputJSON) != "null" {
					text += " input=" + string(inputJSON)
				}
				newContent = append(newContent, map[string]any{"type": "text", "text": text})
				continue
			case "tool_result":
				modifiedThisMsg = true
				toolUseID, _ := blockMap["tool_use_id"].(string)
				isError, _ := blockMap["is_error"].(bool)
				content := blockMap["content"]
				contentJSON, _ := json.Marshal(content)
				text := "(tool_result)"
				if toolUseID != "" {
					text += " tool_use_id=" + toolUseID
				}
				if isError {
					text += " is_error=true"
				}
				if len(contentJSON) > 0 && string(contentJSON) != "null" {
					text += "\n" + string(contentJSON)
				}
				newContent = append(newContent, map[string]any{"type": "text", "text": text})
				continue
			}

			if blockType == "" {
				if rawThinking, hasThinking := blockMap["thinking"]; hasThinking {
					modifiedThisMsg = true
					switch v := rawThinking.(type) {
					case string:
						if v != "" {
							newContent = append(newContent, map[string]any{"type": "text", "text": v})
						}
					default:
						if b, err := json.Marshal(v); err == nil && len(b) > 0 {
							newContent = append(newContent, map[string]any{"type": "text", "text": string(b)})
						}
					}
					continue
				}
			}

			newContent = append(newContent, block)
		}

		if modifiedThisMsg {
			modified = true
			if len(newContent) == 0 {
				placeholder := "(content removed)"
				if role == "assistant" {
					placeholder = "(assistant content removed)"
				}
				newContent = append(newContent, map[string]any{"type": "text", "text": placeholder})
			}
			msgMap["content"] = newContent
		}

		newMessages = append(newMessages, msgMap)
	}

	if !modified {
		return body
	}

	req["messages"] = newMessages
	newBody, err := json.Marshal(req)
	if err != nil {
		return body
	}
	return newBody
}

// filterThinkingBlocksInternal removes invalid thinking blocks from request
// Strategy:
//   - When thinking.type != "enabled": Remove all thinking blocks
//   - When thinking.type == "enabled": Only remove thinking blocks without valid signatures
func filterThinkingBlocksInternal(body []byte, _ bool) []byte {
	// Fast path: if body doesn't contain "thinking", skip parsing
	if !bytes.Contains(body, []byte(`"type":"thinking"`)) &&
		!bytes.Contains(body, []byte(`"type": "thinking"`)) &&
		!bytes.Contains(body, []byte(`"type":"redacted_thinking"`)) &&
		!bytes.Contains(body, []byte(`"type": "redacted_thinking"`)) &&
		!bytes.Contains(body, []byte(`"thinking":`)) &&
		!bytes.Contains(body, []byte(`"thinking" :`)) {
		return body
	}

	var req map[string]any
	if err := json.Unmarshal(body, &req); err != nil {
		return body
	}

	// Check if thinking is enabled
	thinkingEnabled := false
	if thinking, ok := req["thinking"].(map[string]any); ok {
		if thinkType, ok := thinking["type"].(string); ok && thinkType == "enabled" {
			thinkingEnabled = true
		}
	}

	messages, ok := req["messages"].([]any)
	if !ok {
		return body
	}

	filtered := false
	for _, msg := range messages {
		msgMap, ok := msg.(map[string]any)
		if !ok {
			continue
		}

		role, _ := msgMap["role"].(string)
		content, ok := msgMap["content"].([]any)
		if !ok {
			continue
		}

		newContent := make([]any, 0, len(content))
		filteredThisMessage := false

		for _, block := range content {
			blockMap, ok := block.(map[string]any)
			if !ok {
				newContent = append(newContent, block)
				continue
			}

			blockType, _ := blockMap["type"].(string)

			if blockType == "thinking" || blockType == "redacted_thinking" {
				// When thinking is enabled and this is an assistant message,
				// only keep thinking blocks with valid signatures
				if thinkingEnabled && role == "assistant" {
					signature, _ := blockMap["signature"].(string)
					if signature != "" && signature != "skip_thought_signature_validator" {
						newContent = append(newContent, block)
						continue
					}
				}
				filtered = true
				filteredThisMessage = true
				continue
			}

			// Handle blocks without type discriminator but with "thinking" key
			if blockType == "" {
				if _, hasThinking := blockMap["thinking"]; hasThinking {
					filtered = true
					filteredThisMessage = true
					continue
				}
			}

			newContent = append(newContent, block)
		}

		if filteredThisMessage {
			msgMap["content"] = newContent
		}
	}

	if !filtered {
		return body
	}

	newBody, err := json.Marshal(req)
	if err != nil {
		return body
	}
	return newBody
}
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+								package service
 								import (
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
+									"bytes"
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+									"encoding/json"
 									"fmt"
 								)
 								// ParsedRequest 保存网关请求的预解析结果
 								//
 								// 性能优化说明：
 								// 原实现在多个位置重复解析请求体（Handler、Service 各解析一次）：
 								// 1. gateway_handler.go 解析获取 model 和 stream
 								// 2. gateway_service.go 再次解析获取 system、messages、metadata
 								// 3. GenerateSessionHash 又一次解析获取会话哈希所需字段
 								//
 								// 新实现一次解析，多处复用：
 								// 1. 在 Handler 层统一调用 ParseGatewayRequest 一次性解析
 								// 2. 将解析结果 ParsedRequest 传递给 Service 层
 								// 3. 避免重复 json.Unmarshal，减少 CPU 和内存开销
 								type ParsedRequest struct {
 									Body           []byte // 原始请求体（保留用于转发）
 									Model          string // 请求的模型名称
 									Stream         bool   // 是否为流式请求
 									MetadataUserID string // metadata.user_id（用于会话亲和）
 									System         any    // system 字段内容
 									Messages       []any  // messages 数组
-												fix(服务): 修复system判定、统计时区与缓存日志

- system 字段存在即视为显式提供，避免 null 触发默认注入
- 日统计分组显式使用应用时区，缺失时从 TZ 回退到 UTC
- 缓存写入队列丢弃日志节流汇总，关键任务同步回退

测试: go test ./internal/service -run TestBillingCacheServiceQueueHighLoad

											
										
										
											2025-12-31 10:17:38 +08:00
+									HasSystem      bool   // 是否包含 system 字段（包含 null 也视为显式传入）
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+								}
 								// ParseGatewayRequest 解析网关请求体并返回结构化结果
 								// 性能优化：一次解析提取所有需要的字段，避免重复 Unmarshal
 								func ParseGatewayRequest(body []byte) (*ParsedRequest, error) {
 									var req map[string]any
 									if err := json.Unmarshal(body, &req); err != nil {
 										return nil, err
 									}
 									parsed := &ParsedRequest{
 										Body: body,
 									}
 									if rawModel, exists := req["model"]; exists {
 										model, ok := rawModel.(string)
 										if !ok {
 											return nil, fmt.Errorf("invalid model field type")
 										}
 										parsed.Model = model
 									}
 									if rawStream, exists := req["stream"]; exists {
 										stream, ok := rawStream.(bool)
 										if !ok {
 											return nil, fmt.Errorf("invalid stream field type")
 										}
 										parsed.Stream = stream
 									}
 									if metadata, ok := req["metadata"].(map[string]any); ok {
 										if userID, ok := metadata["user_id"].(string); ok {
 											parsed.MetadataUserID = userID
 										}
 									}
-												fix(服务): 修复system判定、统计时区与缓存日志

- system 字段存在即视为显式提供，避免 null 触发默认注入
- 日统计分组显式使用应用时区，缺失时从 TZ 回退到 UTC
- 缓存写入队列丢弃日志节流汇总，关键任务同步回退

测试: go test ./internal/service -run TestBillingCacheServiceQueueHighLoad

											
										
										
											2025-12-31 10:17:38 +08:00
+									// system 字段只要存在就视为显式提供（即使为 null），
 									// 以避免客户端传 null 时被默认 system 误注入。
 									if system, ok := req["system"]; ok {
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+										parsed.HasSystem = true
 										parsed.System = system
 									}
 									if messages, ok := req["messages"].([]any); ok {
 										parsed.Messages = messages
 									}
 									return parsed, nil
 								}
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
 								// FilterThinkingBlocks removes thinking blocks from request body
 								// Returns filtered body or original body if filtering fails (fail-safe)
 								// This prevents 400 errors from invalid thinking block signatures
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+								//
 								// Strategy:
 								//   - When thinking.type != "enabled": Remove all thinking blocks
 								//   - When thinking.type == "enabled": Only remove thinking blocks without valid signatures
 								//     (blocks with missing/empty/dummy signatures that would cause 400 errors)
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
+								func FilterThinkingBlocks(body []byte) []byte {
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+									return filterThinkingBlocksInternal(body, false)
 								}
-												fix(backend): 改进 thinking/tool block 签名处理和重试策略

主要改动：
- request_transformer: thinking block 缺少签名时降级为文本而非丢弃，保留内容并在上层禁用 thinking mode
- antigravity_gateway_service: 新增两阶段降级策略，先处理 thinking blocks，如仍失败且涉及 tool 签名错误则进一步降级 tool blocks
- gateway_request: 新增 FilterSignatureSensitiveBlocksForRetry 函数，支持将 tool_use/tool_result 降级为文本
- gateway_request: 改进 FilterThinkingBlocksForRetry，禁用顶层 thinking 配置以避免结构约束冲突
- gateway_service: 实现保守的两阶段重试逻辑，优先保留内容，仅在必要时降级工具调用
- 新增 antigravity_gateway_service_test.go 测试签名块剥离逻辑
- 更新相关测试用例以验证降级行为

此修复解决了跨平台/账户切换时历史消息签名失效导致的请求失败问题。

											
										
										
											2026-01-04 22:32:36 +08:00
+								// FilterThinkingBlocksForRetry strips thinking-related constructs for retry scenarios.
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+								//
-												fix(backend): 改进 thinking/tool block 签名处理和重试策略

主要改动：
- request_transformer: thinking block 缺少签名时降级为文本而非丢弃，保留内容并在上层禁用 thinking mode
- antigravity_gateway_service: 新增两阶段降级策略，先处理 thinking blocks，如仍失败且涉及 tool 签名错误则进一步降级 tool blocks
- gateway_request: 新增 FilterSignatureSensitiveBlocksForRetry 函数，支持将 tool_use/tool_result 降级为文本
- gateway_request: 改进 FilterThinkingBlocksForRetry，禁用顶层 thinking 配置以避免结构约束冲突
- gateway_service: 实现保守的两阶段重试逻辑，优先保留内容，仅在必要时降级工具调用
- 新增 antigravity_gateway_service_test.go 测试签名块剥离逻辑
- 更新相关测试用例以验证降级行为

此修复解决了跨平台/账户切换时历史消息签名失效导致的请求失败问题。

											
										
										
											2026-01-04 22:32:36 +08:00
+								// Why:
 								//   - Upstreams may reject historical `thinking`/`redacted_thinking` blocks due to invalid/missing signatures.
 								//   - Anthropic extended thinking has a structural constraint: when top-level `thinking` is enabled and the
 								//     final message is an assistant prefill, the assistant content must start with a thinking block.
 								//   - If we remove thinking blocks but keep top-level `thinking` enabled, we can trigger:
-												fix(backend): 修复 CI 失败问题

修复内容：
1. 修复 6 个 golangci-lint 错误
   - 3 个 errcheck 错误：在 gateway_request_test.go 中添加类型断言检查
   - 3 个 gofmt 格式化问题：修复代码格式
2. 修复 API 契约测试失败
   - 在测试中添加缺失的字段：enable_identity_patch 和 identity_patch_prompt

所有测试和 linter 检查现已通过。

											
										
										
											2026-01-05 00:56:48 +08:00
+								//     "Expected `thinking` or `redacted_thinking`, but found `text`"
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+								//
-												fix(backend): 改进 thinking/tool block 签名处理和重试策略

主要改动：
- request_transformer: thinking block 缺少签名时降级为文本而非丢弃，保留内容并在上层禁用 thinking mode
- antigravity_gateway_service: 新增两阶段降级策略，先处理 thinking blocks，如仍失败且涉及 tool 签名错误则进一步降级 tool blocks
- gateway_request: 新增 FilterSignatureSensitiveBlocksForRetry 函数，支持将 tool_use/tool_result 降级为文本
- gateway_request: 改进 FilterThinkingBlocksForRetry，禁用顶层 thinking 配置以避免结构约束冲突
- gateway_service: 实现保守的两阶段重试逻辑，优先保留内容，仅在必要时降级工具调用
- 新增 antigravity_gateway_service_test.go 测试签名块剥离逻辑
- 更新相关测试用例以验证降级行为

此修复解决了跨平台/账户切换时历史消息签名失效导致的请求失败问题。

											
										
										
											2026-01-04 22:32:36 +08:00
+								// Strategy (B: preserve content as text):
 								//   - Disable top-level `thinking` (remove `thinking` field).
 								//   - Convert `thinking` blocks to `text` blocks (preserve the thinking content).
 								//   - Remove `redacted_thinking` blocks (cannot be converted to text).
 								//   - Ensure no message ends up with empty content.
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+								func FilterThinkingBlocksForRetry(body []byte) []byte {
-												fix: 修复空content处理及更新Gemini使用指南链接

- 修复FilterThinkingBlocksForRetry对空content数组的处理
- docker-compose添加SECURITY_URL_ALLOWLIST_UPSTREAM_HOSTS配置
- 更新Gemini使用指南链接：检查归属地、修改归属地、激活Gemini Web

											
										
										
											2026-01-04 18:26:39 -08:00
+									hasThinkingContent := bytes.Contains(body, []byte(`"type":"thinking"`)) ||
 										bytes.Contains(body, []byte(`"type": "thinking"`)) ||
 										bytes.Contains(body, []byte(`"type":"redacted_thinking"`)) ||
 										bytes.Contains(body, []byte(`"type": "redacted_thinking"`)) ||
 										bytes.Contains(body, []byte(`"thinking":`)) ||
 										bytes.Contains(body, []byte(`"thinking" :`))
 									// Also check for empty content arrays that need fixing.
 									// Note: This is a heuristic check; the actual empty content handling is done below.
 									hasEmptyContent := bytes.Contains(body, []byte(`"content":[]`)) ||
 										bytes.Contains(body, []byte(`"content": []`)) ||
 										bytes.Contains(body, []byte(`"content" : []`)) ||
 										bytes.Contains(body, []byte(`"content" :[]`))
 									// Fast path: nothing to process
 									if !hasThinkingContent && !hasEmptyContent {
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+										return body
 									}
 									var req map[string]any
 									if err := json.Unmarshal(body, &req); err != nil {
 										return body
 									}
-												fix(backend): 改进 thinking/tool block 签名处理和重试策略

主要改动：
- request_transformer: thinking block 缺少签名时降级为文本而非丢弃，保留内容并在上层禁用 thinking mode
- antigravity_gateway_service: 新增两阶段降级策略，先处理 thinking blocks，如仍失败且涉及 tool 签名错误则进一步降级 tool blocks
- gateway_request: 新增 FilterSignatureSensitiveBlocksForRetry 函数，支持将 tool_use/tool_result 降级为文本
- gateway_request: 改进 FilterThinkingBlocksForRetry，禁用顶层 thinking 配置以避免结构约束冲突
- gateway_service: 实现保守的两阶段重试逻辑，优先保留内容，仅在必要时降级工具调用
- 新增 antigravity_gateway_service_test.go 测试签名块剥离逻辑
- 更新相关测试用例以验证降级行为

此修复解决了跨平台/账户切换时历史消息签名失效导致的请求失败问题。

											
										
										
											2026-01-04 22:32:36 +08:00
+									modified := false
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+									messages, ok := req["messages"].([]any)
 									if !ok {
 										return body
 									}
-												fix(backend): 改进 thinking/tool block 签名处理和重试策略

主要改动：
- request_transformer: thinking block 缺少签名时降级为文本而非丢弃，保留内容并在上层禁用 thinking mode
- antigravity_gateway_service: 新增两阶段降级策略，先处理 thinking blocks，如仍失败且涉及 tool 签名错误则进一步降级 tool blocks
- gateway_request: 新增 FilterSignatureSensitiveBlocksForRetry 函数，支持将 tool_use/tool_result 降级为文本
- gateway_request: 改进 FilterThinkingBlocksForRetry，禁用顶层 thinking 配置以避免结构约束冲突
- gateway_service: 实现保守的两阶段重试逻辑，优先保留内容，仅在必要时降级工具调用
- 新增 antigravity_gateway_service_test.go 测试签名块剥离逻辑
- 更新相关测试用例以验证降级行为

此修复解决了跨平台/账户切换时历史消息签名失效导致的请求失败问题。

											
										
										
											2026-01-04 22:32:36 +08:00
+									// Disable top-level thinking mode for retry to avoid structural/signature constraints upstream.
 									if _, exists := req["thinking"]; exists {
 										delete(req, "thinking")
 										modified = true
 									}
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+									newMessages := make([]any, 0, len(messages))
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+									for _, msg := range messages {
 										msgMap, ok := msg.(map[string]any)
 										if !ok {
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+											newMessages = append(newMessages, msg)
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+											continue
 										}
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+										role, _ := msgMap["role"].(string)
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+										content, ok := msgMap["content"].([]any)
 										if !ok {
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+											// String content or other format - keep as is
 											newMessages = append(newMessages, msg)
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+											continue
 										}
 										newContent := make([]any, 0, len(content))
 										modifiedThisMsg := false
 										for _, block := range content {
 											blockMap, ok := block.(map[string]any)
 											if !ok {
 												newContent = append(newContent, block)
 												continue
 											}
 											blockType, _ := blockMap["type"].(string)
-												fix(backend): 改进 thinking/tool block 签名处理和重试策略

主要改动：
- request_transformer: thinking block 缺少签名时降级为文本而非丢弃，保留内容并在上层禁用 thinking mode
- antigravity_gateway_service: 新增两阶段降级策略，先处理 thinking blocks，如仍失败且涉及 tool 签名错误则进一步降级 tool blocks
- gateway_request: 新增 FilterSignatureSensitiveBlocksForRetry 函数，支持将 tool_use/tool_result 降级为文本
- gateway_request: 改进 FilterThinkingBlocksForRetry，禁用顶层 thinking 配置以避免结构约束冲突
- gateway_service: 实现保守的两阶段重试逻辑，优先保留内容，仅在必要时降级工具调用
- 新增 antigravity_gateway_service_test.go 测试签名块剥离逻辑
- 更新相关测试用例以验证降级行为

此修复解决了跨平台/账户切换时历史消息签名失效导致的请求失败问题。

											
										
										
											2026-01-04 22:32:36 +08:00
+											// Convert thinking blocks to text (preserve content) and drop redacted_thinking.
 											switch blockType {
 											case "thinking":
 												modifiedThisMsg = true
 												thinkingText, _ := blockMap["thinking"].(string)
 												if thinkingText == "" {
 													continue
 												}
 												newContent = append(newContent, map[string]any{
 													"type": "text",
 													"text": thinkingText,
 												})
 												continue
 											case "redacted_thinking":
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+												modifiedThisMsg = true
 												continue
 											}
-												fix(backend): 改进 thinking/tool block 签名处理和重试策略

主要改动：
- request_transformer: thinking block 缺少签名时降级为文本而非丢弃，保留内容并在上层禁用 thinking mode
- antigravity_gateway_service: 新增两阶段降级策略，先处理 thinking blocks，如仍失败且涉及 tool 签名错误则进一步降级 tool blocks
- gateway_request: 新增 FilterSignatureSensitiveBlocksForRetry 函数，支持将 tool_use/tool_result 降级为文本
- gateway_request: 改进 FilterThinkingBlocksForRetry，禁用顶层 thinking 配置以避免结构约束冲突
- gateway_service: 实现保守的两阶段重试逻辑，优先保留内容，仅在必要时降级工具调用
- 新增 antigravity_gateway_service_test.go 测试签名块剥离逻辑
- 更新相关测试用例以验证降级行为

此修复解决了跨平台/账户切换时历史消息签名失效导致的请求失败问题。

											
										
										
											2026-01-04 22:32:36 +08:00
+											// Handle blocks without type discriminator but with a "thinking" field.
 											if blockType == "" {
 												if rawThinking, hasThinking := blockMap["thinking"]; hasThinking {
 													modifiedThisMsg = true
 													switch v := rawThinking.(type) {
 													case string:
 														if v != "" {
 															newContent = append(newContent, map[string]any{"type": "text", "text": v})
 														}
 													default:
 														if b, err := json.Marshal(v); err == nil && len(b) > 0 {
 															newContent = append(newContent, map[string]any{"type": "text", "text": string(b)})
 														}
 													}
 													continue
 												}
 											}
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+											newContent = append(newContent, block)
 										}
-												fix: 修复空content处理及更新Gemini使用指南链接

- 修复FilterThinkingBlocksForRetry对空content数组的处理
- docker-compose添加SECURITY_URL_ALLOWLIST_UPSTREAM_HOSTS配置
- 更新Gemini使用指南链接：检查归属地、修改归属地、激活Gemini Web

											
										
										
											2026-01-04 18:26:39 -08:00
+										// Handle empty content: either from filtering or originally empty
 										if len(newContent) == 0 {
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+											modified = true
-												fix: 修复空content处理及更新Gemini使用指南链接

- 修复FilterThinkingBlocksForRetry对空content数组的处理
- docker-compose添加SECURITY_URL_ALLOWLIST_UPSTREAM_HOSTS配置
- 更新Gemini使用指南链接：检查归属地、修改归属地、激活Gemini Web

											
										
										
											2026-01-04 18:26:39 -08:00
+											placeholder := "(content removed)"
 											if role == "assistant" {
 												placeholder = "(assistant content removed)"
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+											}
-												fix: 修复空content处理及更新Gemini使用指南链接

- 修复FilterThinkingBlocksForRetry对空content数组的处理
- docker-compose添加SECURITY_URL_ALLOWLIST_UPSTREAM_HOSTS配置
- 更新Gemini使用指南链接：检查归属地、修改归属地、激活Gemini Web

											
										
										
											2026-01-04 18:26:39 -08:00
+											newContent = append(newContent, map[string]any{
 												"type": "text",
 												"text": placeholder,
 											})
 											msgMap["content"] = newContent
 										} else if modifiedThisMsg {
 											modified = true
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+											msgMap["content"] = newContent
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+										}
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+										newMessages = append(newMessages, msgMap)
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+									}
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+									if modified {
 										req["messages"] = newMessages
-												fix(backend): 改进 thinking/tool block 签名处理和重试策略

主要改动：
- request_transformer: thinking block 缺少签名时降级为文本而非丢弃，保留内容并在上层禁用 thinking mode
- antigravity_gateway_service: 新增两阶段降级策略，先处理 thinking blocks，如仍失败且涉及 tool 签名错误则进一步降级 tool blocks
- gateway_request: 新增 FilterSignatureSensitiveBlocksForRetry 函数，支持将 tool_use/tool_result 降级为文本
- gateway_request: 改进 FilterThinkingBlocksForRetry，禁用顶层 thinking 配置以避免结构约束冲突
- gateway_service: 实现保守的两阶段重试逻辑，优先保留内容，仅在必要时降级工具调用
- 新增 antigravity_gateway_service_test.go 测试签名块剥离逻辑
- 更新相关测试用例以验证降级行为

此修复解决了跨平台/账户切换时历史消息签名失效导致的请求失败问题。

											
										
										
											2026-01-04 22:32:36 +08:00
+									} else {
 										// Avoid rewriting JSON when no changes are needed.
 										return body
 									}
 									newBody, err := json.Marshal(req)
 									if err != nil {
 										return body
 									}
 									return newBody
 								}
 								// FilterSignatureSensitiveBlocksForRetry is a stronger retry filter for cases where upstream errors indicate
 								// signature/thought_signature validation issues involving tool blocks.
 								//
 								// This performs everything in FilterThinkingBlocksForRetry, plus:
 								//   - Convert `tool_use` blocks to text (name/id/input) so we stop sending structured tool calls.
 								//   - Convert `tool_result` blocks to text so we keep tool results visible without tool semantics.
 								//
 								// Use this only when needed: converting tool blocks to text changes model behaviour and can increase the
 								// risk of prompt injection (tool output becomes plain conversation text).
 								func FilterSignatureSensitiveBlocksForRetry(body []byte) []byte {
 									// Fast path: only run when we see likely relevant constructs.
 									if !bytes.Contains(body, []byte(`"type":"thinking"`)) &&
 										!bytes.Contains(body, []byte(`"type": "thinking"`)) &&
 										!bytes.Contains(body, []byte(`"type":"redacted_thinking"`)) &&
 										!bytes.Contains(body, []byte(`"type": "redacted_thinking"`)) &&
 										!bytes.Contains(body, []byte(`"type":"tool_use"`)) &&
 										!bytes.Contains(body, []byte(`"type": "tool_use"`)) &&
 										!bytes.Contains(body, []byte(`"type":"tool_result"`)) &&
 										!bytes.Contains(body, []byte(`"type": "tool_result"`)) &&
 										!bytes.Contains(body, []byte(`"thinking":`)) &&
 										!bytes.Contains(body, []byte(`"thinking" :`)) {
 										return body
 									}
 									var req map[string]any
 									if err := json.Unmarshal(body, &req); err != nil {
 										return body
 									}
 									modified := false
 									// Disable top-level thinking for retry to avoid structural/signature constraints upstream.
 									if _, exists := req["thinking"]; exists {
 										delete(req, "thinking")
 										modified = true
 									}
 									messages, ok := req["messages"].([]any)
 									if !ok {
 										return body
 									}
 									newMessages := make([]any, 0, len(messages))
 									for _, msg := range messages {
 										msgMap, ok := msg.(map[string]any)
 										if !ok {
 											newMessages = append(newMessages, msg)
 											continue
 										}
 										role, _ := msgMap["role"].(string)
 										content, ok := msgMap["content"].([]any)
 										if !ok {
 											newMessages = append(newMessages, msg)
 											continue
 										}
 										newContent := make([]any, 0, len(content))
 										modifiedThisMsg := false
 										for _, block := range content {
 											blockMap, ok := block.(map[string]any)
 											if !ok {
 												newContent = append(newContent, block)
 												continue
 											}
 											blockType, _ := blockMap["type"].(string)
 											switch blockType {
 											case "thinking":
 												modifiedThisMsg = true
 												thinkingText, _ := blockMap["thinking"].(string)
 												if thinkingText == "" {
 													continue
 												}
 												newContent = append(newContent, map[string]any{"type": "text", "text": thinkingText})
 												continue
 											case "redacted_thinking":
 												modifiedThisMsg = true
 												continue
 											case "tool_use":
 												modifiedThisMsg = true
 												name, _ := blockMap["name"].(string)
 												id, _ := blockMap["id"].(string)
 												input := blockMap["input"]
 												inputJSON, _ := json.Marshal(input)
 												text := "(tool_use)"
 												if name != "" {
 													text += " name=" + name
 												}
 												if id != "" {
 													text += " id=" + id
 												}
 												if len(inputJSON) > 0 && string(inputJSON) != "null" {
 													text += " input=" + string(inputJSON)
 												}
 												newContent = append(newContent, map[string]any{"type": "text", "text": text})
 												continue
 											case "tool_result":
 												modifiedThisMsg = true
 												toolUseID, _ := blockMap["tool_use_id"].(string)
 												isError, _ := blockMap["is_error"].(bool)
 												content := blockMap["content"]
 												contentJSON, _ := json.Marshal(content)
 												text := "(tool_result)"
 												if toolUseID != "" {
 													text += " tool_use_id=" + toolUseID
 												}
 												if isError {
 													text += " is_error=true"
 												}
 												if len(contentJSON) > 0 && string(contentJSON) != "null" {
 													text += "\n" + string(contentJSON)
 												}
 												newContent = append(newContent, map[string]any{"type": "text", "text": text})
 												continue
 											}
 											if blockType == "" {
 												if rawThinking, hasThinking := blockMap["thinking"]; hasThinking {
 													modifiedThisMsg = true
 													switch v := rawThinking.(type) {
 													case string:
 														if v != "" {
 															newContent = append(newContent, map[string]any{"type": "text", "text": v})
 														}
 													default:
 														if b, err := json.Marshal(v); err == nil && len(b) > 0 {
 															newContent = append(newContent, map[string]any{"type": "text", "text": string(b)})
 														}
 													}
 													continue
 												}
 											}
 											newContent = append(newContent, block)
 										}
 										if modifiedThisMsg {
 											modified = true
 											if len(newContent) == 0 {
 												placeholder := "(content removed)"
 												if role == "assistant" {
 													placeholder = "(assistant content removed)"
 												}
 												newContent = append(newContent, map[string]any{"type": "text", "text": placeholder})
 											}
 											msgMap["content"] = newContent
 										}
 										newMessages = append(newMessages, msgMap)
 									}
 									if !modified {
 										return body
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+									}
-												fix(backend): 改进 thinking/tool block 签名处理和重试策略

主要改动：
- request_transformer: thinking block 缺少签名时降级为文本而非丢弃，保留内容并在上层禁用 thinking mode
- antigravity_gateway_service: 新增两阶段降级策略，先处理 thinking blocks，如仍失败且涉及 tool 签名错误则进一步降级 tool blocks
- gateway_request: 新增 FilterSignatureSensitiveBlocksForRetry 函数，支持将 tool_use/tool_result 降级为文本
- gateway_request: 改进 FilterThinkingBlocksForRetry，禁用顶层 thinking 配置以避免结构约束冲突
- gateway_service: 实现保守的两阶段重试逻辑，优先保留内容，仅在必要时降级工具调用
- 新增 antigravity_gateway_service_test.go 测试签名块剥离逻辑
- 更新相关测试用例以验证降级行为

此修复解决了跨平台/账户切换时历史消息签名失效导致的请求失败问题。

											
										
										
											2026-01-04 22:32:36 +08:00
+									req["messages"] = newMessages
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+									newBody, err := json.Marshal(req)
 									if err != nil {
 										return body
 									}
 									return newBody
 								}
 								// filterThinkingBlocksInternal removes invalid thinking blocks from request
 								// Strategy:
 								//   - When thinking.type != "enabled": Remove all thinking blocks
 								//   - When thinking.type == "enabled": Only remove thinking blocks without valid signatures
 								func filterThinkingBlocksInternal(body []byte, _ bool) []byte {
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
+									// Fast path: if body doesn't contain "thinking", skip parsing
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+									if !bytes.Contains(body, []byte(`"type":"thinking"`)) &&
 										!bytes.Contains(body, []byte(`"type": "thinking"`)) &&
 										!bytes.Contains(body, []byte(`"type":"redacted_thinking"`)) &&
 										!bytes.Contains(body, []byte(`"type": "redacted_thinking"`)) &&
 										!bytes.Contains(body, []byte(`"thinking":`)) &&
 										!bytes.Contains(body, []byte(`"thinking" :`)) {
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
+										return body
 									}
 									var req map[string]any
 									if err := json.Unmarshal(body, &req); err != nil {
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+										return body
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
+									}
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+									// Check if thinking is enabled
 									thinkingEnabled := false
 									if thinking, ok := req["thinking"].(map[string]any); ok {
 										if thinkType, ok := thinking["type"].(string); ok && thinkType == "enabled" {
 											thinkingEnabled = true
 										}
 									}
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
+									messages, ok := req["messages"].([]any)
 									if !ok {
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+										return body
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
+									}
 									filtered := false
 									for _, msg := range messages {
 										msgMap, ok := msg.(map[string]any)
 										if !ok {
 											continue
 										}
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+										role, _ := msgMap["role"].(string)
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
+										content, ok := msgMap["content"].([]any)
 										if !ok {
 											continue
 										}
 										newContent := make([]any, 0, len(content))
 										filteredThisMessage := false
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
+										for _, block := range content {
 											blockMap, ok := block.(map[string]any)
 											if !ok {
 												newContent = append(newContent, block)
 												continue
 											}
 											blockType, _ := blockMap["type"].(string)
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
 											if blockType == "thinking" || blockType == "redacted_thinking" {
 												// When thinking is enabled and this is an assistant message,
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+												// only keep thinking blocks with valid signatures
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+												if thinkingEnabled && role == "assistant" {
 													signature, _ := blockMap["signature"].(string)
 													if signature != "" && signature != "skip_thought_signature_validator" {
 														newContent = append(newContent, block)
 														continue
 													}
 												}
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
+												filtered = true
 												filteredThisMessage = true
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+												continue
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
+											}
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+											// Handle blocks without type discriminator but with "thinking" key
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
+											if blockType == "" {
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+												if _, hasThinking := blockMap["thinking"]; hasThinking {
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
+													filtered = true
 													filteredThisMessage = true
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+													continue
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
+												}
 											}
 											newContent = append(newContent, block)
 										}
 										if filteredThisMessage {
 											msgMap["content"] = newContent
 										}
 									}
 									if !filtered {
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+										return body
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
+									}
 									newBody, err := json.Marshal(req)
 									if err != nil {
-												fix(thinking): 优化 thinking block 签名错误重试逻辑

- FilterThinkingBlocksForRetry: 将 thinking block 转换为 text block 而非直接删除
- stripThinkingFromClaudeRequest: Antigravity 网关同步采用转换策略
- 统一处理 thinking/redacted_thinking/无 type 字段的 thinking block
- 保留 thinking 内容，避免上下文丢失

											
										
										
											2026-01-03 17:07:54 -08:00
+										return body
-												Fix/multiple issues (#24)

* fix(gemini): 修复 google_one OAuth 配置和 scopes 问题

- 修复 google_one 类型在 ExchangeCode 和 RefreshToken 中使用内置客户端
- 添加 DefaultGoogleOneScopes，包含 generative-language 和 drive.readonly 权限
- 在 EffectiveOAuthConfig 中为 google_one 类型使用专门的 scopes
- 将 docker-compose.override.yml 重命名为 .example 并添加到 .gitignore
- 完善 docker-compose.override.yml.example 示例文档

解决问题：
1. google_one OAuth 授权后 API 调用返回 403 权限不足
2. 缺少访问 Gemini API 所需的 generative-language scope
3. 缺少获取 Drive 存储配额所需的 drive.readonly scope

* fix(antigravity): 完全跳过 Claude 模型的所有 thinking 块

问题分析：
- 当前代码尝试保留有 signature 的 thinking 块
- 但 Vertex AI 的 signature 是完整性令牌，无法在本地验证
- 导致 400 错误：Invalid signature in thinking block

根本原因：
1. thinking 功能已对非 Gemini 模型禁用 (isThinkingEnabled=false)
2. Vertex AI 要求原样重放 (thinking, signature) 对或完全不发送
3. 本地无法复制 Vertex 的加密验证逻辑

修复方案：
- 对 Claude 模型完全跳过所有 thinking 块（无论是否有 signature）
- 保持 Gemini 模型使用 dummy signature 的行为不变
- 更新测试用例以反映新的预期行为

影响：
- 消除 thinking 相关的 400 错误
- 与现有的 thinking 禁用策略保持一致
- 不影响 Gemini 模型的 thinking 功能

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestBuildTools_CustomTypeTools 全部通过

参考：Codex review 建议

* fix(gateway): 修复 count_tokens 端点 400 错误

问题分析：
- count_tokens 请求包含 thinking 块时返回 400 错误
- 原因：thinking 块未被过滤，直接转发到上游 API
- 上游 API 拒绝无效的 thinking signature

根本原因：
1. /v1/messages 请求通过 TransformClaudeToGemini 过滤 thinking 块
2. count_tokens 请求绕过转换，直接转发原始请求体
3. 导致包含无效 signature 的 thinking 块被发送到上游

修复方案：
- 创建 FilterThinkingBlocks 工具函数
- 在 buildCountTokensRequest 中应用过滤（1 行修改）
- 与 /v1/messages 行为保持一致

实现细节：
- FilterThinkingBlocks: 解析 JSON，过滤 thinking 块，重新序列化
- 失败安全：解析/序列化失败时返回原始请求体
- 性能优化：仅在发现 thinking 块时重新序列化

测试：
- ✅ 6 个单元测试全部通过
- ✅ 覆盖正常过滤、无 thinking 块、无效 JSON 等场景
- ✅ 现有测试不受影响

影响：
- 消除 count_tokens 的 400 错误
- 不影响 Antigravity 账号（仍返回模拟响应）
- 适用于所有账号类型（OAuth、API Key）

文件修改：
- backend/internal/service/gateway_request.go: +62 行（新函数）
- backend/internal/service/gateway_service.go: +2 行（应用过滤）
- backend/internal/service/gateway_request_test.go: +62 行（测试）

* fix(gateway): 增强 thinking 块过滤逻辑

基于 Codex 分析和建议的改进：

问题分析：
- 新错误：signature: Field required（signature 字段缺失）
- 旧错误：Invalid signature（signature 存在但无效）
- 两者都说明 thinking 块在请求中是危险的

Codex 建议：
- 保持 Option A：完全跳过所有 thinking 块
- 原因：thinking 块应该是只输出的，除非有服务端来源证明
- 在无状态代理中，无法安全区分上游来源 vs 客户端注入

改进内容：

1. 增强 FilterThinkingBlocks 函数
   - 过滤显式的 thinking 块：{"type":"thinking", ...}
   - 过滤无 type 的 thinking 对象：{"thinking": {...}}
   - 保留 tool_use 等其他类型块中的 thinking 字段
   - 修复：只在实际过滤时更新 content 数组

2. 扩展过滤范围
   - 将 FilterThinkingBlocks 应用到 /v1/messages 主路径
   - 之前只应用于 count_tokens，现在两个端点都过滤
   - 防止所有端点的 thinking 相关 400 错误

3. 改进测试
   - 新增：过滤无 type discriminator 的 thinking 块
   - 新增：不过滤 tool_use 中的 thinking 字段
   - 使用 containsThinkingBlock 辅助函数验证

测试：
- ✅ 8 个测试用例全部通过
- ✅ 覆盖各种 thinking 块格式
- ✅ 确保不误伤其他类型的块

影响：
- 消除 signature required 和 invalid signature 错误
- 统一 /v1/messages 和 count_tokens 的行为
- 更健壮的 thinking 块检测逻辑

参考：Codex review 和代码改进

* refactor: 根据 Codex 审查建议进行代码优化

基于 Codex 代码审查的 P1 和 P2 改进：

P1 改进（重要问题）：

1. 优化日志输出
   - 移除 thinking 块跳过时的 log.Printf
   - 避免高频请求下的日志噪音
   - 添加注释说明可通过指标监控

2. 清理遗留代码
   - 删除未使用的 isValidThoughtSignature 函数（27行）
   - 该函数在改为完全跳过 thinking 块后不再需要

P2 改进（性能优化）：

3. 添加快速路径检查
   - 在 FilterThinkingBlocks 中添加 bytes.Contains 预检查
   - 如果请求体不包含 "thinking" 字符串，直接返回
   - 避免不必要的 JSON 解析，提升性能

技术细节：
- request_transformer.go: -27行（删除函数），+1行（优化注释）
- gateway_request.go: +5行（快速路径 + bytes 导入）

测试：
- ✅ TestBuildParts_ThinkingBlockWithoutSignature 全部通过
- ✅ TestFilterThinkingBlocks 全部通过（8个测试用例）

影响：
- 减少日志噪音
- 提升性能（快速路径）
- 代码更简洁（删除未使用代码）

参考：Codex 代码审查建议

* fix: 修复 golangci-lint 检查问题

- 格式化 gateway_request_test.go
- 使用 switch 语句替代 if-else 链（staticcheck QF1003）

* fix(antigravity): 修复 thinking signature 处理并实现 Auto 模式降级

问题分析：
1. 原先代码错误地禁用了 Claude via Vertex 的 thinkingConfig
2. 历史 thinking 块的 signature 被完全跳过，导致验证失败
3. 跨模型混用时 dummy signature 会导致 400 错误

修复内容：

**request_transformer.go**：
- 删除第 38-43 行的错误逻辑（禁用 thinkingConfig）
- 引入 thoughtSignatureMode（Preserve/Dummy）策略
- Claude 模式：透传真实 signature，过滤空/dummy
- Gemini 模式：使用 dummy signature
- 支持 signature-only thinking 块
- tool_use 的 signature 也透传

**antigravity_gateway_service.go**：
- 新增 isSignatureRelatedError() 检测 signature 相关错误
- 新增 stripThinkingFromClaudeRequest() 移除 thinking 块
- 实现 Auto 模式：检测 400 + signature 关键词时自动降级重试
- 重试时完全移除 thinking 配置和消息中的 thinking 块
- 最多重试一次，避免循环

**测试**：
- 更新并新增测试覆盖 Claude preserve/Gemini dummy 模式
- 新增 tool_use signature 处理测试
- 所有测试通过（6/6）

影响：
- ✅ Claude via Vertex 可以正常使用 thinking 功能
- ✅ 历史 signature 正确透传，避免验证失败
- ✅ 跨模型混用时自动过滤无效 signature
- ✅ 错误驱动降级，自动修复 signature 问题
- ✅ 不影响纯 Claude API 和其他渠道

参考：Codex 深度分析和实现建议

* fix(lint): 修复 gofmt 格式问题

* fix(antigravity): 修复 stripThinkingFromClaudeRequest 遗漏 untyped thinking blocks

问题：
- Codex 审查指出 stripThinkingFromClaudeRequest 只移除了 type="thinking" 的块
- 没有处理没有 type 字段的 thinking 对象（如 {"thinking": "...", "signature": "..."}）
- 导致重试时仍包含无效 thinking 块，上游 400 错误持续

修复：
- 添加检查：跳过没有 type 但有 thinking 字段的块
- 现在会移除两种格式：
  1. {"type": "thinking", "thinking": "...", "signature": "..."}
  2. {"thinking": "...", "signature": "..."}（untyped）

测试：所有测试通过

参考：Codex P1 审查意见
											
										
										
											2026-01-02 17:47:49 +08:00
+									}
 									return newBody
 								}