backend/internal/service/gateway_service.go

package service

import (
	"bufio"
	"bytes"
	"context"
	"crypto/sha256"
	"encoding/hex"
	"encoding/json"
	"errors"
	"fmt"
	"io"
	"log"
	"log/slog"
	mathrand "math/rand"
	"net/http"
	"os"
	"regexp"
	"sort"
	"strings"
	"sync/atomic"
	"time"
	"unicode"

	"github.com/Wei-Shaw/sub2api/internal/config"
	"github.com/Wei-Shaw/sub2api/internal/pkg/claude"
	"github.com/Wei-Shaw/sub2api/internal/pkg/ctxkey"
	"github.com/Wei-Shaw/sub2api/internal/util/responseheaders"
	"github.com/Wei-Shaw/sub2api/internal/util/urlvalidator"
	"github.com/google/uuid"
	"github.com/tidwall/gjson"
	"github.com/tidwall/sjson"

	"github.com/gin-gonic/gin"
)

const (
	claudeAPIURL            = "https://api.anthropic.com/v1/messages?beta=true"
	claudeAPICountTokensURL = "https://api.anthropic.com/v1/messages/count_tokens?beta=true"
	stickySessionTTL        = time.Hour // 粘性会话TTL
	defaultMaxLineSize      = 40 * 1024 * 1024
	// Canonical Claude Code banner. Keep it EXACT (no trailing whitespace/newlines)
	// to match real Claude CLI traffic as closely as possible. When we need a visual
	// separator between system blocks, we add "\n\n" at concatenation time.
	claudeCodeSystemPrompt = "You are Claude Code, Anthropic's official CLI for Claude."
	maxCacheControlBlocks  = 4 // Anthropic API 允许的最大 cache_control 块数量
)

const (
	claudeMimicDebugInfoKey = "claude_mimic_debug_info"
)

func (s *GatewayService) debugModelRoutingEnabled() bool {
	v := strings.ToLower(strings.TrimSpace(os.Getenv("SUB2API_DEBUG_MODEL_ROUTING")))
	return v == "1" || v == "true" || v == "yes" || v == "on"
}

func (s *GatewayService) debugClaudeMimicEnabled() bool {
	v := strings.ToLower(strings.TrimSpace(os.Getenv("SUB2API_DEBUG_CLAUDE_MIMIC")))
	return v == "1" || v == "true" || v == "yes" || v == "on"
}

func shortSessionHash(sessionHash string) string {
	if sessionHash == "" {
		return ""
	}
	if len(sessionHash) <= 8 {
		return sessionHash
	}
	return sessionHash[:8]
}

func normalizeClaudeModelForAnthropic(requestedModel string) string {
	for _, prefix := range anthropicPrefixMappings {
		if strings.HasPrefix(requestedModel, prefix) {
			return prefix
		}
	}
	return requestedModel
}

func redactAuthHeaderValue(v string) string {
	v = strings.TrimSpace(v)
	if v == "" {
		return ""
	}
	// Keep scheme for debugging, redact secret.
	if strings.HasPrefix(strings.ToLower(v), "bearer ") {
		return "Bearer [redacted]"
	}
	return "[redacted]"
}

func safeHeaderValueForLog(key string, v string) string {
	key = strings.ToLower(strings.TrimSpace(key))
	switch key {
	case "authorization", "x-api-key":
		return redactAuthHeaderValue(v)
	default:
		return strings.TrimSpace(v)
	}
}

func extractSystemPreviewFromBody(body []byte) string {
	if len(body) == 0 {
		return ""
	}
	sys := gjson.GetBytes(body, "system")
	if !sys.Exists() {
		return ""
	}

	switch {
	case sys.IsArray():
		for _, item := range sys.Array() {
			if !item.IsObject() {
				continue
			}
			if strings.EqualFold(item.Get("type").String(), "text") {
				if t := item.Get("text").String(); strings.TrimSpace(t) != "" {
					return t
				}
			}
		}
		return ""
	case sys.Type == gjson.String:
		return sys.String()
	default:
		return ""
	}
}

func buildClaudeMimicDebugLine(req *http.Request, body []byte, account *Account, tokenType string, mimicClaudeCode bool) string {
	if req == nil {
		return ""
	}

	// Only log a minimal fingerprint to avoid leaking user content.
	interesting := []string{
		"user-agent",
		"x-app",
		"anthropic-dangerous-direct-browser-access",
		"anthropic-version",
		"anthropic-beta",
		"x-stainless-lang",
		"x-stainless-package-version",
		"x-stainless-os",
		"x-stainless-arch",
		"x-stainless-runtime",
		"x-stainless-runtime-version",
		"x-stainless-retry-count",
		"x-stainless-timeout",
		"authorization",
		"x-api-key",
		"content-type",
		"accept",
		"x-stainless-helper-method",
	}

	h := make([]string, 0, len(interesting))
	for _, k := range interesting {
		if v := req.Header.Get(k); v != "" {
			h = append(h, fmt.Sprintf("%s=%q", k, safeHeaderValueForLog(k, v)))
		}
	}

	metaUserID := strings.TrimSpace(gjson.GetBytes(body, "metadata.user_id").String())
	sysPreview := strings.TrimSpace(extractSystemPreviewFromBody(body))

	// Truncate preview to keep logs sane.
	if len(sysPreview) > 300 {
		sysPreview = sysPreview[:300] + "..."
	}
	sysPreview = strings.ReplaceAll(sysPreview, "\n", "\\n")
	sysPreview = strings.ReplaceAll(sysPreview, "\r", "\\r")

	aid := int64(0)
	aname := ""
	if account != nil {
		aid = account.ID
		aname = account.Name
	}

	return fmt.Sprintf(
		"url=%s account=%d(%s) tokenType=%s mimic=%t meta.user_id=%q system.preview=%q headers={%s}",
		req.URL.String(),
		aid,
		aname,
		tokenType,
		mimicClaudeCode,
		metaUserID,
		sysPreview,
		strings.Join(h, " "),
	)
}

func logClaudeMimicDebug(req *http.Request, body []byte, account *Account, tokenType string, mimicClaudeCode bool) {
	line := buildClaudeMimicDebugLine(req, body, account, tokenType, mimicClaudeCode)
	if line == "" {
		return
	}
	log.Printf("[ClaudeMimicDebug] %s", line)
}

func isClaudeCodeCredentialScopeError(msg string) bool {
	m := strings.ToLower(strings.TrimSpace(msg))
	if m == "" {
		return false
	}
	return strings.Contains(m, "only authorized for use with claude code") &&
		strings.Contains(m, "cannot be used for other api requests")
}

// sseDataRe matches SSE data lines with optional whitespace after colon.
// Some upstream APIs return non-standard "data:" without space (should be "data: ").
var (
	sseDataRe            = regexp.MustCompile(`^data:\s*`)
	sessionIDRegex       = regexp.MustCompile(`session_([a-f0-9-]{36})`)
	claudeCliUserAgentRe = regexp.MustCompile(`^claude-cli/\d+\.\d+\.\d+`)
	toolPrefixRe         = regexp.MustCompile(`(?i)^(?:oc_|mcp_)`)
	toolNameBoundaryRe   = regexp.MustCompile(`[^a-zA-Z0-9]+`)
	toolNameCamelRe      = regexp.MustCompile(`([a-z0-9])([A-Z])`)
	toolNameFieldRe      = regexp.MustCompile(`"name"\s*:\s*"([^"]+)"`)
	modelFieldRe         = regexp.MustCompile(`"model"\s*:\s*"([^"]+)"`)
	toolDescAbsPathRe    = regexp.MustCompile(`/\/?(?:home|Users|tmp|var|opt|usr|etc)\/[^\s,\)"'\]]+`)
	toolDescWinPathRe    = regexp.MustCompile(`(?i)[A-Z]:\\[^\s,\)"'\]]+`)

	claudeToolNameOverrides = map[string]string{
		"bash":      "Bash",
		"read":      "Read",
		"edit":      "Edit",
		"write":     "Write",
		"task":      "Task",
		"glob":      "Glob",
		"grep":      "Grep",
		"webfetch":  "WebFetch",
		"websearch": "WebSearch",
		"todowrite": "TodoWrite",
		"question":  "AskUserQuestion",
	}
	openCodeToolOverrides = map[string]string{
		"Bash":            "bash",
		"Read":            "read",
		"Edit":            "edit",
		"Write":           "write",
		"Task":            "task",
		"Glob":            "glob",
		"Grep":            "grep",
		"WebFetch":        "webfetch",
		"WebSearch":       "websearch",
		"TodoWrite":       "todowrite",
		"AskUserQuestion": "question",
	}

	// claudeCodePromptPrefixes 用于检测 Claude Code 系统提示词的前缀列表
	// 支持多种变体：标准版、Agent SDK 版、Explore Agent 版、Compact 版等
	// 注意：前缀之间不应存在包含关系，否则会导致冗余匹配
	claudeCodePromptPrefixes = []string{
		"You are Claude Code, Anthropic's official CLI for Claude",             // 标准版 & Agent SDK 版（含 running within...）
		"You are a Claude agent, built on Anthropic's Claude Agent SDK",        // Agent SDK 变体
		"You are a file search specialist for Claude Code",                     // Explore Agent 版
		"You are a helpful AI assistant tasked with summarizing conversations", // Compact 版
	}

	anthropicPrefixMappings = []string{
		"claude-opus-4-5",
		"claude-haiku-4-5",
		"claude-sonnet-4-5",
	}
)

// ErrClaudeCodeOnly 表示分组仅允许 Claude Code 客户端访问
var ErrClaudeCodeOnly = errors.New("this group only allows Claude Code clients")

// ErrModelScopeNotSupported 表示请求的模型系列不在分组支持的范围内
var ErrModelScopeNotSupported = errors.New("model scope not supported by this group")

// allowedHeaders 白名单headers（参考CRS项目）
var allowedHeaders = map[string]bool{
	"accept":                                    true,
	"x-stainless-retry-count":                   true,
	"x-stainless-timeout":                       true,
	"x-stainless-lang":                          true,
	"x-stainless-package-version":               true,
	"x-stainless-os":                            true,
	"x-stainless-arch":                          true,
	"x-stainless-runtime":                       true,
	"x-stainless-runtime-version":               true,
	"x-stainless-helper-method":                 true,
	"anthropic-dangerous-direct-browser-access": true,
	"anthropic-version":                         true,
	"x-app":                                     true,
	"anthropic-beta":                            true,
	"accept-language":                           true,
	"sec-fetch-mode":                            true,
	"user-agent":                                true,
	"content-type":                              true,
}

// GatewayCache 定义网关服务的缓存操作接口。
// 提供粘性会话（Sticky Session）的存储、查询、刷新和删除功能。
//
// GatewayCache defines cache operations for gateway service.
// Provides sticky session storage, retrieval, refresh and deletion capabilities.
type GatewayCache interface {
	// GetSessionAccountID 获取粘性会话绑定的账号 ID
	// Get the account ID bound to a sticky session
	GetSessionAccountID(ctx context.Context, groupID int64, sessionHash string) (int64, error)
	// SetSessionAccountID 设置粘性会话与账号的绑定关系
	// Set the binding between sticky session and account
	SetSessionAccountID(ctx context.Context, groupID int64, sessionHash string, accountID int64, ttl time.Duration) error
	// RefreshSessionTTL 刷新粘性会话的过期时间
	// Refresh the expiration time of a sticky session
	RefreshSessionTTL(ctx context.Context, groupID int64, sessionHash string, ttl time.Duration) error
	// DeleteSessionAccountID 删除粘性会话绑定，用于账号不可用时主动清理
	// Delete sticky session binding, used to proactively clean up when account becomes unavailable
	DeleteSessionAccountID(ctx context.Context, groupID int64, sessionHash string) error
}

// derefGroupID safely dereferences *int64 to int64, returning 0 if nil
func derefGroupID(groupID *int64) int64 {
	if groupID == nil {
		return 0
	}
	return *groupID
}

// shouldClearStickySession 检查账号是否处于不可调度状态，需要清理粘性会话绑定。
// 当账号状态为错误、禁用、不可调度，或处于临时不可调度期间时，返回 true。
// 这确保后续请求不会继续使用不可用的账号。
//
// shouldClearStickySession checks if an account is in an unschedulable state
// and the sticky session binding should be cleared.
// Returns true when account status is error/disabled, schedulable is false,
// or within temporary unschedulable period.
// This ensures subsequent requests won't continue using unavailable accounts.
func shouldClearStickySession(account *Account) bool {
	if account == nil {
		return false
	}
	if account.Status == StatusError || account.Status == StatusDisabled || !account.Schedulable {
		return true
	}
	if account.TempUnschedulableUntil != nil && time.Now().Before(*account.TempUnschedulableUntil) {
		return true
	}
	return false
}

type AccountWaitPlan struct {
	AccountID      int64
	MaxConcurrency int
	Timeout        time.Duration
	MaxWaiting     int
}

type AccountSelectionResult struct {
	Account     *Account
	Acquired    bool
	ReleaseFunc func()
	WaitPlan    *AccountWaitPlan // nil means no wait allowed
}

// ClaudeUsage 表示Claude API返回的usage信息
type ClaudeUsage struct {
	InputTokens              int `json:"input_tokens"`
	OutputTokens             int `json:"output_tokens"`
	CacheCreationInputTokens int `json:"cache_creation_input_tokens"`
	CacheReadInputTokens     int `json:"cache_read_input_tokens"`
}

// ForwardResult 转发结果
type ForwardResult struct {
	RequestID        string
	Usage            ClaudeUsage
	Model            string
	Stream           bool
	Duration         time.Duration
	FirstTokenMs     *int // 首字时间（流式请求）
	ClientDisconnect bool // 客户端是否在流式传输过程中断开

	// 图片生成计费字段（仅 gemini-3-pro-image 使用）
	ImageCount int    // 生成的图片数量
	ImageSize  string // 图片尺寸 "1K", "2K", "4K"
}

// UpstreamFailoverError indicates an upstream error that should trigger account failover.
type UpstreamFailoverError struct {
	StatusCode int
}

func (e *UpstreamFailoverError) Error() string {
	return fmt.Sprintf("upstream error: %d (failover)", e.StatusCode)
}

// GatewayService handles API gateway operations
type GatewayService struct {
	accountRepo         AccountRepository
	groupRepo           GroupRepository
	usageLogRepo        UsageLogRepository
	userRepo            UserRepository
	userSubRepo         UserSubscriptionRepository
	cache               GatewayCache
	cfg                 *config.Config
	schedulerSnapshot   *SchedulerSnapshotService
	billingService      *BillingService
	rateLimitService    *RateLimitService
	billingCacheService *BillingCacheService
	identityService     *IdentityService
	httpUpstream        HTTPUpstream
	deferredService     *DeferredService
	concurrencyService  *ConcurrencyService
	claudeTokenProvider *ClaudeTokenProvider
	sessionLimitCache   SessionLimitCache // 会话数量限制缓存（仅 Anthropic OAuth/SetupToken）
}

// NewGatewayService creates a new GatewayService
func NewGatewayService(
	accountRepo AccountRepository,
	groupRepo GroupRepository,
	usageLogRepo UsageLogRepository,
	userRepo UserRepository,
	userSubRepo UserSubscriptionRepository,
	cache GatewayCache,
	cfg *config.Config,
	schedulerSnapshot *SchedulerSnapshotService,
	concurrencyService *ConcurrencyService,
	billingService *BillingService,
	rateLimitService *RateLimitService,
	billingCacheService *BillingCacheService,
	identityService *IdentityService,
	httpUpstream HTTPUpstream,
	deferredService *DeferredService,
	claudeTokenProvider *ClaudeTokenProvider,
	sessionLimitCache SessionLimitCache,
) *GatewayService {
	return &GatewayService{
		accountRepo:         accountRepo,
		groupRepo:           groupRepo,
		usageLogRepo:        usageLogRepo,
		userRepo:            userRepo,
		userSubRepo:         userSubRepo,
		cache:               cache,
		cfg:                 cfg,
		schedulerSnapshot:   schedulerSnapshot,
		concurrencyService:  concurrencyService,
		billingService:      billingService,
		rateLimitService:    rateLimitService,
		billingCacheService: billingCacheService,
		identityService:     identityService,
		httpUpstream:        httpUpstream,
		deferredService:     deferredService,
		claudeTokenProvider: claudeTokenProvider,
		sessionLimitCache:   sessionLimitCache,
	}
}

// GenerateSessionHash 从预解析请求计算粘性会话 hash
func (s *GatewayService) GenerateSessionHash(parsed *ParsedRequest) string {
	if parsed == nil {
		return ""
	}

	// 1. 最高优先级：从 metadata.user_id 提取 session_xxx
	if parsed.MetadataUserID != "" {
		if match := sessionIDRegex.FindStringSubmatch(parsed.MetadataUserID); len(match) > 1 {
			return match[1]
		}
	}

	// 2. 提取带 cache_control: {type: "ephemeral"} 的内容
	cacheableContent := s.extractCacheableContent(parsed)
	if cacheableContent != "" {
		return s.hashContent(cacheableContent)
	}

	// 3. Fallback: 使用 system 内容
	if parsed.System != nil {
		systemText := s.extractTextFromSystem(parsed.System)
		if systemText != "" {
			return s.hashContent(systemText)
		}
	}

	// 4. 最后 fallback: 使用第一条消息
	if len(parsed.Messages) > 0 {
		if firstMsg, ok := parsed.Messages[0].(map[string]any); ok {
			msgText := s.extractTextFromContent(firstMsg["content"])
			if msgText != "" {
				return s.hashContent(msgText)
			}
		}
	}

	return ""
}

// BindStickySession sets session -> account binding with standard TTL.
func (s *GatewayService) BindStickySession(ctx context.Context, groupID *int64, sessionHash string, accountID int64) error {
	if sessionHash == "" || accountID <= 0 || s.cache == nil {
		return nil
	}
	return s.cache.SetSessionAccountID(ctx, derefGroupID(groupID), sessionHash, accountID, stickySessionTTL)
}

// GetCachedSessionAccountID retrieves the account ID bound to a sticky session.
// Returns 0 if no binding exists or on error.
func (s *GatewayService) GetCachedSessionAccountID(ctx context.Context, groupID *int64, sessionHash string) (int64, error) {
	if sessionHash == "" || s.cache == nil {
		return 0, nil
	}
	accountID, err := s.cache.GetSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
	if err != nil {
		return 0, err
	}
	return accountID, nil
}

func (s *GatewayService) extractCacheableContent(parsed *ParsedRequest) string {
	if parsed == nil {
		return ""
	}

	var builder strings.Builder

	// 检查 system 中的 cacheable 内容
	if system, ok := parsed.System.([]any); ok {
		for _, part := range system {
			if partMap, ok := part.(map[string]any); ok {
				if cc, ok := partMap["cache_control"].(map[string]any); ok {
					if cc["type"] == "ephemeral" {
						if text, ok := partMap["text"].(string); ok {
							_, _ = builder.WriteString(text)
						}
					}
				}
			}
		}
	}
	systemText := builder.String()

	// 检查 messages 中的 cacheable 内容
	for _, msg := range parsed.Messages {
		if msgMap, ok := msg.(map[string]any); ok {
			if msgContent, ok := msgMap["content"].([]any); ok {
				for _, part := range msgContent {
					if partMap, ok := part.(map[string]any); ok {
						if cc, ok := partMap["cache_control"].(map[string]any); ok {
							if cc["type"] == "ephemeral" {
								return s.extractTextFromContent(msgMap["content"])
							}
						}
					}
				}
			}
		}
	}

	return systemText
}

func (s *GatewayService) extractTextFromSystem(system any) string {
	switch v := system.(type) {
	case string:
		return v
	case []any:
		var texts []string
		for _, part := range v {
			if partMap, ok := part.(map[string]any); ok {
				if text, ok := partMap["text"].(string); ok {
					texts = append(texts, text)
				}
			}
		}
		return strings.Join(texts, "")
	}
	return ""
}

func (s *GatewayService) extractTextFromContent(content any) string {
	switch v := content.(type) {
	case string:
		return v
	case []any:
		var texts []string
		for _, part := range v {
			if partMap, ok := part.(map[string]any); ok {
				if partMap["type"] == "text" {
					if text, ok := partMap["text"].(string); ok {
						texts = append(texts, text)
					}
				}
			}
		}
		return strings.Join(texts, "")
	}
	return ""
}

func (s *GatewayService) hashContent(content string) string {
	hash := sha256.Sum256([]byte(content))
	return hex.EncodeToString(hash[:16]) // 32字符
}

// replaceModelInBody 替换请求体中的model字段
func (s *GatewayService) replaceModelInBody(body []byte, newModel string) []byte {
	var req map[string]any
	if err := json.Unmarshal(body, &req); err != nil {
		return body
	}
	req["model"] = newModel
	newBody, err := json.Marshal(req)
	if err != nil {
		return body
	}
	return newBody
}

type claudeOAuthNormalizeOptions struct {
	injectMetadata          bool
	metadataUserID          string
	stripSystemCacheControl bool
}

func stripToolPrefix(value string) string {
	if value == "" {
		return value
	}
	return toolPrefixRe.ReplaceAllString(value, "")
}

func toPascalCase(value string) string {
	if value == "" {
		return value
	}
	normalized := toolNameBoundaryRe.ReplaceAllString(value, " ")
	tokens := make([]string, 0)
	for _, token := range strings.Fields(normalized) {
		expanded := toolNameCamelRe.ReplaceAllString(token, "$1 $2")
		parts := strings.Fields(expanded)
		if len(parts) > 0 {
			tokens = append(tokens, parts...)
		}
	}
	if len(tokens) == 0 {
		return value
	}
	var builder strings.Builder
	for _, token := range tokens {
		lower := strings.ToLower(token)
		if lower == "" {
			continue
		}
		runes := []rune(lower)
		runes[0] = unicode.ToUpper(runes[0])
		_, _ = builder.WriteString(string(runes))
	}
	return builder.String()
}

func toSnakeCase(value string) string {
	if value == "" {
		return value
	}
	output := toolNameCamelRe.ReplaceAllString(value, "$1_$2")
	output = toolNameBoundaryRe.ReplaceAllString(output, "_")
	output = strings.Trim(output, "_")
	return strings.ToLower(output)
}

func normalizeToolNameForClaude(name string, cache map[string]string) string {
	if name == "" {
		return name
	}
	stripped := stripToolPrefix(name)
	mapped, ok := claudeToolNameOverrides[strings.ToLower(stripped)]
	if !ok {
		mapped = toPascalCase(stripped)
	}
	if mapped != "" && cache != nil && mapped != stripped {
		cache[mapped] = stripped
	}
	if mapped == "" {
		return stripped
	}
	return mapped
}

func normalizeToolNameForOpenCode(name string, cache map[string]string) string {
	if name == "" {
		return name
	}
	stripped := stripToolPrefix(name)
	if cache != nil {
		if mapped, ok := cache[stripped]; ok {
			return mapped
		}
	}
	if mapped, ok := openCodeToolOverrides[stripped]; ok {
		return mapped
	}
	return toSnakeCase(stripped)
}

func normalizeParamNameForOpenCode(name string, cache map[string]string) string {
	if name == "" {
		return name
	}
	if cache != nil {
		if mapped, ok := cache[name]; ok {
			return mapped
		}
	}
	return name
}

// sanitizeSystemText rewrites only the fixed OpenCode identity sentence (if present).
// We intentionally avoid broad keyword replacement in system prompts to prevent
// accidentally changing user-provided instructions.
func sanitizeSystemText(text string) string {
	if text == "" {
		return text
	}
	// Some clients include a fixed OpenCode identity sentence. Anthropic may treat
	// this as a non-Claude-Code fingerprint, so rewrite it to the canonical
	// Claude Code banner before generic "OpenCode"/"opencode" replacements.
	text = strings.ReplaceAll(
		text,
		"You are OpenCode, the best coding agent on the planet.",
		strings.TrimSpace(claudeCodeSystemPrompt),
	)
	return text
}

func sanitizeToolDescription(description string) string {
	if description == "" {
		return description
	}
	description = toolDescAbsPathRe.ReplaceAllString(description, "[path]")
	description = toolDescWinPathRe.ReplaceAllString(description, "[path]")
	// Intentionally do NOT rewrite tool descriptions (OpenCode/Claude strings).
	// Tool names/skill names may rely on exact wording, and rewriting can be misleading.
	return description
}

func normalizeToolInputSchema(inputSchema any, cache map[string]string) {
	schema, ok := inputSchema.(map[string]any)
	if !ok {
		return
	}
	properties, ok := schema["properties"].(map[string]any)
	if !ok {
		return
	}

	newProperties := make(map[string]any, len(properties))
	for key, value := range properties {
		snakeKey := toSnakeCase(key)
		newProperties[snakeKey] = value
		if snakeKey != key && cache != nil {
			cache[snakeKey] = key
		}
	}
	schema["properties"] = newProperties

	if required, ok := schema["required"].([]any); ok {
		newRequired := make([]any, 0, len(required))
		for _, item := range required {
			name, ok := item.(string)
			if !ok {
				newRequired = append(newRequired, item)
				continue
			}
			snakeName := toSnakeCase(name)
			newRequired = append(newRequired, snakeName)
			if snakeName != name && cache != nil {
				cache[snakeName] = name
			}
		}
		schema["required"] = newRequired
	}
}

func stripCacheControlFromSystemBlocks(system any) bool {
	blocks, ok := system.([]any)
	if !ok {
		return false
	}
	changed := false
	for _, item := range blocks {
		block, ok := item.(map[string]any)
		if !ok {
			continue
		}
		if _, exists := block["cache_control"]; !exists {
			continue
		}
		delete(block, "cache_control")
		changed = true
	}
	return changed
}

func normalizeClaudeOAuthRequestBody(body []byte, modelID string, opts claudeOAuthNormalizeOptions) ([]byte, string, map[string]string) {
	if len(body) == 0 {
		return body, modelID, nil
	}
	var req map[string]any
	if err := json.Unmarshal(body, &req); err != nil {
		return body, modelID, nil
	}

	toolNameMap := make(map[string]string)

	if system, ok := req["system"]; ok {
		switch v := system.(type) {
		case string:
			sanitized := sanitizeSystemText(v)
			if sanitized != v {
				req["system"] = sanitized
			}
		case []any:
			for _, item := range v {
				block, ok := item.(map[string]any)
				if !ok {
					continue
				}
				if blockType, _ := block["type"].(string); blockType != "text" {
					continue
				}
				text, ok := block["text"].(string)
				if !ok || text == "" {
					continue
				}
				sanitized := sanitizeSystemText(text)
				if sanitized != text {
					block["text"] = sanitized
				}
			}
		}
	}

	if rawModel, ok := req["model"].(string); ok {
		normalized := claude.NormalizeModelID(rawModel)
		if normalized != rawModel {
			req["model"] = normalized
			modelID = normalized
		}
	}

	if rawTools, exists := req["tools"]; exists {
		switch tools := rawTools.(type) {
		case []any:
			for idx, tool := range tools {
				toolMap, ok := tool.(map[string]any)
				if !ok {
					continue
				}
				if name, ok := toolMap["name"].(string); ok {
					normalized := normalizeToolNameForClaude(name, toolNameMap)
					if normalized != "" && normalized != name {
						toolMap["name"] = normalized
					}
				}
				if desc, ok := toolMap["description"].(string); ok {
					sanitized := sanitizeToolDescription(desc)
					if sanitized != desc {
						toolMap["description"] = sanitized
					}
				}
				if schema, ok := toolMap["input_schema"]; ok {
					normalizeToolInputSchema(schema, toolNameMap)
				}
				tools[idx] = toolMap
			}
			req["tools"] = tools
		case map[string]any:
			normalizedTools := make(map[string]any, len(tools))
			for name, value := range tools {
				normalized := normalizeToolNameForClaude(name, toolNameMap)
				if normalized == "" {
					normalized = name
				}
				if toolMap, ok := value.(map[string]any); ok {
					toolMap["name"] = normalized
					if desc, ok := toolMap["description"].(string); ok {
						sanitized := sanitizeToolDescription(desc)
						if sanitized != desc {
							toolMap["description"] = sanitized
						}
					}
					if schema, ok := toolMap["input_schema"]; ok {
						normalizeToolInputSchema(schema, toolNameMap)
					}
					normalizedTools[normalized] = toolMap
					continue
				}
				normalizedTools[normalized] = value
			}
			req["tools"] = normalizedTools
		}
	} else {
		req["tools"] = []any{}
	}

	if messages, ok := req["messages"].([]any); ok {
		for _, msg := range messages {
			msgMap, ok := msg.(map[string]any)
			if !ok {
				continue
			}
			content, ok := msgMap["content"].([]any)
			if !ok {
				continue
			}
			for _, block := range content {
				blockMap, ok := block.(map[string]any)
				if !ok {
					continue
				}
				if blockType, _ := blockMap["type"].(string); blockType != "tool_use" {
					continue
				}
				if name, ok := blockMap["name"].(string); ok {
					normalized := normalizeToolNameForClaude(name, toolNameMap)
					if normalized != "" && normalized != name {
						blockMap["name"] = normalized
					}
				}
			}
		}
	}

	if opts.stripSystemCacheControl {
		if system, ok := req["system"]; ok {
			_ = stripCacheControlFromSystemBlocks(system)
		}
	}

	if opts.injectMetadata && opts.metadataUserID != "" {
		metadata, ok := req["metadata"].(map[string]any)
		if !ok {
			metadata = map[string]any{}
			req["metadata"] = metadata
		}
		if existing, ok := metadata["user_id"].(string); !ok || existing == "" {
			metadata["user_id"] = opts.metadataUserID
		}
	}

	delete(req, "temperature")
	delete(req, "tool_choice")

	newBody, err := json.Marshal(req)
	if err != nil {
		return body, modelID, toolNameMap
	}
	return newBody, modelID, toolNameMap
}

func (s *GatewayService) buildOAuthMetadataUserID(parsed *ParsedRequest, account *Account, fp *Fingerprint) string {
	if parsed == nil || account == nil {
		return ""
	}
	if parsed.MetadataUserID != "" {
		return ""
	}

	userID := strings.TrimSpace(account.GetClaudeUserID())
	if userID == "" && fp != nil {
		userID = fp.ClientID
	}
	if userID == "" {
		// Fall back to a random, well-formed client id so we can still satisfy
		// Claude Code OAuth requirements when account metadata is incomplete.
		userID = generateClientID()
	}

	sessionHash := s.GenerateSessionHash(parsed)
	sessionID := uuid.NewString()
	if sessionHash != "" {
		seed := fmt.Sprintf("%d::%s", account.ID, sessionHash)
		sessionID = generateSessionUUID(seed)
	}

	// Prefer the newer format that includes account_uuid (if present),
	// otherwise fall back to the legacy Claude Code format.
	accountUUID := strings.TrimSpace(account.GetExtraString("account_uuid"))
	if accountUUID != "" {
		return fmt.Sprintf("user_%s_account_%s_session_%s", userID, accountUUID, sessionID)
	}
	return fmt.Sprintf("user_%s_account__session_%s", userID, sessionID)
}

func generateSessionUUID(seed string) string {
	if seed == "" {
		return uuid.NewString()
	}
	hash := sha256.Sum256([]byte(seed))
	bytes := hash[:16]
	bytes[6] = (bytes[6] & 0x0f) | 0x40
	bytes[8] = (bytes[8] & 0x3f) | 0x80
	return fmt.Sprintf("%x-%x-%x-%x-%x",
		bytes[0:4], bytes[4:6], bytes[6:8], bytes[8:10], bytes[10:16])
}

// SelectAccount 选择账号（粘性会话+优先级）
func (s *GatewayService) SelectAccount(ctx context.Context, groupID *int64, sessionHash string) (*Account, error) {
	return s.SelectAccountForModel(ctx, groupID, sessionHash, "")
}

// SelectAccountForModel 选择支持指定模型的账号（粘性会话+优先级+模型映射）
func (s *GatewayService) SelectAccountForModel(ctx context.Context, groupID *int64, sessionHash string, requestedModel string) (*Account, error) {
	return s.SelectAccountForModelWithExclusions(ctx, groupID, sessionHash, requestedModel, nil)
}

// SelectAccountForModelWithExclusions selects an account supporting the requested model while excluding specified accounts.
func (s *GatewayService) SelectAccountForModelWithExclusions(ctx context.Context, groupID *int64, sessionHash string, requestedModel string, excludedIDs map[int64]struct{}) (*Account, error) {
	// 优先检查 context 中的强制平台（/antigravity 路由）
	var platform string
	forcePlatform, hasForcePlatform := ctx.Value(ctxkey.ForcePlatform).(string)
	if hasForcePlatform && forcePlatform != "" {
		platform = forcePlatform
	} else if groupID != nil {
		group, resolvedGroupID, err := s.resolveGatewayGroup(ctx, groupID)
		if err != nil {
			return nil, err
		}
		groupID = resolvedGroupID
		ctx = s.withGroupContext(ctx, group)
		platform = group.Platform
	} else {
		// 无分组时只使用原生 anthropic 平台
		platform = PlatformAnthropic
	}

	// anthropic/gemini 分组支持混合调度（包含启用了 mixed_scheduling 的 antigravity 账户）
	// 注意：强制平台模式不走混合调度
	if (platform == PlatformAnthropic || platform == PlatformGemini) && !hasForcePlatform {
		return s.selectAccountWithMixedScheduling(ctx, groupID, sessionHash, requestedModel, excludedIDs, platform)
	}

	// antigravity 分组、强制平台模式或无分组使用单平台选择
	// 注意：强制平台模式也必须遵守分组限制，不再回退到全平台查询
	return s.selectAccountForModelWithPlatform(ctx, groupID, sessionHash, requestedModel, excludedIDs, platform)
}

// SelectAccountWithLoadAwareness selects account with load-awareness and wait plan.
// metadataUserID: 已废弃参数，会话限制现在统一使用 sessionHash
func (s *GatewayService) SelectAccountWithLoadAwareness(ctx context.Context, groupID *int64, sessionHash string, requestedModel string, excludedIDs map[int64]struct{}, metadataUserID string) (*AccountSelectionResult, error) {
	// 调试日志：记录调度入口参数
	excludedIDsList := make([]int64, 0, len(excludedIDs))
	for id := range excludedIDs {
		excludedIDsList = append(excludedIDsList, id)
	}
	slog.Debug("account_scheduling_starting",
		"group_id", derefGroupID(groupID),
		"model", requestedModel,
		"session", shortSessionHash(sessionHash),
		"excluded_ids", excludedIDsList)

	cfg := s.schedulingConfig()

	var stickyAccountID int64
	if sessionHash != "" && s.cache != nil {
		if accountID, err := s.cache.GetSessionAccountID(ctx, derefGroupID(groupID), sessionHash); err == nil {
			stickyAccountID = accountID
		}
	}

	// 检查 Claude Code 客户端限制（可能会替换 groupID 为降级分组）
	group, groupID, err := s.checkClaudeCodeRestriction(ctx, groupID)
	if err != nil {
		return nil, err
	}
	ctx = s.withGroupContext(ctx, group)

	if s.debugModelRoutingEnabled() && requestedModel != "" {
		groupPlatform := ""
		if group != nil {
			groupPlatform = group.Platform
		}
		log.Printf("[ModelRoutingDebug] select entry: group_id=%v group_platform=%s model=%s session=%s sticky_account=%d load_batch=%v concurrency=%v",
			derefGroupID(groupID), groupPlatform, requestedModel, shortSessionHash(sessionHash), stickyAccountID, cfg.LoadBatchEnabled, s.concurrencyService != nil)
	}

	if s.concurrencyService == nil || !cfg.LoadBatchEnabled {
		// 复制排除列表，用于会话限制拒绝时的重试
		localExcluded := make(map[int64]struct{})
		for k, v := range excludedIDs {
			localExcluded[k] = v
		}

		for {
			account, err := s.SelectAccountForModelWithExclusions(ctx, groupID, sessionHash, requestedModel, localExcluded)
			if err != nil {
				return nil, err
			}

			result, err := s.tryAcquireAccountSlot(ctx, account.ID, account.Concurrency)
			if err == nil && result.Acquired {
				// 获取槽位后检查会话限制（使用 sessionHash 作为会话标识符）
				if !s.checkAndRegisterSession(ctx, account, sessionHash) {
					result.ReleaseFunc()                   // 释放槽位
					localExcluded[account.ID] = struct{}{} // 排除此账号
					continue                               // 重新选择
				}
				return &AccountSelectionResult{
					Account:     account,
					Acquired:    true,
					ReleaseFunc: result.ReleaseFunc,
				}, nil
			}

			// 对于等待计划的情况，也需要先检查会话限制
			if !s.checkAndRegisterSession(ctx, account, sessionHash) {
				localExcluded[account.ID] = struct{}{}
				continue
			}

			if stickyAccountID > 0 && stickyAccountID == account.ID && s.concurrencyService != nil {
				waitingCount, _ := s.concurrencyService.GetAccountWaitingCount(ctx, account.ID)
				if waitingCount < cfg.StickySessionMaxWaiting {
					return &AccountSelectionResult{
						Account: account,
						WaitPlan: &AccountWaitPlan{
							AccountID:      account.ID,
							MaxConcurrency: account.Concurrency,
							Timeout:        cfg.StickySessionWaitTimeout,
							MaxWaiting:     cfg.StickySessionMaxWaiting,
						},
					}, nil
				}
			}
			return &AccountSelectionResult{
				Account: account,
				WaitPlan: &AccountWaitPlan{
					AccountID:      account.ID,
					MaxConcurrency: account.Concurrency,
					Timeout:        cfg.FallbackWaitTimeout,
					MaxWaiting:     cfg.FallbackMaxWaiting,
				},
			}, nil
		}
	}

	platform, hasForcePlatform, err := s.resolvePlatform(ctx, groupID, group)
	if err != nil {
		return nil, err
	}
	preferOAuth := platform == PlatformGemini
	if s.debugModelRoutingEnabled() && platform == PlatformAnthropic && requestedModel != "" {
		log.Printf("[ModelRoutingDebug] load-aware enabled: group_id=%v model=%s session=%s platform=%s", derefGroupID(groupID), requestedModel, shortSessionHash(sessionHash), platform)
	}

	// Antigravity 模型系列检查（在账号选择前检查，确保所有代码路径都经过此检查）
	if platform == PlatformAntigravity && groupID != nil && requestedModel != "" {
		if err := s.checkAntigravityModelScope(ctx, *groupID, requestedModel); err != nil {
			return nil, err
		}
	}

	accounts, useMixed, err := s.listSchedulableAccounts(ctx, groupID, platform, hasForcePlatform)
	if err != nil {
		return nil, err
	}
	if len(accounts) == 0 {
		return nil, errors.New("no available accounts")
	}

	isExcluded := func(accountID int64) bool {
		if excludedIDs == nil {
			return false
		}
		_, excluded := excludedIDs[accountID]
		return excluded
	}

	// 提前构建 accountByID（供 Layer 1 和 Layer 1.5 使用）
	accountByID := make(map[int64]*Account, len(accounts))
	for i := range accounts {
		accountByID[accounts[i].ID] = &accounts[i]
	}

	// 获取模型路由配置（仅 anthropic 平台）
	var routingAccountIDs []int64
	if group != nil && requestedModel != "" && group.Platform == PlatformAnthropic {
		routingAccountIDs = group.GetRoutingAccountIDs(requestedModel)
		if s.debugModelRoutingEnabled() {
			log.Printf("[ModelRoutingDebug] context group routing: group_id=%d model=%s enabled=%v rules=%d matched_ids=%v session=%s sticky_account=%d",
				group.ID, requestedModel, group.ModelRoutingEnabled, len(group.ModelRouting), routingAccountIDs, shortSessionHash(sessionHash), stickyAccountID)
			if len(routingAccountIDs) == 0 && group.ModelRoutingEnabled && len(group.ModelRouting) > 0 {
				keys := make([]string, 0, len(group.ModelRouting))
				for k := range group.ModelRouting {
					keys = append(keys, k)
				}
				sort.Strings(keys)
				const maxKeys = 20
				if len(keys) > maxKeys {
					keys = keys[:maxKeys]
				}
				log.Printf("[ModelRoutingDebug] context group routing miss: group_id=%d model=%s patterns(sample)=%v", group.ID, requestedModel, keys)
			}
		}
	}

	// ============ Layer 1: 模型路由优先选择（优先级高于粘性会话） ============
	if len(routingAccountIDs) > 0 && s.concurrencyService != nil {
		// 1. 过滤出路由列表中可调度的账号
		var routingCandidates []*Account
		var filteredExcluded, filteredMissing, filteredUnsched, filteredPlatform, filteredModelScope, filteredModelMapping, filteredWindowCost int
		for _, routingAccountID := range routingAccountIDs {
			if isExcluded(routingAccountID) {
				filteredExcluded++
				continue
			}
			account, ok := accountByID[routingAccountID]
			if !ok || !account.IsSchedulable() {
				if !ok {
					filteredMissing++
				} else {
					filteredUnsched++
				}
				continue
			}
			if !s.isAccountAllowedForPlatform(account, platform, useMixed) {
				filteredPlatform++
				continue
			}
			if !account.IsSchedulableForModel(requestedModel) {
				filteredModelScope++
				continue
			}
			if requestedModel != "" && !s.isModelSupportedByAccount(account, requestedModel) {
				filteredModelMapping++
				continue
			}
			// 窗口费用检查（非粘性会话路径）
			if !s.isAccountSchedulableForWindowCost(ctx, account, false) {
				filteredWindowCost++
				continue
			}
			routingCandidates = append(routingCandidates, account)
		}

		if s.debugModelRoutingEnabled() {
			log.Printf("[ModelRoutingDebug] routed candidates: group_id=%v model=%s routed=%d candidates=%d filtered(excluded=%d missing=%d unsched=%d platform=%d model_scope=%d model_mapping=%d window_cost=%d)",
				derefGroupID(groupID), requestedModel, len(routingAccountIDs), len(routingCandidates),
				filteredExcluded, filteredMissing, filteredUnsched, filteredPlatform, filteredModelScope, filteredModelMapping, filteredWindowCost)
		}

		if len(routingCandidates) > 0 {
			// 1.5. 在路由账号范围内检查粘性会话
			if sessionHash != "" && s.cache != nil {
				stickyAccountID, err := s.cache.GetSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
				if err == nil && stickyAccountID > 0 && containsInt64(routingAccountIDs, stickyAccountID) && !isExcluded(stickyAccountID) {
					// 粘性账号在路由列表中，优先使用
					if stickyAccount, ok := accountByID[stickyAccountID]; ok {
						if stickyAccount.IsSchedulable() &&
							s.isAccountAllowedForPlatform(stickyAccount, platform, useMixed) &&
							stickyAccount.IsSchedulableForModel(requestedModel) &&
							(requestedModel == "" || s.isModelSupportedByAccount(stickyAccount, requestedModel)) &&
							s.isAccountSchedulableForWindowCost(ctx, stickyAccount, true) { // 粘性会话窗口费用检查
							result, err := s.tryAcquireAccountSlot(ctx, stickyAccountID, stickyAccount.Concurrency)
							if err == nil && result.Acquired {
								// 会话数量限制检查
								if !s.checkAndRegisterSession(ctx, stickyAccount, sessionHash) {
									result.ReleaseFunc() // 释放槽位
									// 继续到负载感知选择
								} else {
									_ = s.cache.RefreshSessionTTL(ctx, derefGroupID(groupID), sessionHash, stickySessionTTL)
									if s.debugModelRoutingEnabled() {
										log.Printf("[ModelRoutingDebug] routed sticky hit: group_id=%v model=%s session=%s account=%d", derefGroupID(groupID), requestedModel, shortSessionHash(sessionHash), stickyAccountID)
									}
									return &AccountSelectionResult{
										Account:     stickyAccount,
										Acquired:    true,
										ReleaseFunc: result.ReleaseFunc,
									}, nil
								}
							}

							waitingCount, _ := s.concurrencyService.GetAccountWaitingCount(ctx, stickyAccountID)
							if waitingCount < cfg.StickySessionMaxWaiting {
								// 会话数量限制检查（等待计划也需要占用会话配额）
								if !s.checkAndRegisterSession(ctx, stickyAccount, sessionHash) {
									// 会话限制已满，继续到负载感知选择
								} else {
									return &AccountSelectionResult{
										Account: stickyAccount,
										WaitPlan: &AccountWaitPlan{
											AccountID:      stickyAccountID,
											MaxConcurrency: stickyAccount.Concurrency,
											Timeout:        cfg.StickySessionWaitTimeout,
											MaxWaiting:     cfg.StickySessionMaxWaiting,
										},
									}, nil
								}
							}
							// 粘性账号槽位满且等待队列已满，继续使用负载感知选择
						}
					} else {
						_ = s.cache.DeleteSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
					}
				}
			}

			// 2. 批量获取负载信息
			routingLoads := make([]AccountWithConcurrency, 0, len(routingCandidates))
			for _, acc := range routingCandidates {
				routingLoads = append(routingLoads, AccountWithConcurrency{
					ID:             acc.ID,
					MaxConcurrency: acc.Concurrency,
				})
			}
			routingLoadMap, _ := s.concurrencyService.GetAccountsLoadBatch(ctx, routingLoads)

			// 3. 按负载感知排序
			type accountWithLoad struct {
				account  *Account
				loadInfo *AccountLoadInfo
			}
			var routingAvailable []accountWithLoad
			for _, acc := range routingCandidates {
				loadInfo := routingLoadMap[acc.ID]
				if loadInfo == nil {
					loadInfo = &AccountLoadInfo{AccountID: acc.ID}
				}
				if loadInfo.LoadRate < 100 {
					routingAvailable = append(routingAvailable, accountWithLoad{account: acc, loadInfo: loadInfo})
				}
			}

			if len(routingAvailable) > 0 {
				// 排序：优先级 > 负载率 > 最后使用时间
				sort.SliceStable(routingAvailable, func(i, j int) bool {
					a, b := routingAvailable[i], routingAvailable[j]
					if a.account.Priority != b.account.Priority {
						return a.account.Priority < b.account.Priority
					}
					if a.loadInfo.LoadRate != b.loadInfo.LoadRate {
						return a.loadInfo.LoadRate < b.loadInfo.LoadRate
					}
					switch {
					case a.account.LastUsedAt == nil && b.account.LastUsedAt != nil:
						return true
					case a.account.LastUsedAt != nil && b.account.LastUsedAt == nil:
						return false
					case a.account.LastUsedAt == nil && b.account.LastUsedAt == nil:
						return false
					default:
						return a.account.LastUsedAt.Before(*b.account.LastUsedAt)
					}
				})

				// 4. 尝试获取槽位
				for _, item := range routingAvailable {
					result, err := s.tryAcquireAccountSlot(ctx, item.account.ID, item.account.Concurrency)
					if err == nil && result.Acquired {
						// 会话数量限制检查
						if !s.checkAndRegisterSession(ctx, item.account, sessionHash) {
							result.ReleaseFunc() // 释放槽位，继续尝试下一个账号
							continue
						}
						if sessionHash != "" && s.cache != nil {
							_ = s.cache.SetSessionAccountID(ctx, derefGroupID(groupID), sessionHash, item.account.ID, stickySessionTTL)
						}
						if s.debugModelRoutingEnabled() {
							log.Printf("[ModelRoutingDebug] routed select: group_id=%v model=%s session=%s account=%d", derefGroupID(groupID), requestedModel, shortSessionHash(sessionHash), item.account.ID)
						}
						return &AccountSelectionResult{
							Account:     item.account,
							Acquired:    true,
							ReleaseFunc: result.ReleaseFunc,
						}, nil
					}
				}

				// 5. 所有路由账号槽位满，尝试返回等待计划（选择负载最低的）
				// 遍历找到第一个满足会话限制的账号
				for _, item := range routingAvailable {
					if !s.checkAndRegisterSession(ctx, item.account, sessionHash) {
						continue // 会话限制已满，尝试下一个
					}
					if s.debugModelRoutingEnabled() {
						log.Printf("[ModelRoutingDebug] routed wait: group_id=%v model=%s session=%s account=%d", derefGroupID(groupID), requestedModel, shortSessionHash(sessionHash), item.account.ID)
					}
					return &AccountSelectionResult{
						Account: item.account,
						WaitPlan: &AccountWaitPlan{
							AccountID:      item.account.ID,
							MaxConcurrency: item.account.Concurrency,
							Timeout:        cfg.StickySessionWaitTimeout,
							MaxWaiting:     cfg.StickySessionMaxWaiting,
						},
					}, nil
				}
				// 所有路由账号会话限制都已满，继续到 Layer 2 回退
			}
			// 路由列表中的账号都不可用（负载率 >= 100），继续到 Layer 2 回退
			log.Printf("[ModelRouting] All routed accounts unavailable for model=%s, falling back to normal selection", requestedModel)
		}
	}

	// ============ Layer 1.5: 粘性会话（仅在无模型路由配置时生效） ============
	if len(routingAccountIDs) == 0 && sessionHash != "" && s.cache != nil {
		accountID, err := s.cache.GetSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
		if err == nil && accountID > 0 && !isExcluded(accountID) {
			account, ok := accountByID[accountID]
			if ok {
				// 检查账户是否需要清理粘性会话绑定
				// Check if the account needs sticky session cleanup
				clearSticky := shouldClearStickySession(account)
				if clearSticky {
					_ = s.cache.DeleteSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
				}
				if !clearSticky && s.isAccountInGroup(account, groupID) &&
					s.isAccountAllowedForPlatform(account, platform, useMixed) &&
					account.IsSchedulableForModel(requestedModel) &&
					(requestedModel == "" || s.isModelSupportedByAccount(account, requestedModel)) &&
					s.isAccountSchedulableForWindowCost(ctx, account, true) { // 粘性会话窗口费用检查
					result, err := s.tryAcquireAccountSlot(ctx, accountID, account.Concurrency)
					if err == nil && result.Acquired {
						// 会话数量限制检查
						// Session count limit check
						if !s.checkAndRegisterSession(ctx, account, sessionHash) {
							result.ReleaseFunc() // 释放槽位，继续到 Layer 2
						} else {
							_ = s.cache.RefreshSessionTTL(ctx, derefGroupID(groupID), sessionHash, stickySessionTTL)
							return &AccountSelectionResult{
								Account:     account,
								Acquired:    true,
								ReleaseFunc: result.ReleaseFunc,
							}, nil
						}
					}

					waitingCount, _ := s.concurrencyService.GetAccountWaitingCount(ctx, accountID)
					if waitingCount < cfg.StickySessionMaxWaiting {
						// 会话数量限制检查（等待计划也需要占用会话配额）
						// Session count limit check (wait plan also requires session quota)
						if !s.checkAndRegisterSession(ctx, account, sessionHash) {
							// 会话限制已满，继续到 Layer 2
							// Session limit full, continue to Layer 2
						} else {
							return &AccountSelectionResult{
								Account: account,
								WaitPlan: &AccountWaitPlan{
									AccountID:      accountID,
									MaxConcurrency: account.Concurrency,
									Timeout:        cfg.StickySessionWaitTimeout,
									MaxWaiting:     cfg.StickySessionMaxWaiting,
								},
							}, nil
						}
					}
				}
			}
		}
	}

	// ============ Layer 2: 负载感知选择 ============
	candidates := make([]*Account, 0, len(accounts))
	for i := range accounts {
		acc := &accounts[i]
		if isExcluded(acc.ID) {
			continue
		}
		// Scheduler snapshots can be temporarily stale (bucket rebuild is throttled);
		// re-check schedulability here so recently rate-limited/overloaded accounts
		// are not selected again before the bucket is rebuilt.
		if !acc.IsSchedulable() {
			continue
		}
		if !s.isAccountAllowedForPlatform(acc, platform, useMixed) {
			continue
		}
		if !acc.IsSchedulableForModel(requestedModel) {
			continue
		}
		if requestedModel != "" && !s.isModelSupportedByAccount(acc, requestedModel) {
			continue
		}
		// 窗口费用检查（非粘性会话路径）
		if !s.isAccountSchedulableForWindowCost(ctx, acc, false) {
			continue
		}
		candidates = append(candidates, acc)
	}

	if len(candidates) == 0 {
		return nil, errors.New("no available accounts")
	}

	accountLoads := make([]AccountWithConcurrency, 0, len(candidates))
	for _, acc := range candidates {
		accountLoads = append(accountLoads, AccountWithConcurrency{
			ID:             acc.ID,
			MaxConcurrency: acc.Concurrency,
		})
	}

	loadMap, err := s.concurrencyService.GetAccountsLoadBatch(ctx, accountLoads)
	if err != nil {
		if result, ok := s.tryAcquireByLegacyOrder(ctx, candidates, groupID, sessionHash, preferOAuth); ok {
			return result, nil
		}
	} else {
		type accountWithLoad struct {
			account  *Account
			loadInfo *AccountLoadInfo
		}
		var available []accountWithLoad
		for _, acc := range candidates {
			loadInfo := loadMap[acc.ID]
			if loadInfo == nil {
				loadInfo = &AccountLoadInfo{AccountID: acc.ID}
			}
			if loadInfo.LoadRate < 100 {
				available = append(available, accountWithLoad{
					account:  acc,
					loadInfo: loadInfo,
				})
			}
		}

		if len(available) > 0 {
			sort.SliceStable(available, func(i, j int) bool {
				a, b := available[i], available[j]
				if a.account.Priority != b.account.Priority {
					return a.account.Priority < b.account.Priority
				}
				if a.loadInfo.LoadRate != b.loadInfo.LoadRate {
					return a.loadInfo.LoadRate < b.loadInfo.LoadRate
				}
				switch {
				case a.account.LastUsedAt == nil && b.account.LastUsedAt != nil:
					return true
				case a.account.LastUsedAt != nil && b.account.LastUsedAt == nil:
					return false
				case a.account.LastUsedAt == nil && b.account.LastUsedAt == nil:
					if preferOAuth && a.account.Type != b.account.Type {
						return a.account.Type == AccountTypeOAuth
					}
					return false
				default:
					return a.account.LastUsedAt.Before(*b.account.LastUsedAt)
				}
			})

			for _, item := range available {
				result, err := s.tryAcquireAccountSlot(ctx, item.account.ID, item.account.Concurrency)
				if err == nil && result.Acquired {
					// 会话数量限制检查
					if !s.checkAndRegisterSession(ctx, item.account, sessionHash) {
						result.ReleaseFunc() // 释放槽位，继续尝试下一个账号
						continue
					}
					if sessionHash != "" && s.cache != nil {
						_ = s.cache.SetSessionAccountID(ctx, derefGroupID(groupID), sessionHash, item.account.ID, stickySessionTTL)
					}
					return &AccountSelectionResult{
						Account:     item.account,
						Acquired:    true,
						ReleaseFunc: result.ReleaseFunc,
					}, nil
				}
			}
		}
	}

	// ============ Layer 3: 兜底排队 ============
	s.sortCandidatesForFallback(candidates, preferOAuth, cfg.FallbackSelectionMode)
	for _, acc := range candidates {
		// 会话数量限制检查（等待计划也需要占用会话配额）
		if !s.checkAndRegisterSession(ctx, acc, sessionHash) {
			continue // 会话限制已满，尝试下一个账号
		}
		return &AccountSelectionResult{
			Account: acc,
			WaitPlan: &AccountWaitPlan{
				AccountID:      acc.ID,
				MaxConcurrency: acc.Concurrency,
				Timeout:        cfg.FallbackWaitTimeout,
				MaxWaiting:     cfg.FallbackMaxWaiting,
			},
		}, nil
	}
	return nil, errors.New("no available accounts")
}

func (s *GatewayService) tryAcquireByLegacyOrder(ctx context.Context, candidates []*Account, groupID *int64, sessionHash string, preferOAuth bool) (*AccountSelectionResult, bool) {
	ordered := append([]*Account(nil), candidates...)
	sortAccountsByPriorityAndLastUsed(ordered, preferOAuth)

	for _, acc := range ordered {
		result, err := s.tryAcquireAccountSlot(ctx, acc.ID, acc.Concurrency)
		if err == nil && result.Acquired {
			// 会话数量限制检查
			if !s.checkAndRegisterSession(ctx, acc, sessionHash) {
				result.ReleaseFunc() // 释放槽位，继续尝试下一个账号
				continue
			}
			if sessionHash != "" && s.cache != nil {
				_ = s.cache.SetSessionAccountID(ctx, derefGroupID(groupID), sessionHash, acc.ID, stickySessionTTL)
			}
			return &AccountSelectionResult{
				Account:     acc,
				Acquired:    true,
				ReleaseFunc: result.ReleaseFunc,
			}, true
		}
	}

	return nil, false
}

func (s *GatewayService) schedulingConfig() config.GatewaySchedulingConfig {
	if s.cfg != nil {
		return s.cfg.Gateway.Scheduling
	}
	return config.GatewaySchedulingConfig{
		StickySessionMaxWaiting:  3,
		StickySessionWaitTimeout: 45 * time.Second,
		FallbackWaitTimeout:      30 * time.Second,
		FallbackMaxWaiting:       100,
		LoadBatchEnabled:         true,
		SlotCleanupInterval:      30 * time.Second,
	}
}

func (s *GatewayService) withGroupContext(ctx context.Context, group *Group) context.Context {
	if !IsGroupContextValid(group) {
		return ctx
	}
	if existing, ok := ctx.Value(ctxkey.Group).(*Group); ok && existing != nil && existing.ID == group.ID && IsGroupContextValid(existing) {
		return ctx
	}
	return context.WithValue(ctx, ctxkey.Group, group)
}

func (s *GatewayService) groupFromContext(ctx context.Context, groupID int64) *Group {
	if group, ok := ctx.Value(ctxkey.Group).(*Group); ok && IsGroupContextValid(group) && group.ID == groupID {
		return group
	}
	return nil
}

func (s *GatewayService) resolveGroupByID(ctx context.Context, groupID int64) (*Group, error) {
	if group := s.groupFromContext(ctx, groupID); group != nil {
		return group, nil
	}
	group, err := s.groupRepo.GetByIDLite(ctx, groupID)
	if err != nil {
		return nil, fmt.Errorf("get group failed: %w", err)
	}
	return group, nil
}

func (s *GatewayService) ResolveGroupByID(ctx context.Context, groupID int64) (*Group, error) {
	return s.resolveGroupByID(ctx, groupID)
}

func (s *GatewayService) routingAccountIDsForRequest(ctx context.Context, groupID *int64, requestedModel string, platform string) []int64 {
	if groupID == nil || requestedModel == "" || platform != PlatformAnthropic {
		return nil
	}
	group, err := s.resolveGroupByID(ctx, *groupID)
	if err != nil || group == nil {
		if s.debugModelRoutingEnabled() {
			log.Printf("[ModelRoutingDebug] resolve group failed: group_id=%v model=%s platform=%s err=%v", derefGroupID(groupID), requestedModel, platform, err)
		}
		return nil
	}
	// Preserve existing behavior: model routing only applies to anthropic groups.
	if group.Platform != PlatformAnthropic {
		if s.debugModelRoutingEnabled() {
			log.Printf("[ModelRoutingDebug] skip: non-anthropic group platform: group_id=%d group_platform=%s model=%s", group.ID, group.Platform, requestedModel)
		}
		return nil
	}
	ids := group.GetRoutingAccountIDs(requestedModel)
	if s.debugModelRoutingEnabled() {
		log.Printf("[ModelRoutingDebug] routing lookup: group_id=%d model=%s enabled=%v rules=%d matched_ids=%v",
			group.ID, requestedModel, group.ModelRoutingEnabled, len(group.ModelRouting), ids)
	}
	return ids
}

func (s *GatewayService) resolveGatewayGroup(ctx context.Context, groupID *int64) (*Group, *int64, error) {
	if groupID == nil {
		return nil, nil, nil
	}

	currentID := *groupID
	visited := map[int64]struct{}{}
	for {
		if _, seen := visited[currentID]; seen {
			return nil, nil, fmt.Errorf("fallback group cycle detected")
		}
		visited[currentID] = struct{}{}

		group, err := s.resolveGroupByID(ctx, currentID)
		if err != nil {
			return nil, nil, err
		}

		if !group.ClaudeCodeOnly || IsClaudeCodeClient(ctx) {
			return group, &currentID, nil
		}

		if group.FallbackGroupID == nil {
			return nil, nil, ErrClaudeCodeOnly
		}
		currentID = *group.FallbackGroupID
	}
}

// checkClaudeCodeRestriction 检查分组的 Claude Code 客户端限制
// 如果分组启用了 claude_code_only 且请求不是来自 Claude Code 客户端：
//   - 有降级分组：返回降级分组的 ID
//   - 无降级分组：返回 ErrClaudeCodeOnly 错误
func (s *GatewayService) checkClaudeCodeRestriction(ctx context.Context, groupID *int64) (*Group, *int64, error) {
	if groupID == nil {
		return nil, groupID, nil
	}

	// 强制平台模式不检查 Claude Code 限制
	if forcePlatform, hasForcePlatform := ctx.Value(ctxkey.ForcePlatform).(string); hasForcePlatform && forcePlatform != "" {
		return nil, groupID, nil
	}

	group, resolvedID, err := s.resolveGatewayGroup(ctx, groupID)
	if err != nil {
		return nil, nil, err
	}

	return group, resolvedID, nil
}

func (s *GatewayService) resolvePlatform(ctx context.Context, groupID *int64, group *Group) (string, bool, error) {
	forcePlatform, hasForcePlatform := ctx.Value(ctxkey.ForcePlatform).(string)
	if hasForcePlatform && forcePlatform != "" {
		return forcePlatform, true, nil
	}
	if group != nil {
		return group.Platform, false, nil
	}
	if groupID != nil {
		group, err := s.resolveGroupByID(ctx, *groupID)
		if err != nil {
			return "", false, err
		}
		return group.Platform, false, nil
	}
	return PlatformAnthropic, false, nil
}

func (s *GatewayService) listSchedulableAccounts(ctx context.Context, groupID *int64, platform string, hasForcePlatform bool) ([]Account, bool, error) {
	if s.schedulerSnapshot != nil {
		accounts, useMixed, err := s.schedulerSnapshot.ListSchedulableAccounts(ctx, groupID, platform, hasForcePlatform)
		if err == nil {
			slog.Debug("account_scheduling_list_snapshot",
				"group_id", derefGroupID(groupID),
				"platform", platform,
				"use_mixed", useMixed,
				"count", len(accounts))
			for _, acc := range accounts {
				slog.Debug("account_scheduling_account_detail",
					"account_id", acc.ID,
					"name", acc.Name,
					"platform", acc.Platform,
					"type", acc.Type,
					"status", acc.Status,
					"tls_fingerprint", acc.IsTLSFingerprintEnabled())
			}
		}
		return accounts, useMixed, err
	}
	useMixed := (platform == PlatformAnthropic || platform == PlatformGemini) && !hasForcePlatform
	if useMixed {
		platforms := []string{platform, PlatformAntigravity}
		var accounts []Account
		var err error
		if groupID != nil {
			accounts, err = s.accountRepo.ListSchedulableByGroupIDAndPlatforms(ctx, *groupID, platforms)
		} else {
			accounts, err = s.accountRepo.ListSchedulableByPlatforms(ctx, platforms)
		}
		if err != nil {
			slog.Debug("account_scheduling_list_failed",
				"group_id", derefGroupID(groupID),
				"platform", platform,
				"error", err)
			return nil, useMixed, err
		}
		filtered := make([]Account, 0, len(accounts))
		for _, acc := range accounts {
			if acc.Platform == PlatformAntigravity && !acc.IsMixedSchedulingEnabled() {
				continue
			}
			filtered = append(filtered, acc)
		}
		slog.Debug("account_scheduling_list_mixed",
			"group_id", derefGroupID(groupID),
			"platform", platform,
			"raw_count", len(accounts),
			"filtered_count", len(filtered))
		for _, acc := range filtered {
			slog.Debug("account_scheduling_account_detail",
				"account_id", acc.ID,
				"name", acc.Name,
				"platform", acc.Platform,
				"type", acc.Type,
				"status", acc.Status,
				"tls_fingerprint", acc.IsTLSFingerprintEnabled())
		}
		return filtered, useMixed, nil
	}

	var accounts []Account
	var err error
	if s.cfg != nil && s.cfg.RunMode == config.RunModeSimple {
		accounts, err = s.accountRepo.ListSchedulableByPlatform(ctx, platform)
	} else if groupID != nil {
		accounts, err = s.accountRepo.ListSchedulableByGroupIDAndPlatform(ctx, *groupID, platform)
		// 分组内无账号则返回空列表，由上层处理错误，不再回退到全平台查询
	} else {
		accounts, err = s.accountRepo.ListSchedulableByPlatform(ctx, platform)
	}
	if err != nil {
		slog.Debug("account_scheduling_list_failed",
			"group_id", derefGroupID(groupID),
			"platform", platform,
			"error", err)
		return nil, useMixed, err
	}
	slog.Debug("account_scheduling_list_single",
		"group_id", derefGroupID(groupID),
		"platform", platform,
		"count", len(accounts))
	for _, acc := range accounts {
		slog.Debug("account_scheduling_account_detail",
			"account_id", acc.ID,
			"name", acc.Name,
			"platform", acc.Platform,
			"type", acc.Type,
			"status", acc.Status,
			"tls_fingerprint", acc.IsTLSFingerprintEnabled())
	}
	return accounts, useMixed, nil
}

func (s *GatewayService) isAccountAllowedForPlatform(account *Account, platform string, useMixed bool) bool {
	if account == nil {
		return false
	}
	if useMixed {
		if account.Platform == platform {
			return true
		}
		return account.Platform == PlatformAntigravity && account.IsMixedSchedulingEnabled()
	}
	return account.Platform == platform
}

// isAccountInGroup checks if the account belongs to the specified group.
// Returns true if groupID is nil (no group restriction) or account belongs to the group.
func (s *GatewayService) isAccountInGroup(account *Account, groupID *int64) bool {
	if groupID == nil {
		return true // 无分组限制
	}
	if account == nil {
		return false
	}
	for _, ag := range account.AccountGroups {
		if ag.GroupID == *groupID {
			return true
		}
	}
	return false
}

func (s *GatewayService) tryAcquireAccountSlot(ctx context.Context, accountID int64, maxConcurrency int) (*AcquireResult, error) {
	if s.concurrencyService == nil {
		return &AcquireResult{Acquired: true, ReleaseFunc: func() {}}, nil
	}
	return s.concurrencyService.AcquireAccountSlot(ctx, accountID, maxConcurrency)
}

// isAccountSchedulableForWindowCost 检查账号是否可根据窗口费用进行调度
// 仅适用于 Anthropic OAuth/SetupToken 账号
// 返回 true 表示可调度，false 表示不可调度
func (s *GatewayService) isAccountSchedulableForWindowCost(ctx context.Context, account *Account, isSticky bool) bool {
	// 只检查 Anthropic OAuth/SetupToken 账号
	if !account.IsAnthropicOAuthOrSetupToken() {
		return true
	}

	limit := account.GetWindowCostLimit()
	if limit <= 0 {
		return true // 未启用窗口费用限制
	}

	// 尝试从缓存获取窗口费用
	var currentCost float64
	if s.sessionLimitCache != nil {
		if cost, hit, err := s.sessionLimitCache.GetWindowCost(ctx, account.ID); err == nil && hit {
			currentCost = cost
			goto checkSchedulability
		}
	}

	// 缓存未命中，从数据库查询
	{
		// 使用统一的窗口开始时间计算逻辑（考虑窗口过期情况）
		startTime := account.GetCurrentWindowStartTime()

		stats, err := s.usageLogRepo.GetAccountWindowStats(ctx, account.ID, startTime)
		if err != nil {
			// 失败开放：查询失败时允许调度
			return true
		}

		// 使用标准费用（不含账号倍率）
		currentCost = stats.StandardCost

		// 设置缓存（忽略错误）
		if s.sessionLimitCache != nil {
			_ = s.sessionLimitCache.SetWindowCost(ctx, account.ID, currentCost)
		}
	}

checkSchedulability:
	schedulability := account.CheckWindowCostSchedulability(currentCost)

	switch schedulability {
	case WindowCostSchedulable:
		return true
	case WindowCostStickyOnly:
		return isSticky
	case WindowCostNotSchedulable:
		return false
	}
	return true
}

// checkAndRegisterSession 检查并注册会话，用于会话数量限制
// 仅适用于 Anthropic OAuth/SetupToken 账号
// sessionID: 会话标识符（使用粘性会话的 hash）
// 返回 true 表示允许（在限制内或会话已存在），false 表示拒绝（超出限制且是新会话）
func (s *GatewayService) checkAndRegisterSession(ctx context.Context, account *Account, sessionID string) bool {
	// 只检查 Anthropic OAuth/SetupToken 账号
	if !account.IsAnthropicOAuthOrSetupToken() {
		return true
	}

	maxSessions := account.GetMaxSessions()
	if maxSessions <= 0 || sessionID == "" {
		return true // 未启用会话限制或无会话ID
	}

	if s.sessionLimitCache == nil {
		return true // 缓存不可用时允许通过
	}

	idleTimeout := time.Duration(account.GetSessionIdleTimeoutMinutes()) * time.Minute

	allowed, err := s.sessionLimitCache.RegisterSession(ctx, account.ID, sessionID, maxSessions, idleTimeout)
	if err != nil {
		// 失败开放：缓存错误时允许通过
		return true
	}
	return allowed
}

func (s *GatewayService) getSchedulableAccount(ctx context.Context, accountID int64) (*Account, error) {
	if s.schedulerSnapshot != nil {
		return s.schedulerSnapshot.GetAccount(ctx, accountID)
	}
	return s.accountRepo.GetByID(ctx, accountID)
}

func sortAccountsByPriorityAndLastUsed(accounts []*Account, preferOAuth bool) {
	sort.SliceStable(accounts, func(i, j int) bool {
		a, b := accounts[i], accounts[j]
		if a.Priority != b.Priority {
			return a.Priority < b.Priority
		}
		switch {
		case a.LastUsedAt == nil && b.LastUsedAt != nil:
			return true
		case a.LastUsedAt != nil && b.LastUsedAt == nil:
			return false
		case a.LastUsedAt == nil && b.LastUsedAt == nil:
			if preferOAuth && a.Type != b.Type {
				return a.Type == AccountTypeOAuth
			}
			return false
		default:
			return a.LastUsedAt.Before(*b.LastUsedAt)
		}
	})
}

// sortCandidatesForFallback 根据配置选择排序策略
// mode: "last_used"(按最后使用时间) 或 "random"(随机)
func (s *GatewayService) sortCandidatesForFallback(accounts []*Account, preferOAuth bool, mode string) {
	if mode == "random" {
		// 先按优先级排序，然后在同优先级内随机打乱
		sortAccountsByPriorityOnly(accounts, preferOAuth)
		shuffleWithinPriority(accounts)
	} else {
		// 默认按最后使用时间排序
		sortAccountsByPriorityAndLastUsed(accounts, preferOAuth)
	}
}

// sortAccountsByPriorityOnly 仅按优先级排序
func sortAccountsByPriorityOnly(accounts []*Account, preferOAuth bool) {
	sort.SliceStable(accounts, func(i, j int) bool {
		a, b := accounts[i], accounts[j]
		if a.Priority != b.Priority {
			return a.Priority < b.Priority
		}
		if preferOAuth && a.Type != b.Type {
			return a.Type == AccountTypeOAuth
		}
		return false
	})
}

// shuffleWithinPriority 在同优先级内随机打乱顺序
func shuffleWithinPriority(accounts []*Account) {
	if len(accounts) <= 1 {
		return
	}
	r := mathrand.New(mathrand.NewSource(time.Now().UnixNano()))
	start := 0
	for start < len(accounts) {
		priority := accounts[start].Priority
		end := start + 1
		for end < len(accounts) && accounts[end].Priority == priority {
			end++
		}
		// 对 [start, end) 范围内的账户随机打乱
		if end-start > 1 {
			r.Shuffle(end-start, func(i, j int) {
				accounts[start+i], accounts[start+j] = accounts[start+j], accounts[start+i]
			})
		}
		start = end
	}
}

// selectAccountForModelWithPlatform 选择单平台账户（完全隔离）
func (s *GatewayService) selectAccountForModelWithPlatform(ctx context.Context, groupID *int64, sessionHash string, requestedModel string, excludedIDs map[int64]struct{}, platform string) (*Account, error) {
	// 对 Antigravity 平台，检查请求的模型系列是否在分组支持范围内
	if platform == PlatformAntigravity && groupID != nil && requestedModel != "" {
		if err := s.checkAntigravityModelScope(ctx, *groupID, requestedModel); err != nil {
			return nil, err
		}
	}

	preferOAuth := platform == PlatformGemini
	routingAccountIDs := s.routingAccountIDsForRequest(ctx, groupID, requestedModel, platform)

	var accounts []Account
	accountsLoaded := false

	// ============ Model Routing (legacy path): apply before sticky session ============
	// When load-awareness is disabled (e.g. concurrency service not configured), we still honor model routing
	// so switching model can switch upstream account within the same sticky session.
	if len(routingAccountIDs) > 0 {
		if s.debugModelRoutingEnabled() {
			log.Printf("[ModelRoutingDebug] legacy routed begin: group_id=%v model=%s platform=%s session=%s routed_ids=%v",
				derefGroupID(groupID), requestedModel, platform, shortSessionHash(sessionHash), routingAccountIDs)
		}
		// 1) Sticky session only applies if the bound account is within the routing set.
		if sessionHash != "" && s.cache != nil {
			accountID, err := s.cache.GetSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
			if err == nil && accountID > 0 && containsInt64(routingAccountIDs, accountID) {
				if _, excluded := excludedIDs[accountID]; !excluded {
					account, err := s.getSchedulableAccount(ctx, accountID)
					// 检查账号分组归属和平台匹配（确保粘性会话不会跨分组或跨平台）
					if err == nil {
						clearSticky := shouldClearStickySession(account)
						if clearSticky {
							_ = s.cache.DeleteSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
						}
						if !clearSticky && s.isAccountInGroup(account, groupID) && account.Platform == platform && account.IsSchedulableForModel(requestedModel) && (requestedModel == "" || s.isModelSupportedByAccount(account, requestedModel)) {
							if err := s.cache.RefreshSessionTTL(ctx, derefGroupID(groupID), sessionHash, stickySessionTTL); err != nil {
								log.Printf("refresh session ttl failed: session=%s err=%v", sessionHash, err)
							}
							if s.debugModelRoutingEnabled() {
								log.Printf("[ModelRoutingDebug] legacy routed sticky hit: group_id=%v model=%s session=%s account=%d", derefGroupID(groupID), requestedModel, shortSessionHash(sessionHash), accountID)
							}
							return account, nil
						}
					}
				}
			}
		}

		// 2) Select an account from the routed candidates.
		forcePlatform, hasForcePlatform := ctx.Value(ctxkey.ForcePlatform).(string)
		if hasForcePlatform && forcePlatform == "" {
			hasForcePlatform = false
		}
		var err error
		accounts, _, err = s.listSchedulableAccounts(ctx, groupID, platform, hasForcePlatform)
		if err != nil {
			return nil, fmt.Errorf("query accounts failed: %w", err)
		}
		accountsLoaded = true

		routingSet := make(map[int64]struct{}, len(routingAccountIDs))
		for _, id := range routingAccountIDs {
			if id > 0 {
				routingSet[id] = struct{}{}
			}
		}

		var selected *Account
		for i := range accounts {
			acc := &accounts[i]
			if _, ok := routingSet[acc.ID]; !ok {
				continue
			}
			if _, excluded := excludedIDs[acc.ID]; excluded {
				continue
			}
			// Scheduler snapshots can be temporarily stale; re-check schedulability here to
			// avoid selecting accounts that were recently rate-limited/overloaded.
			if !acc.IsSchedulable() {
				continue
			}
			if !acc.IsSchedulableForModel(requestedModel) {
				continue
			}
			if requestedModel != "" && !s.isModelSupportedByAccount(acc, requestedModel) {
				continue
			}
			if selected == nil {
				selected = acc
				continue
			}
			if acc.Priority < selected.Priority {
				selected = acc
			} else if acc.Priority == selected.Priority {
				switch {
				case acc.LastUsedAt == nil && selected.LastUsedAt != nil:
					selected = acc
				case acc.LastUsedAt != nil && selected.LastUsedAt == nil:
					// keep selected (never used is preferred)
				case acc.LastUsedAt == nil && selected.LastUsedAt == nil:
					if preferOAuth && acc.Type != selected.Type && acc.Type == AccountTypeOAuth {
						selected = acc
					}
				default:
					if acc.LastUsedAt.Before(*selected.LastUsedAt) {
						selected = acc
					}
				}
			}
		}

		if selected != nil {
			if sessionHash != "" && s.cache != nil {
				if err := s.cache.SetSessionAccountID(ctx, derefGroupID(groupID), sessionHash, selected.ID, stickySessionTTL); err != nil {
					log.Printf("set session account failed: session=%s account_id=%d err=%v", sessionHash, selected.ID, err)
				}
			}
			if s.debugModelRoutingEnabled() {
				log.Printf("[ModelRoutingDebug] legacy routed select: group_id=%v model=%s session=%s account=%d", derefGroupID(groupID), requestedModel, shortSessionHash(sessionHash), selected.ID)
			}
			return selected, nil
		}
		log.Printf("[ModelRouting] No routed accounts available for model=%s, falling back to normal selection", requestedModel)
	}

	// 1. 查询粘性会话
	if sessionHash != "" && s.cache != nil {
		accountID, err := s.cache.GetSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
		if err == nil && accountID > 0 {
			if _, excluded := excludedIDs[accountID]; !excluded {
				account, err := s.getSchedulableAccount(ctx, accountID)
				// 检查账号分组归属和平台匹配（确保粘性会话不会跨分组或跨平台）
				if err == nil {
					clearSticky := shouldClearStickySession(account)
					if clearSticky {
						_ = s.cache.DeleteSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
					}
					if !clearSticky && s.isAccountInGroup(account, groupID) && account.Platform == platform && account.IsSchedulableForModel(requestedModel) && (requestedModel == "" || s.isModelSupportedByAccount(account, requestedModel)) {
						if err := s.cache.RefreshSessionTTL(ctx, derefGroupID(groupID), sessionHash, stickySessionTTL); err != nil {
							log.Printf("refresh session ttl failed: session=%s err=%v", sessionHash, err)
						}
						return account, nil
					}
				}
			}
		}
	}

	// 2. 获取可调度账号列表（单平台）
	if !accountsLoaded {
		forcePlatform, hasForcePlatform := ctx.Value(ctxkey.ForcePlatform).(string)
		if hasForcePlatform && forcePlatform == "" {
			hasForcePlatform = false
		}
		var err error
		accounts, _, err = s.listSchedulableAccounts(ctx, groupID, platform, hasForcePlatform)
		if err != nil {
			return nil, fmt.Errorf("query accounts failed: %w", err)
		}
	}

	// 3. 按优先级+最久未用选择（考虑模型支持）
	var selected *Account
	for i := range accounts {
		acc := &accounts[i]
		if _, excluded := excludedIDs[acc.ID]; excluded {
			continue
		}
		// Scheduler snapshots can be temporarily stale; re-check schedulability here to
		// avoid selecting accounts that were recently rate-limited/overloaded.
		if !acc.IsSchedulable() {
			continue
		}
		if !acc.IsSchedulableForModel(requestedModel) {
			continue
		}
		if requestedModel != "" && !s.isModelSupportedByAccount(acc, requestedModel) {
			continue
		}
		if selected == nil {
			selected = acc
			continue
		}
		if acc.Priority < selected.Priority {
			selected = acc
		} else if acc.Priority == selected.Priority {
			switch {
			case acc.LastUsedAt == nil && selected.LastUsedAt != nil:
				selected = acc
			case acc.LastUsedAt != nil && selected.LastUsedAt == nil:
				// keep selected (never used is preferred)
			case acc.LastUsedAt == nil && selected.LastUsedAt == nil:
				if preferOAuth && acc.Type != selected.Type && acc.Type == AccountTypeOAuth {
					selected = acc
				}
			default:
				if acc.LastUsedAt.Before(*selected.LastUsedAt) {
					selected = acc
				}
			}
		}
	}

	if selected == nil {
		if requestedModel != "" {
			return nil, fmt.Errorf("no available accounts supporting model: %s", requestedModel)
		}
		return nil, errors.New("no available accounts")
	}

	// 4. 建立粘性绑定
	if sessionHash != "" && s.cache != nil {
		if err := s.cache.SetSessionAccountID(ctx, derefGroupID(groupID), sessionHash, selected.ID, stickySessionTTL); err != nil {
			log.Printf("set session account failed: session=%s account_id=%d err=%v", sessionHash, selected.ID, err)
		}
	}

	return selected, nil
}

// selectAccountWithMixedScheduling 选择账户（支持混合调度）
// 查询原生平台账户 + 启用 mixed_scheduling 的 antigravity 账户
func (s *GatewayService) selectAccountWithMixedScheduling(ctx context.Context, groupID *int64, sessionHash string, requestedModel string, excludedIDs map[int64]struct{}, nativePlatform string) (*Account, error) {
	preferOAuth := nativePlatform == PlatformGemini
	routingAccountIDs := s.routingAccountIDsForRequest(ctx, groupID, requestedModel, nativePlatform)

	var accounts []Account
	accountsLoaded := false

	// ============ Model Routing (legacy path): apply before sticky session ============
	if len(routingAccountIDs) > 0 {
		if s.debugModelRoutingEnabled() {
			log.Printf("[ModelRoutingDebug] legacy mixed routed begin: group_id=%v model=%s platform=%s session=%s routed_ids=%v",
				derefGroupID(groupID), requestedModel, nativePlatform, shortSessionHash(sessionHash), routingAccountIDs)
		}
		// 1) Sticky session only applies if the bound account is within the routing set.
		if sessionHash != "" && s.cache != nil {
			accountID, err := s.cache.GetSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
			if err == nil && accountID > 0 && containsInt64(routingAccountIDs, accountID) {
				if _, excluded := excludedIDs[accountID]; !excluded {
					account, err := s.getSchedulableAccount(ctx, accountID)
					// 检查账号分组归属和有效性：原生平台直接匹配，antigravity 需要启用混合调度
					if err == nil {
						clearSticky := shouldClearStickySession(account)
						if clearSticky {
							_ = s.cache.DeleteSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
						}
						if !clearSticky && s.isAccountInGroup(account, groupID) && account.IsSchedulableForModel(requestedModel) && (requestedModel == "" || s.isModelSupportedByAccount(account, requestedModel)) {
							if account.Platform == nativePlatform || (account.Platform == PlatformAntigravity && account.IsMixedSchedulingEnabled()) {
								if err := s.cache.RefreshSessionTTL(ctx, derefGroupID(groupID), sessionHash, stickySessionTTL); err != nil {
									log.Printf("refresh session ttl failed: session=%s err=%v", sessionHash, err)
								}
								if s.debugModelRoutingEnabled() {
									log.Printf("[ModelRoutingDebug] legacy mixed routed sticky hit: group_id=%v model=%s session=%s account=%d", derefGroupID(groupID), requestedModel, shortSessionHash(sessionHash), accountID)
								}
								return account, nil
							}
						}
					}
				}
			}
		}

		// 2) Select an account from the routed candidates.
		var err error
		accounts, _, err = s.listSchedulableAccounts(ctx, groupID, nativePlatform, false)
		if err != nil {
			return nil, fmt.Errorf("query accounts failed: %w", err)
		}
		accountsLoaded = true

		routingSet := make(map[int64]struct{}, len(routingAccountIDs))
		for _, id := range routingAccountIDs {
			if id > 0 {
				routingSet[id] = struct{}{}
			}
		}

		var selected *Account
		for i := range accounts {
			acc := &accounts[i]
			if _, ok := routingSet[acc.ID]; !ok {
				continue
			}
			if _, excluded := excludedIDs[acc.ID]; excluded {
				continue
			}
			// Scheduler snapshots can be temporarily stale; re-check schedulability here to
			// avoid selecting accounts that were recently rate-limited/overloaded.
			if !acc.IsSchedulable() {
				continue
			}
			// 过滤：原生平台直接通过，antigravity 需要启用混合调度
			if acc.Platform == PlatformAntigravity && !acc.IsMixedSchedulingEnabled() {
				continue
			}
			if !acc.IsSchedulableForModel(requestedModel) {
				continue
			}
			if requestedModel != "" && !s.isModelSupportedByAccount(acc, requestedModel) {
				continue
			}
			if selected == nil {
				selected = acc
				continue
			}
			if acc.Priority < selected.Priority {
				selected = acc
			} else if acc.Priority == selected.Priority {
				switch {
				case acc.LastUsedAt == nil && selected.LastUsedAt != nil:
					selected = acc
				case acc.LastUsedAt != nil && selected.LastUsedAt == nil:
					// keep selected (never used is preferred)
				case acc.LastUsedAt == nil && selected.LastUsedAt == nil:
					if preferOAuth && acc.Platform == PlatformGemini && selected.Platform == PlatformGemini && acc.Type != selected.Type && acc.Type == AccountTypeOAuth {
						selected = acc
					}
				default:
					if acc.LastUsedAt.Before(*selected.LastUsedAt) {
						selected = acc
					}
				}
			}
		}

		if selected != nil {
			if sessionHash != "" && s.cache != nil {
				if err := s.cache.SetSessionAccountID(ctx, derefGroupID(groupID), sessionHash, selected.ID, stickySessionTTL); err != nil {
					log.Printf("set session account failed: session=%s account_id=%d err=%v", sessionHash, selected.ID, err)
				}
			}
			if s.debugModelRoutingEnabled() {
				log.Printf("[ModelRoutingDebug] legacy mixed routed select: group_id=%v model=%s session=%s account=%d", derefGroupID(groupID), requestedModel, shortSessionHash(sessionHash), selected.ID)
			}
			return selected, nil
		}
		log.Printf("[ModelRouting] No routed accounts available for model=%s, falling back to normal selection", requestedModel)
	}

	// 1. 查询粘性会话
	if sessionHash != "" && s.cache != nil {
		accountID, err := s.cache.GetSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
		if err == nil && accountID > 0 {
			if _, excluded := excludedIDs[accountID]; !excluded {
				account, err := s.getSchedulableAccount(ctx, accountID)
				// 检查账号分组归属和有效性：原生平台直接匹配，antigravity 需要启用混合调度
				if err == nil {
					clearSticky := shouldClearStickySession(account)
					if clearSticky {
						_ = s.cache.DeleteSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
					}
					if !clearSticky && s.isAccountInGroup(account, groupID) && account.IsSchedulableForModel(requestedModel) && (requestedModel == "" || s.isModelSupportedByAccount(account, requestedModel)) {
						if account.Platform == nativePlatform || (account.Platform == PlatformAntigravity && account.IsMixedSchedulingEnabled()) {
							if err := s.cache.RefreshSessionTTL(ctx, derefGroupID(groupID), sessionHash, stickySessionTTL); err != nil {
								log.Printf("refresh session ttl failed: session=%s err=%v", sessionHash, err)
							}
							return account, nil
						}
					}
				}
			}
		}
	}

	// 2. 获取可调度账号列表
	if !accountsLoaded {
		var err error
		accounts, _, err = s.listSchedulableAccounts(ctx, groupID, nativePlatform, false)
		if err != nil {
			return nil, fmt.Errorf("query accounts failed: %w", err)
		}
	}

	// 3. 按优先级+最久未用选择（考虑模型支持和混合调度）
	var selected *Account
	for i := range accounts {
		acc := &accounts[i]
		if _, excluded := excludedIDs[acc.ID]; excluded {
			continue
		}
		// Scheduler snapshots can be temporarily stale; re-check schedulability here to
		// avoid selecting accounts that were recently rate-limited/overloaded.
		if !acc.IsSchedulable() {
			continue
		}
		// 过滤：原生平台直接通过，antigravity 需要启用混合调度
		if acc.Platform == PlatformAntigravity && !acc.IsMixedSchedulingEnabled() {
			continue
		}
		if !acc.IsSchedulableForModel(requestedModel) {
			continue
		}
		if requestedModel != "" && !s.isModelSupportedByAccount(acc, requestedModel) {
			continue
		}
		if selected == nil {
			selected = acc
			continue
		}
		if acc.Priority < selected.Priority {
			selected = acc
		} else if acc.Priority == selected.Priority {
			switch {
			case acc.LastUsedAt == nil && selected.LastUsedAt != nil:
				selected = acc
			case acc.LastUsedAt != nil && selected.LastUsedAt == nil:
				// keep selected (never used is preferred)
			case acc.LastUsedAt == nil && selected.LastUsedAt == nil:
				if preferOAuth && acc.Platform == PlatformGemini && selected.Platform == PlatformGemini && acc.Type != selected.Type && acc.Type == AccountTypeOAuth {
					selected = acc
				}
			default:
				if acc.LastUsedAt.Before(*selected.LastUsedAt) {
					selected = acc
				}
			}
		}
	}

	if selected == nil {
		if requestedModel != "" {
			return nil, fmt.Errorf("no available accounts supporting model: %s", requestedModel)
		}
		return nil, errors.New("no available accounts")
	}

	// 4. 建立粘性绑定
	if sessionHash != "" && s.cache != nil {
		if err := s.cache.SetSessionAccountID(ctx, derefGroupID(groupID), sessionHash, selected.ID, stickySessionTTL); err != nil {
			log.Printf("set session account failed: session=%s account_id=%d err=%v", sessionHash, selected.ID, err)
		}
	}

	return selected, nil
}

// isModelSupportedByAccount 根据账户平台检查模型支持
func (s *GatewayService) isModelSupportedByAccount(account *Account, requestedModel string) bool {
	if account.Platform == PlatformAntigravity {
		// Antigravity 平台使用专门的模型支持检查
		return IsAntigravityModelSupported(requestedModel)
	}
	if account.Platform == PlatformAnthropic {
		requestedModel = normalizeClaudeModelForAnthropic(requestedModel)
	}
	// Gemini API Key 账户直接透传，由上游判断模型是否支持
	if account.Platform == PlatformGemini && account.Type == AccountTypeAPIKey {
		return true
	}
	// 其他平台使用账户的模型支持检查
	return account.IsModelSupported(requestedModel)
}

// IsAntigravityModelSupported 检查 Antigravity 平台是否支持指定模型
// 所有 claude- 和 gemini- 前缀的模型都能通过映射或透传支持
func IsAntigravityModelSupported(requestedModel string) bool {
	return strings.HasPrefix(requestedModel, "claude-") ||
		strings.HasPrefix(requestedModel, "gemini-")
}

// GetAccessToken 获取账号凭证
func (s *GatewayService) GetAccessToken(ctx context.Context, account *Account) (string, string, error) {
	switch account.Type {
	case AccountTypeOAuth, AccountTypeSetupToken:
		// Both oauth and setup-token use OAuth token flow
		return s.getOAuthToken(ctx, account)
	case AccountTypeAPIKey:
		apiKey := account.GetCredential("api_key")
		if apiKey == "" {
			return "", "", errors.New("api_key not found in credentials")
		}
		return apiKey, "apikey", nil
	default:
		return "", "", fmt.Errorf("unsupported account type: %s", account.Type)
	}
}

func (s *GatewayService) getOAuthToken(ctx context.Context, account *Account) (string, string, error) {
	// 对于 Anthropic OAuth 账号，使用 ClaudeTokenProvider 获取缓存的 token
	if account.Platform == PlatformAnthropic && account.Type == AccountTypeOAuth && s.claudeTokenProvider != nil {
		accessToken, err := s.claudeTokenProvider.GetAccessToken(ctx, account)
		if err != nil {
			return "", "", err
		}
		return accessToken, "oauth", nil
	}

	// 其他情况（Gemini 有自己的 TokenProvider，setup-token 类型等）直接从账号读取
	accessToken := account.GetCredential("access_token")
	if accessToken == "" {
		return "", "", errors.New("access_token not found in credentials")
	}
	// Token刷新由后台 TokenRefreshService 处理，此处只返回当前token
	return accessToken, "oauth", nil
}

// 重试相关常量
const (
	// 最大尝试次数（包含首次请求）。过多重试会导致请求堆积与资源耗尽。
	maxRetryAttempts = 5

	// 指数退避：第 N 次失败后的等待 = retryBaseDelay * 2^(N-1)，并且上限为 retryMaxDelay。
	retryBaseDelay = 300 * time.Millisecond
	retryMaxDelay  = 3 * time.Second

	// 最大重试耗时（包含请求本身耗时 + 退避等待时间）。
	// 用于防止极端情况下 goroutine 长时间堆积导致资源耗尽。
	maxRetryElapsed = 10 * time.Second
)

func (s *GatewayService) shouldRetryUpstreamError(account *Account, statusCode int) bool {
	// OAuth/Setup Token 账号：仅 403 重试
	if account.IsOAuth() {
		return statusCode == 403
	}

	// API Key 账号：未配置的错误码重试
	return !account.ShouldHandleErrorCode(statusCode)
}

// shouldFailoverUpstreamError determines whether an upstream error should trigger account failover.
func (s *GatewayService) shouldFailoverUpstreamError(statusCode int) bool {
	switch statusCode {
	case 401, 403, 429, 529:
		return true
	default:
		return statusCode >= 500
	}
}

func retryBackoffDelay(attempt int) time.Duration {
	// attempt 从 1 开始，表示第 attempt 次请求刚失败，需要等待后进行第 attempt+1 次请求。
	if attempt <= 0 {
		return retryBaseDelay
	}
	delay := retryBaseDelay * time.Duration(1<<(attempt-1))
	if delay > retryMaxDelay {
		return retryMaxDelay
	}
	return delay
}

func sleepWithContext(ctx context.Context, d time.Duration) error {
	if d <= 0 {
		return nil
	}
	timer := time.NewTimer(d)
	defer func() {
		if !timer.Stop() {
			select {
			case <-timer.C:
			default:
			}
		}
	}()

	select {
	case <-ctx.Done():
		return ctx.Err()
	case <-timer.C:
		return nil
	}
}

// isClaudeCodeClient 判断请求是否来自 Claude Code 客户端
// 简化判断：User-Agent 匹配 + metadata.user_id 存在
func isClaudeCodeClient(userAgent string, metadataUserID string) bool {
	if metadataUserID == "" {
		return false
	}
	return claudeCliUserAgentRe.MatchString(userAgent)
}

func isClaudeCodeRequest(ctx context.Context, c *gin.Context, parsed *ParsedRequest) bool {
	if IsClaudeCodeClient(ctx) {
		return true
	}
	if parsed == nil || c == nil {
		return false
	}
	return isClaudeCodeClient(c.GetHeader("User-Agent"), parsed.MetadataUserID)
}

// systemIncludesClaudeCodePrompt 检查 system 中是否已包含 Claude Code 提示词
// 使用前缀匹配支持多种变体（标准版、Agent SDK 版等）
func systemIncludesClaudeCodePrompt(system any) bool {
	switch v := system.(type) {
	case string:
		return hasClaudeCodePrefix(v)
	case []any:
		for _, item := range v {
			if m, ok := item.(map[string]any); ok {
				if text, ok := m["text"].(string); ok && hasClaudeCodePrefix(text) {
					return true
				}
			}
		}
	}
	return false
}

// hasClaudeCodePrefix 检查文本是否以 Claude Code 提示词的特征前缀开头
func hasClaudeCodePrefix(text string) bool {
	for _, prefix := range claudeCodePromptPrefixes {
		if strings.HasPrefix(text, prefix) {
			return true
		}
	}
	return false
}

// injectClaudeCodePrompt 在 system 开头注入 Claude Code 提示词
// 处理 null、字符串、数组三种格式
func injectClaudeCodePrompt(body []byte, system any) []byte {
	claudeCodeBlock := map[string]any{
		"type":          "text",
		"text":          claudeCodeSystemPrompt,
		"cache_control": map[string]string{"type": "ephemeral"},
	}
	// Opencode plugin applies an extra safeguard: it not only prepends the Claude Code
	// banner, it also prefixes the next system instruction with the same banner plus
	// a blank line. This helps when upstream concatenates system instructions.
	claudeCodePrefix := strings.TrimSpace(claudeCodeSystemPrompt)

	var newSystem []any

	switch v := system.(type) {
	case nil:
		newSystem = []any{claudeCodeBlock}
	case string:
		// Be tolerant of older/newer clients that may differ only by trailing whitespace/newlines.
		if strings.TrimSpace(v) == "" || strings.TrimSpace(v) == strings.TrimSpace(claudeCodeSystemPrompt) {
			newSystem = []any{claudeCodeBlock}
		} else {
			// Mirror opencode behavior: keep the banner as a separate system entry,
			// but also prefix the next system text with the banner.
			merged := v
			if !strings.HasPrefix(v, claudeCodePrefix) {
				merged = claudeCodePrefix + "\n\n" + v
			}
			newSystem = []any{claudeCodeBlock, map[string]any{"type": "text", "text": merged}}
		}
	case []any:
		newSystem = make([]any, 0, len(v)+1)
		newSystem = append(newSystem, claudeCodeBlock)
		prefixedNext := false
		for _, item := range v {
			if m, ok := item.(map[string]any); ok {
				if text, ok := m["text"].(string); ok && strings.TrimSpace(text) == strings.TrimSpace(claudeCodeSystemPrompt) {
					continue
				}
				// Prefix the first subsequent text system block once.
				if !prefixedNext {
					if blockType, _ := m["type"].(string); blockType == "text" {
						if text, ok := m["text"].(string); ok && strings.TrimSpace(text) != "" && !strings.HasPrefix(text, claudeCodePrefix) {
							m["text"] = claudeCodePrefix + "\n\n" + text
							prefixedNext = true
						}
					}
				}
			}
			newSystem = append(newSystem, item)
		}
	default:
		newSystem = []any{claudeCodeBlock}
	}

	result, err := sjson.SetBytes(body, "system", newSystem)
	if err != nil {
		log.Printf("Warning: failed to inject Claude Code prompt: %v", err)
		return body
	}
	return result
}

// enforceCacheControlLimit 强制执行 cache_control 块数量限制（最多 4 个）
// 超限时优先从 messages 中移除 cache_control，保护 system 中的缓存控制
func enforceCacheControlLimit(body []byte) []byte {
	var data map[string]any
	if err := json.Unmarshal(body, &data); err != nil {
		return body
	}

	// 清理 thinking 块中的非法 cache_control（thinking 块不支持该字段）
	removeCacheControlFromThinkingBlocks(data)

	// 计算当前 cache_control 块数量
	count := countCacheControlBlocks(data)
	if count <= maxCacheControlBlocks {
		return body
	}

	// 超限：优先从 messages 中移除，再从 system 中移除
	for count > maxCacheControlBlocks {
		if removeCacheControlFromMessages(data) {
			count--
			continue
		}
		if removeCacheControlFromSystem(data) {
			count--
			continue
		}
		break
	}

	result, err := json.Marshal(data)
	if err != nil {
		return body
	}
	return result
}

// countCacheControlBlocks 统计 system 和 messages 中的 cache_control 块数量
// 注意：thinking 块不支持 cache_control，统计时跳过
func countCacheControlBlocks(data map[string]any) int {
	count := 0

	// 统计 system 中的块
	if system, ok := data["system"].([]any); ok {
		for _, item := range system {
			if m, ok := item.(map[string]any); ok {
				// thinking 块不支持 cache_control，跳过
				if blockType, _ := m["type"].(string); blockType == "thinking" {
					continue
				}
				if _, has := m["cache_control"]; has {
					count++
				}
			}
		}
	}

	// 统计 messages 中的块
	if messages, ok := data["messages"].([]any); ok {
		for _, msg := range messages {
			if msgMap, ok := msg.(map[string]any); ok {
				if content, ok := msgMap["content"].([]any); ok {
					for _, item := range content {
						if m, ok := item.(map[string]any); ok {
							// thinking 块不支持 cache_control，跳过
							if blockType, _ := m["type"].(string); blockType == "thinking" {
								continue
							}
							if _, has := m["cache_control"]; has {
								count++
							}
						}
					}
				}
			}
		}
	}

	return count
}

// removeCacheControlFromMessages 从 messages 中移除一个 cache_control（从头开始）
// 返回 true 表示成功移除，false 表示没有可移除的
// 注意：跳过 thinking 块（它不支持 cache_control）
func removeCacheControlFromMessages(data map[string]any) bool {
	messages, ok := data["messages"].([]any)
	if !ok {
		return false
	}

	for _, msg := range messages {
		msgMap, ok := msg.(map[string]any)
		if !ok {
			continue
		}
		content, ok := msgMap["content"].([]any)
		if !ok {
			continue
		}
		for _, item := range content {
			if m, ok := item.(map[string]any); ok {
				// thinking 块不支持 cache_control，跳过
				if blockType, _ := m["type"].(string); blockType == "thinking" {
					continue
				}
				if _, has := m["cache_control"]; has {
					delete(m, "cache_control")
					return true
				}
			}
		}
	}
	return false
}

// removeCacheControlFromSystem 从 system 中移除一个 cache_control（从尾部开始，保护注入的 prompt）
// 返回 true 表示成功移除，false 表示没有可移除的
// 注意：跳过 thinking 块（它不支持 cache_control）
func removeCacheControlFromSystem(data map[string]any) bool {
	system, ok := data["system"].([]any)
	if !ok {
		return false
	}

	// 从尾部开始移除，保护开头注入的 Claude Code prompt
	for i := len(system) - 1; i >= 0; i-- {
		if m, ok := system[i].(map[string]any); ok {
			// thinking 块不支持 cache_control，跳过
			if blockType, _ := m["type"].(string); blockType == "thinking" {
				continue
			}
			if _, has := m["cache_control"]; has {
				delete(m, "cache_control")
				return true
			}
		}
	}
	return false
}

// removeCacheControlFromThinkingBlocks 强制清理所有 thinking 块中的非法 cache_control
// thinking 块不支持 cache_control 字段，这个函数确保所有 thinking 块都不含该字段
func removeCacheControlFromThinkingBlocks(data map[string]any) {
	// 清理 system 中的 thinking 块
	if system, ok := data["system"].([]any); ok {
		for _, item := range system {
			if m, ok := item.(map[string]any); ok {
				if blockType, _ := m["type"].(string); blockType == "thinking" {
					if _, has := m["cache_control"]; has {
						delete(m, "cache_control")
						log.Printf("[Warning] Removed illegal cache_control from thinking block in system")
					}
				}
			}
		}
	}

	// 清理 messages 中的 thinking 块
	if messages, ok := data["messages"].([]any); ok {
		for msgIdx, msg := range messages {
			if msgMap, ok := msg.(map[string]any); ok {
				if content, ok := msgMap["content"].([]any); ok {
					for contentIdx, item := range content {
						if m, ok := item.(map[string]any); ok {
							if blockType, _ := m["type"].(string); blockType == "thinking" {
								if _, has := m["cache_control"]; has {
									delete(m, "cache_control")
									log.Printf("[Warning] Removed illegal cache_control from thinking block in messages[%d].content[%d]", msgIdx, contentIdx)
								}
							}
						}
					}
				}
			}
		}
	}
}

// Forward 转发请求到Claude API
func (s *GatewayService) Forward(ctx context.Context, c *gin.Context, account *Account, parsed *ParsedRequest) (*ForwardResult, error) {
	startTime := time.Now()
	if parsed == nil {
		return nil, fmt.Errorf("parse request: empty request")
	}

	body := parsed.Body
	reqModel := parsed.Model
	reqStream := parsed.Stream
	originalModel := reqModel
	var toolNameMap map[string]string

	isClaudeCode := isClaudeCodeRequest(ctx, c, parsed)
	shouldMimicClaudeCode := account.IsOAuth() && !isClaudeCode

	if shouldMimicClaudeCode {
		// 智能注入 Claude Code 系统提示词（仅 OAuth/SetupToken 账号需要）
		// 条件：1) OAuth/SetupToken 账号  2) 不是 Claude Code 客户端  3) 不是 Haiku 模型  4) system 中还没有 Claude Code 提示词
		if !strings.Contains(strings.ToLower(reqModel), "haiku") &&
			!systemIncludesClaudeCodePrompt(parsed.System) {
			body = injectClaudeCodePrompt(body, parsed.System)
		}

		normalizeOpts := claudeOAuthNormalizeOptions{stripSystemCacheControl: true}
		if s.identityService != nil {
			fp, err := s.identityService.GetOrCreateFingerprint(ctx, account.ID, c.Request.Header)
			if err == nil && fp != nil {
				if metadataUserID := s.buildOAuthMetadataUserID(parsed, account, fp); metadataUserID != "" {
					normalizeOpts.injectMetadata = true
					normalizeOpts.metadataUserID = metadataUserID
				}
			}
		}

		body, reqModel, toolNameMap = normalizeClaudeOAuthRequestBody(body, reqModel, normalizeOpts)
	}

	// 强制执行 cache_control 块数量限制（最多 4 个）
	body = enforceCacheControlLimit(body)

	// 应用模型映射（APIKey 明确映射优先，其次使用 Anthropic 前缀映射）
	mappedModel := reqModel
	mappingSource := ""
	if account.Type == AccountTypeAPIKey {
		mappedModel = account.GetMappedModel(reqModel)
		if mappedModel != reqModel {
			mappingSource = "account"
		}
	}
	if mappingSource == "" && account.Platform == PlatformAnthropic {
		normalized := normalizeClaudeModelForAnthropic(reqModel)
		if normalized != reqModel {
			mappedModel = normalized
			mappingSource = "prefix"
		}
	}
	if mappedModel != reqModel {
		// 替换请求体中的模型名
		body = s.replaceModelInBody(body, mappedModel)
		reqModel = mappedModel
		log.Printf("Model mapping applied: %s -> %s (account: %s, source=%s)", originalModel, mappedModel, account.Name, mappingSource)
	}

	// 获取凭证
	token, tokenType, err := s.GetAccessToken(ctx, account)
	if err != nil {
		return nil, err
	}

	// 获取代理URL
	proxyURL := ""
	if account.ProxyID != nil && account.Proxy != nil {
		proxyURL = account.Proxy.URL()
	}

	// 调试日志：记录即将转发的账号信息
	log.Printf("[Forward] Using account: ID=%d Name=%s Platform=%s Type=%s TLSFingerprint=%v Proxy=%s",
		account.ID, account.Name, account.Platform, account.Type, account.IsTLSFingerprintEnabled(), proxyURL)

	// 重试循环
	var resp *http.Response
	retryStart := time.Now()
	for attempt := 1; attempt <= maxRetryAttempts; attempt++ {
		// 构建上游请求（每次重试需要重新构建，因为请求体需要重新读取）
		// Capture upstream request body for ops retry of this attempt.
		c.Set(OpsUpstreamRequestBodyKey, string(body))
		upstreamReq, err := s.buildUpstreamRequest(ctx, c, account, body, token, tokenType, reqModel, reqStream, shouldMimicClaudeCode)
		if err != nil {
			return nil, err
		}

		// 发送请求
		resp, err = s.httpUpstream.DoWithTLS(upstreamReq, proxyURL, account.ID, account.Concurrency, account.IsTLSFingerprintEnabled())
		if err != nil {
			if resp != nil && resp.Body != nil {
				_ = resp.Body.Close()
			}
			// Ensure the client receives an error response (handlers assume Forward writes on non-failover errors).
			safeErr := sanitizeUpstreamErrorMessage(err.Error())
			setOpsUpstreamError(c, 0, safeErr, "")
			appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
				Platform:           account.Platform,
				AccountID:          account.ID,
				AccountName:        account.Name,
				UpstreamStatusCode: 0,
				Kind:               "request_error",
				Message:            safeErr,
			})
			c.JSON(http.StatusBadGateway, gin.H{
				"type": "error",
				"error": gin.H{
					"type":    "upstream_error",
					"message": "Upstream request failed",
				},
			})
			return nil, fmt.Errorf("upstream request failed: %s", safeErr)
		}

		// 优先检测thinking block签名错误（400）并重试一次
		if resp.StatusCode == 400 {
			respBody, readErr := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
			if readErr == nil {
				_ = resp.Body.Close()

				if s.isThinkingBlockSignatureError(respBody) {
					appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
						Platform:           account.Platform,
						AccountID:          account.ID,
						AccountName:        account.Name,
						UpstreamStatusCode: resp.StatusCode,
						UpstreamRequestID:  resp.Header.Get("x-request-id"),
						Kind:               "signature_error",
						Message:            extractUpstreamErrorMessage(respBody),
						Detail: func() string {
							if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
								return truncateString(string(respBody), s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes)
							}
							return ""
						}(),
					})

					looksLikeToolSignatureError := func(msg string) bool {
						m := strings.ToLower(msg)
						return strings.Contains(m, "tool_use") ||
							strings.Contains(m, "tool_result") ||
							strings.Contains(m, "functioncall") ||
							strings.Contains(m, "function_call") ||
							strings.Contains(m, "functionresponse") ||
							strings.Contains(m, "function_response")
					}

					// 避免在重试预算已耗尽时再发起额外请求
					if time.Since(retryStart) >= maxRetryElapsed {
						resp.Body = io.NopCloser(bytes.NewReader(respBody))
						break
					}
					log.Printf("Account %d: detected thinking block signature error, retrying with filtered thinking blocks", account.ID)

					// Conservative two-stage fallback:
					// 1) Disable thinking + thinking->text (preserve content)
					// 2) Only if upstream still errors AND error message points to tool/function signature issues:
					//    also downgrade tool_use/tool_result blocks to text.

					filteredBody := FilterThinkingBlocksForRetry(body)
					retryReq, buildErr := s.buildUpstreamRequest(ctx, c, account, filteredBody, token, tokenType, reqModel, reqStream, shouldMimicClaudeCode)
					if buildErr == nil {
						retryResp, retryErr := s.httpUpstream.DoWithTLS(retryReq, proxyURL, account.ID, account.Concurrency, account.IsTLSFingerprintEnabled())
						if retryErr == nil {
							if retryResp.StatusCode < 400 {
								log.Printf("Account %d: signature error retry succeeded (thinking downgraded)", account.ID)
								resp = retryResp
								break
							}

							retryRespBody, retryReadErr := io.ReadAll(io.LimitReader(retryResp.Body, 2<<20))
							_ = retryResp.Body.Close()
							if retryReadErr == nil && retryResp.StatusCode == 400 && s.isThinkingBlockSignatureError(retryRespBody) {
								appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
									Platform:           account.Platform,
									AccountID:          account.ID,
									AccountName:        account.Name,
									UpstreamStatusCode: retryResp.StatusCode,
									UpstreamRequestID:  retryResp.Header.Get("x-request-id"),
									Kind:               "signature_retry_thinking",
									Message:            extractUpstreamErrorMessage(retryRespBody),
									Detail: func() string {
										if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
											return truncateString(string(retryRespBody), s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes)
										}
										return ""
									}(),
								})
								msg2 := extractUpstreamErrorMessage(retryRespBody)
								if looksLikeToolSignatureError(msg2) && time.Since(retryStart) < maxRetryElapsed {
									log.Printf("Account %d: signature retry still failing and looks tool-related, retrying with tool blocks downgraded", account.ID)
									filteredBody2 := FilterSignatureSensitiveBlocksForRetry(body)
									retryReq2, buildErr2 := s.buildUpstreamRequest(ctx, c, account, filteredBody2, token, tokenType, reqModel, reqStream, shouldMimicClaudeCode)
									if buildErr2 == nil {
										retryResp2, retryErr2 := s.httpUpstream.DoWithTLS(retryReq2, proxyURL, account.ID, account.Concurrency, account.IsTLSFingerprintEnabled())
										if retryErr2 == nil {
											resp = retryResp2
											break
										}
										if retryResp2 != nil && retryResp2.Body != nil {
											_ = retryResp2.Body.Close()
										}
										appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
											Platform:           account.Platform,
											AccountID:          account.ID,
											AccountName:        account.Name,
											UpstreamStatusCode: 0,
											Kind:               "signature_retry_tools_request_error",
											Message:            sanitizeUpstreamErrorMessage(retryErr2.Error()),
										})
										log.Printf("Account %d: tool-downgrade signature retry failed: %v", account.ID, retryErr2)
									} else {
										log.Printf("Account %d: tool-downgrade signature retry build failed: %v", account.ID, buildErr2)
									}
								}
							}

							// Fall back to the original retry response context.
							resp = &http.Response{
								StatusCode: retryResp.StatusCode,
								Header:     retryResp.Header.Clone(),
								Body:       io.NopCloser(bytes.NewReader(retryRespBody)),
							}
							break
						}
						if retryResp != nil && retryResp.Body != nil {
							_ = retryResp.Body.Close()
						}
						log.Printf("Account %d: signature error retry failed: %v", account.ID, retryErr)
					} else {
						log.Printf("Account %d: signature error retry build request failed: %v", account.ID, buildErr)
					}

					// Retry failed: restore original response body and continue handling.
					resp.Body = io.NopCloser(bytes.NewReader(respBody))
					break
				}
				// 不是thinking签名错误，恢复响应体
				resp.Body = io.NopCloser(bytes.NewReader(respBody))
			}
		}

		// 检查是否需要通用重试（排除400，因为400已经在上面特殊处理过了）
		if resp.StatusCode >= 400 && resp.StatusCode != 400 && s.shouldRetryUpstreamError(account, resp.StatusCode) {
			if attempt < maxRetryAttempts {
				elapsed := time.Since(retryStart)
				if elapsed >= maxRetryElapsed {
					break
				}

				delay := retryBackoffDelay(attempt)
				remaining := maxRetryElapsed - elapsed
				if delay > remaining {
					delay = remaining
				}
				if delay <= 0 {
					break
				}

				respBody, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
				_ = resp.Body.Close()
				appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
					Platform:           account.Platform,
					AccountID:          account.ID,
					AccountName:        account.Name,
					UpstreamStatusCode: resp.StatusCode,
					UpstreamRequestID:  resp.Header.Get("x-request-id"),
					Kind:               "retry",
					Message:            extractUpstreamErrorMessage(respBody),
					Detail: func() string {
						if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
							return truncateString(string(respBody), s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes)
						}
						return ""
					}(),
				})
				log.Printf("Account %d: upstream error %d, retry %d/%d after %v (elapsed=%v/%v)",
					account.ID, resp.StatusCode, attempt, maxRetryAttempts, delay, elapsed, maxRetryElapsed)
				if err := sleepWithContext(ctx, delay); err != nil {
					return nil, err
				}
				continue
			}
			// 最后一次尝试也失败，跳出循环处理重试耗尽
			break
		}

		// 不需要重试（成功或不可重试的错误），跳出循环
		// DEBUG: 输出响应 headers（用于检测 rate limit 信息）
		if account.Platform == PlatformGemini && resp.StatusCode < 400 {
			log.Printf("[DEBUG] Gemini API Response Headers for account %d:", account.ID)
			for k, v := range resp.Header {
				log.Printf("[DEBUG]   %s: %v", k, v)
			}
		}
		break
	}
	if resp == nil || resp.Body == nil {
		return nil, errors.New("upstream request failed: empty response")
	}
	defer func() { _ = resp.Body.Close() }()

	// 处理重试耗尽的情况
	if resp.StatusCode >= 400 && s.shouldRetryUpstreamError(account, resp.StatusCode) {
		if s.shouldFailoverUpstreamError(resp.StatusCode) {
			respBody, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
			_ = resp.Body.Close()
			resp.Body = io.NopCloser(bytes.NewReader(respBody))

			// 调试日志：打印重试耗尽后的错误响应
			log.Printf("[Forward] Upstream error (retry exhausted, failover): Account=%d(%s) Status=%d RequestID=%s Body=%s",
				account.ID, account.Name, resp.StatusCode, resp.Header.Get("x-request-id"), truncateString(string(respBody), 1000))

			s.handleRetryExhaustedSideEffects(ctx, resp, account)
			appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
				Platform:           account.Platform,
				AccountID:          account.ID,
				AccountName:        account.Name,
				UpstreamStatusCode: resp.StatusCode,
				UpstreamRequestID:  resp.Header.Get("x-request-id"),
				Kind:               "retry_exhausted_failover",
				Message:            extractUpstreamErrorMessage(respBody),
				Detail: func() string {
					if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
						return truncateString(string(respBody), s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes)
					}
					return ""
				}(),
			})
			return nil, &UpstreamFailoverError{StatusCode: resp.StatusCode}
		}
		return s.handleRetryExhaustedError(ctx, resp, c, account)
	}

	// 处理可切换账号的错误
	if resp.StatusCode >= 400 && s.shouldFailoverUpstreamError(resp.StatusCode) {
		respBody, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
		_ = resp.Body.Close()
		resp.Body = io.NopCloser(bytes.NewReader(respBody))

		// 调试日志：打印上游错误响应
		log.Printf("[Forward] Upstream error (failover): Account=%d(%s) Status=%d RequestID=%s Body=%s",
			account.ID, account.Name, resp.StatusCode, resp.Header.Get("x-request-id"), truncateString(string(respBody), 1000))

		s.handleFailoverSideEffects(ctx, resp, account)
		appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
			Platform:           account.Platform,
			AccountID:          account.ID,
			UpstreamStatusCode: resp.StatusCode,
			UpstreamRequestID:  resp.Header.Get("x-request-id"),
			Kind:               "failover",
			Message:            extractUpstreamErrorMessage(respBody),
			Detail: func() string {
				if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
					return truncateString(string(respBody), s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes)
				}
				return ""
			}(),
		})
		return nil, &UpstreamFailoverError{StatusCode: resp.StatusCode}
	}

	// 处理错误响应（不可重试的错误）
	if resp.StatusCode >= 400 {
		// 可选：对部分 400 触发 failover（默认关闭以保持语义）
		if resp.StatusCode == 400 && s.cfg != nil && s.cfg.Gateway.FailoverOn400 {
			respBody, readErr := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
			if readErr != nil {
				// ReadAll failed, fall back to normal error handling without consuming the stream
				return s.handleErrorResponse(ctx, resp, c, account)
			}
			_ = resp.Body.Close()
			resp.Body = io.NopCloser(bytes.NewReader(respBody))

			if s.shouldFailoverOn400(respBody) {
				upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(respBody))
				upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)
				upstreamDetail := ""
				if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
					maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
					if maxBytes <= 0 {
						maxBytes = 2048
					}
					upstreamDetail = truncateString(string(respBody), maxBytes)
				}
				appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
					Platform:           account.Platform,
					AccountID:          account.ID,
					AccountName:        account.Name,
					UpstreamStatusCode: resp.StatusCode,
					UpstreamRequestID:  resp.Header.Get("x-request-id"),
					Kind:               "failover_on_400",
					Message:            upstreamMsg,
					Detail:             upstreamDetail,
				})

				if s.cfg.Gateway.LogUpstreamErrorBody {
					log.Printf(
						"Account %d: 400 error, attempting failover: %s",
						account.ID,
						truncateForLog(respBody, s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes),
					)
				} else {
					log.Printf("Account %d: 400 error, attempting failover", account.ID)
				}
				s.handleFailoverSideEffects(ctx, resp, account)
				return nil, &UpstreamFailoverError{StatusCode: resp.StatusCode}
			}
		}
		return s.handleErrorResponse(ctx, resp, c, account)
	}

	// 处理正常响应
	var usage *ClaudeUsage
	var firstTokenMs *int
	var clientDisconnect bool
	if reqStream {
		streamResult, err := s.handleStreamingResponse(ctx, resp, c, account, startTime, originalModel, reqModel, toolNameMap, shouldMimicClaudeCode)
		if err != nil {
			if err.Error() == "have error in stream" {
				return nil, &UpstreamFailoverError{
					StatusCode: 403,
				}
			}
			return nil, err
		}
		usage = streamResult.usage
		firstTokenMs = streamResult.firstTokenMs
		clientDisconnect = streamResult.clientDisconnect
	} else {
		usage, err = s.handleNonStreamingResponse(ctx, resp, c, account, originalModel, reqModel, toolNameMap, shouldMimicClaudeCode)
		if err != nil {
			return nil, err
		}
	}

	return &ForwardResult{
		RequestID:        resp.Header.Get("x-request-id"),
		Usage:            *usage,
		Model:            originalModel, // 使用原始模型用于计费和日志
		Stream:           reqStream,
		Duration:         time.Since(startTime),
		FirstTokenMs:     firstTokenMs,
		ClientDisconnect: clientDisconnect,
	}, nil
}

func (s *GatewayService) buildUpstreamRequest(ctx context.Context, c *gin.Context, account *Account, body []byte, token, tokenType, modelID string, reqStream bool, mimicClaudeCode bool) (*http.Request, error) {
	// 确定目标URL
	targetURL := claudeAPIURL
	if account.Type == AccountTypeAPIKey {
		baseURL := account.GetBaseURL()
		if baseURL != "" {
			validatedURL, err := s.validateUpstreamBaseURL(baseURL)
			if err != nil {
				return nil, err
			}
			targetURL = validatedURL + "/v1/messages"
		}
	}

	clientHeaders := http.Header{}
	if c != nil && c.Request != nil {
		clientHeaders = c.Request.Header
	}

	// OAuth账号：应用统一指纹
	var fingerprint *Fingerprint
	if account.IsOAuth() && s.identityService != nil {
		// 1. 获取或创建指纹（包含随机生成的ClientID）
		fp, err := s.identityService.GetOrCreateFingerprint(ctx, account.ID, clientHeaders)
		if err != nil {
			log.Printf("Warning: failed to get fingerprint for account %d: %v", account.ID, err)
			// 失败时降级为透传原始headers
		} else {
			fingerprint = fp

			// 2. 重写metadata.user_id（需要指纹中的ClientID和账号的account_uuid）
			// 如果启用了会话ID伪装，会在重写后替换 session 部分为固定值
			accountUUID := account.GetExtraString("account_uuid")
			if accountUUID != "" && fp.ClientID != "" {
				if newBody, err := s.identityService.RewriteUserIDWithMasking(ctx, body, account, accountUUID, fp.ClientID); err == nil && len(newBody) > 0 {
					body = newBody
				}
			}
		}
	}

	req, err := http.NewRequestWithContext(ctx, "POST", targetURL, bytes.NewReader(body))
	if err != nil {
		return nil, err
	}

	// 设置认证头
	if tokenType == "oauth" {
		req.Header.Set("authorization", "Bearer "+token)
	} else {
		req.Header.Set("x-api-key", token)
	}

	// 白名单透传headers
	for key, values := range clientHeaders {
		lowerKey := strings.ToLower(key)
		if allowedHeaders[lowerKey] {
			for _, v := range values {
				req.Header.Add(key, v)
			}
		}
	}

	// OAuth账号：应用缓存的指纹到请求头（覆盖白名单透传的头）
	if fingerprint != nil {
		s.identityService.ApplyFingerprint(req, fingerprint)
	}

	// 确保必要的headers存在
	if req.Header.Get("content-type") == "" {
		req.Header.Set("content-type", "application/json")
	}
	if req.Header.Get("anthropic-version") == "" {
		req.Header.Set("anthropic-version", "2023-06-01")
	}
	if tokenType == "oauth" {
		applyClaudeOAuthHeaderDefaults(req, reqStream)
	}

	// 处理 anthropic-beta header（OAuth 账号需要包含 oauth beta）
	if tokenType == "oauth" {
		if mimicClaudeCode {
			// 非 Claude Code 客户端：按 opencode 的策略处理：
			// - 强制 Claude Code 指纹相关请求头（尤其是 user-agent/x-stainless/x-app）
			// - 保留 incoming beta 的同时，确保 OAuth 所需 beta 存在
			applyClaudeCodeMimicHeaders(req, reqStream)

			incomingBeta := req.Header.Get("anthropic-beta")
			// Match real Claude CLI traffic (per mitmproxy reports):
			// messages requests typically use only oauth + interleaved-thinking.
			// Also drop claude-code beta if a downstream client added it.
			requiredBetas := []string{claude.BetaOAuth, claude.BetaInterleavedThinking}
			drop := map[string]struct{}{claude.BetaClaudeCode: {}}
			req.Header.Set("anthropic-beta", mergeAnthropicBetaDropping(requiredBetas, incomingBeta, drop))
		} else {
			// Claude Code 客户端：尽量透传原始 header，仅补齐 oauth beta
			clientBetaHeader := req.Header.Get("anthropic-beta")
			req.Header.Set("anthropic-beta", s.getBetaHeader(modelID, clientBetaHeader))
		}
	} else if s.cfg != nil && s.cfg.Gateway.InjectBetaForAPIKey && req.Header.Get("anthropic-beta") == "" {
		// API-key：仅在请求显式使用 beta 特性且客户端未提供时，按需补齐（默认关闭）
		if requestNeedsBetaFeatures(body) {
			if beta := defaultAPIKeyBetaHeader(body); beta != "" {
				req.Header.Set("anthropic-beta", beta)
			}
		}
	}

	// Always capture a compact fingerprint line for later error diagnostics.
	// We only print it when needed (or when the explicit debug flag is enabled).
	if c != nil && tokenType == "oauth" {
		c.Set(claudeMimicDebugInfoKey, buildClaudeMimicDebugLine(req, body, account, tokenType, mimicClaudeCode))
	}
	if s.debugClaudeMimicEnabled() {
		logClaudeMimicDebug(req, body, account, tokenType, mimicClaudeCode)
	}

	return req, nil
}

// getBetaHeader 处理anthropic-beta header
// 对于OAuth账号，需要确保包含oauth-2025-04-20
func (s *GatewayService) getBetaHeader(modelID string, clientBetaHeader string) string {
	// 如果客户端传了anthropic-beta
	if clientBetaHeader != "" {
		// 已包含oauth beta则直接返回
		if strings.Contains(clientBetaHeader, claude.BetaOAuth) {
			return clientBetaHeader
		}

		// 需要添加oauth beta
		parts := strings.Split(clientBetaHeader, ",")
		for i, p := range parts {
			parts[i] = strings.TrimSpace(p)
		}

		// 在claude-code-20250219后面插入oauth beta
		claudeCodeIdx := -1
		for i, p := range parts {
			if p == claude.BetaClaudeCode {
				claudeCodeIdx = i
				break
			}
		}

		if claudeCodeIdx >= 0 {
			// 在claude-code后面插入
			newParts := make([]string, 0, len(parts)+1)
			newParts = append(newParts, parts[:claudeCodeIdx+1]...)
			newParts = append(newParts, claude.BetaOAuth)
			newParts = append(newParts, parts[claudeCodeIdx+1:]...)
			return strings.Join(newParts, ",")
		}

		// 没有claude-code，放在第一位
		return claude.BetaOAuth + "," + clientBetaHeader
	}

	// 客户端没传，根据模型生成
	// haiku 模型不需要 claude-code beta
	if strings.Contains(strings.ToLower(modelID), "haiku") {
		return claude.HaikuBetaHeader
	}

	return claude.DefaultBetaHeader
}

func requestNeedsBetaFeatures(body []byte) bool {
	tools := gjson.GetBytes(body, "tools")
	if tools.Exists() && tools.IsArray() && len(tools.Array()) > 0 {
		return true
	}
	if strings.EqualFold(gjson.GetBytes(body, "thinking.type").String(), "enabled") {
		return true
	}
	return false
}

func defaultAPIKeyBetaHeader(body []byte) string {
	modelID := gjson.GetBytes(body, "model").String()
	if strings.Contains(strings.ToLower(modelID), "haiku") {
		return claude.APIKeyHaikuBetaHeader
	}
	return claude.APIKeyBetaHeader
}

func applyClaudeOAuthHeaderDefaults(req *http.Request, isStream bool) {
	if req == nil {
		return
	}
	if req.Header.Get("accept") == "" {
		req.Header.Set("accept", "application/json")
	}
	for key, value := range claude.DefaultHeaders {
		if value == "" {
			continue
		}
		if req.Header.Get(key) == "" {
			req.Header.Set(key, value)
		}
	}
	if isStream && req.Header.Get("x-stainless-helper-method") == "" {
		req.Header.Set("x-stainless-helper-method", "stream")
	}
}

func mergeAnthropicBeta(required []string, incoming string) string {
	seen := make(map[string]struct{}, len(required)+8)
	out := make([]string, 0, len(required)+8)

	add := func(v string) {
		v = strings.TrimSpace(v)
		if v == "" {
			return
		}
		if _, ok := seen[v]; ok {
			return
		}
		seen[v] = struct{}{}
		out = append(out, v)
	}

	for _, r := range required {
		add(r)
	}
	for _, p := range strings.Split(incoming, ",") {
		add(p)
	}
	return strings.Join(out, ",")
}

func mergeAnthropicBetaDropping(required []string, incoming string, drop map[string]struct{}) string {
	merged := mergeAnthropicBeta(required, incoming)
	if merged == "" || len(drop) == 0 {
		return merged
	}
	out := make([]string, 0, 8)
	for _, p := range strings.Split(merged, ",") {
		p = strings.TrimSpace(p)
		if p == "" {
			continue
		}
		if _, ok := drop[p]; ok {
			continue
		}
		out = append(out, p)
	}
	return strings.Join(out, ",")
}

// applyClaudeCodeMimicHeaders forces "Claude Code-like" request headers.
// This mirrors opencode-anthropic-auth behavior: do not trust downstream
// headers when using Claude Code-scoped OAuth credentials.
func applyClaudeCodeMimicHeaders(req *http.Request, isStream bool) {
	if req == nil {
		return
	}
	// Start with the standard defaults (fill missing).
	applyClaudeOAuthHeaderDefaults(req, isStream)
	// Then force key headers to match Claude Code fingerprint regardless of what the client sent.
	for key, value := range claude.DefaultHeaders {
		if value == "" {
			continue
		}
		req.Header.Set(key, value)
	}
	// Real Claude CLI uses Accept: application/json (even for streaming).
	req.Header.Set("accept", "application/json")
	if isStream {
		req.Header.Set("x-stainless-helper-method", "stream")
	}
}

func truncateForLog(b []byte, maxBytes int) string {
	if maxBytes <= 0 {
		maxBytes = 2048
	}
	if len(b) > maxBytes {
		b = b[:maxBytes]
	}
	s := string(b)
	// 保持一行，避免污染日志格式
	s = strings.ReplaceAll(s, "\n", "\\n")
	s = strings.ReplaceAll(s, "\r", "\\r")
	return s
}

// isThinkingBlockSignatureError 检测是否是thinking block相关错误
// 这类错误可以通过过滤thinking blocks并重试来解决
func (s *GatewayService) isThinkingBlockSignatureError(respBody []byte) bool {
	msg := strings.ToLower(strings.TrimSpace(extractUpstreamErrorMessage(respBody)))
	if msg == "" {
		return false
	}

	// Log for debugging
	log.Printf("[SignatureCheck] Checking error message: %s", msg)

	// 检测signature相关的错误（更宽松的匹配）
	// 例如: "Invalid `signature` in `thinking` block", "***.signature" 等
	if strings.Contains(msg, "signature") {
		log.Printf("[SignatureCheck] Detected signature error")
		return true
	}

	// 检测 thinking block 顺序/类型错误
	// 例如: "Expected `thinking` or `redacted_thinking`, but found `text`"
	if strings.Contains(msg, "expected") && (strings.Contains(msg, "thinking") || strings.Contains(msg, "redacted_thinking")) {
		log.Printf("[SignatureCheck] Detected thinking block type error")
		return true
	}

	// 检测空消息内容错误（可能是过滤 thinking blocks 后导致的）
	// 例如: "all messages must have non-empty content"
	if strings.Contains(msg, "non-empty content") || strings.Contains(msg, "empty content") {
		log.Printf("[SignatureCheck] Detected empty content error")
		return true
	}

	return false
}

func (s *GatewayService) shouldFailoverOn400(respBody []byte) bool {
	// 只对“可能是兼容性差异导致”的 400 允许切换，避免无意义重试。
	// 默认保守：无法识别则不切换。
	msg := strings.ToLower(strings.TrimSpace(extractUpstreamErrorMessage(respBody)))
	if msg == "" {
		return false
	}

	// 缺少/错误的 beta header：换账号/链路可能成功（尤其是混合调度时）。
	// 更精确匹配 beta 相关的兼容性问题，避免误触发切换。
	if strings.Contains(msg, "anthropic-beta") ||
		strings.Contains(msg, "beta feature") ||
		strings.Contains(msg, "requires beta") {
		return true
	}

	// thinking/tool streaming 等兼容性约束（常见于中间转换链路）
	if strings.Contains(msg, "thinking") || strings.Contains(msg, "thought_signature") || strings.Contains(msg, "signature") {
		return true
	}
	if strings.Contains(msg, "tool_use") || strings.Contains(msg, "tool_result") || strings.Contains(msg, "tools") {
		return true
	}

	return false
}

func extractUpstreamErrorMessage(body []byte) string {
	// Claude 风格：{"type":"error","error":{"type":"...","message":"..."}}
	if m := gjson.GetBytes(body, "error.message").String(); strings.TrimSpace(m) != "" {
		inner := strings.TrimSpace(m)
		// 有些上游会把完整 JSON 作为字符串塞进 message
		if strings.HasPrefix(inner, "{") {
			if innerMsg := gjson.Get(inner, "error.message").String(); strings.TrimSpace(innerMsg) != "" {
				return innerMsg
			}
		}
		return m
	}

	// 兜底：尝试顶层 message
	return gjson.GetBytes(body, "message").String()
}

func (s *GatewayService) handleErrorResponse(ctx context.Context, resp *http.Response, c *gin.Context, account *Account) (*ForwardResult, error) {
	body, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))

	// 调试日志：打印上游错误响应
	log.Printf("[Forward] Upstream error (non-retryable): Account=%d(%s) Status=%d RequestID=%s Body=%s",
		account.ID, account.Name, resp.StatusCode, resp.Header.Get("x-request-id"), truncateString(string(body), 1000))

	upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(body))
	upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)

	// Print a compact upstream request fingerprint when we hit the Claude Code OAuth
	// credential scope error. This avoids requiring env-var tweaks in a fixed deploy.
	if isClaudeCodeCredentialScopeError(upstreamMsg) && c != nil {
		if v, ok := c.Get(claudeMimicDebugInfoKey); ok {
			if line, ok := v.(string); ok && strings.TrimSpace(line) != "" {
				log.Printf("[ClaudeMimicDebugOnError] status=%d request_id=%s %s",
					resp.StatusCode,
					resp.Header.Get("x-request-id"),
					line,
				)
			}
		}
	}

	// Enrich Ops error logs with upstream status + message, and optionally a truncated body snippet.
	upstreamDetail := ""
	if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
		maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
		if maxBytes <= 0 {
			maxBytes = 2048
		}
		upstreamDetail = truncateString(string(body), maxBytes)
	}
	setOpsUpstreamError(c, resp.StatusCode, upstreamMsg, upstreamDetail)
	appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
		Platform:           account.Platform,
		AccountID:          account.ID,
		UpstreamStatusCode: resp.StatusCode,
		UpstreamRequestID:  resp.Header.Get("x-request-id"),
		Kind:               "http_error",
		Message:            upstreamMsg,
		Detail:             upstreamDetail,
	})

	// 处理上游错误，标记账号状态
	shouldDisable := false
	if s.rateLimitService != nil {
		shouldDisable = s.rateLimitService.HandleUpstreamError(ctx, account, resp.StatusCode, resp.Header, body)
	}
	if shouldDisable {
		return nil, &UpstreamFailoverError{StatusCode: resp.StatusCode}
	}

	// 记录上游错误响应体摘要便于排障（可选：由配置控制；不回显到客户端）
	if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
		log.Printf(
			"Upstream error %d (account=%d platform=%s type=%s): %s",
			resp.StatusCode,
			account.ID,
			account.Platform,
			account.Type,
			truncateForLog(body, s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes),
		)
	}

	// 根据状态码返回适当的自定义错误响应（不透传上游详细信息）
	var errType, errMsg string
	var statusCode int

	switch resp.StatusCode {
	case 400:
		c.Data(http.StatusBadRequest, "application/json", body)
		summary := upstreamMsg
		if summary == "" {
			summary = truncateForLog(body, 512)
		}
		if summary == "" {
			return nil, fmt.Errorf("upstream error: %d", resp.StatusCode)
		}
		return nil, fmt.Errorf("upstream error: %d message=%s", resp.StatusCode, summary)
	case 401:
		statusCode = http.StatusBadGateway
		errType = "upstream_error"
		errMsg = "Upstream authentication failed, please contact administrator"
	case 403:
		statusCode = http.StatusBadGateway
		errType = "upstream_error"
		errMsg = "Upstream access forbidden, please contact administrator"
	case 429:
		statusCode = http.StatusTooManyRequests
		errType = "rate_limit_error"
		errMsg = "Upstream rate limit exceeded, please retry later"
	case 529:
		statusCode = http.StatusServiceUnavailable
		errType = "overloaded_error"
		errMsg = "Upstream service overloaded, please retry later"
	case 500, 502, 503, 504:
		statusCode = http.StatusBadGateway
		errType = "upstream_error"
		errMsg = "Upstream service temporarily unavailable"
	default:
		statusCode = http.StatusBadGateway
		errType = "upstream_error"
		errMsg = "Upstream request failed"
	}

	// 返回自定义错误响应
	c.JSON(statusCode, gin.H{
		"type": "error",
		"error": gin.H{
			"type":    errType,
			"message": errMsg,
		},
	})

	if upstreamMsg == "" {
		return nil, fmt.Errorf("upstream error: %d", resp.StatusCode)
	}
	return nil, fmt.Errorf("upstream error: %d message=%s", resp.StatusCode, upstreamMsg)
}

func (s *GatewayService) handleRetryExhaustedSideEffects(ctx context.Context, resp *http.Response, account *Account) {
	body, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
	statusCode := resp.StatusCode

	// OAuth/Setup Token 账号的 403：标记账号异常
	if account.IsOAuth() && statusCode == 403 {
		s.rateLimitService.HandleUpstreamError(ctx, account, statusCode, resp.Header, body)
		log.Printf("Account %d: marked as error after %d retries for status %d", account.ID, maxRetryAttempts, statusCode)
	} else {
		// API Key 未配置错误码：不标记账号状态
		log.Printf("Account %d: upstream error %d after %d retries (not marking account)", account.ID, statusCode, maxRetryAttempts)
	}
}

func (s *GatewayService) handleFailoverSideEffects(ctx context.Context, resp *http.Response, account *Account) {
	body, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
	s.rateLimitService.HandleUpstreamError(ctx, account, resp.StatusCode, resp.Header, body)
}

// handleRetryExhaustedError 处理重试耗尽后的错误
// OAuth 403：标记账号异常
// API Key 未配置错误码：仅返回错误，不标记账号
func (s *GatewayService) handleRetryExhaustedError(ctx context.Context, resp *http.Response, c *gin.Context, account *Account) (*ForwardResult, error) {
	// Capture upstream error body before side-effects consume the stream.
	respBody, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
	_ = resp.Body.Close()
	resp.Body = io.NopCloser(bytes.NewReader(respBody))

	s.handleRetryExhaustedSideEffects(ctx, resp, account)

	upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(respBody))
	upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)

	if isClaudeCodeCredentialScopeError(upstreamMsg) && c != nil {
		if v, ok := c.Get(claudeMimicDebugInfoKey); ok {
			if line, ok := v.(string); ok && strings.TrimSpace(line) != "" {
				log.Printf("[ClaudeMimicDebugOnError] status=%d request_id=%s %s",
					resp.StatusCode,
					resp.Header.Get("x-request-id"),
					line,
				)
			}
		}
	}

	upstreamDetail := ""
	if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
		maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
		if maxBytes <= 0 {
			maxBytes = 2048
		}
		upstreamDetail = truncateString(string(respBody), maxBytes)
	}
	setOpsUpstreamError(c, resp.StatusCode, upstreamMsg, upstreamDetail)
	appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
		Platform:           account.Platform,
		AccountID:          account.ID,
		UpstreamStatusCode: resp.StatusCode,
		UpstreamRequestID:  resp.Header.Get("x-request-id"),
		Kind:               "retry_exhausted",
		Message:            upstreamMsg,
		Detail:             upstreamDetail,
	})

	if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
		log.Printf(
			"Upstream error %d retries_exhausted (account=%d platform=%s type=%s): %s",
			resp.StatusCode,
			account.ID,
			account.Platform,
			account.Type,
			truncateForLog(respBody, s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes),
		)
	}

	// 返回统一的重试耗尽错误响应
	c.JSON(http.StatusBadGateway, gin.H{
		"type": "error",
		"error": gin.H{
			"type":    "upstream_error",
			"message": "Upstream request failed after retries",
		},
	})

	if upstreamMsg == "" {
		return nil, fmt.Errorf("upstream error: %d (retries exhausted)", resp.StatusCode)
	}
	return nil, fmt.Errorf("upstream error: %d (retries exhausted) message=%s", resp.StatusCode, upstreamMsg)
}

// streamingResult 流式响应结果
type streamingResult struct {
	usage            *ClaudeUsage
	firstTokenMs     *int
	clientDisconnect bool // 客户端是否在流式传输过程中断开
}

func (s *GatewayService) handleStreamingResponse(ctx context.Context, resp *http.Response, c *gin.Context, account *Account, startTime time.Time, originalModel, mappedModel string, toolNameMap map[string]string, mimicClaudeCode bool) (*streamingResult, error) {
	// 更新5h窗口状态
	s.rateLimitService.UpdateSessionWindow(ctx, account, resp.Header)

	if s.cfg != nil {
		responseheaders.WriteFilteredHeaders(c.Writer.Header(), resp.Header, s.cfg.Security.ResponseHeaders)
	}

	// 设置SSE响应头
	c.Header("Content-Type", "text/event-stream")
	c.Header("Cache-Control", "no-cache")
	c.Header("Connection", "keep-alive")
	c.Header("X-Accel-Buffering", "no")

	// 透传其他响应头
	if v := resp.Header.Get("x-request-id"); v != "" {
		c.Header("x-request-id", v)
	}

	w := c.Writer
	flusher, ok := w.(http.Flusher)
	if !ok {
		return nil, errors.New("streaming not supported")
	}

	usage := &ClaudeUsage{}
	var firstTokenMs *int
	scanner := bufio.NewScanner(resp.Body)
	// 设置更大的buffer以处理长行
	maxLineSize := defaultMaxLineSize
	if s.cfg != nil && s.cfg.Gateway.MaxLineSize > 0 {
		maxLineSize = s.cfg.Gateway.MaxLineSize
	}
	scanner.Buffer(make([]byte, 64*1024), maxLineSize)

	type scanEvent struct {
		line string
		err  error
	}
	// 独立 goroutine 读取上游，避免读取阻塞导致超时/keepalive无法处理
	events := make(chan scanEvent, 16)
	done := make(chan struct{})
	sendEvent := func(ev scanEvent) bool {
		select {
		case events <- ev:
			return true
		case <-done:
			return false
		}
	}
	var lastReadAt int64
	atomic.StoreInt64(&lastReadAt, time.Now().UnixNano())
	go func() {
		defer close(events)
		for scanner.Scan() {
			atomic.StoreInt64(&lastReadAt, time.Now().UnixNano())
			if !sendEvent(scanEvent{line: scanner.Text()}) {
				return
			}
		}
		if err := scanner.Err(); err != nil {
			_ = sendEvent(scanEvent{err: err})
		}
	}()
	defer close(done)

	streamInterval := time.Duration(0)
	if s.cfg != nil && s.cfg.Gateway.StreamDataIntervalTimeout > 0 {
		streamInterval = time.Duration(s.cfg.Gateway.StreamDataIntervalTimeout) * time.Second
	}
	// 仅监控上游数据间隔超时，避免下游写入阻塞导致误判
	var intervalTicker *time.Ticker
	if streamInterval > 0 {
		intervalTicker = time.NewTicker(streamInterval)
		defer intervalTicker.Stop()
	}
	var intervalCh <-chan time.Time
	if intervalTicker != nil {
		intervalCh = intervalTicker.C
	}

	// 仅发送一次错误事件，避免多次写入导致协议混乱（写失败时尽力通知客户端）
	errorEventSent := false
	sendErrorEvent := func(reason string) {
		if errorEventSent {
			return
		}
		errorEventSent = true
		_, _ = fmt.Fprintf(w, "event: error\ndata: {\"error\":\"%s\"}\n\n", reason)
		flusher.Flush()
	}

	needModelReplace := originalModel != mappedModel
	clientDisconnected := false // 客户端断开标志，断开后继续读取上游以获取完整usage

	pendingEventLines := make([]string, 0, 4)
	var toolInputBuffers map[int]string
	if mimicClaudeCode {
		toolInputBuffers = make(map[int]string)
	}

	transformToolInputJSON := func(raw string) string {
		if !mimicClaudeCode {
			return raw
		}
		raw = strings.TrimSpace(raw)
		if raw == "" {
			return raw
		}

		var parsed any
		if err := json.Unmarshal([]byte(raw), &parsed); err != nil {
			return replaceToolNamesInText(raw, toolNameMap)
		}

		rewritten, changed := rewriteParamKeysInValue(parsed, toolNameMap)
		if changed {
			if bytes, err := json.Marshal(rewritten); err == nil {
				return string(bytes)
			}
		}
		return raw
	}

	processSSEEvent := func(lines []string) ([]string, string, error) {
		if len(lines) == 0 {
			return nil, "", nil
		}

		eventName := ""
		dataLine := ""
		for _, line := range lines {
			trimmed := strings.TrimSpace(line)
			if strings.HasPrefix(trimmed, "event:") {
				eventName = strings.TrimSpace(strings.TrimPrefix(trimmed, "event:"))
				continue
			}
			if dataLine == "" && sseDataRe.MatchString(trimmed) {
				dataLine = sseDataRe.ReplaceAllString(trimmed, "")
			}
		}

		if eventName == "error" {
			return nil, dataLine, errors.New("have error in stream")
		}

		if dataLine == "" {
			return []string{strings.Join(lines, "\n") + "\n\n"}, "", nil
		}

		if dataLine == "[DONE]" {
			block := ""
			if eventName != "" {
				block = "event: " + eventName + "\n"
			}
			block += "data: " + dataLine + "\n\n"
			return []string{block}, dataLine, nil
		}

		var event map[string]any
		if err := json.Unmarshal([]byte(dataLine), &event); err != nil {
			replaced := dataLine
			if mimicClaudeCode {
				replaced = replaceToolNamesInText(dataLine, toolNameMap)
			}
			block := ""
			if eventName != "" {
				block = "event: " + eventName + "\n"
			}
			block += "data: " + replaced + "\n\n"
			return []string{block}, replaced, nil
		}

		eventType, _ := event["type"].(string)
		if eventName == "" {
			eventName = eventType
		}

		if needModelReplace {
			if msg, ok := event["message"].(map[string]any); ok {
				if model, ok := msg["model"].(string); ok && model == mappedModel {
					msg["model"] = originalModel
				}
			}
		}

		if mimicClaudeCode && eventType == "content_block_delta" {
			if delta, ok := event["delta"].(map[string]any); ok {
				if deltaType, _ := delta["type"].(string); deltaType == "input_json_delta" {
					if indexVal, ok := event["index"].(float64); ok {
						index := int(indexVal)
						if partial, ok := delta["partial_json"].(string); ok {
							toolInputBuffers[index] += partial
						}
					}
					return nil, dataLine, nil
				}
			}
		}

		if mimicClaudeCode && eventType == "content_block_stop" {
			if indexVal, ok := event["index"].(float64); ok {
				index := int(indexVal)
				if buffered := toolInputBuffers[index]; buffered != "" {
					delete(toolInputBuffers, index)

					transformed := transformToolInputJSON(buffered)
					synthetic := map[string]any{
						"type":  "content_block_delta",
						"index": index,
						"delta": map[string]any{
							"type":         "input_json_delta",
							"partial_json": transformed,
						},
					}

					synthBytes, synthErr := json.Marshal(synthetic)
					if synthErr == nil {
						synthBlock := "event: content_block_delta\n" + "data: " + string(synthBytes) + "\n\n"

						rewriteToolNamesInValue(event, toolNameMap)
						stopBytes, stopErr := json.Marshal(event)
						if stopErr == nil {
							stopBlock := ""
							if eventName != "" {
								stopBlock = "event: " + eventName + "\n"
							}
							stopBlock += "data: " + string(stopBytes) + "\n\n"
							return []string{synthBlock, stopBlock}, string(stopBytes), nil
						}
					}
				}
			}
		}

		if mimicClaudeCode {
			rewriteToolNamesInValue(event, toolNameMap)
		}
		newData, err := json.Marshal(event)
		if err != nil {
			replaced := dataLine
			if mimicClaudeCode {
				replaced = replaceToolNamesInText(dataLine, toolNameMap)
			}
			block := ""
			if eventName != "" {
				block = "event: " + eventName + "\n"
			}
			block += "data: " + replaced + "\n\n"
			return []string{block}, replaced, nil
		}

		block := ""
		if eventName != "" {
			block = "event: " + eventName + "\n"
		}
		block += "data: " + string(newData) + "\n\n"
		return []string{block}, string(newData), nil
	}

	for {
		select {
		case ev, ok := <-events:
			if !ok {
				// 上游完成，返回结果
				return &streamingResult{usage: usage, firstTokenMs: firstTokenMs, clientDisconnect: clientDisconnected}, nil
			}
			if ev.err != nil {
				// 检测 context 取消（客户端断开会导致 context 取消，进而影响上游读取）
				if errors.Is(ev.err, context.Canceled) || errors.Is(ev.err, context.DeadlineExceeded) {
					log.Printf("Context canceled during streaming, returning collected usage")
					return &streamingResult{usage: usage, firstTokenMs: firstTokenMs, clientDisconnect: true}, nil
				}
				// 客户端已通过写入失败检测到断开，上游也出错了，返回已收集的 usage
				if clientDisconnected {
					log.Printf("Upstream read error after client disconnect: %v, returning collected usage", ev.err)
					return &streamingResult{usage: usage, firstTokenMs: firstTokenMs, clientDisconnect: true}, nil
				}
				// 客户端未断开，正常的错误处理
				if errors.Is(ev.err, bufio.ErrTooLong) {
					log.Printf("SSE line too long: account=%d max_size=%d error=%v", account.ID, maxLineSize, ev.err)
					sendErrorEvent("response_too_large")
					return &streamingResult{usage: usage, firstTokenMs: firstTokenMs}, ev.err
				}
				sendErrorEvent("stream_read_error")
				return &streamingResult{usage: usage, firstTokenMs: firstTokenMs}, fmt.Errorf("stream read error: %w", ev.err)
			}
			line := ev.line
			trimmed := strings.TrimSpace(line)

			if trimmed == "" {
				if len(pendingEventLines) == 0 {
					continue
				}

				outputBlocks, data, err := processSSEEvent(pendingEventLines)
				pendingEventLines = pendingEventLines[:0]
				if err != nil {
					if clientDisconnected {
						return &streamingResult{usage: usage, firstTokenMs: firstTokenMs, clientDisconnect: true}, nil
					}
					return nil, err
				}

				for _, block := range outputBlocks {
					if !clientDisconnected {
						if _, werr := fmt.Fprint(w, block); werr != nil {
							clientDisconnected = true
							log.Printf("Client disconnected during streaming, continuing to drain upstream for billing")
							break
						}
						flusher.Flush()
					}
					if data != "" {
						if firstTokenMs == nil && data != "[DONE]" {
							ms := int(time.Since(startTime).Milliseconds())
							firstTokenMs = &ms
						}
						s.parseSSEUsage(data, usage)
					}
				}
				continue
			}

			pendingEventLines = append(pendingEventLines, line)

		case <-intervalCh:
			lastRead := time.Unix(0, atomic.LoadInt64(&lastReadAt))
			if time.Since(lastRead) < streamInterval {
				continue
			}
			if clientDisconnected {
				// 客户端已断开，上游也超时了，返回已收集的 usage
				log.Printf("Upstream timeout after client disconnect, returning collected usage")
				return &streamingResult{usage: usage, firstTokenMs: firstTokenMs, clientDisconnect: true}, nil
			}
			log.Printf("Stream data interval timeout: account=%d model=%s interval=%s", account.ID, originalModel, streamInterval)
			// 处理流超时，可能标记账户为临时不可调度或错误状态
			if s.rateLimitService != nil {
				s.rateLimitService.HandleStreamTimeout(ctx, account, originalModel)
			}
			sendErrorEvent("stream_timeout")
			return &streamingResult{usage: usage, firstTokenMs: firstTokenMs}, fmt.Errorf("stream data interval timeout")
		}
	}

}

func rewriteParamKeysInValue(value any, cache map[string]string) (any, bool) {
	switch v := value.(type) {
	case map[string]any:
		changed := false
		rewritten := make(map[string]any, len(v))
		for key, item := range v {
			newKey := normalizeParamNameForOpenCode(key, cache)
			newItem, childChanged := rewriteParamKeysInValue(item, cache)
			if childChanged {
				changed = true
			}
			if newKey != key {
				changed = true
			}
			rewritten[newKey] = newItem
		}
		if !changed {
			return value, false
		}
		return rewritten, true
	case []any:
		changed := false
		rewritten := make([]any, len(v))
		for idx, item := range v {
			newItem, childChanged := rewriteParamKeysInValue(item, cache)
			if childChanged {
				changed = true
			}
			rewritten[idx] = newItem
		}
		if !changed {
			return value, false
		}
		return rewritten, true
	default:
		return value, false
	}
}

func rewriteToolNamesInValue(value any, toolNameMap map[string]string) bool {
	switch v := value.(type) {
	case map[string]any:
		changed := false
		if blockType, _ := v["type"].(string); blockType == "tool_use" {
			if name, ok := v["name"].(string); ok {
				mapped := normalizeToolNameForOpenCode(name, toolNameMap)
				if mapped != name {
					v["name"] = mapped
					changed = true
				}
			}
			if input, ok := v["input"].(map[string]any); ok {
				rewrittenInput, inputChanged := rewriteParamKeysInValue(input, toolNameMap)
				if inputChanged {
					if m, ok := rewrittenInput.(map[string]any); ok {
						v["input"] = m
						changed = true
					}
				}
			}
		}
		for _, item := range v {
			if rewriteToolNamesInValue(item, toolNameMap) {
				changed = true
			}
		}
		return changed
	case []any:
		changed := false
		for _, item := range v {
			if rewriteToolNamesInValue(item, toolNameMap) {
				changed = true
			}
		}
		return changed
	default:
		return false
	}
}

func replaceToolNamesInText(text string, toolNameMap map[string]string) string {
	if text == "" {
		return text
	}
	output := toolNameFieldRe.ReplaceAllStringFunc(text, func(match string) string {
		submatches := toolNameFieldRe.FindStringSubmatch(match)
		if len(submatches) < 2 {
			return match
		}
		name := submatches[1]
		mapped := normalizeToolNameForOpenCode(name, toolNameMap)
		if mapped == name {
			return match
		}
		return strings.Replace(match, name, mapped, 1)
	})
	output = modelFieldRe.ReplaceAllStringFunc(output, func(match string) string {
		submatches := modelFieldRe.FindStringSubmatch(match)
		if len(submatches) < 2 {
			return match
		}
		model := submatches[1]
		mapped := claude.DenormalizeModelID(model)
		if mapped == model {
			return match
		}
		return strings.Replace(match, model, mapped, 1)
	})

	for mapped, original := range toolNameMap {
		if mapped == "" || original == "" || mapped == original {
			continue
		}
		output = strings.ReplaceAll(output, "\""+mapped+"\":", "\""+original+"\":")
		output = strings.ReplaceAll(output, "\\\""+mapped+"\\\":", "\\\""+original+"\\\":")
	}

	return output
}

func (s *GatewayService) parseSSEUsage(data string, usage *ClaudeUsage) {
	// 解析message_start获取input tokens（标准Claude API格式）
	var msgStart struct {
		Type    string `json:"type"`
		Message struct {
			Usage ClaudeUsage `json:"usage"`
		} `json:"message"`
	}
	if json.Unmarshal([]byte(data), &msgStart) == nil && msgStart.Type == "message_start" {
		usage.InputTokens = msgStart.Message.Usage.InputTokens
		usage.CacheCreationInputTokens = msgStart.Message.Usage.CacheCreationInputTokens
		usage.CacheReadInputTokens = msgStart.Message.Usage.CacheReadInputTokens
	}

	// 解析message_delta获取tokens（兼容GLM等把所有usage放在delta中的API）
	var msgDelta struct {
		Type  string `json:"type"`
		Usage struct {
			InputTokens              int `json:"input_tokens"`
			OutputTokens             int `json:"output_tokens"`
			CacheCreationInputTokens int `json:"cache_creation_input_tokens"`
			CacheReadInputTokens     int `json:"cache_read_input_tokens"`
		} `json:"usage"`
	}
	if json.Unmarshal([]byte(data), &msgDelta) == nil && msgDelta.Type == "message_delta" {
		// message_delta 仅覆盖存在且非0的字段
		// 避免覆盖 message_start 中已有的值（如 input_tokens）
		// Claude API 的 message_delta 通常只包含 output_tokens
		if msgDelta.Usage.InputTokens > 0 {
			usage.InputTokens = msgDelta.Usage.InputTokens
		}
		if msgDelta.Usage.OutputTokens > 0 {
			usage.OutputTokens = msgDelta.Usage.OutputTokens
		}
		if msgDelta.Usage.CacheCreationInputTokens > 0 {
			usage.CacheCreationInputTokens = msgDelta.Usage.CacheCreationInputTokens
		}
		if msgDelta.Usage.CacheReadInputTokens > 0 {
			usage.CacheReadInputTokens = msgDelta.Usage.CacheReadInputTokens
		}
	}
}

func (s *GatewayService) handleNonStreamingResponse(ctx context.Context, resp *http.Response, c *gin.Context, account *Account, originalModel, mappedModel string, toolNameMap map[string]string, mimicClaudeCode bool) (*ClaudeUsage, error) {
	// 更新5h窗口状态
	s.rateLimitService.UpdateSessionWindow(ctx, account, resp.Header)

	body, err := io.ReadAll(resp.Body)
	if err != nil {
		return nil, err
	}

	// 解析usage
	var response struct {
		Usage ClaudeUsage `json:"usage"`
	}
	if err := json.Unmarshal(body, &response); err != nil {
		return nil, fmt.Errorf("parse response: %w", err)
	}

	// 如果有模型映射，替换响应中的model字段
	if originalModel != mappedModel {
		body = s.replaceModelInResponseBody(body, mappedModel, originalModel)
	}
	if mimicClaudeCode {
		body = s.replaceToolNamesInResponseBody(body, toolNameMap)
	}

	responseheaders.WriteFilteredHeaders(c.Writer.Header(), resp.Header, s.cfg.Security.ResponseHeaders)

	contentType := "application/json"
	if s.cfg != nil && !s.cfg.Security.ResponseHeaders.Enabled {
		if upstreamType := resp.Header.Get("Content-Type"); upstreamType != "" {
			contentType = upstreamType
		}
	}

	// 写入响应
	c.Data(resp.StatusCode, contentType, body)

	return &response.Usage, nil
}

// replaceModelInResponseBody 替换响应体中的model字段
func (s *GatewayService) replaceModelInResponseBody(body []byte, fromModel, toModel string) []byte {
	var resp map[string]any
	if err := json.Unmarshal(body, &resp); err != nil {
		return body
	}

	model, ok := resp["model"].(string)
	if !ok || model != fromModel {
		return body
	}

	resp["model"] = toModel
	newBody, err := json.Marshal(resp)
	if err != nil {
		return body
	}

	return newBody
}

func (s *GatewayService) replaceToolNamesInResponseBody(body []byte, toolNameMap map[string]string) []byte {
	if len(body) == 0 {
		return body
	}
	var resp map[string]any
	if err := json.Unmarshal(body, &resp); err != nil {
		replaced := replaceToolNamesInText(string(body), toolNameMap)
		if replaced == string(body) {
			return body
		}
		return []byte(replaced)
	}
	if !rewriteToolNamesInValue(resp, toolNameMap) {
		return body
	}
	newBody, err := json.Marshal(resp)
	if err != nil {
		return body
	}
	return newBody
}

// RecordUsageInput 记录使用量的输入参数
type RecordUsageInput struct {
	Result       *ForwardResult
	APIKey       *APIKey
	User         *User
	Account      *Account
	Subscription *UserSubscription // 可选：订阅信息
	UserAgent    string            // 请求的 User-Agent
	IPAddress    string            // 请求的客户端 IP 地址
}

// RecordUsage 记录使用量并扣费（或更新订阅用量）
func (s *GatewayService) RecordUsage(ctx context.Context, input *RecordUsageInput) error {
	result := input.Result
	apiKey := input.APIKey
	user := input.User
	account := input.Account
	subscription := input.Subscription

	// 获取费率倍数
	multiplier := s.cfg.Default.RateMultiplier
	if apiKey.GroupID != nil && apiKey.Group != nil {
		multiplier = apiKey.Group.RateMultiplier
	}

	var cost *CostBreakdown

	// 根据请求类型选择计费方式
	if result.ImageCount > 0 {
		// 图片生成计费
		var groupConfig *ImagePriceConfig
		if apiKey.Group != nil {
			groupConfig = &ImagePriceConfig{
				Price1K: apiKey.Group.ImagePrice1K,
				Price2K: apiKey.Group.ImagePrice2K,
				Price4K: apiKey.Group.ImagePrice4K,
			}
		}
		cost = s.billingService.CalculateImageCost(result.Model, result.ImageSize, result.ImageCount, groupConfig, multiplier)
	} else {
		// Token 计费
		tokens := UsageTokens{
			InputTokens:         result.Usage.InputTokens,
			OutputTokens:        result.Usage.OutputTokens,
			CacheCreationTokens: result.Usage.CacheCreationInputTokens,
			CacheReadTokens:     result.Usage.CacheReadInputTokens,
		}
		var err error
		cost, err = s.billingService.CalculateCost(result.Model, tokens, multiplier)
		if err != nil {
			log.Printf("Calculate cost failed: %v", err)
			cost = &CostBreakdown{ActualCost: 0}
		}
	}

	// 判断计费方式：订阅模式 vs 余额模式
	isSubscriptionBilling := subscription != nil && apiKey.Group != nil && apiKey.Group.IsSubscriptionType()
	billingType := BillingTypeBalance
	if isSubscriptionBilling {
		billingType = BillingTypeSubscription
	}

	// 创建使用日志
	durationMs := int(result.Duration.Milliseconds())
	var imageSize *string
	if result.ImageSize != "" {
		imageSize = &result.ImageSize
	}
	accountRateMultiplier := account.BillingRateMultiplier()
	usageLog := &UsageLog{
		UserID:                user.ID,
		APIKeyID:              apiKey.ID,
		AccountID:             account.ID,
		RequestID:             result.RequestID,
		Model:                 result.Model,
		InputTokens:           result.Usage.InputTokens,
		OutputTokens:          result.Usage.OutputTokens,
		CacheCreationTokens:   result.Usage.CacheCreationInputTokens,
		CacheReadTokens:       result.Usage.CacheReadInputTokens,
		InputCost:             cost.InputCost,
		OutputCost:            cost.OutputCost,
		CacheCreationCost:     cost.CacheCreationCost,
		CacheReadCost:         cost.CacheReadCost,
		TotalCost:             cost.TotalCost,
		ActualCost:            cost.ActualCost,
		RateMultiplier:        multiplier,
		AccountRateMultiplier: &accountRateMultiplier,
		BillingType:           billingType,
		Stream:                result.Stream,
		DurationMs:            &durationMs,
		FirstTokenMs:          result.FirstTokenMs,
		ImageCount:            result.ImageCount,
		ImageSize:             imageSize,
		CreatedAt:             time.Now(),
	}

	// 添加 UserAgent
	if input.UserAgent != "" {
		usageLog.UserAgent = &input.UserAgent
	}

	// 添加 IPAddress
	if input.IPAddress != "" {
		usageLog.IPAddress = &input.IPAddress
	}

	// 添加分组和订阅关联
	if apiKey.GroupID != nil {
		usageLog.GroupID = apiKey.GroupID
	}
	if subscription != nil {
		usageLog.SubscriptionID = &subscription.ID
	}

	inserted, err := s.usageLogRepo.Create(ctx, usageLog)
	if err != nil {
		log.Printf("Create usage log failed: %v", err)
	}

	if s.cfg != nil && s.cfg.RunMode == config.RunModeSimple {
		log.Printf("[SIMPLE MODE] Usage recorded (not billed): user=%d, tokens=%d", usageLog.UserID, usageLog.TotalTokens())
		s.deferredService.ScheduleLastUsedUpdate(account.ID)
		return nil
	}

	shouldBill := inserted || err != nil

	// 根据计费类型执行扣费
	if isSubscriptionBilling {
		// 订阅模式：更新订阅用量（使用 TotalCost 原始费用，不考虑倍率）
		if shouldBill && cost.TotalCost > 0 {
			if err := s.userSubRepo.IncrementUsage(ctx, subscription.ID, cost.TotalCost); err != nil {
				log.Printf("Increment subscription usage failed: %v", err)
			}
			// 异步更新订阅缓存
			s.billingCacheService.QueueUpdateSubscriptionUsage(user.ID, *apiKey.GroupID, cost.TotalCost)
		}
	} else {
		// 余额模式：扣除用户余额（使用 ActualCost 考虑倍率后的费用）
		if shouldBill && cost.ActualCost > 0 {
			if err := s.userRepo.DeductBalance(ctx, user.ID, cost.ActualCost); err != nil {
				log.Printf("Deduct balance failed: %v", err)
			}
			// 异步更新余额缓存
			s.billingCacheService.QueueDeductBalance(user.ID, cost.ActualCost)
		}
	}

	// Schedule batch update for account last_used_at
	s.deferredService.ScheduleLastUsedUpdate(account.ID)

	return nil
}

// RecordUsageLongContextInput 记录使用量的输入参数（支持长上下文双倍计费）
type RecordUsageLongContextInput struct {
	Result                *ForwardResult
	APIKey                *APIKey
	User                  *User
	Account               *Account
	Subscription          *UserSubscription // 可选：订阅信息
	UserAgent             string            // 请求的 User-Agent
	IPAddress             string            // 请求的客户端 IP 地址
	LongContextThreshold  int               // 长上下文阈值（如 200000）
	LongContextMultiplier float64           // 超出阈值部分的倍率（如 2.0）
}

// RecordUsageWithLongContext 记录使用量并扣费，支持长上下文双倍计费（用于 Gemini）
func (s *GatewayService) RecordUsageWithLongContext(ctx context.Context, input *RecordUsageLongContextInput) error {
	result := input.Result
	apiKey := input.APIKey
	user := input.User
	account := input.Account
	subscription := input.Subscription

	// 获取费率倍数
	multiplier := s.cfg.Default.RateMultiplier
	if apiKey.GroupID != nil && apiKey.Group != nil {
		multiplier = apiKey.Group.RateMultiplier
	}

	var cost *CostBreakdown

	// 根据请求类型选择计费方式
	if result.ImageCount > 0 {
		// 图片生成计费
		var groupConfig *ImagePriceConfig
		if apiKey.Group != nil {
			groupConfig = &ImagePriceConfig{
				Price1K: apiKey.Group.ImagePrice1K,
				Price2K: apiKey.Group.ImagePrice2K,
				Price4K: apiKey.Group.ImagePrice4K,
			}
		}
		cost = s.billingService.CalculateImageCost(result.Model, result.ImageSize, result.ImageCount, groupConfig, multiplier)
	} else {
		// Token 计费（使用长上下文计费方法）
		tokens := UsageTokens{
			InputTokens:         result.Usage.InputTokens,
			OutputTokens:        result.Usage.OutputTokens,
			CacheCreationTokens: result.Usage.CacheCreationInputTokens,
			CacheReadTokens:     result.Usage.CacheReadInputTokens,
		}
		var err error
		cost, err = s.billingService.CalculateCostWithLongContext(result.Model, tokens, multiplier, input.LongContextThreshold, input.LongContextMultiplier)
		if err != nil {
			log.Printf("Calculate cost failed: %v", err)
			cost = &CostBreakdown{ActualCost: 0}
		}
	}

	// 判断计费方式：订阅模式 vs 余额模式
	isSubscriptionBilling := subscription != nil && apiKey.Group != nil && apiKey.Group.IsSubscriptionType()
	billingType := BillingTypeBalance
	if isSubscriptionBilling {
		billingType = BillingTypeSubscription
	}

	// 创建使用日志
	durationMs := int(result.Duration.Milliseconds())
	var imageSize *string
	if result.ImageSize != "" {
		imageSize = &result.ImageSize
	}
	accountRateMultiplier := account.BillingRateMultiplier()
	usageLog := &UsageLog{
		UserID:                user.ID,
		APIKeyID:              apiKey.ID,
		AccountID:             account.ID,
		RequestID:             result.RequestID,
		Model:                 result.Model,
		InputTokens:           result.Usage.InputTokens,
		OutputTokens:          result.Usage.OutputTokens,
		CacheCreationTokens:   result.Usage.CacheCreationInputTokens,
		CacheReadTokens:       result.Usage.CacheReadInputTokens,
		InputCost:             cost.InputCost,
		OutputCost:            cost.OutputCost,
		CacheCreationCost:     cost.CacheCreationCost,
		CacheReadCost:         cost.CacheReadCost,
		TotalCost:             cost.TotalCost,
		ActualCost:            cost.ActualCost,
		RateMultiplier:        multiplier,
		AccountRateMultiplier: &accountRateMultiplier,
		BillingType:           billingType,
		Stream:                result.Stream,
		DurationMs:            &durationMs,
		FirstTokenMs:          result.FirstTokenMs,
		ImageCount:            result.ImageCount,
		ImageSize:             imageSize,
		CreatedAt:             time.Now(),
	}

	// 添加 UserAgent
	if input.UserAgent != "" {
		usageLog.UserAgent = &input.UserAgent
	}

	// 添加 IPAddress
	if input.IPAddress != "" {
		usageLog.IPAddress = &input.IPAddress
	}

	// 添加分组和订阅关联
	if apiKey.GroupID != nil {
		usageLog.GroupID = apiKey.GroupID
	}
	if subscription != nil {
		usageLog.SubscriptionID = &subscription.ID
	}

	inserted, err := s.usageLogRepo.Create(ctx, usageLog)
	if err != nil {
		log.Printf("Create usage log failed: %v", err)
	}

	if s.cfg != nil && s.cfg.RunMode == config.RunModeSimple {
		log.Printf("[SIMPLE MODE] Usage recorded (not billed): user=%d, tokens=%d", usageLog.UserID, usageLog.TotalTokens())
		s.deferredService.ScheduleLastUsedUpdate(account.ID)
		return nil
	}

	shouldBill := inserted || err != nil

	// 根据计费类型执行扣费
	if isSubscriptionBilling {
		// 订阅模式：更新订阅用量（使用 TotalCost 原始费用，不考虑倍率）
		if shouldBill && cost.TotalCost > 0 {
			if err := s.userSubRepo.IncrementUsage(ctx, subscription.ID, cost.TotalCost); err != nil {
				log.Printf("Increment subscription usage failed: %v", err)
			}
			// 异步更新订阅缓存
			s.billingCacheService.QueueUpdateSubscriptionUsage(user.ID, *apiKey.GroupID, cost.TotalCost)
		}
	} else {
		// 余额模式：扣除用户余额（使用 ActualCost 考虑倍率后的费用）
		if shouldBill && cost.ActualCost > 0 {
			if err := s.userRepo.DeductBalance(ctx, user.ID, cost.ActualCost); err != nil {
				log.Printf("Deduct balance failed: %v", err)
			}
			// 异步更新余额缓存
			s.billingCacheService.QueueDeductBalance(user.ID, cost.ActualCost)
		}
	}

	// Schedule batch update for account last_used_at
	s.deferredService.ScheduleLastUsedUpdate(account.ID)

	return nil
}

// ForwardCountTokens 转发 count_tokens 请求到上游 API
// 特点：不记录使用量、仅支持非流式响应
func (s *GatewayService) ForwardCountTokens(ctx context.Context, c *gin.Context, account *Account, parsed *ParsedRequest) error {
	if parsed == nil {
		s.countTokensError(c, http.StatusBadRequest, "invalid_request_error", "Request body is empty")
		return fmt.Errorf("parse request: empty request")
	}

	body := parsed.Body
	reqModel := parsed.Model

	isClaudeCode := isClaudeCodeRequest(ctx, c, parsed)
	shouldMimicClaudeCode := account.IsOAuth() && !isClaudeCode

	if shouldMimicClaudeCode {
		normalizeOpts := claudeOAuthNormalizeOptions{stripSystemCacheControl: true}
		body, reqModel, _ = normalizeClaudeOAuthRequestBody(body, reqModel, normalizeOpts)
	}

	// Antigravity 账户不支持 count_tokens 转发，直接返回空值
	if account.Platform == PlatformAntigravity {
		c.JSON(http.StatusOK, gin.H{"input_tokens": 0})
		return nil
	}

	// 应用模型映射（APIKey 明确映射优先，其次使用 Anthropic 前缀映射）
	if reqModel != "" {
		mappedModel := reqModel
		mappingSource := ""
		if account.Type == AccountTypeAPIKey {
			mappedModel = account.GetMappedModel(reqModel)
			if mappedModel != reqModel {
				mappingSource = "account"
			}
		}
		if mappingSource == "" && account.Platform == PlatformAnthropic {
			normalized := normalizeClaudeModelForAnthropic(reqModel)
			if normalized != reqModel {
				mappedModel = normalized
				mappingSource = "prefix"
			}
		}
		if mappedModel != reqModel {
			body = s.replaceModelInBody(body, mappedModel)
			reqModel = mappedModel
			log.Printf("CountTokens model mapping applied: %s -> %s (account: %s, source=%s)", parsed.Model, mappedModel, account.Name, mappingSource)
		}
	}

	// 获取凭证
	token, tokenType, err := s.GetAccessToken(ctx, account)
	if err != nil {
		s.countTokensError(c, http.StatusBadGateway, "upstream_error", "Failed to get access token")
		return err
	}

	// 构建上游请求
	upstreamReq, err := s.buildCountTokensRequest(ctx, c, account, body, token, tokenType, reqModel, shouldMimicClaudeCode)
	if err != nil {
		s.countTokensError(c, http.StatusInternalServerError, "api_error", "Failed to build request")
		return err
	}

	// 获取代理URL
	proxyURL := ""
	if account.ProxyID != nil && account.Proxy != nil {
		proxyURL = account.Proxy.URL()
	}

	// 发送请求
	resp, err := s.httpUpstream.DoWithTLS(upstreamReq, proxyURL, account.ID, account.Concurrency, account.IsTLSFingerprintEnabled())
	if err != nil {
		setOpsUpstreamError(c, 0, sanitizeUpstreamErrorMessage(err.Error()), "")
		s.countTokensError(c, http.StatusBadGateway, "upstream_error", "Request failed")
		return fmt.Errorf("upstream request failed: %w", err)
	}

	// 读取响应体
	respBody, err := io.ReadAll(resp.Body)
	_ = resp.Body.Close()
	if err != nil {
		s.countTokensError(c, http.StatusBadGateway, "upstream_error", "Failed to read response")
		return err
	}

	// 检测 thinking block 签名错误（400）并重试一次（过滤 thinking blocks）
	if resp.StatusCode == 400 && s.isThinkingBlockSignatureError(respBody) {
		log.Printf("Account %d: detected thinking block signature error on count_tokens, retrying with filtered thinking blocks", account.ID)

		filteredBody := FilterThinkingBlocksForRetry(body)
		retryReq, buildErr := s.buildCountTokensRequest(ctx, c, account, filteredBody, token, tokenType, reqModel, shouldMimicClaudeCode)
		if buildErr == nil {
			retryResp, retryErr := s.httpUpstream.DoWithTLS(retryReq, proxyURL, account.ID, account.Concurrency, account.IsTLSFingerprintEnabled())
			if retryErr == nil {
				resp = retryResp
				respBody, err = io.ReadAll(resp.Body)
				_ = resp.Body.Close()
				if err != nil {
					s.countTokensError(c, http.StatusBadGateway, "upstream_error", "Failed to read response")
					return err
				}
			}
		}
	}

	// 处理错误响应
	if resp.StatusCode >= 400 {
		// 标记账号状态（429/529等）
		s.rateLimitService.HandleUpstreamError(ctx, account, resp.StatusCode, resp.Header, respBody)

		upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(respBody))
		upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)
		upstreamDetail := ""
		if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
			maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
			if maxBytes <= 0 {
				maxBytes = 2048
			}
			upstreamDetail = truncateString(string(respBody), maxBytes)
		}
		setOpsUpstreamError(c, resp.StatusCode, upstreamMsg, upstreamDetail)

		// 记录上游错误摘要便于排障（不回显请求内容）
		if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
			log.Printf(
				"count_tokens upstream error %d (account=%d platform=%s type=%s): %s",
				resp.StatusCode,
				account.ID,
				account.Platform,
				account.Type,
				truncateForLog(respBody, s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes),
			)
		}

		// 返回简化的错误响应
		errMsg := "Upstream request failed"
		switch resp.StatusCode {
		case 429:
			errMsg = "Rate limit exceeded"
		case 529:
			errMsg = "Service overloaded"
		}
		s.countTokensError(c, resp.StatusCode, "upstream_error", errMsg)
		if upstreamMsg == "" {
			return fmt.Errorf("upstream error: %d", resp.StatusCode)
		}
		return fmt.Errorf("upstream error: %d message=%s", resp.StatusCode, upstreamMsg)
	}

	// 透传成功响应
	c.Data(resp.StatusCode, "application/json", respBody)
	return nil
}

// buildCountTokensRequest 构建 count_tokens 上游请求
func (s *GatewayService) buildCountTokensRequest(ctx context.Context, c *gin.Context, account *Account, body []byte, token, tokenType, modelID string, mimicClaudeCode bool) (*http.Request, error) {
	// 确定目标 URL
	targetURL := claudeAPICountTokensURL
	if account.Type == AccountTypeAPIKey {
		baseURL := account.GetBaseURL()
		if baseURL != "" {
			validatedURL, err := s.validateUpstreamBaseURL(baseURL)
			if err != nil {
				return nil, err
			}
			targetURL = validatedURL + "/v1/messages/count_tokens"
		}
	}

	clientHeaders := http.Header{}
	if c != nil && c.Request != nil {
		clientHeaders = c.Request.Header
	}

	// OAuth 账号：应用统一指纹和重写 userID
	// 如果启用了会话ID伪装，会在重写后替换 session 部分为固定值
	if account.IsOAuth() && s.identityService != nil {
		fp, err := s.identityService.GetOrCreateFingerprint(ctx, account.ID, clientHeaders)
		if err == nil {
			accountUUID := account.GetExtraString("account_uuid")
			if accountUUID != "" && fp.ClientID != "" {
				if newBody, err := s.identityService.RewriteUserIDWithMasking(ctx, body, account, accountUUID, fp.ClientID); err == nil && len(newBody) > 0 {
					body = newBody
				}
			}
		}
	}

	req, err := http.NewRequestWithContext(ctx, "POST", targetURL, bytes.NewReader(body))
	if err != nil {
		return nil, err
	}

	// 设置认证头
	if tokenType == "oauth" {
		req.Header.Set("authorization", "Bearer "+token)
	} else {
		req.Header.Set("x-api-key", token)
	}

	// 白名单透传 headers
	for key, values := range clientHeaders {
		lowerKey := strings.ToLower(key)
		if allowedHeaders[lowerKey] {
			for _, v := range values {
				req.Header.Add(key, v)
			}
		}
	}

	// OAuth 账号：应用指纹到请求头
	if account.IsOAuth() && s.identityService != nil {
		fp, _ := s.identityService.GetOrCreateFingerprint(ctx, account.ID, clientHeaders)
		if fp != nil {
			s.identityService.ApplyFingerprint(req, fp)
		}
	}

	// 确保必要的 headers 存在
	if req.Header.Get("content-type") == "" {
		req.Header.Set("content-type", "application/json")
	}
	if req.Header.Get("anthropic-version") == "" {
		req.Header.Set("anthropic-version", "2023-06-01")
	}
	if tokenType == "oauth" {
		applyClaudeOAuthHeaderDefaults(req, false)
	}

	// OAuth 账号：处理 anthropic-beta header
	if tokenType == "oauth" {
		if mimicClaudeCode {
			applyClaudeCodeMimicHeaders(req, false)

			incomingBeta := req.Header.Get("anthropic-beta")
			requiredBetas := []string{claude.BetaClaudeCode, claude.BetaOAuth, claude.BetaInterleavedThinking, claude.BetaTokenCounting}
			req.Header.Set("anthropic-beta", mergeAnthropicBeta(requiredBetas, incomingBeta))
		} else {
			clientBetaHeader := req.Header.Get("anthropic-beta")
			if clientBetaHeader == "" {
				req.Header.Set("anthropic-beta", claude.CountTokensBetaHeader)
			} else {
				beta := s.getBetaHeader(modelID, clientBetaHeader)
				if !strings.Contains(beta, claude.BetaTokenCounting) {
					beta = beta + "," + claude.BetaTokenCounting
				}
				req.Header.Set("anthropic-beta", beta)
			}
		}
	} else if s.cfg != nil && s.cfg.Gateway.InjectBetaForAPIKey && req.Header.Get("anthropic-beta") == "" {
		// API-key：与 messages 同步的按需 beta 注入（默认关闭）
		if requestNeedsBetaFeatures(body) {
			if beta := defaultAPIKeyBetaHeader(body); beta != "" {
				req.Header.Set("anthropic-beta", beta)
			}
		}
	}

	if c != nil && tokenType == "oauth" {
		c.Set(claudeMimicDebugInfoKey, buildClaudeMimicDebugLine(req, body, account, tokenType, mimicClaudeCode))
	}
	if s.debugClaudeMimicEnabled() {
		logClaudeMimicDebug(req, body, account, tokenType, mimicClaudeCode)
	}

	return req, nil
}

// countTokensError 返回 count_tokens 错误响应
func (s *GatewayService) countTokensError(c *gin.Context, status int, errType, message string) {
	c.JSON(status, gin.H{
		"type": "error",
		"error": gin.H{
			"type":    errType,
			"message": message,
		},
	})
}

func (s *GatewayService) validateUpstreamBaseURL(raw string) (string, error) {
	if s.cfg != nil && !s.cfg.Security.URLAllowlist.Enabled {
		normalized, err := urlvalidator.ValidateURLFormat(raw, s.cfg.Security.URLAllowlist.AllowInsecureHTTP)
		if err != nil {
			return "", fmt.Errorf("invalid base_url: %w", err)
		}
		return normalized, nil
	}
	normalized, err := urlvalidator.ValidateHTTPSURL(raw, urlvalidator.ValidationOptions{
		AllowedHosts:     s.cfg.Security.URLAllowlist.UpstreamHosts,
		RequireAllowlist: true,
		AllowPrivate:     s.cfg.Security.URLAllowlist.AllowPrivateHosts,
	})
	if err != nil {
		return "", fmt.Errorf("invalid base_url: %w", err)
	}
	return normalized, nil
}

// checkAntigravityModelScope 检查 Antigravity 平台的模型系列是否在分组支持范围内
func (s *GatewayService) checkAntigravityModelScope(ctx context.Context, groupID int64, requestedModel string) error {
	scope, ok := ResolveAntigravityQuotaScope(requestedModel)
	if !ok {
		return nil // 无法解析 scope，跳过检查
	}

	group, err := s.resolveGroupByID(ctx, groupID)
	if err != nil {
		return nil // 查询失败时放行
	}
	if group == nil {
		return nil // 分组不存在时放行
	}

	if !IsScopeSupported(group.SupportedModelScopes, scope) {
		return ErrModelScopeNotSupported
	}
	return nil
}

// GetAvailableModels returns the list of models available for a group
// It aggregates model_mapping keys from all schedulable accounts in the group
func (s *GatewayService) GetAvailableModels(ctx context.Context, groupID *int64, platform string) []string {
	var accounts []Account
	var err error

	if groupID != nil {
		accounts, err = s.accountRepo.ListSchedulableByGroupID(ctx, *groupID)
	} else {
		accounts, err = s.accountRepo.ListSchedulable(ctx)
	}

	if err != nil || len(accounts) == 0 {
		return nil
	}

	// Filter by platform if specified
	if platform != "" {
		filtered := make([]Account, 0)
		for _, acc := range accounts {
			if acc.Platform == platform {
				filtered = append(filtered, acc)
			}
		}
		accounts = filtered
	}

	// Collect unique models from all accounts
	modelSet := make(map[string]struct{})
	hasAnyMapping := false

	for _, acc := range accounts {
		mapping := acc.GetModelMapping()
		if len(mapping) > 0 {
			hasAnyMapping = true
			for model := range mapping {
				modelSet[model] = struct{}{}
			}
		}
	}

	// If no account has model_mapping, return nil (use default)
	if !hasAnyMapping {
		return nil
	}

	// Convert to slice
	models := make([]string, 0, len(modelSet))
	for model := range modelSet {
		models = append(models, model)
	}

	return models
}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								package service
 								import (
 									"bufio"
 									"bytes"
 									"context"
 									"crypto/sha256"
 									"encoding/hex"
 									"encoding/json"
 									"errors"
 									"fmt"
 									"io"
 									"log"
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+									"log/slog"
-												feat(scheduling): 兜底层账户选择策略可配置

- gateway.scheduling.fallback_selection_mode: "last_used"(默认) 或 "random"
- last_used: 按最后使用时间排序（轮询效果）
- random: 同优先级内随机选择

											
										
										
											2026-01-16 20:47:07 +08:00
+									mathrand "math/rand"
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									"net/http"
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+									"os"
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									"regexp"
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									"sort"
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									"strings"
-												fix(流式): 以上游读取判定超时并调大事件缓冲

- 以读取时间戳判定流式间隔超时，避免下游阻塞误判
- antigravity 流式读取使用 MaxLineSize 配置
- 事件通道缓冲提升到 16

测试: go test ./...

											
										
										
											2026-01-04 20:19:07 +08:00
+									"sync/atomic"
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									"time"
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+									"unicode"
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
-												refactor: 重命名 go module

											
										
										
											2025-12-24 21:07:21 +08:00
+									"github.com/Wei-Shaw/sub2api/internal/config"
 									"github.com/Wei-Shaw/sub2api/internal/pkg/claude"
-												fix: 修复 golangci-lint 检查错误

- SA1029: 创建 ctxkey 包定义类型安全的 context key
- ST1005: 错误字符串首字母改小写
- errcheck: 显式忽略 bytes.Buffer.Write 返回值
- 修复单元测试中 GatewayService 缺少 cfg 字段的问题

											
										
										
											2025-12-29 17:46:52 +08:00
+									"github.com/Wei-Shaw/sub2api/internal/pkg/ctxkey"
-												feat(安全): 强化安全策略与配置校验

- 增加 CORS/CSP/安全响应头与代理信任配置

- 引入 URL 白名单与私网开关，校验上游与价格源

- 改善 API Key 处理与网关错误返回

- 管理端设置隐藏敏感字段并优化前端提示

- 增加计费熔断与相关配置示例

测试: go test ./...

											
										
										
											2026-01-02 17:40:57 +08:00
+									"github.com/Wei-Shaw/sub2api/internal/util/responseheaders"
 									"github.com/Wei-Shaw/sub2api/internal/util/urlvalidator"
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+									"github.com/google/uuid"
-												CC 400 返回具体错误信息 && 非 CC 请求时增加 system prompt (#26)

* feat: http 400 返回具体错误

* 更新 workflows

* 优化打包/docker 构建流程

* 400 是返回 原始错误 - json 格式

* feat: 非 cc请求时补充 system

* go mod tidy
											
										
										
											2025-12-25 14:47:19 +08:00
+									"github.com/tidwall/gjson"
 									"github.com/tidwall/sjson"
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
 									"github.com/gin-gonic/gin"
 								)
 								const (
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+									claudeAPIURL            = "https://api.anthropic.com/v1/messages?beta=true"
 									claudeAPICountTokensURL = "https://api.anthropic.com/v1/messages/count_tokens?beta=true"
 									stickySessionTTL        = time.Hour // 粘性会话TTL
-												chore: 提升 SSE 单行上限到 40MB

											
										
										
											2026-01-09 20:57:06 +08:00
+									defaultMaxLineSize      = 40 * 1024 * 1024
-												fix: align Claude Code system banner with opencode latest

											
										
										
											2026-01-29 15:37:07 +08:00
+									// Canonical Claude Code banner. Keep it EXACT (no trailing whitespace/newlines)
 									// to match real Claude CLI traffic as closely as possible. When we need a visual
 									// separator between system blocks, we add "\n\n" at concatenation time.
 									claudeCodeSystemPrompt = "You are Claude Code, Anthropic's official CLI for Claude."
-												chore: gofmt

											
										
										
											2026-01-29 01:34:58 +08:00
+									maxCacheControlBlocks  = 4 // Anthropic API 允许的最大 cache_control 块数量
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								)
-												chore(debug): emit Claude mimic fingerprint on credential-scope error

											
										
										
											2026-01-29 15:17:46 +08:00
+								const (
 									claudeMimicDebugInfoKey = "claude_mimic_debug_info"
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								)
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+								func (s *GatewayService) debugModelRoutingEnabled() bool {
 									v := strings.ToLower(strings.TrimSpace(os.Getenv("SUB2API_DEBUG_MODEL_ROUTING")))
 									return v == "1" || v == "true" || v == "yes" || v == "on"
 								}
-												chore(debug): log Claude mimic fingerprint

											
										
										
											2026-01-29 03:13:14 +08:00
+								func (s *GatewayService) debugClaudeMimicEnabled() bool {
 									v := strings.ToLower(strings.TrimSpace(os.Getenv("SUB2API_DEBUG_CLAUDE_MIMIC")))
 									return v == "1" || v == "true" || v == "yes" || v == "on"
 								}
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+								func shortSessionHash(sessionHash string) string {
 									if sessionHash == "" {
 										return ""
 									}
 									if len(sessionHash) <= 8 {
 										return sessionHash
 									}
 									return sessionHash[:8]
 								}
-												Add invalid-request fallback routing

											
										
										
											2026-01-23 22:24:46 +08:00
+								func normalizeClaudeModelForAnthropic(requestedModel string) string {
 									for _, prefix := range anthropicPrefixMappings {
 										if strings.HasPrefix(requestedModel, prefix) {
 											return prefix
 										}
 									}
 									return requestedModel
 								}
-												chore(debug): log Claude mimic fingerprint

											
										
										
											2026-01-29 03:13:14 +08:00
+								func redactAuthHeaderValue(v string) string {
 									v = strings.TrimSpace(v)
 									if v == "" {
 										return ""
 									}
 									// Keep scheme for debugging, redact secret.
 									if strings.HasPrefix(strings.ToLower(v), "bearer ") {
 										return "Bearer [redacted]"
 									}
 									return "[redacted]"
 								}
 								func safeHeaderValueForLog(key string, v string) string {
 									key = strings.ToLower(strings.TrimSpace(key))
 									switch key {
 									case "authorization", "x-api-key":
 										return redactAuthHeaderValue(v)
 									default:
 										return strings.TrimSpace(v)
 									}
 								}
 								func extractSystemPreviewFromBody(body []byte) string {
 									if len(body) == 0 {
 										return ""
 									}
 									sys := gjson.GetBytes(body, "system")
 									if !sys.Exists() {
 										return ""
 									}
 									switch {
 									case sys.IsArray():
 										for _, item := range sys.Array() {
 											if !item.IsObject() {
 												continue
 											}
 											if strings.EqualFold(item.Get("type").String(), "text") {
 												if t := item.Get("text").String(); strings.TrimSpace(t) != "" {
 													return t
 												}
 											}
 										}
 										return ""
 									case sys.Type == gjson.String:
 										return sys.String()
 									default:
 										return ""
 									}
 								}
-												chore(debug): emit Claude mimic fingerprint on credential-scope error

											
										
										
											2026-01-29 15:17:46 +08:00
+								func buildClaudeMimicDebugLine(req *http.Request, body []byte, account *Account, tokenType string, mimicClaudeCode bool) string {
-												chore(debug): log Claude mimic fingerprint

											
										
										
											2026-01-29 03:13:14 +08:00
+									if req == nil {
-												chore(debug): emit Claude mimic fingerprint on credential-scope error

											
										
										
											2026-01-29 15:17:46 +08:00
+										return ""
-												chore(debug): log Claude mimic fingerprint

											
										
										
											2026-01-29 03:13:14 +08:00
+									}
 									// Only log a minimal fingerprint to avoid leaking user content.
 									interesting := []string{
 										"user-agent",
 										"x-app",
 										"anthropic-dangerous-direct-browser-access",
 										"anthropic-version",
 										"anthropic-beta",
 										"x-stainless-lang",
 										"x-stainless-package-version",
 										"x-stainless-os",
 										"x-stainless-arch",
 										"x-stainless-runtime",
 										"x-stainless-runtime-version",
 										"x-stainless-retry-count",
 										"x-stainless-timeout",
 										"authorization",
 										"x-api-key",
 										"content-type",
 										"accept",
 										"x-stainless-helper-method",
 									}
 									h := make([]string, 0, len(interesting))
 									for _, k := range interesting {
 										if v := req.Header.Get(k); v != "" {
 											h = append(h, fmt.Sprintf("%s=%q", k, safeHeaderValueForLog(k, v)))
 										}
 									}
 									metaUserID := strings.TrimSpace(gjson.GetBytes(body, "metadata.user_id").String())
 									sysPreview := strings.TrimSpace(extractSystemPreviewFromBody(body))
 									// Truncate preview to keep logs sane.
 									if len(sysPreview) > 300 {
 										sysPreview = sysPreview[:300] + "..."
 									}
 									sysPreview = strings.ReplaceAll(sysPreview, "\n", "\\n")
 									sysPreview = strings.ReplaceAll(sysPreview, "\r", "\\r")
 									aid := int64(0)
 									aname := ""
 									if account != nil {
 										aid = account.ID
 										aname = account.Name
 									}
-												chore(debug): emit Claude mimic fingerprint on credential-scope error

											
										
										
											2026-01-29 15:17:46 +08:00
+									return fmt.Sprintf(
 										"url=%s account=%d(%s) tokenType=%s mimic=%t meta.user_id=%q system.preview=%q headers={%s}",
-												chore(debug): log Claude mimic fingerprint

											
										
										
											2026-01-29 03:13:14 +08:00
+										req.URL.String(),
 										aid,
 										aname,
 										tokenType,
 										mimicClaudeCode,
 										metaUserID,
 										sysPreview,
 										strings.Join(h, " "),
 									)
 								}
-												chore(debug): emit Claude mimic fingerprint on credential-scope error

											
										
										
											2026-01-29 15:17:46 +08:00
+								func logClaudeMimicDebug(req *http.Request, body []byte, account *Account, tokenType string, mimicClaudeCode bool) {
 									line := buildClaudeMimicDebugLine(req, body, account, tokenType, mimicClaudeCode)
 									if line == "" {
 										return
 									}
 									log.Printf("[ClaudeMimicDebug] %s", line)
 								}
 								func isClaudeCodeCredentialScopeError(msg string) bool {
 									m := strings.ToLower(strings.TrimSpace(msg))
 									if m == "" {
 										return false
 									}
 									return strings.Contains(m, "only authorized for use with claude code") &&
 										strings.Contains(m, "cannot be used for other api requests")
 								}
-												fix(sse): 修复非标准 SSE 格式解析问题

部分上游 API 返回的 SSE 格式不符合标准规范：
- 标准格式: `data: {...}`（冒号后有空格）
- 非标准格式: `data:{...}`（冒号后无空格）

使用预编译正则 `^data:\s*` 统一处理两种格式。

											
										
										
											2025-12-26 03:49:55 -08:00
+								// sseDataRe matches SSE data lines with optional whitespace after colon.
 								// Some upstream APIs return non-standard "data:" without space (should be "data: ").
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+								var (
-												feat(gateway): 实现 Claude Code 系统提示词智能注入

											
										
										
											2026-01-04 10:38:13 +08:00
+									sseDataRe            = regexp.MustCompile(`^data:\s*`)
 									sessionIDRegex       = regexp.MustCompile(`session_([a-f0-9-]{36})`)
 									claudeCliUserAgentRe = regexp.MustCompile(`^claude-cli/\d+\.\d+\.\d+`)
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+									toolPrefixRe         = regexp.MustCompile(`(?i)^(?:oc_|mcp_)`)
 									toolNameBoundaryRe   = regexp.MustCompile(`[^a-zA-Z0-9]+`)
 									toolNameCamelRe      = regexp.MustCompile(`([a-z0-9])([A-Z])`)
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+									toolNameFieldRe      = regexp.MustCompile(`"name"\s*:\s*"([^"]+)"`)
 									modelFieldRe         = regexp.MustCompile(`"model"\s*:\s*"([^"]+)"`)
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+									toolDescAbsPathRe    = regexp.MustCompile(`/\/?(?:home|Users|tmp|var|opt|usr|etc)\/[^\s,\)"'\]]+`)
 									toolDescWinPathRe    = regexp.MustCompile(`(?i)[A-Z]:\\[^\s,\)"'\]]+`)
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
 									claudeToolNameOverrides = map[string]string{
 										"bash":      "Bash",
 										"read":      "Read",
 										"edit":      "Edit",
 										"write":     "Write",
 										"task":      "Task",
 										"glob":      "Glob",
 										"grep":      "Grep",
 										"webfetch":  "WebFetch",
 										"websearch": "WebSearch",
 										"todowrite": "TodoWrite",
 										"question":  "AskUserQuestion",
 									}
 									openCodeToolOverrides = map[string]string{
 										"Bash":            "bash",
 										"Read":            "read",
 										"Edit":            "edit",
 										"Write":           "write",
 										"Task":            "task",
 										"Glob":            "glob",
 										"Grep":            "grep",
 										"WebFetch":        "webfetch",
 										"WebSearch":       "websearch",
 										"TodoWrite":       "todowrite",
 										"AskUserQuestion": "question",
 									}
-												fix(gateway): 修复 cache_control 块超限问题并优化 Claude Code 检测

问题：
- OAuth/SetupToken 账号注入 system prompt 后可能导致 cache_control
  块超过 Anthropic API 的 4 个限制
- Claude Code 检测使用精确匹配，无法识别 Agent SDK 等变体

修复：
- 新增 enforceCacheControlLimit 函数，强制执行 4 个块限制
- 优先从 messages 移除，再从 system 尾部移除（保护注入的 prompt）
- 改用前缀匹配检测 Claude Code 系统提示词，支持多种变体：
  - 标准版、Agent SDK 版、Explore Agent 版、Compact 版

											
										
										
											2026-01-07 10:17:09 +08:00
 									// claudeCodePromptPrefixes 用于检测 Claude Code 系统提示词的前缀列表
 									// 支持多种变体：标准版、Agent SDK 版、Explore Agent 版、Compact 版等
 									// 注意：前缀之间不应存在包含关系，否则会导致冗余匹配
 									claudeCodePromptPrefixes = []string{
 										"You are Claude Code, Anthropic's official CLI for Claude",             // 标准版 & Agent SDK 版（含 running within...）
 										"You are a Claude agent, built on Anthropic's Claude Agent SDK",        // Agent SDK 变体
 										"You are a file search specialist for Claude Code",                     // Explore Agent 版
 										"You are a helpful AI assistant tasked with summarizing conversations", // Compact 版
 									}
-												Add invalid-request fallback routing

											
										
										
											2026-01-23 22:24:46 +08:00
 									anthropicPrefixMappings = []string{
 										"claude-opus-4-5",
 										"claude-haiku-4-5",
 										"claude-sonnet-4-5",
 									}
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+								)
-												fix(sse): 修复非标准 SSE 格式解析问题

部分上游 API 返回的 SSE 格式不符合标准规范：
- 标准格式: `data: {...}`（冒号后有空格）
- 非标准格式: `data:{...}`（冒号后无空格）

使用预编译正则 `^data:\s*` 统一处理两种格式。

											
										
										
											2025-12-26 03:49:55 -08:00
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+								// ErrClaudeCodeOnly 表示分组仅允许 Claude Code 客户端访问
 								var ErrClaudeCodeOnly = errors.New("this group only allows Claude Code clients")
-												chore: apply stashed changes

											
										
										
											2026-02-02 22:20:08 +08:00
+								// ErrModelScopeNotSupported 表示请求的模型系列不在分组支持的范围内
 								var ErrModelScopeNotSupported = errors.New("model scope not supported by this group")
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								// allowedHeaders 白名单headers（参考CRS项目）
 								var allowedHeaders = map[string]bool{
-												fix: 修复并发请求时共享httpClient.Transport导致的竞态条件

问题描述：
当多个请求并发执行且使用不同代理配置时，它们会同时修改共享的
s.httpClient.Transport，导致请求可能使用错误的代理（数据泄露风险）
或意外失败。

修复方案：
为需要代理的请求创建独立的http.Client，而不是修改共享的httpClient.Transport。

改动内容：
- 新增 buildUpstreamRequestResult 结构体，返回请求和可选的独立client
- 修改 buildUpstreamRequest 方法，配置代理时创建独立client
- 更新 Forward 方法，根据是否有代理选择合适的client

											
										
										
											2025-12-18 18:14:20 +08:00
+									"accept":                                    true,
 									"x-stainless-retry-count":                   true,
 									"x-stainless-timeout":                       true,
 									"x-stainless-lang":                          true,
 									"x-stainless-package-version":               true,
 									"x-stainless-os":                            true,
 									"x-stainless-arch":                          true,
 									"x-stainless-runtime":                       true,
 									"x-stainless-runtime-version":               true,
 									"x-stainless-helper-method":                 true,
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									"anthropic-dangerous-direct-browser-access": true,
-												fix: 修复并发请求时共享httpClient.Transport导致的竞态条件

问题描述：
当多个请求并发执行且使用不同代理配置时，它们会同时修改共享的
s.httpClient.Transport，导致请求可能使用错误的代理（数据泄露风险）
或意外失败。

修复方案：
为需要代理的请求创建独立的http.Client，而不是修改共享的httpClient.Transport。

改动内容：
- 新增 buildUpstreamRequestResult 结构体，返回请求和可选的独立client
- 修改 buildUpstreamRequest 方法，配置代理时创建独立client
- 更新 Forward 方法，根据是否有代理选择合适的client

											
										
										
											2025-12-18 18:14:20 +08:00
+									"anthropic-version":                         true,
 									"x-app":                                     true,
 									"anthropic-beta":                            true,
 									"accept-language":                           true,
 									"sec-fetch-mode":                            true,
 									"user-agent":                                true,
 									"content-type":                              true,
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+								// GatewayCache 定义网关服务的缓存操作接口。
 								// 提供粘性会话（Sticky Session）的存储、查询、刷新和删除功能。
 								//
 								// GatewayCache defines cache operations for gateway service.
 								// Provides sticky session storage, retrieval, refresh and deletion capabilities.
-												refactor: 删除 ports 目录

											
										
										
											2025-12-25 17:15:01 +08:00
+								type GatewayCache interface {
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+									// GetSessionAccountID 获取粘性会话绑定的账号 ID
 									// Get the account ID bound to a sticky session
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+									GetSessionAccountID(ctx context.Context, groupID int64, sessionHash string) (int64, error)
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+									// SetSessionAccountID 设置粘性会话与账号的绑定关系
 									// Set the binding between sticky session and account
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+									SetSessionAccountID(ctx context.Context, groupID int64, sessionHash string, accountID int64, ttl time.Duration) error
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+									// RefreshSessionTTL 刷新粘性会话的过期时间
 									// Refresh the expiration time of a sticky session
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+									RefreshSessionTTL(ctx context.Context, groupID int64, sessionHash string, ttl time.Duration) error
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+									// DeleteSessionAccountID 删除粘性会话绑定，用于账号不可用时主动清理
 									// Delete sticky session binding, used to proactively clean up when account becomes unavailable
 									DeleteSessionAccountID(ctx context.Context, groupID int64, sessionHash string) error
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+								}
 								// derefGroupID safely dereferences *int64 to int64, returning 0 if nil
 								func derefGroupID(groupID *int64) int64 {
 									if groupID == nil {
 										return 0
 									}
 									return *groupID
-												refactor: 删除 ports 目录

											
										
										
											2025-12-25 17:15:01 +08:00
+								}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+								// shouldClearStickySession 检查账号是否处于不可调度状态，需要清理粘性会话绑定。
 								// 当账号状态为错误、禁用、不可调度，或处于临时不可调度期间时，返回 true。
 								// 这确保后续请求不会继续使用不可用的账号。
 								//
 								// shouldClearStickySession checks if an account is in an unschedulable state
 								// and the sticky session binding should be cleared.
 								// Returns true when account status is error/disabled, schedulable is false,
 								// or within temporary unschedulable period.
 								// This ensures subsequent requests won't continue using unavailable accounts.
 								func shouldClearStickySession(account *Account) bool {
 									if account == nil {
 										return false
 									}
 									if account.Status == StatusError || account.Status == StatusDisabled || !account.Schedulable {
 										return true
 									}
 									if account.TempUnschedulableUntil != nil && time.Now().Before(*account.TempUnschedulableUntil) {
 										return true
 									}
 									return false
 								}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+								type AccountWaitPlan struct {
 									AccountID      int64
 									MaxConcurrency int
 									Timeout        time.Duration
 									MaxWaiting     int
 								}
 								type AccountSelectionResult struct {
 									Account     *Account
 									Acquired    bool
 									ReleaseFunc func()
 									WaitPlan    *AccountWaitPlan // nil means no wait allowed
 								}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								// ClaudeUsage 表示Claude API返回的usage信息
 								type ClaudeUsage struct {
 									InputTokens              int `json:"input_tokens"`
 									OutputTokens             int `json:"output_tokens"`
 									CacheCreationInputTokens int `json:"cache_creation_input_tokens"`
 									CacheReadInputTokens     int `json:"cache_read_input_tokens"`
 								}
 								// ForwardResult 转发结果
 								type ForwardResult struct {
-												fix(billing): 修复客户端取消请求时计费丢失问题

检测 context.Canceled 作为客户端断开信号，返回已收集的 usage 而非错误

											
										
										
											2026-01-08 11:25:17 +08:00
+									RequestID        string
 									Usage            ClaudeUsage
 									Model            string
 									Stream           bool
 									Duration         time.Duration
 									FirstTokenMs     *int // 首字时间（流式请求）
 									ClientDisconnect bool // 客户端是否在流式传输过程中断开
-												feat: 图片生成计费功能

- 新增 Group 图片价格配置（image_price_1k/2k/4k）
- BillingService 新增 CalculateImageCost 方法
- AntigravityGatewayService 支持识别图片生成模型并按次计费
- UsageLog 新增 image_count 和 image_size 字段
- 前端分组管理支持配置图片价格（antigravity 和 gemini 平台）
- 图片计费复用通用计费能力（余额检查、扣费、倍率、订阅限额）

											
										
										
											2026-01-05 17:07:29 +08:00
 									// 图片生成计费字段（仅 gemini-3-pro-image 使用）
 									ImageCount int    // 生成的图片数量
 									ImageSize  string // 图片尺寸 "1K", "2K", "4K"
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								}
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+								// UpstreamFailoverError indicates an upstream error that should trigger account failover.
 								type UpstreamFailoverError struct {
 									StatusCode int
 								}
 								func (e *UpstreamFailoverError) Error() string {
 									return fmt.Sprintf("upstream error: %d (failover)", e.StatusCode)
 								}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								// GatewayService handles API gateway operations
 								type GatewayService struct {
-												refactor: 删除 ports 目录

											
										
										
											2025-12-25 17:15:01 +08:00
+									accountRepo         AccountRepository
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+									groupRepo           GroupRepository
-												refactor: 删除 ports 目录

											
										
										
											2025-12-25 17:15:01 +08:00
+									usageLogRepo        UsageLogRepository
 									userRepo            UserRepository
 									userSubRepo         UserSubscriptionRepository
 									cache               GatewayCache
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									cfg                 *config.Config
-												style: 修复 gofmt 格式化问题

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>

											
										
										
											2026-01-15 19:42:18 +08:00
+									schedulerSnapshot   *SchedulerSnapshotService
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									billingService      *BillingService
 									rateLimitService    *RateLimitService
 									billingCacheService *BillingCacheService
 									identityService     *IdentityService
-												refactor: 删除 ports 目录

											
										
										
											2025-12-25 17:15:01 +08:00
+									httpUpstream        HTTPUpstream
-												feat: Schedule batch update for account last_used_at

Implement deferred batch update mechanism to reduce database load:

- Add DeferredService for batching account last_used_at updates
- Add TimingWheelService for efficient recurring task scheduling
- Integrate with GatewayService and OpenAIGatewayService
- Implement BatchUpdateLastUsed repository method using CASE...WHEN SQL
- Fix golangci-lint error: Replace interface{} with any

Benefits:
- Reduces database writes by batching updates (10-second intervals)
- Improves request throughput by deferring non-critical updates
- Maintains accurate account usage tracking for scheduling

											
										
										
											2025-12-28 08:07:15 +08:00
+									deferredService     *DeferredService
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									concurrencyService  *ConcurrencyService
-												style: 修复 gofmt 格式化问题

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>

											
										
										
											2026-01-15 19:42:18 +08:00
+									claudeTokenProvider *ClaudeTokenProvider
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+									sessionLimitCache   SessionLimitCache // 会话数量限制缓存（仅 Anthropic OAuth/SetupToken）
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								}
 								// NewGatewayService creates a new GatewayService
-												refactor(backend): 引入端口接口模式

											
										
										
											2025-12-19 21:26:19 +08:00
+								func NewGatewayService(
-												refactor: 删除 ports 目录

											
										
										
											2025-12-25 17:15:01 +08:00
+									accountRepo AccountRepository,
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+									groupRepo GroupRepository,
-												refactor: 删除 ports 目录

											
										
										
											2025-12-25 17:15:01 +08:00
+									usageLogRepo UsageLogRepository,
 									userRepo UserRepository,
 									userSubRepo UserSubscriptionRepository,
 									cache GatewayCache,
-												refactor(backend): 引入端口接口模式

											
										
										
											2025-12-19 21:26:19 +08:00
+									cfg *config.Config,
-												feat(scheduler): 引入调度快照缓存与 outbox 回放

- 调度热路径优先读 Redis 快照，保留分组排序语义
- outbox 回放 + 全量重建纠偏，失败重试不推进水位
- 自动 Atlas 基线对齐并同步调度配置示例

											
										
										
											2026-01-12 14:19:06 +08:00
+									schedulerSnapshot *SchedulerSnapshotService,
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									concurrencyService *ConcurrencyService,
-												refactor(backend): 引入端口接口模式

											
										
										
											2025-12-19 21:26:19 +08:00
+									billingService *BillingService,
 									rateLimitService *RateLimitService,
 									billingCacheService *BillingCacheService,
 									identityService *IdentityService,
-												refactor: 删除 ports 目录

											
										
										
											2025-12-25 17:15:01 +08:00
+									httpUpstream HTTPUpstream,
-												feat: Schedule batch update for account last_used_at

Implement deferred batch update mechanism to reduce database load:

- Add DeferredService for batching account last_used_at updates
- Add TimingWheelService for efficient recurring task scheduling
- Integrate with GatewayService and OpenAIGatewayService
- Implement BatchUpdateLastUsed repository method using CASE...WHEN SQL
- Fix golangci-lint error: Replace interface{} with any

Benefits:
- Reduces database writes by batching updates (10-second intervals)
- Improves request throughput by deferring non-critical updates
- Maintains accurate account usage tracking for scheduling

											
										
										
											2025-12-28 08:07:15 +08:00
+									deferredService *DeferredService,
-												feat(网关): 引入 OpenAI/Claude OAuth token 缓存

新增 OpenAI/Claude TokenProvider 与缓存键生成
扩展 OAuth 缓存失效覆盖更多平台
统一 OAuth 缓存前缀与依赖注入

											
										
										
											2026-01-15 18:27:06 +08:00
+									claudeTokenProvider *ClaudeTokenProvider,
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+									sessionLimitCache SessionLimitCache,
-												refactor(backend): 引入端口接口模式

											
										
										
											2025-12-19 21:26:19 +08:00
+								) *GatewayService {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									return &GatewayService{
-												refactor(backend): 引入端口接口模式

											
										
										
											2025-12-19 21:26:19 +08:00
+										accountRepo:         accountRepo,
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+										groupRepo:           groupRepo,
-												refactor(backend): 引入端口接口模式

											
										
										
											2025-12-19 21:26:19 +08:00
+										usageLogRepo:        usageLogRepo,
 										userRepo:            userRepo,
 										userSubRepo:         userSubRepo,
-												refactor(backend): 添加 service 缓存端口

											
										
										
											2025-12-19 23:39:28 +08:00
+										cache:               cache,
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										cfg:                 cfg,
-												style: 修复 gofmt 格式化问题

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>

											
										
										
											2026-01-15 19:42:18 +08:00
+										schedulerSnapshot:   schedulerSnapshot,
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										concurrencyService:  concurrencyService,
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										billingService:      billingService,
 										rateLimitService:    rateLimitService,
 										billingCacheService: billingCacheService,
 										identityService:     identityService,
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										httpUpstream:        httpUpstream,
-												feat: Schedule batch update for account last_used_at

Implement deferred batch update mechanism to reduce database load:

- Add DeferredService for batching account last_used_at updates
- Add TimingWheelService for efficient recurring task scheduling
- Integrate with GatewayService and OpenAIGatewayService
- Implement BatchUpdateLastUsed repository method using CASE...WHEN SQL
- Fix golangci-lint error: Replace interface{} with any

Benefits:
- Reduces database writes by batching updates (10-second intervals)
- Improves request throughput by deferring non-critical updates
- Maintains accurate account usage tracking for scheduling

											
										
										
											2025-12-28 08:07:15 +08:00
+										deferredService:     deferredService,
-												style: 修复 gofmt 格式化问题

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>

											
										
										
											2026-01-15 19:42:18 +08:00
+										claudeTokenProvider: claudeTokenProvider,
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+										sessionLimitCache:   sessionLimitCache,
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
 								}
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+								// GenerateSessionHash 从预解析请求计算粘性会话 hash
 								func (s *GatewayService) GenerateSessionHash(parsed *ParsedRequest) string {
 									if parsed == nil {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										return ""
 									}
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+									// 1. 最高优先级：从 metadata.user_id 提取 session_xxx
 									if parsed.MetadataUserID != "" {
 										if match := sessionIDRegex.FindStringSubmatch(parsed.MetadataUserID); len(match) > 1 {
 											return match[1]
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										}
 									}
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+									// 2. 提取带 cache_control: {type: "ephemeral"} 的内容
 									cacheableContent := s.extractCacheableContent(parsed)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									if cacheableContent != "" {
 										return s.hashContent(cacheableContent)
 									}
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+									// 3. Fallback: 使用 system 内容
 									if parsed.System != nil {
 										systemText := s.extractTextFromSystem(parsed.System)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										if systemText != "" {
 											return s.hashContent(systemText)
 										}
 									}
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+									// 4. 最后 fallback: 使用第一条消息
 									if len(parsed.Messages) > 0 {
 										if firstMsg, ok := parsed.Messages[0].(map[string]any); ok {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+											msgText := s.extractTextFromContent(firstMsg["content"])
 											if msgText != "" {
 												return s.hashContent(msgText)
 											}
 										}
 									}
 									return ""
 								}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+								// BindStickySession sets session -> account binding with standard TTL.
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+								func (s *GatewayService) BindStickySession(ctx context.Context, groupID *int64, sessionHash string, accountID int64) error {
-												perf: 负载感知调度系统性能优化与稳定性增强 (#23)

* Reapply "feat(gateway): 实现负载感知的账号调度优化 (#114)" (#117)

This reverts commit c5c12d4c8b44cbfecf2ee22ae3fd7810f724c638.

* fix: 恢复 Google One 功能兼容性

恢复 main 分支的 gemini_oauth_service.go 以保持与 Google One 功能的兼容性。

变更：
- 添加 Google One tier 常量定义
- 添加存储空间 tier 阈值常量
- 支持 google_one OAuth 类型
- 包含 RefreshAccountGoogleOneTier 等 Google One 相关方法

原因：
- atomic-scheduling 恢复时使用了旧版本的文件
- 需要保持与 main 分支 Google One 功能（PR #118）的兼容性
- 避免编译错误（handler 代码依赖这些方法）

* fix: 修复 SSE/JSON 转义和 nil 安全问题

基于 Codex 审查建议修复关键安全问题。

SSE/JSON 转义修复：
- handleStreamingAwareError: 使用 json.Marshal 替代字符串拼接
- sendMockWarmupStream: 使用 json.Marshal 生成 message_start 事件
- 防止错误消息中的特殊字符导致无效 JSON

Nil 安全检查：
- SelectAccountWithLoadAwareness: 粘性会话层添加 s.cache != nil 检查
- BindStickySession: 添加 s.cache == nil 检查
- 防止 cache 未初始化时的运行时 panic

影响：
- 提升 SSE 错误处理的健壮性
- 避免客户端 JSON 解析失败
- 增强代码防御性编程

* perf: 优化负载感知调度的准确性和响应速度

基于 Codex 审查建议的性能优化。

负载批量查询优化：
- getAccountsLoadBatchScript 添加过期槽位清理
- 使用 ZREMRANGEBYSCORE 在计数前清理过期条目
- 防止过期槽位导致负载率计算偏高
- 提升负载感知调度的准确性

等待循环优化：
- waitForSlotWithPingTimeout 添加立即获取尝试
- 避免不必要的 initialBackoff 延迟
- 低负载场景下减少响应延迟

测试改进：
- 取消跳过 TestGetAccountsLoadBatch 集成测试
- 过期槽位清理应该修复了 CI 中的计数问题

影响：
- 更准确的负载感知调度决策
- 更快的槽位获取响应
- 更好的测试覆盖率

* test: 暂时跳过 TestGetAccountsLoadBatch 集成测试

该测试在 CI 环境中失败，需要进一步调试。
暂时跳过以让 CI 通过，后续在本地 Docker 环境中修复。
											
										
										
											2026-01-02 17:30:07 +08:00
+									if sessionHash == "" || accountID <= 0 || s.cache == nil {
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										return nil
 									}
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+									return s.cache.SetSessionAccountID(ctx, derefGroupID(groupID), sessionHash, accountID, stickySessionTTL)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+								}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+								// GetCachedSessionAccountID retrieves the account ID bound to a sticky session.
 								// Returns 0 if no binding exists or on error.
 								func (s *GatewayService) GetCachedSessionAccountID(ctx context.Context, groupID *int64, sessionHash string) (int64, error) {
 									if sessionHash == "" || s.cache == nil {
 										return 0, nil
 									}
 									accountID, err := s.cache.GetSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
 									if err != nil {
 										return 0, err
 									}
 									return accountID, nil
 								}
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+								func (s *GatewayService) extractCacheableContent(parsed *ParsedRequest) string {
 									if parsed == nil {
 										return ""
 									}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+									var builder strings.Builder
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+									// 检查 system 中的 cacheable 内容
 									if system, ok := parsed.System.([]any); ok {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										for _, part := range system {
-												ci(backend): 添加 gofmt 配置

											
										
										
											2025-12-20 16:19:40 +08:00
+											if partMap, ok := part.(map[string]any); ok {
 												if cc, ok := partMap["cache_control"].(map[string]any); ok {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+													if cc["type"] == "ephemeral" {
 														if text, ok := partMap["text"].(string); ok {
-												fix(lint): 修复 golangci-lint 报告的代码问题

- errcheck: 修复类型断言未检查返回值的问题
  - pool.go: 添加 sync.Map 类型断言安全检查
  - req_client_pool.go: 添加 sync.Map 类型断言安全检查
  - concurrency_cache_benchmark_test.go: 显式忽略断言返回值
  - gateway_service.go: 显式忽略 WriteString 返回值

- gofmt: 修复代码格式问题
  - redis.go: 注释对齐
  - api_key_repo.go: 结构体字段对齐
  - concurrency_cache.go: 字段对齐
  - http_upstream.go: 注释对齐

- unused: 删除未使用的代码
  - user_repo.go: 删除未使用的 sql 字段
  - usage_service.go: 删除未使用的 calculateStats 函数

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>

											
										
										
											2025-12-31 14:51:58 +08:00
+															_, _ = builder.WriteString(text)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+														}
 													}
 												}
 											}
 										}
 									}
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+									systemText := builder.String()
 									// 检查 messages 中的 cacheable 内容
 									for _, msg := range parsed.Messages {
 										if msgMap, ok := msg.(map[string]any); ok {
 											if msgContent, ok := msgMap["content"].([]any); ok {
 												for _, part := range msgContent {
 													if partMap, ok := part.(map[string]any); ok {
 														if cc, ok := partMap["cache_control"].(map[string]any); ok {
 															if cc["type"] == "ephemeral" {
 																return s.extractTextFromContent(msgMap["content"])
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+															}
 														}
 													}
 												}
 											}
 										}
 									}
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+									return systemText
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								}
-												ci(backend): 添加 gofmt 配置

											
										
										
											2025-12-20 16:19:40 +08:00
+								func (s *GatewayService) extractTextFromSystem(system any) string {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									switch v := system.(type) {
 									case string:
 										return v
-												ci(backend): 添加 gofmt 配置

											
										
										
											2025-12-20 16:19:40 +08:00
+									case []any:
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										var texts []string
 										for _, part := range v {
-												ci(backend): 添加 gofmt 配置

											
										
										
											2025-12-20 16:19:40 +08:00
+											if partMap, ok := part.(map[string]any); ok {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+												if text, ok := partMap["text"].(string); ok {
 													texts = append(texts, text)
 												}
 											}
 										}
 										return strings.Join(texts, "")
 									}
 									return ""
 								}
-												ci(backend): 添加 gofmt 配置

											
										
										
											2025-12-20 16:19:40 +08:00
+								func (s *GatewayService) extractTextFromContent(content any) string {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									switch v := content.(type) {
 									case string:
 										return v
-												ci(backend): 添加 gofmt 配置

											
										
										
											2025-12-20 16:19:40 +08:00
+									case []any:
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										var texts []string
 										for _, part := range v {
-												ci(backend): 添加 gofmt 配置

											
										
										
											2025-12-20 16:19:40 +08:00
+											if partMap, ok := part.(map[string]any); ok {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+												if partMap["type"] == "text" {
 													if text, ok := partMap["text"].(string); ok {
 														texts = append(texts, text)
 													}
 												}
 											}
 										}
 										return strings.Join(texts, "")
 									}
 									return ""
 								}
 								func (s *GatewayService) hashContent(content string) string {
 									hash := sha256.Sum256([]byte(content))
 									return hex.EncodeToString(hash[:16]) // 32字符
 								}
 								// replaceModelInBody 替换请求体中的model字段
 								func (s *GatewayService) replaceModelInBody(body []byte, newModel string) []byte {
-												ci(backend): 添加 gofmt 配置

											
										
										
											2025-12-20 16:19:40 +08:00
+									var req map[string]any
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									if err := json.Unmarshal(body, &req); err != nil {
 										return body
 									}
 									req["model"] = newModel
 									newBody, err := json.Marshal(req)
 									if err != nil {
 										return body
 									}
 									return newBody
 								}
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+								type claudeOAuthNormalizeOptions struct {
 									injectMetadata          bool
 									metadataUserID          string
 									stripSystemCacheControl bool
 								}
 								func stripToolPrefix(value string) string {
 									if value == "" {
 										return value
 									}
 									return toolPrefixRe.ReplaceAllString(value, "")
 								}
 								func toPascalCase(value string) string {
 									if value == "" {
 										return value
 									}
 									normalized := toolNameBoundaryRe.ReplaceAllString(value, " ")
 									tokens := make([]string, 0)
 									for _, token := range strings.Fields(normalized) {
 										expanded := toolNameCamelRe.ReplaceAllString(token, "$1 $2")
 										parts := strings.Fields(expanded)
 										if len(parts) > 0 {
 											tokens = append(tokens, parts...)
 										}
 									}
 									if len(tokens) == 0 {
 										return value
 									}
 									var builder strings.Builder
 									for _, token := range tokens {
 										lower := strings.ToLower(token)
 										if lower == "" {
 											continue
 										}
 										runes := []rune(lower)
 										runes[0] = unicode.ToUpper(runes[0])
-												fix(gateway): satisfy golangci-lint checks

											
										
										
											2026-01-17 18:16:34 +08:00
+										_, _ = builder.WriteString(string(runes))
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+									}
 									return builder.String()
 								}
 								func toSnakeCase(value string) string {
 									if value == "" {
 										return value
 									}
 									output := toolNameCamelRe.ReplaceAllString(value, "$1_$2")
 									output = toolNameBoundaryRe.ReplaceAllString(output, "_")
 									output = strings.Trim(output, "_")
 									return strings.ToLower(output)
 								}
 								func normalizeToolNameForClaude(name string, cache map[string]string) string {
 									if name == "" {
 										return name
 									}
 									stripped := stripToolPrefix(name)
 									mapped, ok := claudeToolNameOverrides[strings.ToLower(stripped)]
 									if !ok {
 										mapped = toPascalCase(stripped)
 									}
 									if mapped != "" && cache != nil && mapped != stripped {
 										cache[mapped] = stripped
 									}
 									if mapped == "" {
 										return stripped
 									}
 									return mapped
 								}
 								func normalizeToolNameForOpenCode(name string, cache map[string]string) string {
 									if name == "" {
 										return name
 									}
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+									stripped := stripToolPrefix(name)
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+									if cache != nil {
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+										if mapped, ok := cache[stripped]; ok {
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+											return mapped
 										}
 									}
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+									if mapped, ok := openCodeToolOverrides[stripped]; ok {
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+										return mapped
 									}
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+									return toSnakeCase(stripped)
 								}
 								func normalizeParamNameForOpenCode(name string, cache map[string]string) string {
 									if name == "" {
 										return name
 									}
 									if cache != nil {
 										if mapped, ok := cache[name]; ok {
 											return mapped
 										}
 									}
 									return name
 								}
-												refactor: limit OpenCode keyword replacement to tool descriptions

											
										
										
											2026-01-31 01:40:38 +08:00
+								// sanitizeSystemText rewrites only the fixed OpenCode identity sentence (if present).
 								// We intentionally avoid broad keyword replacement in system prompts to prevent
 								// accidentally changing user-provided instructions.
 								func sanitizeSystemText(text string) string {
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+									if text == "" {
 										return text
 									}
-												fix: rewrite OpenCode identity sentence to Claude Code

											
										
										
											2026-01-29 03:03:40 +08:00
+									// Some clients include a fixed OpenCode identity sentence. Anthropic may treat
 									// this as a non-Claude-Code fingerprint, so rewrite it to the canonical
 									// Claude Code banner before generic "OpenCode"/"opencode" replacements.
 									text = strings.ReplaceAll(
 										text,
 										"You are OpenCode, the best coding agent on the planet.",
 										strings.TrimSpace(claudeCodeSystemPrompt),
 									)
-												refactor: limit OpenCode keyword replacement to tool descriptions

											
										
										
											2026-01-31 01:40:38 +08:00
+									return text
 								}
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+								func sanitizeToolDescription(description string) string {
 									if description == "" {
 										return description
 									}
 									description = toolDescAbsPathRe.ReplaceAllString(description, "[path]")
 									description = toolDescWinPathRe.ReplaceAllString(description, "[path]")
-												refactor: stop rewriting tool descriptions; keep only system sentence rewrite

											
										
										
											2026-01-31 02:01:51 +08:00
+									// Intentionally do NOT rewrite tool descriptions (OpenCode/Claude strings).
 									// Tool names/skill names may rely on exact wording, and rewriting can be misleading.
 									return description
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+								}
 								func normalizeToolInputSchema(inputSchema any, cache map[string]string) {
 									schema, ok := inputSchema.(map[string]any)
 									if !ok {
 										return
 									}
 									properties, ok := schema["properties"].(map[string]any)
 									if !ok {
 										return
 									}
 									newProperties := make(map[string]any, len(properties))
 									for key, value := range properties {
 										snakeKey := toSnakeCase(key)
 										newProperties[snakeKey] = value
 										if snakeKey != key && cache != nil {
 											cache[snakeKey] = key
 										}
 									}
 									schema["properties"] = newProperties
 									if required, ok := schema["required"].([]any); ok {
 										newRequired := make([]any, 0, len(required))
 										for _, item := range required {
 											name, ok := item.(string)
 											if !ok {
 												newRequired = append(newRequired, item)
 												continue
 											}
 											snakeName := toSnakeCase(name)
 											newRequired = append(newRequired, snakeName)
 											if snakeName != name && cache != nil {
 												cache[snakeName] = name
 											}
 										}
 										schema["required"] = newRequired
 									}
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+								}
 								func stripCacheControlFromSystemBlocks(system any) bool {
 									blocks, ok := system.([]any)
 									if !ok {
 										return false
 									}
 									changed := false
 									for _, item := range blocks {
 										block, ok := item.(map[string]any)
 										if !ok {
 											continue
 										}
 										if _, exists := block["cache_control"]; !exists {
 											continue
 										}
 										delete(block, "cache_control")
 										changed = true
 									}
 									return changed
 								}
 								func normalizeClaudeOAuthRequestBody(body []byte, modelID string, opts claudeOAuthNormalizeOptions) ([]byte, string, map[string]string) {
 									if len(body) == 0 {
 										return body, modelID, nil
 									}
 									var req map[string]any
 									if err := json.Unmarshal(body, &req); err != nil {
 										return body, modelID, nil
 									}
 									toolNameMap := make(map[string]string)
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+									if system, ok := req["system"]; ok {
 										switch v := system.(type) {
 										case string:
-												refactor: limit OpenCode keyword replacement to tool descriptions

											
										
										
											2026-01-31 01:40:38 +08:00
+											sanitized := sanitizeSystemText(v)
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+											if sanitized != v {
 												req["system"] = sanitized
 											}
 										case []any:
 											for _, item := range v {
 												block, ok := item.(map[string]any)
 												if !ok {
 													continue
 												}
 												if blockType, _ := block["type"].(string); blockType != "text" {
 													continue
 												}
 												text, ok := block["text"].(string)
 												if !ok || text == "" {
 													continue
 												}
-												refactor: limit OpenCode keyword replacement to tool descriptions

											
										
										
											2026-01-31 01:40:38 +08:00
+												sanitized := sanitizeSystemText(text)
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+												if sanitized != text {
 													block["text"] = sanitized
 												}
 											}
 										}
 									}
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+									if rawModel, ok := req["model"].(string); ok {
 										normalized := claude.NormalizeModelID(rawModel)
 										if normalized != rawModel {
 											req["model"] = normalized
 											modelID = normalized
 										}
 									}
 									if rawTools, exists := req["tools"]; exists {
 										switch tools := rawTools.(type) {
 										case []any:
 											for idx, tool := range tools {
 												toolMap, ok := tool.(map[string]any)
 												if !ok {
 													continue
 												}
 												if name, ok := toolMap["name"].(string); ok {
 													normalized := normalizeToolNameForClaude(name, toolNameMap)
 													if normalized != "" && normalized != name {
 														toolMap["name"] = normalized
 													}
 												}
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+												if desc, ok := toolMap["description"].(string); ok {
 													sanitized := sanitizeToolDescription(desc)
 													if sanitized != desc {
 														toolMap["description"] = sanitized
 													}
 												}
 												if schema, ok := toolMap["input_schema"]; ok {
 													normalizeToolInputSchema(schema, toolNameMap)
 												}
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+												tools[idx] = toolMap
 											}
 											req["tools"] = tools
 										case map[string]any:
 											normalizedTools := make(map[string]any, len(tools))
 											for name, value := range tools {
 												normalized := normalizeToolNameForClaude(name, toolNameMap)
 												if normalized == "" {
 													normalized = name
 												}
 												if toolMap, ok := value.(map[string]any); ok {
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+													toolMap["name"] = normalized
 													if desc, ok := toolMap["description"].(string); ok {
 														sanitized := sanitizeToolDescription(desc)
 														if sanitized != desc {
 															toolMap["description"] = sanitized
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+														}
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+													}
 													if schema, ok := toolMap["input_schema"]; ok {
 														normalizeToolInputSchema(schema, toolNameMap)
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+													}
 													normalizedTools[normalized] = toolMap
 													continue
 												}
 												normalizedTools[normalized] = value
 											}
 											req["tools"] = normalizedTools
 										}
 									} else {
 										req["tools"] = []any{}
 									}
 									if messages, ok := req["messages"].([]any); ok {
 										for _, msg := range messages {
 											msgMap, ok := msg.(map[string]any)
 											if !ok {
 												continue
 											}
 											content, ok := msgMap["content"].([]any)
 											if !ok {
 												continue
 											}
 											for _, block := range content {
 												blockMap, ok := block.(map[string]any)
 												if !ok {
 													continue
 												}
 												if blockType, _ := blockMap["type"].(string); blockType != "tool_use" {
 													continue
 												}
 												if name, ok := blockMap["name"].(string); ok {
 													normalized := normalizeToolNameForClaude(name, toolNameMap)
 													if normalized != "" && normalized != name {
 														blockMap["name"] = normalized
 													}
 												}
 											}
 										}
 									}
 									if opts.stripSystemCacheControl {
 										if system, ok := req["system"]; ok {
 											_ = stripCacheControlFromSystemBlocks(system)
 										}
 									}
 									if opts.injectMetadata && opts.metadataUserID != "" {
 										metadata, ok := req["metadata"].(map[string]any)
 										if !ok {
 											metadata = map[string]any{}
 											req["metadata"] = metadata
 										}
 										if existing, ok := metadata["user_id"].(string); !ok || existing == "" {
 											metadata["user_id"] = opts.metadataUserID
 										}
 									}
-												fix(gateway): satisfy golangci-lint checks

											
										
										
											2026-01-17 18:16:34 +08:00
+									delete(req, "temperature")
 									delete(req, "tool_choice")
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
 									newBody, err := json.Marshal(req)
 									if err != nil {
 										return body, modelID, toolNameMap
 									}
 									return newBody, modelID, toolNameMap
 								}
 								func (s *GatewayService) buildOAuthMetadataUserID(parsed *ParsedRequest, account *Account, fp *Fingerprint) string {
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+									if parsed == nil || account == nil {
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+										return ""
 									}
 									if parsed.MetadataUserID != "" {
 										return ""
 									}
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
 									userID := strings.TrimSpace(account.GetClaudeUserID())
 									if userID == "" && fp != nil {
 										userID = fp.ClientID
 									}
 									if userID == "" {
-												fix(oauth): mimic Claude Code metadata and beta headers

											
										
										
											2026-01-29 01:49:51 +08:00
+										// Fall back to a random, well-formed client id so we can still satisfy
 										// Claude Code OAuth requirements when account metadata is incomplete.
 										userID = generateClientID()
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+									}
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+									sessionHash := s.GenerateSessionHash(parsed)
 									sessionID := uuid.NewString()
 									if sessionHash != "" {
 										seed := fmt.Sprintf("%d::%s", account.ID, sessionHash)
 										sessionID = generateSessionUUID(seed)
 									}
-												fix(oauth): mimic Claude Code metadata and beta headers

											
										
										
											2026-01-29 01:49:51 +08:00
 									// Prefer the newer format that includes account_uuid (if present),
 									// otherwise fall back to the legacy Claude Code format.
 									accountUUID := strings.TrimSpace(account.GetExtraString("account_uuid"))
 									if accountUUID != "" {
 										return fmt.Sprintf("user_%s_account_%s_session_%s", userID, accountUUID, sessionID)
 									}
 									return fmt.Sprintf("user_%s_account__session_%s", userID, sessionID)
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+								}
 								func generateSessionUUID(seed string) string {
 									if seed == "" {
 										return uuid.NewString()
 									}
 									hash := sha256.Sum256([]byte(seed))
 									bytes := hash[:16]
 									bytes[6] = (bytes[6] & 0x0f) | 0x40
 									bytes[8] = (bytes[8] & 0x3f) | 0x80
 									return fmt.Sprintf("%x-%x-%x-%x-%x",
 										bytes[0:4], bytes[4:6], bytes[6:8], bytes[8:10], bytes[10:16])
 								}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								// SelectAccount 选择账号（粘性会话+优先级）
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+								func (s *GatewayService) SelectAccount(ctx context.Context, groupID *int64, sessionHash string) (*Account, error) {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									return s.SelectAccountForModel(ctx, groupID, sessionHash, "")
 								}
 								// SelectAccountForModel 选择支持指定模型的账号（粘性会话+优先级+模型映射）
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+								func (s *GatewayService) SelectAccountForModel(ctx context.Context, groupID *int64, sessionHash string, requestedModel string) (*Account, error) {
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+									return s.SelectAccountForModelWithExclusions(ctx, groupID, sessionHash, requestedModel, nil)
 								}
 								// SelectAccountForModelWithExclusions selects an account supporting the requested model while excluding specified accounts.
 								func (s *GatewayService) SelectAccountForModelWithExclusions(ctx context.Context, groupID *int64, sessionHash string, requestedModel string, excludedIDs map[int64]struct{}) (*Account, error) {
-												feat(antigravity): 添加专用路由，支持仅使用 antigravity 账户

添加 /antigravity/v1/* 和 /antigravity/v1beta/* 路由：
- 通过 ForcePlatform 中间件强制使用 antigravity 平台
- 跳过混合调度逻辑，仅调度 antigravity 账户
- 支持按分组优先查找，找不到时回退查询全部 antigravity 账户

修复 context key 类型不匹配问题：
- middleware 和 service 统一使用字符串常量 "ctx_force_platform"
- 解决 Go context.Value() 类型+值匹配导致的读取失败

其他改动：
- 嵌入式前端中间件白名单添加 /antigravity/ 路径
- e2e 测试 Gemini 端点 URL 添加 endpointPrefix 支持

											
										
										
											2025-12-29 16:52:55 +08:00
+									// 优先检查 context 中的强制平台（/antigravity 路由）
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+									var platform string
-												fix: 修复 golangci-lint 检查错误

- SA1029: 创建 ctxkey 包定义类型安全的 context key
- ST1005: 错误字符串首字母改小写
- errcheck: 显式忽略 bytes.Buffer.Write 返回值
- 修复单元测试中 GatewayService 缺少 cfg 字段的问题

											
										
										
											2025-12-29 17:46:52 +08:00
+									forcePlatform, hasForcePlatform := ctx.Value(ctxkey.ForcePlatform).(string)
-												feat(antigravity): 添加专用路由，支持仅使用 antigravity 账户

添加 /antigravity/v1/* 和 /antigravity/v1beta/* 路由：
- 通过 ForcePlatform 中间件强制使用 antigravity 平台
- 跳过混合调度逻辑，仅调度 antigravity 账户
- 支持按分组优先查找，找不到时回退查询全部 antigravity 账户

修复 context key 类型不匹配问题：
- middleware 和 service 统一使用字符串常量 "ctx_force_platform"
- 解决 Go context.Value() 类型+值匹配导致的读取失败

其他改动：
- 嵌入式前端中间件白名单添加 /antigravity/ 路径
- e2e 测试 Gemini 端点 URL 添加 endpointPrefix 支持

											
										
										
											2025-12-29 16:52:55 +08:00
+									if hasForcePlatform && forcePlatform != "" {
 										platform = forcePlatform
 									} else if groupID != nil {
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+										group, resolvedGroupID, err := s.resolveGatewayGroup(ctx, groupID)
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+										if err != nil {
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+											return nil, err
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+										}
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+										groupID = resolvedGroupID
 										ctx = s.withGroupContext(ctx, group)
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+										platform = group.Platform
 									} else {
 										// 无分组时只使用原生 anthropic 平台
 										platform = PlatformAnthropic
 									}
 									// anthropic/gemini 分组支持混合调度（包含启用了 mixed_scheduling 的 antigravity 账户）
-												feat(antigravity): 添加专用路由，支持仅使用 antigravity 账户

添加 /antigravity/v1/* 和 /antigravity/v1beta/* 路由：
- 通过 ForcePlatform 中间件强制使用 antigravity 平台
- 跳过混合调度逻辑，仅调度 antigravity 账户
- 支持按分组优先查找，找不到时回退查询全部 antigravity 账户

修复 context key 类型不匹配问题：
- middleware 和 service 统一使用字符串常量 "ctx_force_platform"
- 解决 Go context.Value() 类型+值匹配导致的读取失败

其他改动：
- 嵌入式前端中间件白名单添加 /antigravity/ 路径
- e2e 测试 Gemini 端点 URL 添加 endpointPrefix 支持

											
										
										
											2025-12-29 16:52:55 +08:00
+									// 注意：强制平台模式不走混合调度
 									if (platform == PlatformAnthropic || platform == PlatformGemini) && !hasForcePlatform {
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+										return s.selectAccountWithMixedScheduling(ctx, groupID, sessionHash, requestedModel, excludedIDs, platform)
 									}
-												feat(antigravity): 添加专用路由，支持仅使用 antigravity 账户

添加 /antigravity/v1/* 和 /antigravity/v1beta/* 路由：
- 通过 ForcePlatform 中间件强制使用 antigravity 平台
- 跳过混合调度逻辑，仅调度 antigravity 账户
- 支持按分组优先查找，找不到时回退查询全部 antigravity 账户

修复 context key 类型不匹配问题：
- middleware 和 service 统一使用字符串常量 "ctx_force_platform"
- 解决 Go context.Value() 类型+值匹配导致的读取失败

其他改动：
- 嵌入式前端中间件白名单添加 /antigravity/ 路径
- e2e 测试 Gemini 端点 URL 添加 endpointPrefix 支持

											
										
										
											2025-12-29 16:52:55 +08:00
+									// antigravity 分组、强制平台模式或无分组使用单平台选择
-												fix(gateway): 修复账号跨分组调度问题

问题：账号可能被调度到未分配的分组（如 simon 账号被调度到 claude_default）

根因：
- 强制平台模式下分组查询失败时回退到全平台查询
- listSchedulableAccounts 中分组为空时回退到无分组查询
- 粘性会话只检查平台匹配，未校验账号分组归属

修复：
- 移除强制平台模式的回退逻辑，分组内无账号时返回错误
- 移除 listSchedulableAccounts 的回退逻辑
- 新增 isAccountInGroup 方法用于分组校验
- 在三处粘性会话检查中增加分组归属验证

											
										
										
											2026-01-07 10:56:52 +08:00
+									// 注意：强制平台模式也必须遵守分组限制，不再回退到全平台查询
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+									return s.selectAccountForModelWithPlatform(ctx, groupID, sessionHash, requestedModel, excludedIDs, platform)
-												feat: 完善 Antigravity 多平台网关支持，修复 Gemini handler 分流逻辑

											
										
										
											2025-12-28 17:48:52 +08:00
+								}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+								// SelectAccountWithLoadAwareness selects account with load-awareness and wait plan.
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+								// metadataUserID: 已废弃参数，会话限制现在统一使用 sessionHash
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+								func (s *GatewayService) SelectAccountWithLoadAwareness(ctx context.Context, groupID *int64, sessionHash string, requestedModel string, excludedIDs map[int64]struct{}, metadataUserID string) (*AccountSelectionResult, error) {
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+									// 调试日志：记录调度入口参数
 									excludedIDsList := make([]int64, 0, len(excludedIDs))
 									for id := range excludedIDs {
 										excludedIDsList = append(excludedIDsList, id)
 									}
 									slog.Debug("account_scheduling_starting",
 										"group_id", derefGroupID(groupID),
 										"model", requestedModel,
 										"session", shortSessionHash(sessionHash),
 										"excluded_ids", excludedIDsList)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									cfg := s.schedulingConfig()
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									var stickyAccountID int64
 									if sessionHash != "" && s.cache != nil {
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+										if accountID, err := s.cache.GetSessionAccountID(ctx, derefGroupID(groupID), sessionHash); err == nil {
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+											stickyAccountID = accountID
 										}
 									}
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
 									// 检查 Claude Code 客户端限制（可能会替换 groupID 为降级分组）
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+									group, groupID, err := s.checkClaudeCodeRestriction(ctx, groupID)
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+									if err != nil {
 										return nil, err
 									}
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+									ctx = s.withGroupContext(ctx, group)
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+									if s.debugModelRoutingEnabled() && requestedModel != "" {
 										groupPlatform := ""
 										if group != nil {
 											groupPlatform = group.Platform
 										}
 										log.Printf("[ModelRoutingDebug] select entry: group_id=%v group_platform=%s model=%s session=%s sticky_account=%d load_batch=%v concurrency=%v",
 											derefGroupID(groupID), groupPlatform, requestedModel, shortSessionHash(sessionHash), stickyAccountID, cfg.LoadBatchEnabled, s.concurrencyService != nil)
 									}
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									if s.concurrencyService == nil || !cfg.LoadBatchEnabled {
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+										// 复制排除列表，用于会话限制拒绝时的重试
 										localExcluded := make(map[int64]struct{})
 										for k, v := range excludedIDs {
 											localExcluded[k] = v
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
 										for {
 											account, err := s.SelectAccountForModelWithExclusions(ctx, groupID, sessionHash, requestedModel, localExcluded)
 											if err != nil {
 												return nil, err
 											}
 											result, err := s.tryAcquireAccountSlot(ctx, account.ID, account.Concurrency)
 											if err == nil && result.Acquired {
 												// 获取槽位后检查会话限制（使用 sessionHash 作为会话标识符）
 												if !s.checkAndRegisterSession(ctx, account, sessionHash) {
 													result.ReleaseFunc()                   // 释放槽位
 													localExcluded[account.ID] = struct{}{} // 排除此账号
 													continue                               // 重新选择
 												}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+												return &AccountSelectionResult{
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+													Account:     account,
 													Acquired:    true,
 													ReleaseFunc: result.ReleaseFunc,
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+												}, nil
 											}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
 											// 对于等待计划的情况，也需要先检查会话限制
 											if !s.checkAndRegisterSession(ctx, account, sessionHash) {
 												localExcluded[account.ID] = struct{}{}
 												continue
 											}
 											if stickyAccountID > 0 && stickyAccountID == account.ID && s.concurrencyService != nil {
 												waitingCount, _ := s.concurrencyService.GetAccountWaitingCount(ctx, account.ID)
 												if waitingCount < cfg.StickySessionMaxWaiting {
 													return &AccountSelectionResult{
 														Account: account,
 														WaitPlan: &AccountWaitPlan{
 															AccountID:      account.ID,
 															MaxConcurrency: account.Concurrency,
 															Timeout:        cfg.StickySessionWaitTimeout,
 															MaxWaiting:     cfg.StickySessionMaxWaiting,
 														},
 													}, nil
 												}
 											}
 											return &AccountSelectionResult{
 												Account: account,
 												WaitPlan: &AccountWaitPlan{
 													AccountID:      account.ID,
 													MaxConcurrency: account.Concurrency,
 													Timeout:        cfg.FallbackWaitTimeout,
 													MaxWaiting:     cfg.FallbackMaxWaiting,
 												},
 											}, nil
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										}
 									}
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+									platform, hasForcePlatform, err := s.resolvePlatform(ctx, groupID, group)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									if err != nil {
 										return nil, err
 									}
 									preferOAuth := platform == PlatformGemini
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+									if s.debugModelRoutingEnabled() && platform == PlatformAnthropic && requestedModel != "" {
 										log.Printf("[ModelRoutingDebug] load-aware enabled: group_id=%v model=%s session=%s platform=%s", derefGroupID(groupID), requestedModel, shortSessionHash(sessionHash), platform)
 									}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
-												chore: apply stashed changes

											
										
										
											2026-02-02 22:20:08 +08:00
+									// Antigravity 模型系列检查（在账号选择前检查，确保所有代码路径都经过此检查）
 									if platform == PlatformAntigravity && groupID != nil && requestedModel != "" {
 										if err := s.checkAntigravityModelScope(ctx, *groupID, requestedModel); err != nil {
 											return nil, err
 										}
 									}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									accounts, useMixed, err := s.listSchedulableAccounts(ctx, groupID, platform, hasForcePlatform)
 									if err != nil {
 										return nil, err
 									}
 									if len(accounts) == 0 {
 										return nil, errors.New("no available accounts")
 									}
 									isExcluded := func(accountID int64) bool {
 										if excludedIDs == nil {
 											return false
 										}
 										_, excluded := excludedIDs[accountID]
 										return excluded
 									}
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+									// 提前构建 accountByID（供 Layer 1 和 Layer 1.5 使用）
 									accountByID := make(map[int64]*Account, len(accounts))
 									for i := range accounts {
 										accountByID[accounts[i].ID] = &accounts[i]
 									}
 									// 获取模型路由配置（仅 anthropic 平台）
 									var routingAccountIDs []int64
 									if group != nil && requestedModel != "" && group.Platform == PlatformAnthropic {
 										routingAccountIDs = group.GetRoutingAccountIDs(requestedModel)
 										if s.debugModelRoutingEnabled() {
 											log.Printf("[ModelRoutingDebug] context group routing: group_id=%d model=%s enabled=%v rules=%d matched_ids=%v session=%s sticky_account=%d",
 												group.ID, requestedModel, group.ModelRoutingEnabled, len(group.ModelRouting), routingAccountIDs, shortSessionHash(sessionHash), stickyAccountID)
 											if len(routingAccountIDs) == 0 && group.ModelRoutingEnabled && len(group.ModelRouting) > 0 {
 												keys := make([]string, 0, len(group.ModelRouting))
 												for k := range group.ModelRouting {
 													keys = append(keys, k)
 												}
 												sort.Strings(keys)
 												const maxKeys = 20
 												if len(keys) > maxKeys {
 													keys = keys[:maxKeys]
 												}
 												log.Printf("[ModelRoutingDebug] context group routing miss: group_id=%d model=%s patterns(sample)=%v", group.ID, requestedModel, keys)
 											}
 										}
 									}
 									// ============ Layer 1: 模型路由优先选择（优先级高于粘性会话） ============
 									if len(routingAccountIDs) > 0 && s.concurrencyService != nil {
 										// 1. 过滤出路由列表中可调度的账号
 										var routingCandidates []*Account
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+										var filteredExcluded, filteredMissing, filteredUnsched, filteredPlatform, filteredModelScope, filteredModelMapping, filteredWindowCost int
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+										for _, routingAccountID := range routingAccountIDs {
 											if isExcluded(routingAccountID) {
 												filteredExcluded++
 												continue
 											}
 											account, ok := accountByID[routingAccountID]
 											if !ok || !account.IsSchedulable() {
 												if !ok {
 													filteredMissing++
 												} else {
 													filteredUnsched++
 												}
 												continue
 											}
 											if !s.isAccountAllowedForPlatform(account, platform, useMixed) {
 												filteredPlatform++
 												continue
 											}
 											if !account.IsSchedulableForModel(requestedModel) {
 												filteredModelScope++
 												continue
 											}
 											if requestedModel != "" && !s.isModelSupportedByAccount(account, requestedModel) {
 												filteredModelMapping++
 												continue
 											}
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+											// 窗口费用检查（非粘性会话路径）
 											if !s.isAccountSchedulableForWindowCost(ctx, account, false) {
 												filteredWindowCost++
 												continue
 											}
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+											routingCandidates = append(routingCandidates, account)
 										}
 										if s.debugModelRoutingEnabled() {
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+											log.Printf("[ModelRoutingDebug] routed candidates: group_id=%v model=%s routed=%d candidates=%d filtered(excluded=%d missing=%d unsched=%d platform=%d model_scope=%d model_mapping=%d window_cost=%d)",
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+												derefGroupID(groupID), requestedModel, len(routingAccountIDs), len(routingCandidates),
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+												filteredExcluded, filteredMissing, filteredUnsched, filteredPlatform, filteredModelScope, filteredModelMapping, filteredWindowCost)
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+										}
 										if len(routingCandidates) > 0 {
 											// 1.5. 在路由账号范围内检查粘性会话
 											if sessionHash != "" && s.cache != nil {
 												stickyAccountID, err := s.cache.GetSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
 												if err == nil && stickyAccountID > 0 && containsInt64(routingAccountIDs, stickyAccountID) && !isExcluded(stickyAccountID) {
 													// 粘性账号在路由列表中，优先使用
 													if stickyAccount, ok := accountByID[stickyAccountID]; ok {
 														if stickyAccount.IsSchedulable() &&
 															s.isAccountAllowedForPlatform(stickyAccount, platform, useMixed) &&
 															stickyAccount.IsSchedulableForModel(requestedModel) &&
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+															(requestedModel == "" || s.isModelSupportedByAccount(stickyAccount, requestedModel)) &&
 															s.isAccountSchedulableForWindowCost(ctx, stickyAccount, true) { // 粘性会话窗口费用检查
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+															result, err := s.tryAcquireAccountSlot(ctx, stickyAccountID, stickyAccount.Concurrency)
 															if err == nil && result.Acquired {
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+																// 会话数量限制检查
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+																if !s.checkAndRegisterSession(ctx, stickyAccount, sessionHash) {
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+																	result.ReleaseFunc() // 释放槽位
 																	// 继续到负载感知选择
 																} else {
 																	_ = s.cache.RefreshSessionTTL(ctx, derefGroupID(groupID), sessionHash, stickySessionTTL)
 																	if s.debugModelRoutingEnabled() {
 																		log.Printf("[ModelRoutingDebug] routed sticky hit: group_id=%v model=%s session=%s account=%d", derefGroupID(groupID), requestedModel, shortSessionHash(sessionHash), stickyAccountID)
 																	}
 																	return &AccountSelectionResult{
 																		Account:     stickyAccount,
 																		Acquired:    true,
 																		ReleaseFunc: result.ReleaseFunc,
 																	}, nil
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+																}
 															}
 															waitingCount, _ := s.concurrencyService.GetAccountWaitingCount(ctx, stickyAccountID)
 															if waitingCount < cfg.StickySessionMaxWaiting {
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+																// 会话数量限制检查（等待计划也需要占用会话配额）
 																if !s.checkAndRegisterSession(ctx, stickyAccount, sessionHash) {
 																	// 会话限制已满，继续到负载感知选择
 																} else {
 																	return &AccountSelectionResult{
 																		Account: stickyAccount,
 																		WaitPlan: &AccountWaitPlan{
 																			AccountID:      stickyAccountID,
 																			MaxConcurrency: stickyAccount.Concurrency,
 																			Timeout:        cfg.StickySessionWaitTimeout,
 																			MaxWaiting:     cfg.StickySessionMaxWaiting,
 																		},
 																	}, nil
 																}
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+															}
 															// 粘性账号槽位满且等待队列已满，继续使用负载感知选择
 														}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+													} else {
 														_ = s.cache.DeleteSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+													}
 												}
 											}
 											// 2. 批量获取负载信息
 											routingLoads := make([]AccountWithConcurrency, 0, len(routingCandidates))
 											for _, acc := range routingCandidates {
 												routingLoads = append(routingLoads, AccountWithConcurrency{
 													ID:             acc.ID,
 													MaxConcurrency: acc.Concurrency,
 												})
 											}
 											routingLoadMap, _ := s.concurrencyService.GetAccountsLoadBatch(ctx, routingLoads)
 											// 3. 按负载感知排序
 											type accountWithLoad struct {
 												account  *Account
 												loadInfo *AccountLoadInfo
 											}
 											var routingAvailable []accountWithLoad
 											for _, acc := range routingCandidates {
 												loadInfo := routingLoadMap[acc.ID]
 												if loadInfo == nil {
 													loadInfo = &AccountLoadInfo{AccountID: acc.ID}
 												}
 												if loadInfo.LoadRate < 100 {
 													routingAvailable = append(routingAvailable, accountWithLoad{account: acc, loadInfo: loadInfo})
 												}
 											}
 											if len(routingAvailable) > 0 {
 												// 排序：优先级 > 负载率 > 最后使用时间
 												sort.SliceStable(routingAvailable, func(i, j int) bool {
 													a, b := routingAvailable[i], routingAvailable[j]
 													if a.account.Priority != b.account.Priority {
 														return a.account.Priority < b.account.Priority
 													}
 													if a.loadInfo.LoadRate != b.loadInfo.LoadRate {
 														return a.loadInfo.LoadRate < b.loadInfo.LoadRate
 													}
 													switch {
 													case a.account.LastUsedAt == nil && b.account.LastUsedAt != nil:
 														return true
 													case a.account.LastUsedAt != nil && b.account.LastUsedAt == nil:
 														return false
 													case a.account.LastUsedAt == nil && b.account.LastUsedAt == nil:
 														return false
 													default:
 														return a.account.LastUsedAt.Before(*b.account.LastUsedAt)
 													}
 												})
 												// 4. 尝试获取槽位
 												for _, item := range routingAvailable {
 													result, err := s.tryAcquireAccountSlot(ctx, item.account.ID, item.account.Concurrency)
 													if err == nil && result.Acquired {
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+														// 会话数量限制检查
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+														if !s.checkAndRegisterSession(ctx, item.account, sessionHash) {
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+															result.ReleaseFunc() // 释放槽位，继续尝试下一个账号
 															continue
 														}
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+														if sessionHash != "" && s.cache != nil {
 															_ = s.cache.SetSessionAccountID(ctx, derefGroupID(groupID), sessionHash, item.account.ID, stickySessionTTL)
 														}
 														if s.debugModelRoutingEnabled() {
 															log.Printf("[ModelRoutingDebug] routed select: group_id=%v model=%s session=%s account=%d", derefGroupID(groupID), requestedModel, shortSessionHash(sessionHash), item.account.ID)
 														}
 														return &AccountSelectionResult{
 															Account:     item.account,
 															Acquired:    true,
 															ReleaseFunc: result.ReleaseFunc,
 														}, nil
 													}
 												}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+												// 5. 所有路由账号槽位满，尝试返回等待计划（选择负载最低的）
 												// 遍历找到第一个满足会话限制的账号
 												for _, item := range routingAvailable {
 													if !s.checkAndRegisterSession(ctx, item.account, sessionHash) {
 														continue // 会话限制已满，尝试下一个
 													}
 													if s.debugModelRoutingEnabled() {
 														log.Printf("[ModelRoutingDebug] routed wait: group_id=%v model=%s session=%s account=%d", derefGroupID(groupID), requestedModel, shortSessionHash(sessionHash), item.account.ID)
 													}
 													return &AccountSelectionResult{
 														Account: item.account,
 														WaitPlan: &AccountWaitPlan{
 															AccountID:      item.account.ID,
 															MaxConcurrency: item.account.Concurrency,
 															Timeout:        cfg.StickySessionWaitTimeout,
 															MaxWaiting:     cfg.StickySessionMaxWaiting,
 														},
 													}, nil
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+												}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+												// 所有路由账号会话限制都已满，继续到 Layer 2 回退
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+											}
 											// 路由列表中的账号都不可用（负载率 >= 100），继续到 Layer 2 回退
 											log.Printf("[ModelRouting] All routed accounts unavailable for model=%s, falling back to normal selection", requestedModel)
 										}
 									}
 									// ============ Layer 1.5: 粘性会话（仅在无模型路由配置时生效） ============
 									if len(routingAccountIDs) == 0 && sessionHash != "" && s.cache != nil {
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+										accountID, err := s.cache.GetSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										if err == nil && accountID > 0 && !isExcluded(accountID) {
-												perf(网关): 粘性会话命中复用候选账号

使用候选账号映射避免粘性命中时额外的 GetByID 查询
新增单测确保粘性命中不触发 GetByID 且提前返回

											
										
										
											2026-01-10 14:39:33 +08:00
+											account, ok := accountByID[accountID]
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+											if ok {
 												// 检查账户是否需要清理粘性会话绑定
 												// Check if the account needs sticky session cleanup
 												clearSticky := shouldClearStickySession(account)
 												if clearSticky {
 													_ = s.cache.DeleteSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+												}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+												if !clearSticky && s.isAccountInGroup(account, groupID) &&
 													s.isAccountAllowedForPlatform(account, platform, useMixed) &&
 													account.IsSchedulableForModel(requestedModel) &&
 													(requestedModel == "" || s.isModelSupportedByAccount(account, requestedModel)) &&
 													s.isAccountSchedulableForWindowCost(ctx, account, true) { // 粘性会话窗口费用检查
 													result, err := s.tryAcquireAccountSlot(ctx, accountID, account.Concurrency)
 													if err == nil && result.Acquired {
 														// 会话数量限制检查
 														// Session count limit check
 														if !s.checkAndRegisterSession(ctx, account, sessionHash) {
 															result.ReleaseFunc() // 释放槽位，继续到 Layer 2
 														} else {
 															_ = s.cache.RefreshSessionTTL(ctx, derefGroupID(groupID), sessionHash, stickySessionTTL)
 															return &AccountSelectionResult{
 																Account:     account,
 																Acquired:    true,
 																ReleaseFunc: result.ReleaseFunc,
 															}, nil
 														}
 													}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+													waitingCount, _ := s.concurrencyService.GetAccountWaitingCount(ctx, accountID)
 													if waitingCount < cfg.StickySessionMaxWaiting {
 														// 会话数量限制检查（等待计划也需要占用会话配额）
 														// Session count limit check (wait plan also requires session quota)
 														if !s.checkAndRegisterSession(ctx, account, sessionHash) {
 															// 会话限制已满，继续到 Layer 2
 															// Session limit full, continue to Layer 2
 														} else {
 															return &AccountSelectionResult{
 																Account: account,
 																WaitPlan: &AccountWaitPlan{
 																	AccountID:      accountID,
 																	MaxConcurrency: account.Concurrency,
 																	Timeout:        cfg.StickySessionWaitTimeout,
 																	MaxWaiting:     cfg.StickySessionMaxWaiting,
 																},
 															}, nil
 														}
 													}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+												}
 											}
 										}
 									}
 									// ============ Layer 2: 负载感知选择 ============
 									candidates := make([]*Account, 0, len(accounts))
 									for i := range accounts {
 										acc := &accounts[i]
 										if isExcluded(acc.ID) {
 											continue
 										}
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+										// Scheduler snapshots can be temporarily stale (bucket rebuild is throttled);
 										// re-check schedulability here so recently rate-limited/overloaded accounts
 										// are not selected again before the bucket is rebuilt.
 										if !acc.IsSchedulable() {
 											continue
 										}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										if !s.isAccountAllowedForPlatform(acc, platform, useMixed) {
 											continue
 										}
-												feat: antigravity 配额域限流

											
										
										
											2026-01-09 17:35:02 +08:00
+										if !acc.IsSchedulableForModel(requestedModel) {
 											continue
 										}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										if requestedModel != "" && !s.isModelSupportedByAccount(acc, requestedModel) {
 											continue
 										}
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+										// 窗口费用检查（非粘性会话路径）
 										if !s.isAccountSchedulableForWindowCost(ctx, acc, false) {
 											continue
 										}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										candidates = append(candidates, acc)
 									}
 									if len(candidates) == 0 {
 										return nil, errors.New("no available accounts")
 									}
 									accountLoads := make([]AccountWithConcurrency, 0, len(candidates))
 									for _, acc := range candidates {
 										accountLoads = append(accountLoads, AccountWithConcurrency{
 											ID:             acc.ID,
 											MaxConcurrency: acc.Concurrency,
 										})
 									}
 									loadMap, err := s.concurrencyService.GetAccountsLoadBatch(ctx, accountLoads)
 									if err != nil {
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+										if result, ok := s.tryAcquireByLegacyOrder(ctx, candidates, groupID, sessionHash, preferOAuth); ok {
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+											return result, nil
 										}
 									} else {
 										type accountWithLoad struct {
 											account  *Account
 											loadInfo *AccountLoadInfo
 										}
 										var available []accountWithLoad
 										for _, acc := range candidates {
 											loadInfo := loadMap[acc.ID]
 											if loadInfo == nil {
 												loadInfo = &AccountLoadInfo{AccountID: acc.ID}
 											}
 											if loadInfo.LoadRate < 100 {
 												available = append(available, accountWithLoad{
 													account:  acc,
 													loadInfo: loadInfo,
 												})
 											}
 										}
 										if len(available) > 0 {
 											sort.SliceStable(available, func(i, j int) bool {
 												a, b := available[i], available[j]
 												if a.account.Priority != b.account.Priority {
 													return a.account.Priority < b.account.Priority
 												}
 												if a.loadInfo.LoadRate != b.loadInfo.LoadRate {
 													return a.loadInfo.LoadRate < b.loadInfo.LoadRate
 												}
 												switch {
 												case a.account.LastUsedAt == nil && b.account.LastUsedAt != nil:
 													return true
 												case a.account.LastUsedAt != nil && b.account.LastUsedAt == nil:
 													return false
 												case a.account.LastUsedAt == nil && b.account.LastUsedAt == nil:
 													if preferOAuth && a.account.Type != b.account.Type {
 														return a.account.Type == AccountTypeOAuth
 													}
 													return false
 												default:
 													return a.account.LastUsedAt.Before(*b.account.LastUsedAt)
 												}
 											})
 											for _, item := range available {
 												result, err := s.tryAcquireAccountSlot(ctx, item.account.ID, item.account.Concurrency)
 												if err == nil && result.Acquired {
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+													// 会话数量限制检查
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+													if !s.checkAndRegisterSession(ctx, item.account, sessionHash) {
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+														result.ReleaseFunc() // 释放槽位，继续尝试下一个账号
 														continue
 													}
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+													if sessionHash != "" && s.cache != nil {
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+														_ = s.cache.SetSessionAccountID(ctx, derefGroupID(groupID), sessionHash, item.account.ID, stickySessionTTL)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+													}
 													return &AccountSelectionResult{
 														Account:     item.account,
 														Acquired:    true,
 														ReleaseFunc: result.ReleaseFunc,
 													}, nil
 												}
 											}
 										}
 									}
 									// ============ Layer 3: 兜底排队 ============
-												feat(scheduling): 兜底层账户选择策略可配置

- gateway.scheduling.fallback_selection_mode: "last_used"(默认) 或 "random"
- last_used: 按最后使用时间排序（轮询效果）
- random: 同优先级内随机选择

											
										
										
											2026-01-16 20:47:07 +08:00
+									s.sortCandidatesForFallback(candidates, preferOAuth, cfg.FallbackSelectionMode)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									for _, acc := range candidates {
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+										// 会话数量限制检查（等待计划也需要占用会话配额）
 										if !s.checkAndRegisterSession(ctx, acc, sessionHash) {
 											continue // 会话限制已满，尝试下一个账号
 										}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										return &AccountSelectionResult{
 											Account: acc,
 											WaitPlan: &AccountWaitPlan{
 												AccountID:      acc.ID,
 												MaxConcurrency: acc.Concurrency,
 												Timeout:        cfg.FallbackWaitTimeout,
 												MaxWaiting:     cfg.FallbackMaxWaiting,
 											},
 										}, nil
 									}
 									return nil, errors.New("no available accounts")
 								}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+								func (s *GatewayService) tryAcquireByLegacyOrder(ctx context.Context, candidates []*Account, groupID *int64, sessionHash string, preferOAuth bool) (*AccountSelectionResult, bool) {
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									ordered := append([]*Account(nil), candidates...)
 									sortAccountsByPriorityAndLastUsed(ordered, preferOAuth)
 									for _, acc := range ordered {
 										result, err := s.tryAcquireAccountSlot(ctx, acc.ID, acc.Concurrency)
 										if err == nil && result.Acquired {
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+											// 会话数量限制检查
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+											if !s.checkAndRegisterSession(ctx, acc, sessionHash) {
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+												result.ReleaseFunc() // 释放槽位，继续尝试下一个账号
 												continue
 											}
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+											if sessionHash != "" && s.cache != nil {
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+												_ = s.cache.SetSessionAccountID(ctx, derefGroupID(groupID), sessionHash, acc.ID, stickySessionTTL)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+											}
 											return &AccountSelectionResult{
 												Account:     acc,
 												Acquired:    true,
 												ReleaseFunc: result.ReleaseFunc,
 											}, true
 										}
 									}
 									return nil, false
 								}
 								func (s *GatewayService) schedulingConfig() config.GatewaySchedulingConfig {
 									if s.cfg != nil {
 										return s.cfg.Gateway.Scheduling
 									}
 									return config.GatewaySchedulingConfig{
 										StickySessionMaxWaiting:  3,
 										StickySessionWaitTimeout: 45 * time.Second,
 										FallbackWaitTimeout:      30 * time.Second,
 										FallbackMaxWaiting:       100,
 										LoadBatchEnabled:         true,
 										SlotCleanupInterval:      30 * time.Second,
 									}
 								}
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+								func (s *GatewayService) withGroupContext(ctx context.Context, group *Group) context.Context {
-												fix(分组): 防止降级环并校验上下文分组

- 增加降级链路环检测并拦截配置

- 仅复用合法分组上下文并必要时回退查询

- 标注 GetByIDLite 轻量语义并补充测试

											
										
										
											2026-01-10 07:56:50 +08:00
+									if !IsGroupContextValid(group) {
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+										return ctx
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+									}
-												fix(分组): 强化上下文分组可信校验

- 引入 Hydrated 标记限制复用来源

- 无效上下文分组允许被新值覆盖自愈

- 更新相关单测覆盖

											
										
										
											2026-01-10 08:40:27 +08:00
+									if existing, ok := ctx.Value(ctxkey.Group).(*Group); ok && existing != nil && existing.ID == group.ID && IsGroupContextValid(existing) {
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+										return ctx
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+									}
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+									return context.WithValue(ctx, ctxkey.Group, group)
 								}
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+								func (s *GatewayService) groupFromContext(ctx context.Context, groupID int64) *Group {
-												fix(分组): 防止降级环并校验上下文分组

- 增加降级链路环检测并拦截配置

- 仅复用合法分组上下文并必要时回退查询

- 标注 GetByIDLite 轻量语义并补充测试

											
										
										
											2026-01-10 07:56:50 +08:00
+									if group, ok := ctx.Value(ctxkey.Group).(*Group); ok && IsGroupContextValid(group) && group.ID == groupID {
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+										return group
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+									}
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+									return nil
 								}
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+								func (s *GatewayService) resolveGroupByID(ctx context.Context, groupID int64) (*Group, error) {
 									if group := s.groupFromContext(ctx, groupID); group != nil {
 										return group, nil
 									}
 									group, err := s.groupRepo.GetByIDLite(ctx, groupID)
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+									if err != nil {
 										return nil, fmt.Errorf("get group failed: %w", err)
 									}
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+									return group, nil
 								}
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
-												Add invalid-request fallback routing

											
										
										
											2026-01-23 22:24:46 +08:00
+								func (s *GatewayService) ResolveGroupByID(ctx context.Context, groupID int64) (*Group, error) {
 									return s.resolveGroupByID(ctx, groupID)
 								}
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+								func (s *GatewayService) routingAccountIDsForRequest(ctx context.Context, groupID *int64, requestedModel string, platform string) []int64 {
 									if groupID == nil || requestedModel == "" || platform != PlatformAnthropic {
 										return nil
 									}
 									group, err := s.resolveGroupByID(ctx, *groupID)
 									if err != nil || group == nil {
 										if s.debugModelRoutingEnabled() {
 											log.Printf("[ModelRoutingDebug] resolve group failed: group_id=%v model=%s platform=%s err=%v", derefGroupID(groupID), requestedModel, platform, err)
 										}
 										return nil
 									}
 									// Preserve existing behavior: model routing only applies to anthropic groups.
 									if group.Platform != PlatformAnthropic {
 										if s.debugModelRoutingEnabled() {
 											log.Printf("[ModelRoutingDebug] skip: non-anthropic group platform: group_id=%d group_platform=%s model=%s", group.ID, group.Platform, requestedModel)
 										}
 										return nil
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+									}
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+									ids := group.GetRoutingAccountIDs(requestedModel)
 									if s.debugModelRoutingEnabled() {
 										log.Printf("[ModelRoutingDebug] routing lookup: group_id=%d model=%s enabled=%v rules=%d matched_ids=%v",
 											group.ID, requestedModel, group.ModelRoutingEnabled, len(group.ModelRouting), ids)
 									}
 									return ids
 								}
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+								func (s *GatewayService) resolveGatewayGroup(ctx context.Context, groupID *int64) (*Group, *int64, error) {
 									if groupID == nil {
 										return nil, nil, nil
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+									}
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+									currentID := *groupID
-												fix(分组): 防止降级环并校验上下文分组

- 增加降级链路环检测并拦截配置

- 仅复用合法分组上下文并必要时回退查询

- 标注 GetByIDLite 轻量语义并补充测试

											
										
										
											2026-01-10 07:56:50 +08:00
+									visited := map[int64]struct{}{}
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+									for {
-												fix(分组): 防止降级环并校验上下文分组

- 增加降级链路环检测并拦截配置

- 仅复用合法分组上下文并必要时回退查询

- 标注 GetByIDLite 轻量语义并补充测试

											
										
										
											2026-01-10 07:56:50 +08:00
+										if _, seen := visited[currentID]; seen {
 											return nil, nil, fmt.Errorf("fallback group cycle detected")
 										}
 										visited[currentID] = struct{}{}
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+										group, err := s.resolveGroupByID(ctx, currentID)
 										if err != nil {
 											return nil, nil, err
 										}
 										if !group.ClaudeCodeOnly || IsClaudeCodeClient(ctx) {
 											return group, &currentID, nil
 										}
 										if group.FallbackGroupID == nil {
 											return nil, nil, ErrClaudeCodeOnly
 										}
 										currentID = *group.FallbackGroupID
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+									}
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+								}
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+								// checkClaudeCodeRestriction 检查分组的 Claude Code 客户端限制
 								// 如果分组启用了 claude_code_only 且请求不是来自 Claude Code 客户端：
 								//   - 有降级分组：返回降级分组的 ID
 								//   - 无降级分组：返回 ErrClaudeCodeOnly 错误
 								func (s *GatewayService) checkClaudeCodeRestriction(ctx context.Context, groupID *int64) (*Group, *int64, error) {
 									if groupID == nil {
 										return nil, groupID, nil
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+									}
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+									// 强制平台模式不检查 Claude Code 限制
-												Add invalid-request fallback routing

											
										
										
											2026-01-23 22:24:46 +08:00
+									if forcePlatform, hasForcePlatform := ctx.Value(ctxkey.ForcePlatform).(string); hasForcePlatform && forcePlatform != "" {
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+										return nil, groupID, nil
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+									}
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+									group, resolvedID, err := s.resolveGatewayGroup(ctx, groupID)
 									if err != nil {
 										return nil, nil, err
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+									}
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+									return group, resolvedID, nil
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+								}
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+								func (s *GatewayService) resolvePlatform(ctx context.Context, groupID *int64, group *Group) (string, bool, error) {
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									forcePlatform, hasForcePlatform := ctx.Value(ctxkey.ForcePlatform).(string)
 									if hasForcePlatform && forcePlatform != "" {
 										return forcePlatform, true, nil
 									}
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+									if group != nil {
 										return group.Platform, false, nil
 									}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									if groupID != nil {
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+										group, err := s.resolveGroupByID(ctx, *groupID)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										if err != nil {
-												perf(网关): 复用分组上下文减少热路径查询

新增 GetByIDLite 并在网关与 Gemini 选择流程复用上下文 group，避免 COUNT 触发
更新 API key 中间件注入 group 上下文，减少重复查库
补充 gateway/gemini 中间件与仓库层回归测试

测试: make test

											
										
										
											2026-01-09 23:01:42 +08:00
+											return "", false, err
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										}
 										return group.Platform, false, nil
 									}
 									return PlatformAnthropic, false, nil
 								}
 								func (s *GatewayService) listSchedulableAccounts(ctx context.Context, groupID *int64, platform string, hasForcePlatform bool) ([]Account, bool, error) {
-												feat(scheduler): 引入调度快照缓存与 outbox 回放

- 调度热路径优先读 Redis 快照，保留分组排序语义
- outbox 回放 + 全量重建纠偏，失败重试不推进水位
- 自动 Atlas 基线对齐并同步调度配置示例

											
										
										
											2026-01-12 14:19:06 +08:00
+									if s.schedulerSnapshot != nil {
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+										accounts, useMixed, err := s.schedulerSnapshot.ListSchedulableAccounts(ctx, groupID, platform, hasForcePlatform)
 										if err == nil {
 											slog.Debug("account_scheduling_list_snapshot",
 												"group_id", derefGroupID(groupID),
 												"platform", platform,
 												"use_mixed", useMixed,
 												"count", len(accounts))
 											for _, acc := range accounts {
 												slog.Debug("account_scheduling_account_detail",
 													"account_id", acc.ID,
 													"name", acc.Name,
 													"platform", acc.Platform,
 													"type", acc.Type,
 													"status", acc.Status,
 													"tls_fingerprint", acc.IsTLSFingerprintEnabled())
 											}
 										}
 										return accounts, useMixed, err
-												feat(scheduler): 引入调度快照缓存与 outbox 回放

- 调度热路径优先读 Redis 快照，保留分组排序语义
- outbox 回放 + 全量重建纠偏，失败重试不推进水位
- 自动 Atlas 基线对齐并同步调度配置示例

											
										
										
											2026-01-12 14:19:06 +08:00
+									}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									useMixed := (platform == PlatformAnthropic || platform == PlatformGemini) && !hasForcePlatform
 									if useMixed {
 										platforms := []string{platform, PlatformAntigravity}
 										var accounts []Account
 										var err error
 										if groupID != nil {
 											accounts, err = s.accountRepo.ListSchedulableByGroupIDAndPlatforms(ctx, *groupID, platforms)
 										} else {
 											accounts, err = s.accountRepo.ListSchedulableByPlatforms(ctx, platforms)
 										}
 										if err != nil {
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+											slog.Debug("account_scheduling_list_failed",
 												"group_id", derefGroupID(groupID),
 												"platform", platform,
 												"error", err)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+											return nil, useMixed, err
 										}
 										filtered := make([]Account, 0, len(accounts))
 										for _, acc := range accounts {
 											if acc.Platform == PlatformAntigravity && !acc.IsMixedSchedulingEnabled() {
 												continue
 											}
 											filtered = append(filtered, acc)
 										}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+										slog.Debug("account_scheduling_list_mixed",
 											"group_id", derefGroupID(groupID),
 											"platform", platform,
 											"raw_count", len(accounts),
 											"filtered_count", len(filtered))
 										for _, acc := range filtered {
 											slog.Debug("account_scheduling_account_detail",
 												"account_id", acc.ID,
 												"name", acc.Name,
 												"platform", acc.Platform,
 												"type", acc.Type,
 												"status", acc.Status,
 												"tls_fingerprint", acc.IsTLSFingerprintEnabled())
 										}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										return filtered, useMixed, nil
 									}
 									var accounts []Account
 									var err error
 									if s.cfg != nil && s.cfg.RunMode == config.RunModeSimple {
 										accounts, err = s.accountRepo.ListSchedulableByPlatform(ctx, platform)
 									} else if groupID != nil {
 										accounts, err = s.accountRepo.ListSchedulableByGroupIDAndPlatform(ctx, *groupID, platform)
-												fix(gateway): 修复账号跨分组调度问题

问题：账号可能被调度到未分配的分组（如 simon 账号被调度到 claude_default）

根因：
- 强制平台模式下分组查询失败时回退到全平台查询
- listSchedulableAccounts 中分组为空时回退到无分组查询
- 粘性会话只检查平台匹配，未校验账号分组归属

修复：
- 移除强制平台模式的回退逻辑，分组内无账号时返回错误
- 移除 listSchedulableAccounts 的回退逻辑
- 新增 isAccountInGroup 方法用于分组校验
- 在三处粘性会话检查中增加分组归属验证

											
										
										
											2026-01-07 10:56:52 +08:00
+										// 分组内无账号则返回空列表，由上层处理错误，不再回退到全平台查询
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									} else {
 										accounts, err = s.accountRepo.ListSchedulableByPlatform(ctx, platform)
 									}
 									if err != nil {
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+										slog.Debug("account_scheduling_list_failed",
 											"group_id", derefGroupID(groupID),
 											"platform", platform,
 											"error", err)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										return nil, useMixed, err
 									}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+									slog.Debug("account_scheduling_list_single",
 										"group_id", derefGroupID(groupID),
 										"platform", platform,
 										"count", len(accounts))
 									for _, acc := range accounts {
 										slog.Debug("account_scheduling_account_detail",
 											"account_id", acc.ID,
 											"name", acc.Name,
 											"platform", acc.Platform,
 											"type", acc.Type,
 											"status", acc.Status,
 											"tls_fingerprint", acc.IsTLSFingerprintEnabled())
 									}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									return accounts, useMixed, nil
 								}
 								func (s *GatewayService) isAccountAllowedForPlatform(account *Account, platform string, useMixed bool) bool {
 									if account == nil {
 										return false
 									}
 									if useMixed {
 										if account.Platform == platform {
 											return true
 										}
 										return account.Platform == PlatformAntigravity && account.IsMixedSchedulingEnabled()
 									}
 									return account.Platform == platform
 								}
-												fix(gateway): 修复账号跨分组调度问题

问题：账号可能被调度到未分配的分组（如 simon 账号被调度到 claude_default）

根因：
- 强制平台模式下分组查询失败时回退到全平台查询
- listSchedulableAccounts 中分组为空时回退到无分组查询
- 粘性会话只检查平台匹配，未校验账号分组归属

修复：
- 移除强制平台模式的回退逻辑，分组内无账号时返回错误
- 移除 listSchedulableAccounts 的回退逻辑
- 新增 isAccountInGroup 方法用于分组校验
- 在三处粘性会话检查中增加分组归属验证

											
										
										
											2026-01-07 10:56:52 +08:00
+								// isAccountInGroup checks if the account belongs to the specified group.
 								// Returns true if groupID is nil (no group restriction) or account belongs to the group.
 								func (s *GatewayService) isAccountInGroup(account *Account, groupID *int64) bool {
 									if groupID == nil {
 										return true // 无分组限制
 									}
 									if account == nil {
 										return false
 									}
 									for _, ag := range account.AccountGroups {
 										if ag.GroupID == *groupID {
 											return true
 										}
 									}
 									return false
 								}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+								func (s *GatewayService) tryAcquireAccountSlot(ctx context.Context, accountID int64, maxConcurrency int) (*AcquireResult, error) {
 									if s.concurrencyService == nil {
 										return &AcquireResult{Acquired: true, ReleaseFunc: func() {}}, nil
 									}
 									return s.concurrencyService.AcquireAccountSlot(ctx, accountID, maxConcurrency)
 								}
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+								// isAccountSchedulableForWindowCost 检查账号是否可根据窗口费用进行调度
 								// 仅适用于 Anthropic OAuth/SetupToken 账号
 								// 返回 true 表示可调度，false 表示不可调度
 								func (s *GatewayService) isAccountSchedulableForWindowCost(ctx context.Context, account *Account, isSticky bool) bool {
 									// 只检查 Anthropic OAuth/SetupToken 账号
 									if !account.IsAnthropicOAuthOrSetupToken() {
 										return true
 									}
 									limit := account.GetWindowCostLimit()
 									if limit <= 0 {
 										return true // 未启用窗口费用限制
 									}
 									// 尝试从缓存获取窗口费用
 									var currentCost float64
 									if s.sessionLimitCache != nil {
 										if cost, hit, err := s.sessionLimitCache.GetWindowCost(ctx, account.ID); err == nil && hit {
 											currentCost = cost
 											goto checkSchedulability
 										}
 									}
 									// 缓存未命中，从数据库查询
 									{
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+										// 使用统一的窗口开始时间计算逻辑（考虑窗口过期情况）
 										startTime := account.GetCurrentWindowStartTime()
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
 										stats, err := s.usageLogRepo.GetAccountWindowStats(ctx, account.ID, startTime)
 										if err != nil {
 											// 失败开放：查询失败时允许调度
 											return true
 										}
 										// 使用标准费用（不含账号倍率）
 										currentCost = stats.StandardCost
 										// 设置缓存（忽略错误）
 										if s.sessionLimitCache != nil {
 											_ = s.sessionLimitCache.SetWindowCost(ctx, account.ID, currentCost)
 										}
 									}
 								checkSchedulability:
 									schedulability := account.CheckWindowCostSchedulability(currentCost)
 									switch schedulability {
 									case WindowCostSchedulable:
 										return true
 									case WindowCostStickyOnly:
 										return isSticky
 									case WindowCostNotSchedulable:
 										return false
 									}
 									return true
 								}
 								// checkAndRegisterSession 检查并注册会话，用于会话数量限制
 								// 仅适用于 Anthropic OAuth/SetupToken 账号
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+								// sessionID: 会话标识符（使用粘性会话的 hash）
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+								// 返回 true 表示允许（在限制内或会话已存在），false 表示拒绝（超出限制且是新会话）
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+								func (s *GatewayService) checkAndRegisterSession(ctx context.Context, account *Account, sessionID string) bool {
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+									// 只检查 Anthropic OAuth/SetupToken 账号
 									if !account.IsAnthropicOAuthOrSetupToken() {
 										return true
 									}
 									maxSessions := account.GetMaxSessions()
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+									if maxSessions <= 0 || sessionID == "" {
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+										return true // 未启用会话限制或无会话ID
 									}
 									if s.sessionLimitCache == nil {
 										return true // 缓存不可用时允许通过
 									}
 									idleTimeout := time.Duration(account.GetSessionIdleTimeoutMinutes()) * time.Minute
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+									allowed, err := s.sessionLimitCache.RegisterSession(ctx, account.ID, sessionID, maxSessions, idleTimeout)
-												feat: 添加5h窗口费用控制和会话数量限制

- 支持Anthropic OAuth/SetupToken账号的5h窗口费用阈值控制
- 支持账号级别的并发会话数量限制
- 使用Redis缓存窗口费用(30秒TTL)减少数据库压力
- 费用计算基于标准费用(不含账号倍率)

											
										
										
											2026-01-16 23:36:52 +08:00
+									if err != nil {
 										// 失败开放：缓存错误时允许通过
 										return true
 									}
 									return allowed
 								}
-												feat(scheduler): 引入调度快照缓存与 outbox 回放

- 调度热路径优先读 Redis 快照，保留分组排序语义
- outbox 回放 + 全量重建纠偏，失败重试不推进水位
- 自动 Atlas 基线对齐并同步调度配置示例

											
										
										
											2026-01-12 14:19:06 +08:00
+								func (s *GatewayService) getSchedulableAccount(ctx context.Context, accountID int64) (*Account, error) {
 									if s.schedulerSnapshot != nil {
 										return s.schedulerSnapshot.GetAccount(ctx, accountID)
 									}
 									return s.accountRepo.GetByID(ctx, accountID)
 								}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+								func sortAccountsByPriorityAndLastUsed(accounts []*Account, preferOAuth bool) {
 									sort.SliceStable(accounts, func(i, j int) bool {
 										a, b := accounts[i], accounts[j]
 										if a.Priority != b.Priority {
 											return a.Priority < b.Priority
 										}
 										switch {
 										case a.LastUsedAt == nil && b.LastUsedAt != nil:
 											return true
 										case a.LastUsedAt != nil && b.LastUsedAt == nil:
 											return false
 										case a.LastUsedAt == nil && b.LastUsedAt == nil:
 											if preferOAuth && a.Type != b.Type {
 												return a.Type == AccountTypeOAuth
 											}
 											return false
 										default:
 											return a.LastUsedAt.Before(*b.LastUsedAt)
 										}
 									})
 								}
-												feat(scheduling): 兜底层账户选择策略可配置

- gateway.scheduling.fallback_selection_mode: "last_used"(默认) 或 "random"
- last_used: 按最后使用时间排序（轮询效果）
- random: 同优先级内随机选择

											
										
										
											2026-01-16 20:47:07 +08:00
+								// sortCandidatesForFallback 根据配置选择排序策略
 								// mode: "last_used"(按最后使用时间) 或 "random"(随机)
 								func (s *GatewayService) sortCandidatesForFallback(accounts []*Account, preferOAuth bool, mode string) {
 									if mode == "random" {
 										// 先按优先级排序，然后在同优先级内随机打乱
 										sortAccountsByPriorityOnly(accounts, preferOAuth)
 										shuffleWithinPriority(accounts)
 									} else {
 										// 默认按最后使用时间排序
 										sortAccountsByPriorityAndLastUsed(accounts, preferOAuth)
 									}
 								}
 								// sortAccountsByPriorityOnly 仅按优先级排序
 								func sortAccountsByPriorityOnly(accounts []*Account, preferOAuth bool) {
 									sort.SliceStable(accounts, func(i, j int) bool {
 										a, b := accounts[i], accounts[j]
 										if a.Priority != b.Priority {
 											return a.Priority < b.Priority
 										}
 										if preferOAuth && a.Type != b.Type {
 											return a.Type == AccountTypeOAuth
 										}
 										return false
 									})
 								}
 								// shuffleWithinPriority 在同优先级内随机打乱顺序
 								func shuffleWithinPriority(accounts []*Account) {
 									if len(accounts) <= 1 {
 										return
 									}
 									r := mathrand.New(mathrand.NewSource(time.Now().UnixNano()))
 									start := 0
 									for start < len(accounts) {
 										priority := accounts[start].Priority
 										end := start + 1
 										for end < len(accounts) && accounts[end].Priority == priority {
 											end++
 										}
 										// 对 [start, end) 范围内的账户随机打乱
 										if end-start > 1 {
 											r.Shuffle(end-start, func(i, j int) {
 												accounts[start+i], accounts[start+j] = accounts[start+j], accounts[start+i]
 											})
 										}
 										start = end
 									}
 								}
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+								// selectAccountForModelWithPlatform 选择单平台账户（完全隔离）
 								func (s *GatewayService) selectAccountForModelWithPlatform(ctx context.Context, groupID *int64, sessionHash string, requestedModel string, excludedIDs map[int64]struct{}, platform string) (*Account, error) {
-												chore: apply stashed changes

											
										
										
											2026-02-02 22:20:08 +08:00
+									// 对 Antigravity 平台，检查请求的模型系列是否在分组支持范围内
 									if platform == PlatformAntigravity && groupID != nil && requestedModel != "" {
 										if err := s.checkAntigravityModelScope(ctx, *groupID, requestedModel); err != nil {
 											return nil, err
 										}
 									}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									preferOAuth := platform == PlatformGemini
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+									routingAccountIDs := s.routingAccountIDsForRequest(ctx, groupID, requestedModel, platform)
 									var accounts []Account
 									accountsLoaded := false
 									// ============ Model Routing (legacy path): apply before sticky session ============
 									// When load-awareness is disabled (e.g. concurrency service not configured), we still honor model routing
 									// so switching model can switch upstream account within the same sticky session.
 									if len(routingAccountIDs) > 0 {
 										if s.debugModelRoutingEnabled() {
 											log.Printf("[ModelRoutingDebug] legacy routed begin: group_id=%v model=%s platform=%s session=%s routed_ids=%v",
 												derefGroupID(groupID), requestedModel, platform, shortSessionHash(sessionHash), routingAccountIDs)
 										}
 										// 1) Sticky session only applies if the bound account is within the routing set.
 										if sessionHash != "" && s.cache != nil {
 											accountID, err := s.cache.GetSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
 											if err == nil && accountID > 0 && containsInt64(routingAccountIDs, accountID) {
 												if _, excluded := excludedIDs[accountID]; !excluded {
 													account, err := s.getSchedulableAccount(ctx, accountID)
 													// 检查账号分组归属和平台匹配（确保粘性会话不会跨分组或跨平台）
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+													if err == nil {
 														clearSticky := shouldClearStickySession(account)
 														if clearSticky {
 															_ = s.cache.DeleteSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+														}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+														if !clearSticky && s.isAccountInGroup(account, groupID) && account.Platform == platform && account.IsSchedulableForModel(requestedModel) && (requestedModel == "" || s.isModelSupportedByAccount(account, requestedModel)) {
 															if err := s.cache.RefreshSessionTTL(ctx, derefGroupID(groupID), sessionHash, stickySessionTTL); err != nil {
 																log.Printf("refresh session ttl failed: session=%s err=%v", sessionHash, err)
 															}
 															if s.debugModelRoutingEnabled() {
 																log.Printf("[ModelRoutingDebug] legacy routed sticky hit: group_id=%v model=%s session=%s account=%d", derefGroupID(groupID), requestedModel, shortSessionHash(sessionHash), accountID)
 															}
 															return account, nil
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+														}
 													}
 												}
 											}
 										}
 										// 2) Select an account from the routed candidates.
 										forcePlatform, hasForcePlatform := ctx.Value(ctxkey.ForcePlatform).(string)
 										if hasForcePlatform && forcePlatform == "" {
 											hasForcePlatform = false
 										}
 										var err error
 										accounts, _, err = s.listSchedulableAccounts(ctx, groupID, platform, hasForcePlatform)
 										if err != nil {
 											return nil, fmt.Errorf("query accounts failed: %w", err)
 										}
 										accountsLoaded = true
 										routingSet := make(map[int64]struct{}, len(routingAccountIDs))
 										for _, id := range routingAccountIDs {
 											if id > 0 {
 												routingSet[id] = struct{}{}
 											}
 										}
 										var selected *Account
 										for i := range accounts {
 											acc := &accounts[i]
 											if _, ok := routingSet[acc.ID]; !ok {
 												continue
 											}
 											if _, excluded := excludedIDs[acc.ID]; excluded {
 												continue
 											}
 											// Scheduler snapshots can be temporarily stale; re-check schedulability here to
 											// avoid selecting accounts that were recently rate-limited/overloaded.
 											if !acc.IsSchedulable() {
 												continue
 											}
 											if !acc.IsSchedulableForModel(requestedModel) {
 												continue
 											}
 											if requestedModel != "" && !s.isModelSupportedByAccount(acc, requestedModel) {
 												continue
 											}
 											if selected == nil {
 												selected = acc
 												continue
 											}
 											if acc.Priority < selected.Priority {
 												selected = acc
 											} else if acc.Priority == selected.Priority {
 												switch {
 												case acc.LastUsedAt == nil && selected.LastUsedAt != nil:
 													selected = acc
 												case acc.LastUsedAt != nil && selected.LastUsedAt == nil:
 													// keep selected (never used is preferred)
 												case acc.LastUsedAt == nil && selected.LastUsedAt == nil:
 													if preferOAuth && acc.Type != selected.Type && acc.Type == AccountTypeOAuth {
 														selected = acc
 													}
 												default:
 													if acc.LastUsedAt.Before(*selected.LastUsedAt) {
 														selected = acc
 													}
 												}
 											}
 										}
 										if selected != nil {
 											if sessionHash != "" && s.cache != nil {
 												if err := s.cache.SetSessionAccountID(ctx, derefGroupID(groupID), sessionHash, selected.ID, stickySessionTTL); err != nil {
 													log.Printf("set session account failed: session=%s account_id=%d err=%v", sessionHash, selected.ID, err)
 												}
 											}
 											if s.debugModelRoutingEnabled() {
 												log.Printf("[ModelRoutingDebug] legacy routed select: group_id=%v model=%s session=%s account=%d", derefGroupID(groupID), requestedModel, shortSessionHash(sessionHash), selected.ID)
 											}
 											return selected, nil
 										}
 										log.Printf("[ModelRouting] No routed accounts available for model=%s, falling back to normal selection", requestedModel)
 									}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									// 1. 查询粘性会话
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+									if sessionHash != "" && s.cache != nil {
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+										accountID, err := s.cache.GetSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										if err == nil && accountID > 0 {
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+											if _, excluded := excludedIDs[accountID]; !excluded {
-												feat(scheduler): 引入调度快照缓存与 outbox 回放

- 调度热路径优先读 Redis 快照，保留分组排序语义
- outbox 回放 + 全量重建纠偏，失败重试不推进水位
- 自动 Atlas 基线对齐并同步调度配置示例

											
										
										
											2026-01-12 14:19:06 +08:00
+												account, err := s.getSchedulableAccount(ctx, accountID)
-												fix(gateway): 修复账号跨分组调度问题

问题：账号可能被调度到未分配的分组（如 simon 账号被调度到 claude_default）

根因：
- 强制平台模式下分组查询失败时回退到全平台查询
- listSchedulableAccounts 中分组为空时回退到无分组查询
- 粘性会话只检查平台匹配，未校验账号分组归属

修复：
- 移除强制平台模式的回退逻辑，分组内无账号时返回错误
- 移除 listSchedulableAccounts 的回退逻辑
- 新增 isAccountInGroup 方法用于分组校验
- 在三处粘性会话检查中增加分组归属验证

											
										
										
											2026-01-07 10:56:52 +08:00
+												// 检查账号分组归属和平台匹配（确保粘性会话不会跨分组或跨平台）
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+												if err == nil {
 													clearSticky := shouldClearStickySession(account)
 													if clearSticky {
 														_ = s.cache.DeleteSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
 													}
 													if !clearSticky && s.isAccountInGroup(account, groupID) && account.Platform == platform && account.IsSchedulableForModel(requestedModel) && (requestedModel == "" || s.isModelSupportedByAccount(account, requestedModel)) {
 														if err := s.cache.RefreshSessionTTL(ctx, derefGroupID(groupID), sessionHash, stickySessionTTL); err != nil {
 															log.Printf("refresh session ttl failed: session=%s err=%v", sessionHash, err)
 														}
 														return account, nil
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+													}
-												ci(backend): 添加 github actions (#10)

## 变更内容

### CI/CD
- 添加 GitHub Actions 工作流（test + golangci-lint）
- 添加 golangci-lint 配置，启用 errcheck/govet/staticcheck/unused/depguard
- 通过 depguard 强制 service 层不能直接导入 repository

### 错误处理修复
- 修复 CSV 写入、SSE 流式输出、随机数生成等未处理的错误
- GenerateRedeemCode() 现在返回 error

### 资源泄露修复
- 统一使用 defer func() { _ = xxx.Close() }() 模式

### 代码清理
- 移除未使用的常量
- 简化 nil map 检查
- 统一代码格式
											
										
										
											2025-12-20 15:29:52 +08:00
+												}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+											}
 										}
 									}
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+									// 2. 获取可调度账号列表（单平台）
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+									if !accountsLoaded {
 										forcePlatform, hasForcePlatform := ctx.Value(ctxkey.ForcePlatform).(string)
 										if hasForcePlatform && forcePlatform == "" {
 											hasForcePlatform = false
 										}
 										var err error
 										accounts, _, err = s.listSchedulableAccounts(ctx, groupID, platform, hasForcePlatform)
 										if err != nil {
 											return nil, fmt.Errorf("query accounts failed: %w", err)
 										}
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+									}
 									// 3. 按优先级+最久未用选择（考虑模型支持）
 									var selected *Account
 									for i := range accounts {
 										acc := &accounts[i]
 										if _, excluded := excludedIDs[acc.ID]; excluded {
 											continue
 										}
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+										// Scheduler snapshots can be temporarily stale; re-check schedulability here to
 										// avoid selecting accounts that were recently rate-limited/overloaded.
 										if !acc.IsSchedulable() {
 											continue
 										}
-												feat: antigravity 配额域限流

											
										
										
											2026-01-09 17:35:02 +08:00
+										if !acc.IsSchedulableForModel(requestedModel) {
 											continue
 										}
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+										if requestedModel != "" && !s.isModelSupportedByAccount(acc, requestedModel) {
 											continue
 										}
 										if selected == nil {
 											selected = acc
 											continue
 										}
 										if acc.Priority < selected.Priority {
 											selected = acc
 										} else if acc.Priority == selected.Priority {
 											switch {
 											case acc.LastUsedAt == nil && selected.LastUsedAt != nil:
 												selected = acc
 											case acc.LastUsedAt != nil && selected.LastUsedAt == nil:
 												// keep selected (never used is preferred)
 											case acc.LastUsedAt == nil && selected.LastUsedAt == nil:
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+												if preferOAuth && acc.Type != selected.Type && acc.Type == AccountTypeOAuth {
 													selected = acc
 												}
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+											default:
 												if acc.LastUsedAt.Before(*selected.LastUsedAt) {
 													selected = acc
 												}
 											}
 										}
 									}
 									if selected == nil {
 										if requestedModel != "" {
 											return nil, fmt.Errorf("no available accounts supporting model: %s", requestedModel)
 										}
 										return nil, errors.New("no available accounts")
 									}
 									// 4. 建立粘性绑定
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+									if sessionHash != "" && s.cache != nil {
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+										if err := s.cache.SetSessionAccountID(ctx, derefGroupID(groupID), sessionHash, selected.ID, stickySessionTTL); err != nil {
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+											log.Printf("set session account failed: session=%s account_id=%d err=%v", sessionHash, selected.ID, err)
 										}
 									}
 									return selected, nil
 								}
 								// selectAccountWithMixedScheduling 选择账户（支持混合调度）
 								// 查询原生平台账户 + 启用 mixed_scheduling 的 antigravity 账户
 								func (s *GatewayService) selectAccountWithMixedScheduling(ctx context.Context, groupID *int64, sessionHash string, requestedModel string, excludedIDs map[int64]struct{}, nativePlatform string) (*Account, error) {
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									preferOAuth := nativePlatform == PlatformGemini
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+									routingAccountIDs := s.routingAccountIDsForRequest(ctx, groupID, requestedModel, nativePlatform)
 									var accounts []Account
 									accountsLoaded := false
 									// ============ Model Routing (legacy path): apply before sticky session ============
 									if len(routingAccountIDs) > 0 {
 										if s.debugModelRoutingEnabled() {
 											log.Printf("[ModelRoutingDebug] legacy mixed routed begin: group_id=%v model=%s platform=%s session=%s routed_ids=%v",
 												derefGroupID(groupID), requestedModel, nativePlatform, shortSessionHash(sessionHash), routingAccountIDs)
 										}
 										// 1) Sticky session only applies if the bound account is within the routing set.
 										if sessionHash != "" && s.cache != nil {
 											accountID, err := s.cache.GetSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
 											if err == nil && accountID > 0 && containsInt64(routingAccountIDs, accountID) {
 												if _, excluded := excludedIDs[accountID]; !excluded {
 													account, err := s.getSchedulableAccount(ctx, accountID)
 													// 检查账号分组归属和有效性：原生平台直接匹配，antigravity 需要启用混合调度
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+													if err == nil {
 														clearSticky := shouldClearStickySession(account)
 														if clearSticky {
 															_ = s.cache.DeleteSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
 														}
 														if !clearSticky && s.isAccountInGroup(account, groupID) && account.IsSchedulableForModel(requestedModel) && (requestedModel == "" || s.isModelSupportedByAccount(account, requestedModel)) {
 															if account.Platform == nativePlatform || (account.Platform == PlatformAntigravity && account.IsMixedSchedulingEnabled()) {
 																if err := s.cache.RefreshSessionTTL(ctx, derefGroupID(groupID), sessionHash, stickySessionTTL); err != nil {
 																	log.Printf("refresh session ttl failed: session=%s err=%v", sessionHash, err)
 																}
 																if s.debugModelRoutingEnabled() {
 																	log.Printf("[ModelRoutingDebug] legacy mixed routed sticky hit: group_id=%v model=%s session=%s account=%d", derefGroupID(groupID), requestedModel, shortSessionHash(sessionHash), accountID)
 																}
 																return account, nil
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+															}
 														}
 													}
 												}
 											}
 										}
 										// 2) Select an account from the routed candidates.
 										var err error
 										accounts, _, err = s.listSchedulableAccounts(ctx, groupID, nativePlatform, false)
 										if err != nil {
 											return nil, fmt.Errorf("query accounts failed: %w", err)
 										}
 										accountsLoaded = true
 										routingSet := make(map[int64]struct{}, len(routingAccountIDs))
 										for _, id := range routingAccountIDs {
 											if id > 0 {
 												routingSet[id] = struct{}{}
 											}
 										}
 										var selected *Account
 										for i := range accounts {
 											acc := &accounts[i]
 											if _, ok := routingSet[acc.ID]; !ok {
 												continue
 											}
 											if _, excluded := excludedIDs[acc.ID]; excluded {
 												continue
 											}
 											// Scheduler snapshots can be temporarily stale; re-check schedulability here to
 											// avoid selecting accounts that were recently rate-limited/overloaded.
 											if !acc.IsSchedulable() {
 												continue
 											}
 											// 过滤：原生平台直接通过，antigravity 需要启用混合调度
 											if acc.Platform == PlatformAntigravity && !acc.IsMixedSchedulingEnabled() {
 												continue
 											}
 											if !acc.IsSchedulableForModel(requestedModel) {
 												continue
 											}
 											if requestedModel != "" && !s.isModelSupportedByAccount(acc, requestedModel) {
 												continue
 											}
 											if selected == nil {
 												selected = acc
 												continue
 											}
 											if acc.Priority < selected.Priority {
 												selected = acc
 											} else if acc.Priority == selected.Priority {
 												switch {
 												case acc.LastUsedAt == nil && selected.LastUsedAt != nil:
 													selected = acc
 												case acc.LastUsedAt != nil && selected.LastUsedAt == nil:
 													// keep selected (never used is preferred)
 												case acc.LastUsedAt == nil && selected.LastUsedAt == nil:
 													if preferOAuth && acc.Platform == PlatformGemini && selected.Platform == PlatformGemini && acc.Type != selected.Type && acc.Type == AccountTypeOAuth {
 														selected = acc
 													}
 												default:
 													if acc.LastUsedAt.Before(*selected.LastUsedAt) {
 														selected = acc
 													}
 												}
 											}
 										}
 										if selected != nil {
 											if sessionHash != "" && s.cache != nil {
 												if err := s.cache.SetSessionAccountID(ctx, derefGroupID(groupID), sessionHash, selected.ID, stickySessionTTL); err != nil {
 													log.Printf("set session account failed: session=%s account_id=%d err=%v", sessionHash, selected.ID, err)
 												}
 											}
 											if s.debugModelRoutingEnabled() {
 												log.Printf("[ModelRoutingDebug] legacy mixed routed select: group_id=%v model=%s session=%s account=%d", derefGroupID(groupID), requestedModel, shortSessionHash(sessionHash), selected.ID)
 											}
 											return selected, nil
 										}
 										log.Printf("[ModelRouting] No routed accounts available for model=%s, falling back to normal selection", requestedModel)
 									}
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
 									// 1. 查询粘性会话
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+									if sessionHash != "" && s.cache != nil {
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+										accountID, err := s.cache.GetSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+										if err == nil && accountID > 0 {
 											if _, excluded := excludedIDs[accountID]; !excluded {
-												feat(scheduler): 引入调度快照缓存与 outbox 回放

- 调度热路径优先读 Redis 快照，保留分组排序语义
- outbox 回放 + 全量重建纠偏，失败重试不推进水位
- 自动 Atlas 基线对齐并同步调度配置示例

											
										
										
											2026-01-12 14:19:06 +08:00
+												account, err := s.getSchedulableAccount(ctx, accountID)
-												fix(gateway): 修复账号跨分组调度问题

问题：账号可能被调度到未分配的分组（如 simon 账号被调度到 claude_default）

根因：
- 强制平台模式下分组查询失败时回退到全平台查询
- listSchedulableAccounts 中分组为空时回退到无分组查询
- 粘性会话只检查平台匹配，未校验账号分组归属

修复：
- 移除强制平台模式的回退逻辑，分组内无账号时返回错误
- 移除 listSchedulableAccounts 的回退逻辑
- 新增 isAccountInGroup 方法用于分组校验
- 在三处粘性会话检查中增加分组归属验证

											
										
										
											2026-01-07 10:56:52 +08:00
+												// 检查账号分组归属和有效性：原生平台直接匹配，antigravity 需要启用混合调度
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+												if err == nil {
 													clearSticky := shouldClearStickySession(account)
 													if clearSticky {
 														_ = s.cache.DeleteSessionAccountID(ctx, derefGroupID(groupID), sessionHash)
 													}
 													if !clearSticky && s.isAccountInGroup(account, groupID) && account.IsSchedulableForModel(requestedModel) && (requestedModel == "" || s.isModelSupportedByAccount(account, requestedModel)) {
 														if account.Platform == nativePlatform || (account.Platform == PlatformAntigravity && account.IsMixedSchedulingEnabled()) {
 															if err := s.cache.RefreshSessionTTL(ctx, derefGroupID(groupID), sessionHash, stickySessionTTL); err != nil {
 																log.Printf("refresh session ttl failed: session=%s err=%v", sessionHash, err)
 															}
 															return account, nil
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+														}
 													}
 												}
 											}
 										}
 									}
 									// 2. 获取可调度账号列表
-												feat(group): 添加分组级别模型路由配置功能
  支持为分组配置模型路由规则，可以指定特定模型模式优先使用的账号列表。

  - 新增 model_routing 字段存储路由配置（JSONB格式，支持通配符匹配）

  - 新增 model_routing_enabled 字段控制是否启用路由

  - 更新后端 handler/service/repository 支持路由配置的增删改查

  - 更新前端 GroupsView 添加路由配置界面

  - 添加数据库迁移脚本 040/041

											
										
										
											2026-01-16 17:26:05 +08:00
+									if !accountsLoaded {
 										var err error
 										accounts, _, err = s.listSchedulableAccounts(ctx, groupID, nativePlatform, false)
 										if err != nil {
 											return nil, fmt.Errorf("query accounts failed: %w", err)
 										}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+									// 3. 按优先级+最久未用选择（考虑模型支持和混合调度）
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+									var selected *Account
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									for i := range accounts {
 										acc := &accounts[i]
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+										if _, excluded := excludedIDs[acc.ID]; excluded {
 											continue
 										}
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+										// Scheduler snapshots can be temporarily stale; re-check schedulability here to
 										// avoid selecting accounts that were recently rate-limited/overloaded.
 										if !acc.IsSchedulable() {
 											continue
 										}
-												feat(antigravity): 添加混合调度可选功能

- 后端：账户模型添加 IsMixedSchedulingEnabled() 方法，读取 extra.mixed_scheduling
- 后端：gateway_service 和 gemini_messages_compat_service 支持混合调度逻辑
- 后端：分组创建支持指定 platform 参数
- 前端：账户创建/编辑弹窗添加混合调度开关（仅 antigravity 账户显示）
- 前端：混合调度开关添加问号图标和 tooltip 说明
- 前端：GroupSelector 支持根据 mixedScheduling 属性过滤分组
- 前端：分组创建支持选择 platform
- 测试：e2e 测试添加 ENDPOINT_PREFIX 环境变量支持混合/隔离模式测试
- 测试：删除过时的 Claude signature 测试用例

											
										
										
											2025-12-29 09:44:39 +08:00
+										// 过滤：原生平台直接通过，antigravity 需要启用混合调度
 										if acc.Platform == PlatformAntigravity && !acc.IsMixedSchedulingEnabled() {
 											continue
 										}
-												feat: antigravity 配额域限流

											
										
										
											2026-01-09 17:35:02 +08:00
+										if !acc.IsSchedulableForModel(requestedModel) {
 											continue
 										}
-												feat: 完善 Antigravity 多平台网关支持，修复 Gemini handler 分流逻辑

											
										
										
											2025-12-28 17:48:52 +08:00
+										if requestedModel != "" && !s.isModelSupportedByAccount(acc, requestedModel) {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+											continue
 										}
 										if selected == nil {
 											selected = acc
 											continue
 										}
 										if acc.Priority < selected.Priority {
 											selected = acc
 										} else if acc.Priority == selected.Priority {
-												feat(backend): 实现 Gemini AI Studio OAuth 和消息兼容服务

- gemini_oauth_service.go: 新增 AI Studio OAuth 类型支持
- gemini_token_provider.go: Token 提供器增强
- gemini_messages_compat_service.go: 支持 AI Studio 端点
- account_test_service.go: Gemini 账户可用性检测
- gateway_service.go: 网关服务适配
- openai_gateway_service.go: OpenAI 兼容层调整

											
										
										
											2025-12-25 21:24:44 -08:00
+											switch {
 											case acc.LastUsedAt == nil && selected.LastUsedAt != nil:
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+												selected = acc
-												feat(backend): 实现 Gemini AI Studio OAuth 和消息兼容服务

- gemini_oauth_service.go: 新增 AI Studio OAuth 类型支持
- gemini_token_provider.go: Token 提供器增强
- gemini_messages_compat_service.go: 支持 AI Studio 端点
- account_test_service.go: Gemini 账户可用性检测
- gateway_service.go: 网关服务适配
- openai_gateway_service.go: OpenAI 兼容层调整

											
										
										
											2025-12-25 21:24:44 -08:00
+											case acc.LastUsedAt != nil && selected.LastUsedAt == nil:
 												// keep selected (never used is preferred)
 											case acc.LastUsedAt == nil && selected.LastUsedAt == nil:
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+												if preferOAuth && acc.Platform == PlatformGemini && selected.Platform == PlatformGemini && acc.Type != selected.Type && acc.Type == AccountTypeOAuth {
 													selected = acc
 												}
-												feat(backend): 实现 Gemini AI Studio OAuth 和消息兼容服务

- gemini_oauth_service.go: 新增 AI Studio OAuth 类型支持
- gemini_token_provider.go: Token 提供器增强
- gemini_messages_compat_service.go: 支持 AI Studio 端点
- account_test_service.go: Gemini 账户可用性检测
- gateway_service.go: 网关服务适配
- openai_gateway_service.go: OpenAI 兼容层调整

											
										
										
											2025-12-25 21:24:44 -08:00
+											default:
 												if acc.LastUsedAt.Before(*selected.LastUsedAt) {
 													selected = acc
 												}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+											}
 										}
 									}
 									if selected == nil {
 										if requestedModel != "" {
 											return nil, fmt.Errorf("no available accounts supporting model: %s", requestedModel)
 										}
 										return nil, errors.New("no available accounts")
 									}
 									// 4. 建立粘性绑定
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+									if sessionHash != "" && s.cache != nil {
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+										if err := s.cache.SetSessionAccountID(ctx, derefGroupID(groupID), sessionHash, selected.ID, stickySessionTTL); err != nil {
-												ci(backend): 添加 github actions (#10)

## 变更内容

### CI/CD
- 添加 GitHub Actions 工作流（test + golangci-lint）
- 添加 golangci-lint 配置，启用 errcheck/govet/staticcheck/unused/depguard
- 通过 depguard 强制 service 层不能直接导入 repository

### 错误处理修复
- 修复 CSV 写入、SSE 流式输出、随机数生成等未处理的错误
- GenerateRedeemCode() 现在返回 error

### 资源泄露修复
- 统一使用 defer func() { _ = xxx.Close() }() 模式

### 代码清理
- 移除未使用的常量
- 简化 nil map 检查
- 统一代码格式
											
										
										
											2025-12-20 15:29:52 +08:00
+											log.Printf("set session account failed: session=%s account_id=%d err=%v", sessionHash, selected.ID, err)
 										}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
 									return selected, nil
 								}
-												feat: 完善 Antigravity 多平台网关支持，修复 Gemini handler 分流逻辑

											
										
										
											2025-12-28 17:48:52 +08:00
+								// isModelSupportedByAccount 根据账户平台检查模型支持
 								func (s *GatewayService) isModelSupportedByAccount(account *Account, requestedModel string) bool {
 									if account.Platform == PlatformAntigravity {
 										// Antigravity 平台使用专门的模型支持检查
 										return IsAntigravityModelSupported(requestedModel)
 									}
-												Add invalid-request fallback routing

											
										
										
											2026-01-23 22:24:46 +08:00
+									if account.Platform == PlatformAnthropic {
 										requestedModel = normalizeClaudeModelForAnthropic(requestedModel)
 									}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+									// Gemini API Key 账户直接透传，由上游判断模型是否支持
 									if account.Platform == PlatformGemini && account.Type == AccountTypeAPIKey {
 										return true
 									}
-												feat: 完善 Antigravity 多平台网关支持，修复 Gemini handler 分流逻辑

											
										
										
											2025-12-28 17:48:52 +08:00
+									// 其他平台使用账户的模型支持检查
 									return account.IsModelSupported(requestedModel)
 								}
 								// IsAntigravityModelSupported 检查 Antigravity 平台是否支持指定模型
-												refactor(antigravity): 简化模型映射逻辑，支持前缀匹配

- 删除精确映射表 antigravityModelMapping，统一使用前缀映射
- 前缀映射支持模型版本号变化（如 -20251111, -thinking, -preview）
- 简化 IsModelSupported 函数，所有 claude-/gemini- 前缀模型都支持
- 添加跨协议测试用例：Claude 端点调用 Gemini 模型、Gemini 端点调用 Claude 模型

											
										
										
											2025-12-31 21:16:32 +08:00
+								// 所有 claude- 和 gemini- 前缀的模型都能通过映射或透传支持
-												feat: 完善 Antigravity 多平台网关支持，修复 Gemini handler 分流逻辑

											
										
										
											2025-12-28 17:48:52 +08:00
+								func IsAntigravityModelSupported(requestedModel string) bool {
-												refactor(antigravity): 简化模型映射逻辑，支持前缀匹配

- 删除精确映射表 antigravityModelMapping，统一使用前缀映射
- 前缀映射支持模型版本号变化（如 -20251111, -thinking, -preview）
- 简化 IsModelSupported 函数，所有 claude-/gemini- 前缀模型都支持
- 添加跨协议测试用例：Claude 端点调用 Gemini 模型、Gemini 端点调用 Claude 模型

											
										
										
											2025-12-31 21:16:32 +08:00
+									return strings.HasPrefix(requestedModel, "claude-") ||
 										strings.HasPrefix(requestedModel, "gemini-")
-												feat: 完善 Antigravity 多平台网关支持，修复 Gemini handler 分流逻辑

											
										
										
											2025-12-28 17:48:52 +08:00
+								}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								// GetAccessToken 获取账号凭证
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+								func (s *GatewayService) GetAccessToken(ctx context.Context, account *Account) (string, string, error) {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									switch account.Type {
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+									case AccountTypeOAuth, AccountTypeSetupToken:
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										// Both oauth and setup-token use OAuth token flow
 										return s.getOAuthToken(ctx, account)
-												fix(lint): 修复所有 Go 命名规范问题

- 全局替换 ApiKey → APIKey（类型、字段、方法、变量）
- 修复所有 initialism 命名（API, SMTP, HTML, URL 等）
- 添加所有缺失的包注释
- 修复导出符号的注释格式

主要修改：
- ApiKey → APIKey（所有出现的地方）
- ApiKeyID → APIKeyID
- ApiKeyIDs → APIKeyIDs
- TestSmtpConnection → TestSMTPConnection
- HtmlURL → HTMLURL
- 添加 20+ 个包注释
- 修复 10+ 个导出符号注释格式

验证结果：
- ✓ golangci-lint: 0 issues
- ✓ 单元测试: 通过
- ✓ 集成测试: 通过

											
										
										
											2026-01-04 19:27:53 +08:00
+									case AccountTypeAPIKey:
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										apiKey := account.GetCredential("api_key")
 										if apiKey == "" {
 											return "", "", errors.New("api_key not found in credentials")
 										}
 										return apiKey, "apikey", nil
 									default:
 										return "", "", fmt.Errorf("unsupported account type: %s", account.Type)
 									}
 								}
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+								func (s *GatewayService) getOAuthToken(ctx context.Context, account *Account) (string, string, error) {
-												feat(网关): 引入 OpenAI/Claude OAuth token 缓存

新增 OpenAI/Claude TokenProvider 与缓存键生成
扩展 OAuth 缓存失效覆盖更多平台
统一 OAuth 缓存前缀与依赖注入

											
										
										
											2026-01-15 18:27:06 +08:00
+									// 对于 Anthropic OAuth 账号，使用 ClaudeTokenProvider 获取缓存的 token
 									if account.Platform == PlatformAnthropic && account.Type == AccountTypeOAuth && s.claudeTokenProvider != nil {
 										accessToken, err := s.claudeTokenProvider.GetAccessToken(ctx, account)
 										if err != nil {
 											return "", "", err
 										}
 										return accessToken, "oauth", nil
 									}
 									// 其他情况（Gemini 有自己的 TokenProvider，setup-token 类型等）直接从账号读取
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									accessToken := account.GetCredential("access_token")
-												fix: 修复Oauth账号自动刷新token失败的bug

											
										
										
											2025-12-20 13:01:58 +08:00
+									if accessToken == "" {
 										return "", "", errors.New("access_token not found in credentials")
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
-												fix: 修复Oauth账号自动刷新token失败的bug

											
										
										
											2025-12-20 13:01:58 +08:00
+									// Token刷新由后台 TokenRefreshService 处理，此处只返回当前token
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									return accessToken, "oauth", nil
 								}
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+								// 重试相关常量
 								const (
-												fix(frontend): comprehensive i18n cleanup and Select component hardening

											
										
										
											2026-01-04 21:09:14 +08:00
+									// 最大尝试次数（包含首次请求）。过多重试会导致请求堆积与资源耗尽。
 									maxRetryAttempts = 5
 									// 指数退避：第 N 次失败后的等待 = retryBaseDelay * 2^(N-1)，并且上限为 retryMaxDelay。
 									retryBaseDelay = 300 * time.Millisecond
 									retryMaxDelay  = 3 * time.Second
 									// 最大重试耗时（包含请求本身耗时 + 退避等待时间）。
 									// 用于防止极端情况下 goroutine 长时间堆积导致资源耗尽。
 									maxRetryElapsed = 10 * time.Second
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+								)
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+								func (s *GatewayService) shouldRetryUpstreamError(account *Account, statusCode int) bool {
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+									// OAuth/Setup Token 账号：仅 403 重试
 									if account.IsOAuth() {
 										return statusCode == 403
 									}
 									// API Key 账号：未配置的错误码重试
 									return !account.ShouldHandleErrorCode(statusCode)
 								}
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+								// shouldFailoverUpstreamError determines whether an upstream error should trigger account failover.
 								func (s *GatewayService) shouldFailoverUpstreamError(statusCode int) bool {
 									switch statusCode {
 									case 401, 403, 429, 529:
 										return true
 									default:
 										return statusCode >= 500
 									}
 								}
-												fix(frontend): comprehensive i18n cleanup and Select component hardening

											
										
										
											2026-01-04 21:09:14 +08:00
+								func retryBackoffDelay(attempt int) time.Duration {
 									// attempt 从 1 开始，表示第 attempt 次请求刚失败，需要等待后进行第 attempt+1 次请求。
 									if attempt <= 0 {
 										return retryBaseDelay
 									}
 									delay := retryBaseDelay * time.Duration(1<<(attempt-1))
 									if delay > retryMaxDelay {
 										return retryMaxDelay
 									}
 									return delay
 								}
 								func sleepWithContext(ctx context.Context, d time.Duration) error {
 									if d <= 0 {
 										return nil
 									}
 									timer := time.NewTimer(d)
 									defer func() {
 										if !timer.Stop() {
 											select {
 											case <-timer.C:
 											default:
 											}
 										}
 									}()
 									select {
 									case <-ctx.Done():
 										return ctx.Err()
 									case <-timer.C:
 										return nil
 									}
 								}
-												feat(gateway): 实现 Claude Code 系统提示词智能注入

											
										
										
											2026-01-04 10:38:13 +08:00
+								// isClaudeCodeClient 判断请求是否来自 Claude Code 客户端
 								// 简化判断：User-Agent 匹配 + metadata.user_id 存在
 								func isClaudeCodeClient(userAgent string, metadataUserID string) bool {
 									if metadataUserID == "" {
 										return false
 									}
 									return claudeCliUserAgentRe.MatchString(userAgent)
 								}
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+								func isClaudeCodeRequest(ctx context.Context, c *gin.Context, parsed *ParsedRequest) bool {
 									if IsClaudeCodeClient(ctx) {
 										return true
 									}
 									if parsed == nil || c == nil {
 										return false
 									}
 									return isClaudeCodeClient(c.GetHeader("User-Agent"), parsed.MetadataUserID)
 								}
-												feat(gateway): 实现 Claude Code 系统提示词智能注入

											
										
										
											2026-01-04 10:38:13 +08:00
+								// systemIncludesClaudeCodePrompt 检查 system 中是否已包含 Claude Code 提示词
-												fix(gateway): 修复 cache_control 块超限问题并优化 Claude Code 检测

问题：
- OAuth/SetupToken 账号注入 system prompt 后可能导致 cache_control
  块超过 Anthropic API 的 4 个限制
- Claude Code 检测使用精确匹配，无法识别 Agent SDK 等变体

修复：
- 新增 enforceCacheControlLimit 函数，强制执行 4 个块限制
- 优先从 messages 移除，再从 system 尾部移除（保护注入的 prompt）
- 改用前缀匹配检测 Claude Code 系统提示词，支持多种变体：
  - 标准版、Agent SDK 版、Explore Agent 版、Compact 版

											
										
										
											2026-01-07 10:17:09 +08:00
+								// 使用前缀匹配支持多种变体（标准版、Agent SDK 版等）
-												feat(gateway): 实现 Claude Code 系统提示词智能注入

											
										
										
											2026-01-04 10:38:13 +08:00
+								func systemIncludesClaudeCodePrompt(system any) bool {
 									switch v := system.(type) {
 									case string:
-												fix(gateway): 修复 cache_control 块超限问题并优化 Claude Code 检测

问题：
- OAuth/SetupToken 账号注入 system prompt 后可能导致 cache_control
  块超过 Anthropic API 的 4 个限制
- Claude Code 检测使用精确匹配，无法识别 Agent SDK 等变体

修复：
- 新增 enforceCacheControlLimit 函数，强制执行 4 个块限制
- 优先从 messages 移除，再从 system 尾部移除（保护注入的 prompt）
- 改用前缀匹配检测 Claude Code 系统提示词，支持多种变体：
  - 标准版、Agent SDK 版、Explore Agent 版、Compact 版

											
										
										
											2026-01-07 10:17:09 +08:00
+										return hasClaudeCodePrefix(v)
-												feat(gateway): 实现 Claude Code 系统提示词智能注入

											
										
										
											2026-01-04 10:38:13 +08:00
+									case []any:
 										for _, item := range v {
 											if m, ok := item.(map[string]any); ok {
-												fix(gateway): 修复 cache_control 块超限问题并优化 Claude Code 检测

问题：
- OAuth/SetupToken 账号注入 system prompt 后可能导致 cache_control
  块超过 Anthropic API 的 4 个限制
- Claude Code 检测使用精确匹配，无法识别 Agent SDK 等变体

修复：
- 新增 enforceCacheControlLimit 函数，强制执行 4 个块限制
- 优先从 messages 移除，再从 system 尾部移除（保护注入的 prompt）
- 改用前缀匹配检测 Claude Code 系统提示词，支持多种变体：
  - 标准版、Agent SDK 版、Explore Agent 版、Compact 版

											
										
										
											2026-01-07 10:17:09 +08:00
+												if text, ok := m["text"].(string); ok && hasClaudeCodePrefix(text) {
-												feat(gateway): 实现 Claude Code 系统提示词智能注入

											
										
										
											2026-01-04 10:38:13 +08:00
+													return true
 												}
 											}
 										}
 									}
 									return false
 								}
-												fix(gateway): 修复 cache_control 块超限问题并优化 Claude Code 检测

问题：
- OAuth/SetupToken 账号注入 system prompt 后可能导致 cache_control
  块超过 Anthropic API 的 4 个限制
- Claude Code 检测使用精确匹配，无法识别 Agent SDK 等变体

修复：
- 新增 enforceCacheControlLimit 函数，强制执行 4 个块限制
- 优先从 messages 移除，再从 system 尾部移除（保护注入的 prompt）
- 改用前缀匹配检测 Claude Code 系统提示词，支持多种变体：
  - 标准版、Agent SDK 版、Explore Agent 版、Compact 版

											
										
										
											2026-01-07 10:17:09 +08:00
+								// hasClaudeCodePrefix 检查文本是否以 Claude Code 提示词的特征前缀开头
 								func hasClaudeCodePrefix(text string) bool {
 									for _, prefix := range claudeCodePromptPrefixes {
 										if strings.HasPrefix(text, prefix) {
 											return true
 										}
 									}
 									return false
 								}
-												feat(gateway): 实现 Claude Code 系统提示词智能注入

											
										
										
											2026-01-04 10:38:13 +08:00
+								// injectClaudeCodePrompt 在 system 开头注入 Claude Code 提示词
 								// 处理 null、字符串、数组三种格式
 								func injectClaudeCodePrompt(body []byte, system any) []byte {
 									claudeCodeBlock := map[string]any{
 										"type":          "text",
 										"text":          claudeCodeSystemPrompt,
 										"cache_control": map[string]string{"type": "ephemeral"},
 									}
-												fix: also prefix next system block with Claude Code banner

											
										
										
											2026-01-29 02:03:54 +08:00
+									// Opencode plugin applies an extra safeguard: it not only prepends the Claude Code
 									// banner, it also prefixes the next system instruction with the same banner plus
 									// a blank line. This helps when upstream concatenates system instructions.
 									claudeCodePrefix := strings.TrimSpace(claudeCodeSystemPrompt)
-												feat(gateway): 实现 Claude Code 系统提示词智能注入

											
										
										
											2026-01-04 10:38:13 +08:00
 									var newSystem []any
 									switch v := system.(type) {
 									case nil:
 										newSystem = []any{claudeCodeBlock}
 									case string:
-												fix: add newline separation for Claude Code system prompt

											
										
										
											2026-01-29 01:28:43 +08:00
+										// Be tolerant of older/newer clients that may differ only by trailing whitespace/newlines.
 										if strings.TrimSpace(v) == "" || strings.TrimSpace(v) == strings.TrimSpace(claudeCodeSystemPrompt) {
-												feat(gateway): 实现 Claude Code 系统提示词智能注入

											
										
										
											2026-01-04 10:38:13 +08:00
+											newSystem = []any{claudeCodeBlock}
 										} else {
-												fix: also prefix next system block with Claude Code banner

											
										
										
											2026-01-29 02:03:54 +08:00
+											// Mirror opencode behavior: keep the banner as a separate system entry,
 											// but also prefix the next system text with the banner.
 											merged := v
 											if !strings.HasPrefix(v, claudeCodePrefix) {
 												merged = claudeCodePrefix + "\n\n" + v
 											}
 											newSystem = []any{claudeCodeBlock, map[string]any{"type": "text", "text": merged}}
-												feat(gateway): 实现 Claude Code 系统提示词智能注入

											
										
										
											2026-01-04 10:38:13 +08:00
+										}
 									case []any:
 										newSystem = make([]any, 0, len(v)+1)
 										newSystem = append(newSystem, claudeCodeBlock)
-												fix: also prefix next system block with Claude Code banner

											
										
										
											2026-01-29 02:03:54 +08:00
+										prefixedNext := false
-												feat(gateway): 实现 Claude Code 系统提示词智能注入

											
										
										
											2026-01-04 10:38:13 +08:00
+										for _, item := range v {
 											if m, ok := item.(map[string]any); ok {
-												fix: add newline separation for Claude Code system prompt

											
										
										
											2026-01-29 01:28:43 +08:00
+												if text, ok := m["text"].(string); ok && strings.TrimSpace(text) == strings.TrimSpace(claudeCodeSystemPrompt) {
-												feat(gateway): 实现 Claude Code 系统提示词智能注入

											
										
										
											2026-01-04 10:38:13 +08:00
+													continue
 												}
-												fix: also prefix next system block with Claude Code banner

											
										
										
											2026-01-29 02:03:54 +08:00
+												// Prefix the first subsequent text system block once.
 												if !prefixedNext {
 													if blockType, _ := m["type"].(string); blockType == "text" {
 														if text, ok := m["text"].(string); ok && strings.TrimSpace(text) != "" && !strings.HasPrefix(text, claudeCodePrefix) {
 															m["text"] = claudeCodePrefix + "\n\n" + text
 															prefixedNext = true
 														}
 													}
 												}
-												feat(gateway): 实现 Claude Code 系统提示词智能注入

											
										
										
											2026-01-04 10:38:13 +08:00
+											}
 											newSystem = append(newSystem, item)
 										}
 									default:
 										newSystem = []any{claudeCodeBlock}
 									}
 									result, err := sjson.SetBytes(body, "system", newSystem)
 									if err != nil {
 										log.Printf("Warning: failed to inject Claude Code prompt: %v", err)
 										return body
 									}
 									return result
 								}
-												fix(gateway): 修复 cache_control 块超限问题并优化 Claude Code 检测

问题：
- OAuth/SetupToken 账号注入 system prompt 后可能导致 cache_control
  块超过 Anthropic API 的 4 个限制
- Claude Code 检测使用精确匹配，无法识别 Agent SDK 等变体

修复：
- 新增 enforceCacheControlLimit 函数，强制执行 4 个块限制
- 优先从 messages 移除，再从 system 尾部移除（保护注入的 prompt）
- 改用前缀匹配检测 Claude Code 系统提示词，支持多种变体：
  - 标准版、Agent SDK 版、Explore Agent 版、Compact 版

											
										
										
											2026-01-07 10:17:09 +08:00
+								// enforceCacheControlLimit 强制执行 cache_control 块数量限制（最多 4 个）
 								// 超限时优先从 messages 中移除 cache_control，保护 system 中的缓存控制
 								func enforceCacheControlLimit(body []byte) []byte {
 									var data map[string]any
 									if err := json.Unmarshal(body, &data); err != nil {
 										return body
 									}
-												feat(gateway): 优化 Antigravity/Gemini 思考块处理

此提交解决了思考块 (thinking blocks) 在转发过程中的兼容性问题。

主要变更：

1. **思考块优化 (Thinking Blocks)**：
   - 在 AntigravityGatewayService 中增加了 sanitizeThinkingBlocks 处理，强制移除思考块中不支持的 cache_control 字段（避免 Anthropic/Vertex AI 报错）
   - 实现历史思考块展平 (Flattening)：将非最后一条消息中的思考块转换为普通文本块，以绕过上游对历史思考块签名的严格校验
   - 增加 cleanCacheControlFromGeminiJSON 作为最后一道防线，确保转换后的 Gemini 请求中不残留非法的 cache_control

2. **GatewayService 缓存控制优化**：
   - 更新缓存控制逻辑，跳过 thinking 块（thinking 块不支持 cache_control 字段）
   - 增加 removeCacheControlFromThinkingBlocks 函数强制清理

关联 Issue: #225

											
										
										
											2026-01-10 04:56:11 +00:00
+									// 清理 thinking 块中的非法 cache_control（thinking 块不支持该字段）
 									removeCacheControlFromThinkingBlocks(data)
-												fix(gateway): 修复 cache_control 块超限问题并优化 Claude Code 检测

问题：
- OAuth/SetupToken 账号注入 system prompt 后可能导致 cache_control
  块超过 Anthropic API 的 4 个限制
- Claude Code 检测使用精确匹配，无法识别 Agent SDK 等变体

修复：
- 新增 enforceCacheControlLimit 函数，强制执行 4 个块限制
- 优先从 messages 移除，再从 system 尾部移除（保护注入的 prompt）
- 改用前缀匹配检测 Claude Code 系统提示词，支持多种变体：
  - 标准版、Agent SDK 版、Explore Agent 版、Compact 版

											
										
										
											2026-01-07 10:17:09 +08:00
+									// 计算当前 cache_control 块数量
 									count := countCacheControlBlocks(data)
 									if count <= maxCacheControlBlocks {
 										return body
 									}
 									// 超限：优先从 messages 中移除，再从 system 中移除
 									for count > maxCacheControlBlocks {
 										if removeCacheControlFromMessages(data) {
 											count--
 											continue
 										}
 										if removeCacheControlFromSystem(data) {
 											count--
 											continue
 										}
 										break
 									}
 									result, err := json.Marshal(data)
 									if err != nil {
 										return body
 									}
 									return result
 								}
 								// countCacheControlBlocks 统计 system 和 messages 中的 cache_control 块数量
-												feat(gateway): 优化 Antigravity/Gemini 思考块处理

此提交解决了思考块 (thinking blocks) 在转发过程中的兼容性问题。

主要变更：

1. **思考块优化 (Thinking Blocks)**：
   - 在 AntigravityGatewayService 中增加了 sanitizeThinkingBlocks 处理，强制移除思考块中不支持的 cache_control 字段（避免 Anthropic/Vertex AI 报错）
   - 实现历史思考块展平 (Flattening)：将非最后一条消息中的思考块转换为普通文本块，以绕过上游对历史思考块签名的严格校验
   - 增加 cleanCacheControlFromGeminiJSON 作为最后一道防线，确保转换后的 Gemini 请求中不残留非法的 cache_control

2. **GatewayService 缓存控制优化**：
   - 更新缓存控制逻辑，跳过 thinking 块（thinking 块不支持 cache_control 字段）
   - 增加 removeCacheControlFromThinkingBlocks 函数强制清理

关联 Issue: #225

											
										
										
											2026-01-10 04:56:11 +00:00
+								// 注意：thinking 块不支持 cache_control，统计时跳过
-												fix(gateway): 修复 cache_control 块超限问题并优化 Claude Code 检测

问题：
- OAuth/SetupToken 账号注入 system prompt 后可能导致 cache_control
  块超过 Anthropic API 的 4 个限制
- Claude Code 检测使用精确匹配，无法识别 Agent SDK 等变体

修复：
- 新增 enforceCacheControlLimit 函数，强制执行 4 个块限制
- 优先从 messages 移除，再从 system 尾部移除（保护注入的 prompt）
- 改用前缀匹配检测 Claude Code 系统提示词，支持多种变体：
  - 标准版、Agent SDK 版、Explore Agent 版、Compact 版

											
										
										
											2026-01-07 10:17:09 +08:00
+								func countCacheControlBlocks(data map[string]any) int {
 									count := 0
 									// 统计 system 中的块
 									if system, ok := data["system"].([]any); ok {
 										for _, item := range system {
 											if m, ok := item.(map[string]any); ok {
-												feat(gateway): 优化 Antigravity/Gemini 思考块处理

此提交解决了思考块 (thinking blocks) 在转发过程中的兼容性问题。

主要变更：

1. **思考块优化 (Thinking Blocks)**：
   - 在 AntigravityGatewayService 中增加了 sanitizeThinkingBlocks 处理，强制移除思考块中不支持的 cache_control 字段（避免 Anthropic/Vertex AI 报错）
   - 实现历史思考块展平 (Flattening)：将非最后一条消息中的思考块转换为普通文本块，以绕过上游对历史思考块签名的严格校验
   - 增加 cleanCacheControlFromGeminiJSON 作为最后一道防线，确保转换后的 Gemini 请求中不残留非法的 cache_control

2. **GatewayService 缓存控制优化**：
   - 更新缓存控制逻辑，跳过 thinking 块（thinking 块不支持 cache_control 字段）
   - 增加 removeCacheControlFromThinkingBlocks 函数强制清理

关联 Issue: #225

											
										
										
											2026-01-10 04:56:11 +00:00
+												// thinking 块不支持 cache_control，跳过
 												if blockType, _ := m["type"].(string); blockType == "thinking" {
 													continue
 												}
-												fix(gateway): 修复 cache_control 块超限问题并优化 Claude Code 检测

问题：
- OAuth/SetupToken 账号注入 system prompt 后可能导致 cache_control
  块超过 Anthropic API 的 4 个限制
- Claude Code 检测使用精确匹配，无法识别 Agent SDK 等变体

修复：
- 新增 enforceCacheControlLimit 函数，强制执行 4 个块限制
- 优先从 messages 移除，再从 system 尾部移除（保护注入的 prompt）
- 改用前缀匹配检测 Claude Code 系统提示词，支持多种变体：
  - 标准版、Agent SDK 版、Explore Agent 版、Compact 版

											
										
										
											2026-01-07 10:17:09 +08:00
+												if _, has := m["cache_control"]; has {
 													count++
 												}
 											}
 										}
 									}
 									// 统计 messages 中的块
 									if messages, ok := data["messages"].([]any); ok {
 										for _, msg := range messages {
 											if msgMap, ok := msg.(map[string]any); ok {
 												if content, ok := msgMap["content"].([]any); ok {
 													for _, item := range content {
 														if m, ok := item.(map[string]any); ok {
-												feat(gateway): 优化 Antigravity/Gemini 思考块处理

此提交解决了思考块 (thinking blocks) 在转发过程中的兼容性问题。

主要变更：

1. **思考块优化 (Thinking Blocks)**：
   - 在 AntigravityGatewayService 中增加了 sanitizeThinkingBlocks 处理，强制移除思考块中不支持的 cache_control 字段（避免 Anthropic/Vertex AI 报错）
   - 实现历史思考块展平 (Flattening)：将非最后一条消息中的思考块转换为普通文本块，以绕过上游对历史思考块签名的严格校验
   - 增加 cleanCacheControlFromGeminiJSON 作为最后一道防线，确保转换后的 Gemini 请求中不残留非法的 cache_control

2. **GatewayService 缓存控制优化**：
   - 更新缓存控制逻辑，跳过 thinking 块（thinking 块不支持 cache_control 字段）
   - 增加 removeCacheControlFromThinkingBlocks 函数强制清理

关联 Issue: #225

											
										
										
											2026-01-10 04:56:11 +00:00
+															// thinking 块不支持 cache_control，跳过
 															if blockType, _ := m["type"].(string); blockType == "thinking" {
 																continue
 															}
-												fix(gateway): 修复 cache_control 块超限问题并优化 Claude Code 检测

问题：
- OAuth/SetupToken 账号注入 system prompt 后可能导致 cache_control
  块超过 Anthropic API 的 4 个限制
- Claude Code 检测使用精确匹配，无法识别 Agent SDK 等变体

修复：
- 新增 enforceCacheControlLimit 函数，强制执行 4 个块限制
- 优先从 messages 移除，再从 system 尾部移除（保护注入的 prompt）
- 改用前缀匹配检测 Claude Code 系统提示词，支持多种变体：
  - 标准版、Agent SDK 版、Explore Agent 版、Compact 版

											
										
										
											2026-01-07 10:17:09 +08:00
+															if _, has := m["cache_control"]; has {
 																count++
 															}
 														}
 													}
 												}
 											}
 										}
 									}
 									return count
 								}
 								// removeCacheControlFromMessages 从 messages 中移除一个 cache_control（从头开始）
 								// 返回 true 表示成功移除，false 表示没有可移除的
-												feat(gateway): 优化 Antigravity/Gemini 思考块处理

此提交解决了思考块 (thinking blocks) 在转发过程中的兼容性问题。

主要变更：

1. **思考块优化 (Thinking Blocks)**：
   - 在 AntigravityGatewayService 中增加了 sanitizeThinkingBlocks 处理，强制移除思考块中不支持的 cache_control 字段（避免 Anthropic/Vertex AI 报错）
   - 实现历史思考块展平 (Flattening)：将非最后一条消息中的思考块转换为普通文本块，以绕过上游对历史思考块签名的严格校验
   - 增加 cleanCacheControlFromGeminiJSON 作为最后一道防线，确保转换后的 Gemini 请求中不残留非法的 cache_control

2. **GatewayService 缓存控制优化**：
   - 更新缓存控制逻辑，跳过 thinking 块（thinking 块不支持 cache_control 字段）
   - 增加 removeCacheControlFromThinkingBlocks 函数强制清理

关联 Issue: #225

											
										
										
											2026-01-10 04:56:11 +00:00
+								// 注意：跳过 thinking 块（它不支持 cache_control）
-												fix(gateway): 修复 cache_control 块超限问题并优化 Claude Code 检测

问题：
- OAuth/SetupToken 账号注入 system prompt 后可能导致 cache_control
  块超过 Anthropic API 的 4 个限制
- Claude Code 检测使用精确匹配，无法识别 Agent SDK 等变体

修复：
- 新增 enforceCacheControlLimit 函数，强制执行 4 个块限制
- 优先从 messages 移除，再从 system 尾部移除（保护注入的 prompt）
- 改用前缀匹配检测 Claude Code 系统提示词，支持多种变体：
  - 标准版、Agent SDK 版、Explore Agent 版、Compact 版

											
										
										
											2026-01-07 10:17:09 +08:00
+								func removeCacheControlFromMessages(data map[string]any) bool {
 									messages, ok := data["messages"].([]any)
 									if !ok {
 										return false
 									}
 									for _, msg := range messages {
 										msgMap, ok := msg.(map[string]any)
 										if !ok {
 											continue
 										}
 										content, ok := msgMap["content"].([]any)
 										if !ok {
 											continue
 										}
 										for _, item := range content {
 											if m, ok := item.(map[string]any); ok {
-												feat(gateway): 优化 Antigravity/Gemini 思考块处理

此提交解决了思考块 (thinking blocks) 在转发过程中的兼容性问题。

主要变更：

1. **思考块优化 (Thinking Blocks)**：
   - 在 AntigravityGatewayService 中增加了 sanitizeThinkingBlocks 处理，强制移除思考块中不支持的 cache_control 字段（避免 Anthropic/Vertex AI 报错）
   - 实现历史思考块展平 (Flattening)：将非最后一条消息中的思考块转换为普通文本块，以绕过上游对历史思考块签名的严格校验
   - 增加 cleanCacheControlFromGeminiJSON 作为最后一道防线，确保转换后的 Gemini 请求中不残留非法的 cache_control

2. **GatewayService 缓存控制优化**：
   - 更新缓存控制逻辑，跳过 thinking 块（thinking 块不支持 cache_control 字段）
   - 增加 removeCacheControlFromThinkingBlocks 函数强制清理

关联 Issue: #225

											
										
										
											2026-01-10 04:56:11 +00:00
+												// thinking 块不支持 cache_control，跳过
 												if blockType, _ := m["type"].(string); blockType == "thinking" {
 													continue
 												}
-												fix(gateway): 修复 cache_control 块超限问题并优化 Claude Code 检测

问题：
- OAuth/SetupToken 账号注入 system prompt 后可能导致 cache_control
  块超过 Anthropic API 的 4 个限制
- Claude Code 检测使用精确匹配，无法识别 Agent SDK 等变体

修复：
- 新增 enforceCacheControlLimit 函数，强制执行 4 个块限制
- 优先从 messages 移除，再从 system 尾部移除（保护注入的 prompt）
- 改用前缀匹配检测 Claude Code 系统提示词，支持多种变体：
  - 标准版、Agent SDK 版、Explore Agent 版、Compact 版

											
										
										
											2026-01-07 10:17:09 +08:00
+												if _, has := m["cache_control"]; has {
 													delete(m, "cache_control")
 													return true
 												}
 											}
 										}
 									}
 									return false
 								}
 								// removeCacheControlFromSystem 从 system 中移除一个 cache_control（从尾部开始，保护注入的 prompt）
 								// 返回 true 表示成功移除，false 表示没有可移除的
-												feat(gateway): 优化 Antigravity/Gemini 思考块处理

此提交解决了思考块 (thinking blocks) 在转发过程中的兼容性问题。

主要变更：

1. **思考块优化 (Thinking Blocks)**：
   - 在 AntigravityGatewayService 中增加了 sanitizeThinkingBlocks 处理，强制移除思考块中不支持的 cache_control 字段（避免 Anthropic/Vertex AI 报错）
   - 实现历史思考块展平 (Flattening)：将非最后一条消息中的思考块转换为普通文本块，以绕过上游对历史思考块签名的严格校验
   - 增加 cleanCacheControlFromGeminiJSON 作为最后一道防线，确保转换后的 Gemini 请求中不残留非法的 cache_control

2. **GatewayService 缓存控制优化**：
   - 更新缓存控制逻辑，跳过 thinking 块（thinking 块不支持 cache_control 字段）
   - 增加 removeCacheControlFromThinkingBlocks 函数强制清理

关联 Issue: #225

											
										
										
											2026-01-10 04:56:11 +00:00
+								// 注意：跳过 thinking 块（它不支持 cache_control）
-												fix(gateway): 修复 cache_control 块超限问题并优化 Claude Code 检测

问题：
- OAuth/SetupToken 账号注入 system prompt 后可能导致 cache_control
  块超过 Anthropic API 的 4 个限制
- Claude Code 检测使用精确匹配，无法识别 Agent SDK 等变体

修复：
- 新增 enforceCacheControlLimit 函数，强制执行 4 个块限制
- 优先从 messages 移除，再从 system 尾部移除（保护注入的 prompt）
- 改用前缀匹配检测 Claude Code 系统提示词，支持多种变体：
  - 标准版、Agent SDK 版、Explore Agent 版、Compact 版

											
										
										
											2026-01-07 10:17:09 +08:00
+								func removeCacheControlFromSystem(data map[string]any) bool {
 									system, ok := data["system"].([]any)
 									if !ok {
 										return false
 									}
 									// 从尾部开始移除，保护开头注入的 Claude Code prompt
 									for i := len(system) - 1; i >= 0; i-- {
 										if m, ok := system[i].(map[string]any); ok {
-												feat(gateway): 优化 Antigravity/Gemini 思考块处理

此提交解决了思考块 (thinking blocks) 在转发过程中的兼容性问题。

主要变更：

1. **思考块优化 (Thinking Blocks)**：
   - 在 AntigravityGatewayService 中增加了 sanitizeThinkingBlocks 处理，强制移除思考块中不支持的 cache_control 字段（避免 Anthropic/Vertex AI 报错）
   - 实现历史思考块展平 (Flattening)：将非最后一条消息中的思考块转换为普通文本块，以绕过上游对历史思考块签名的严格校验
   - 增加 cleanCacheControlFromGeminiJSON 作为最后一道防线，确保转换后的 Gemini 请求中不残留非法的 cache_control

2. **GatewayService 缓存控制优化**：
   - 更新缓存控制逻辑，跳过 thinking 块（thinking 块不支持 cache_control 字段）
   - 增加 removeCacheControlFromThinkingBlocks 函数强制清理

关联 Issue: #225

											
										
										
											2026-01-10 04:56:11 +00:00
+											// thinking 块不支持 cache_control，跳过
 											if blockType, _ := m["type"].(string); blockType == "thinking" {
 												continue
 											}
-												fix(gateway): 修复 cache_control 块超限问题并优化 Claude Code 检测

问题：
- OAuth/SetupToken 账号注入 system prompt 后可能导致 cache_control
  块超过 Anthropic API 的 4 个限制
- Claude Code 检测使用精确匹配，无法识别 Agent SDK 等变体

修复：
- 新增 enforceCacheControlLimit 函数，强制执行 4 个块限制
- 优先从 messages 移除，再从 system 尾部移除（保护注入的 prompt）
- 改用前缀匹配检测 Claude Code 系统提示词，支持多种变体：
  - 标准版、Agent SDK 版、Explore Agent 版、Compact 版

											
										
										
											2026-01-07 10:17:09 +08:00
+											if _, has := m["cache_control"]; has {
 												delete(m, "cache_control")
 												return true
 											}
 										}
 									}
 									return false
 								}
-												feat(gateway): 优化 Antigravity/Gemini 思考块处理

此提交解决了思考块 (thinking blocks) 在转发过程中的兼容性问题。

主要变更：

1. **思考块优化 (Thinking Blocks)**：
   - 在 AntigravityGatewayService 中增加了 sanitizeThinkingBlocks 处理，强制移除思考块中不支持的 cache_control 字段（避免 Anthropic/Vertex AI 报错）
   - 实现历史思考块展平 (Flattening)：将非最后一条消息中的思考块转换为普通文本块，以绕过上游对历史思考块签名的严格校验
   - 增加 cleanCacheControlFromGeminiJSON 作为最后一道防线，确保转换后的 Gemini 请求中不残留非法的 cache_control

2. **GatewayService 缓存控制优化**：
   - 更新缓存控制逻辑，跳过 thinking 块（thinking 块不支持 cache_control 字段）
   - 增加 removeCacheControlFromThinkingBlocks 函数强制清理

关联 Issue: #225

											
										
										
											2026-01-10 04:56:11 +00:00
+								// removeCacheControlFromThinkingBlocks 强制清理所有 thinking 块中的非法 cache_control
 								// thinking 块不支持 cache_control 字段，这个函数确保所有 thinking 块都不含该字段
 								func removeCacheControlFromThinkingBlocks(data map[string]any) {
 									// 清理 system 中的 thinking 块
 									if system, ok := data["system"].([]any); ok {
 										for _, item := range system {
 											if m, ok := item.(map[string]any); ok {
 												if blockType, _ := m["type"].(string); blockType == "thinking" {
 													if _, has := m["cache_control"]; has {
 														delete(m, "cache_control")
 														log.Printf("[Warning] Removed illegal cache_control from thinking block in system")
 													}
 												}
 											}
 										}
 									}
 									// 清理 messages 中的 thinking 块
 									if messages, ok := data["messages"].([]any); ok {
 										for msgIdx, msg := range messages {
 											if msgMap, ok := msg.(map[string]any); ok {
 												if content, ok := msgMap["content"].([]any); ok {
 													for contentIdx, item := range content {
 														if m, ok := item.(map[string]any); ok {
 															if blockType, _ := m["type"].(string); blockType == "thinking" {
 																if _, has := m["cache_control"]; has {
 																	delete(m, "cache_control")
 																	log.Printf("[Warning] Removed illegal cache_control from thinking block in messages[%d].content[%d]", msgIdx, contentIdx)
 																}
 															}
 														}
 													}
 												}
 											}
 										}
 									}
 								}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								// Forward 转发请求到Claude API
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+								func (s *GatewayService) Forward(ctx context.Context, c *gin.Context, account *Account, parsed *ParsedRequest) (*ForwardResult, error) {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									startTime := time.Now()
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+									if parsed == nil {
 										return nil, fmt.Errorf("parse request: empty request")
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+									body := parsed.Body
 									reqModel := parsed.Model
 									reqStream := parsed.Stream
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+									originalModel := reqModel
 									var toolNameMap map[string]string
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+									isClaudeCode := isClaudeCodeRequest(ctx, c, parsed)
 									shouldMimicClaudeCode := account.IsOAuth() && !isClaudeCode
 									if shouldMimicClaudeCode {
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+										// 智能注入 Claude Code 系统提示词（仅 OAuth/SetupToken 账号需要）
 										// 条件：1) OAuth/SetupToken 账号  2) 不是 Claude Code 客户端  3) 不是 Haiku 模型  4) system 中还没有 Claude Code 提示词
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+										if !strings.Contains(strings.ToLower(reqModel), "haiku") &&
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+											!systemIncludesClaudeCodePrompt(parsed.System) {
 											body = injectClaudeCodePrompt(body, parsed.System)
 										}
 										normalizeOpts := claudeOAuthNormalizeOptions{stripSystemCacheControl: true}
 										if s.identityService != nil {
 											fp, err := s.identityService.GetOrCreateFingerprint(ctx, account.ID, c.Request.Header)
 											if err == nil && fp != nil {
 												if metadataUserID := s.buildOAuthMetadataUserID(parsed, account, fp); metadataUserID != "" {
 													normalizeOpts.injectMetadata = true
 													normalizeOpts.metadataUserID = metadataUserID
 												}
 											}
 										}
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+										body, reqModel, toolNameMap = normalizeClaudeOAuthRequestBody(body, reqModel, normalizeOpts)
-												CC 400 返回具体错误信息 && 非 CC 请求时增加 system prompt (#26)

* feat: http 400 返回具体错误

* 更新 workflows

* 优化打包/docker 构建流程

* 400 是返回 原始错误 - json 格式

* feat: 非 cc请求时补充 system

* go mod tidy
											
										
										
											2025-12-25 14:47:19 +08:00
+									}
-												fix(gateway): 修复 cache_control 块超限问题并优化 Claude Code 检测

问题：
- OAuth/SetupToken 账号注入 system prompt 后可能导致 cache_control
  块超过 Anthropic API 的 4 个限制
- Claude Code 检测使用精确匹配，无法识别 Agent SDK 等变体

修复：
- 新增 enforceCacheControlLimit 函数，强制执行 4 个块限制
- 优先从 messages 移除，再从 system 尾部移除（保护注入的 prompt）
- 改用前缀匹配检测 Claude Code 系统提示词，支持多种变体：
  - 标准版、Agent SDK 版、Explore Agent 版、Compact 版

											
										
										
											2026-01-07 10:17:09 +08:00
+									// 强制执行 cache_control 块数量限制（最多 4 个）
 									body = enforceCacheControlLimit(body)
-												Add invalid-request fallback routing

											
										
										
											2026-01-23 22:24:46 +08:00
+									// 应用模型映射（APIKey 明确映射优先，其次使用 Anthropic 前缀映射）
 									mappedModel := reqModel
 									mappingSource := ""
-												fix(lint): 修复所有 Go 命名规范问题

- 全局替换 ApiKey → APIKey（类型、字段、方法、变量）
- 修复所有 initialism 命名（API, SMTP, HTML, URL 等）
- 添加所有缺失的包注释
- 修复导出符号的注释格式

主要修改：
- ApiKey → APIKey（所有出现的地方）
- ApiKeyID → APIKeyID
- ApiKeyIDs → APIKeyIDs
- TestSmtpConnection → TestSMTPConnection
- HtmlURL → HTMLURL
- 添加 20+ 个包注释
- 修复 10+ 个导出符号注释格式

验证结果：
- ✓ golangci-lint: 0 issues
- ✓ 单元测试: 通过
- ✓ 集成测试: 通过

											
										
										
											2026-01-04 19:27:53 +08:00
+									if account.Type == AccountTypeAPIKey {
-												Add invalid-request fallback routing

											
										
										
											2026-01-23 22:24:46 +08:00
+										mappedModel = account.GetMappedModel(reqModel)
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+										if mappedModel != reqModel {
-												Add invalid-request fallback routing

											
										
										
											2026-01-23 22:24:46 +08:00
+											mappingSource = "account"
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										}
 									}
-												Add invalid-request fallback routing

											
										
										
											2026-01-23 22:24:46 +08:00
+									if mappingSource == "" && account.Platform == PlatformAnthropic {
 										normalized := normalizeClaudeModelForAnthropic(reqModel)
 										if normalized != reqModel {
 											mappedModel = normalized
 											mappingSource = "prefix"
 										}
 									}
 									if mappedModel != reqModel {
 										// 替换请求体中的模型名
 										body = s.replaceModelInBody(body, mappedModel)
 										reqModel = mappedModel
 										log.Printf("Model mapping applied: %s -> %s (account: %s, source=%s)", originalModel, mappedModel, account.Name, mappingSource)
 									}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
 									// 获取凭证
 									token, tokenType, err := s.GetAccessToken(ctx, account)
 									if err != nil {
 										return nil, err
 									}
-												refactor(backend): service http ports

											
										
										
											2025-12-20 11:56:11 +08:00
+									// 获取代理URL
 									proxyURL := ""
 									if account.ProxyID != nil && account.Proxy != nil {
 										proxyURL = account.Proxy.URL()
-												fix: 修复并发请求时共享httpClient.Transport导致的竞态条件

问题描述：
当多个请求并发执行且使用不同代理配置时，它们会同时修改共享的
s.httpClient.Transport，导致请求可能使用错误的代理（数据泄露风险）
或意外失败。

修复方案：
为需要代理的请求创建独立的http.Client，而不是修改共享的httpClient.Transport。

改动内容：
- 新增 buildUpstreamRequestResult 结构体，返回请求和可选的独立client
- 修改 buildUpstreamRequest 方法，配置代理时创建独立client
- 更新 Forward 方法，根据是否有代理选择合适的client

											
										
										
											2025-12-18 18:14:20 +08:00
+									}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+									// 调试日志：记录即将转发的账号信息
 									log.Printf("[Forward] Using account: ID=%d Name=%s Platform=%s Type=%s TLSFingerprint=%v Proxy=%s",
 										account.ID, account.Name, account.Platform, account.Type, account.IsTLSFingerprintEnabled(), proxyURL)
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+									// 重试循环
 									var resp *http.Response
-												fix(frontend): comprehensive i18n cleanup and Select component hardening

											
										
										
											2026-01-04 21:09:14 +08:00
+									retryStart := time.Now()
 									for attempt := 1; attempt <= maxRetryAttempts; attempt++ {
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+										// 构建上游请求（每次重试需要重新构建，因为请求体需要重新读取）
-												feat: merge dev

											
										
										
											2026-01-15 15:14:44 +08:00
+										// Capture upstream request body for ops retry of this attempt.
 										c.Set(OpsUpstreamRequestBodyKey, string(body))
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+										upstreamReq, err := s.buildUpstreamRequest(ctx, c, account, body, token, tokenType, reqModel, reqStream, shouldMimicClaudeCode)
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+										if err != nil {
 											return nil, err
 										}
 										// 发送请求
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+										resp, err = s.httpUpstream.DoWithTLS(upstreamReq, proxyURL, account.ID, account.Concurrency, account.IsTLSFingerprintEnabled())
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+										if err != nil {
-												fix(frontend): comprehensive i18n cleanup and Select component hardening

											
										
										
											2026-01-04 21:09:14 +08:00
+											if resp != nil && resp.Body != nil {
 												_ = resp.Body.Close()
 											}
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
+											// Ensure the client receives an error response (handlers assume Forward writes on non-failover errors).
 											safeErr := sanitizeUpstreamErrorMessage(err.Error())
 											setOpsUpstreamError(c, 0, safeErr, "")
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+											appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 												Platform:           account.Platform,
 												AccountID:          account.ID,
-												feat: merge dev

											
										
										
											2026-01-15 15:14:44 +08:00
+												AccountName:        account.Name,
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+												UpstreamStatusCode: 0,
 												Kind:               "request_error",
 												Message:            safeErr,
 											})
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
+											c.JSON(http.StatusBadGateway, gin.H{
 												"type": "error",
 												"error": gin.H{
 													"type":    "upstream_error",
 													"message": "Upstream request failed",
 												},
 											})
 											return nil, fmt.Errorf("upstream request failed: %s", safeErr)
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+										}
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+										// 优先检测thinking block签名错误（400）并重试一次
 										if resp.StatusCode == 400 {
 											respBody, readErr := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
 											if readErr == nil {
 												_ = resp.Body.Close()
 												if s.isThinkingBlockSignatureError(respBody) {
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+													appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 														Platform:           account.Platform,
 														AccountID:          account.ID,
-												feat: merge dev

											
										
										
											2026-01-15 15:14:44 +08:00
+														AccountName:        account.Name,
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+														UpstreamStatusCode: resp.StatusCode,
 														UpstreamRequestID:  resp.Header.Get("x-request-id"),
 														Kind:               "signature_error",
 														Message:            extractUpstreamErrorMessage(respBody),
 														Detail: func() string {
 															if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 																return truncateString(string(respBody), s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes)
 															}
 															return ""
 														}(),
 													})
-												fix(backend): 修复 CI 失败问题

修复内容：
1. 修复 6 个 golangci-lint 错误
   - 3 个 errcheck 错误：在 gateway_request_test.go 中添加类型断言检查
   - 3 个 gofmt 格式化问题：修复代码格式
2. 修复 API 契约测试失败
   - 在测试中添加缺失的字段：enable_identity_patch 和 identity_patch_prompt

所有测试和 linter 检查现已通过。

											
										
										
											2026-01-05 00:56:48 +08:00
+													looksLikeToolSignatureError := func(msg string) bool {
 														m := strings.ToLower(msg)
 														return strings.Contains(m, "tool_use") ||
 															strings.Contains(m, "tool_result") ||
 															strings.Contains(m, "functioncall") ||
 															strings.Contains(m, "function_call") ||
 															strings.Contains(m, "functionresponse") ||
 															strings.Contains(m, "function_response")
 													}
 													// 避免在重试预算已耗尽时再发起额外请求
 													if time.Since(retryStart) >= maxRetryElapsed {
 														resp.Body = io.NopCloser(bytes.NewReader(respBody))
 														break
-												fix(frontend): comprehensive i18n cleanup and Select component hardening

											
										
										
											2026-01-04 21:09:14 +08:00
+													}
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+													log.Printf("Account %d: detected thinking block signature error, retrying with filtered thinking blocks", account.ID)
-												fix(backend): 修复 CI 失败问题

修复内容：
1. 修复 6 个 golangci-lint 错误
   - 3 个 errcheck 错误：在 gateway_request_test.go 中添加类型断言检查
   - 3 个 gofmt 格式化问题：修复代码格式
2. 修复 API 契约测试失败
   - 在测试中添加缺失的字段：enable_identity_patch 和 identity_patch_prompt

所有测试和 linter 检查现已通过。

											
										
										
											2026-01-05 00:56:48 +08:00
+													// Conservative two-stage fallback:
 													// 1) Disable thinking + thinking->text (preserve content)
 													// 2) Only if upstream still errors AND error message points to tool/function signature issues:
 													//    also downgrade tool_use/tool_result blocks to text.
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+													filteredBody := FilterThinkingBlocksForRetry(body)
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+													retryReq, buildErr := s.buildUpstreamRequest(ctx, c, account, filteredBody, token, tokenType, reqModel, reqStream, shouldMimicClaudeCode)
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+													if buildErr == nil {
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+														retryResp, retryErr := s.httpUpstream.DoWithTLS(retryReq, proxyURL, account.ID, account.Concurrency, account.IsTLSFingerprintEnabled())
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+														if retryErr == nil {
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+															if retryResp.StatusCode < 400 {
-												fix(backend): 修复 CI 失败问题

修复内容：
1. 修复 6 个 golangci-lint 错误
   - 3 个 errcheck 错误：在 gateway_request_test.go 中添加类型断言检查
   - 3 个 gofmt 格式化问题：修复代码格式
2. 修复 API 契约测试失败
   - 在测试中添加缺失的字段：enable_identity_patch 和 identity_patch_prompt

所有测试和 linter 检查现已通过。

											
										
										
											2026-01-05 00:56:48 +08:00
+																log.Printf("Account %d: signature error retry succeeded (thinking downgraded)", account.ID)
 																resp = retryResp
 																break
 															}
-												fix(backend): 改进 thinking/tool block 签名处理和重试策略

主要改动：
- request_transformer: thinking block 缺少签名时降级为文本而非丢弃，保留内容并在上层禁用 thinking mode
- antigravity_gateway_service: 新增两阶段降级策略，先处理 thinking blocks，如仍失败且涉及 tool 签名错误则进一步降级 tool blocks
- gateway_request: 新增 FilterSignatureSensitiveBlocksForRetry 函数，支持将 tool_use/tool_result 降级为文本
- gateway_request: 改进 FilterThinkingBlocksForRetry，禁用顶层 thinking 配置以避免结构约束冲突
- gateway_service: 实现保守的两阶段重试逻辑，优先保留内容，仅在必要时降级工具调用
- 新增 antigravity_gateway_service_test.go 测试签名块剥离逻辑
- 更新相关测试用例以验证降级行为

此修复解决了跨平台/账户切换时历史消息签名失效导致的请求失败问题。

											
										
										
											2026-01-04 22:32:36 +08:00
-												fix(backend): 修复 CI 失败问题

修复内容：
1. 修复 6 个 golangci-lint 错误
   - 3 个 errcheck 错误：在 gateway_request_test.go 中添加类型断言检查
   - 3 个 gofmt 格式化问题：修复代码格式
2. 修复 API 契约测试失败
   - 在测试中添加缺失的字段：enable_identity_patch 和 identity_patch_prompt

所有测试和 linter 检查现已通过。

											
										
										
											2026-01-05 00:56:48 +08:00
+															retryRespBody, retryReadErr := io.ReadAll(io.LimitReader(retryResp.Body, 2<<20))
 															_ = retryResp.Body.Close()
 															if retryReadErr == nil && retryResp.StatusCode == 400 && s.isThinkingBlockSignatureError(retryRespBody) {
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+																appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 																	Platform:           account.Platform,
 																	AccountID:          account.ID,
-												feat: merge dev

											
										
										
											2026-01-15 15:14:44 +08:00
+																	AccountName:        account.Name,
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+																	UpstreamStatusCode: retryResp.StatusCode,
 																	UpstreamRequestID:  retryResp.Header.Get("x-request-id"),
 																	Kind:               "signature_retry_thinking",
 																	Message:            extractUpstreamErrorMessage(retryRespBody),
 																	Detail: func() string {
 																		if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 																			return truncateString(string(retryRespBody), s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes)
 																		}
 																		return ""
 																	}(),
 																})
-												fix(backend): 修复 CI 失败问题

修复内容：
1. 修复 6 个 golangci-lint 错误
   - 3 个 errcheck 错误：在 gateway_request_test.go 中添加类型断言检查
   - 3 个 gofmt 格式化问题：修复代码格式
2. 修复 API 契约测试失败
   - 在测试中添加缺失的字段：enable_identity_patch 和 identity_patch_prompt

所有测试和 linter 检查现已通过。

											
										
										
											2026-01-05 00:56:48 +08:00
+																msg2 := extractUpstreamErrorMessage(retryRespBody)
 																if looksLikeToolSignatureError(msg2) && time.Since(retryStart) < maxRetryElapsed {
 																	log.Printf("Account %d: signature retry still failing and looks tool-related, retrying with tool blocks downgraded", account.ID)
 																	filteredBody2 := FilterSignatureSensitiveBlocksForRetry(body)
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+																	retryReq2, buildErr2 := s.buildUpstreamRequest(ctx, c, account, filteredBody2, token, tokenType, reqModel, reqStream, shouldMimicClaudeCode)
-												fix(backend): 修复 CI 失败问题

修复内容：
1. 修复 6 个 golangci-lint 错误
   - 3 个 errcheck 错误：在 gateway_request_test.go 中添加类型断言检查
   - 3 个 gofmt 格式化问题：修复代码格式
2. 修复 API 契约测试失败
   - 在测试中添加缺失的字段：enable_identity_patch 和 identity_patch_prompt

所有测试和 linter 检查现已通过。

											
										
										
											2026-01-05 00:56:48 +08:00
+																	if buildErr2 == nil {
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+																		retryResp2, retryErr2 := s.httpUpstream.DoWithTLS(retryReq2, proxyURL, account.ID, account.Concurrency, account.IsTLSFingerprintEnabled())
-												fix(backend): 修复 CI 失败问题

修复内容：
1. 修复 6 个 golangci-lint 错误
   - 3 个 errcheck 错误：在 gateway_request_test.go 中添加类型断言检查
   - 3 个 gofmt 格式化问题：修复代码格式
2. 修复 API 契约测试失败
   - 在测试中添加缺失的字段：enable_identity_patch 和 identity_patch_prompt

所有测试和 linter 检查现已通过。

											
										
										
											2026-01-05 00:56:48 +08:00
+																		if retryErr2 == nil {
 																			resp = retryResp2
 																			break
 																		}
 																		if retryResp2 != nil && retryResp2.Body != nil {
 																			_ = retryResp2.Body.Close()
-												fix(backend): 改进 thinking/tool block 签名处理和重试策略

主要改动：
- request_transformer: thinking block 缺少签名时降级为文本而非丢弃，保留内容并在上层禁用 thinking mode
- antigravity_gateway_service: 新增两阶段降级策略，先处理 thinking blocks，如仍失败且涉及 tool 签名错误则进一步降级 tool blocks
- gateway_request: 新增 FilterSignatureSensitiveBlocksForRetry 函数，支持将 tool_use/tool_result 降级为文本
- gateway_request: 改进 FilterThinkingBlocksForRetry，禁用顶层 thinking 配置以避免结构约束冲突
- gateway_service: 实现保守的两阶段重试逻辑，优先保留内容，仅在必要时降级工具调用
- 新增 antigravity_gateway_service_test.go 测试签名块剥离逻辑
- 更新相关测试用例以验证降级行为

此修复解决了跨平台/账户切换时历史消息签名失效导致的请求失败问题。

											
										
										
											2026-01-04 22:32:36 +08:00
+																		}
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+																		appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 																			Platform:           account.Platform,
 																			AccountID:          account.ID,
-												feat: merge dev

											
										
										
											2026-01-15 15:14:44 +08:00
+																			AccountName:        account.Name,
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+																			UpstreamStatusCode: 0,
 																			Kind:               "signature_retry_tools_request_error",
 																			Message:            sanitizeUpstreamErrorMessage(retryErr2.Error()),
 																		})
-												fix(backend): 修复 CI 失败问题

修复内容：
1. 修复 6 个 golangci-lint 错误
   - 3 个 errcheck 错误：在 gateway_request_test.go 中添加类型断言检查
   - 3 个 gofmt 格式化问题：修复代码格式
2. 修复 API 契约测试失败
   - 在测试中添加缺失的字段：enable_identity_patch 和 identity_patch_prompt

所有测试和 linter 检查现已通过。

											
										
										
											2026-01-05 00:56:48 +08:00
+																		log.Printf("Account %d: tool-downgrade signature retry failed: %v", account.ID, retryErr2)
 																	} else {
 																		log.Printf("Account %d: tool-downgrade signature retry build failed: %v", account.ID, buildErr2)
-												fix(backend): 改进 thinking/tool block 签名处理和重试策略

主要改动：
- request_transformer: thinking block 缺少签名时降级为文本而非丢弃，保留内容并在上层禁用 thinking mode
- antigravity_gateway_service: 新增两阶段降级策略，先处理 thinking blocks，如仍失败且涉及 tool 签名错误则进一步降级 tool blocks
- gateway_request: 新增 FilterSignatureSensitiveBlocksForRetry 函数，支持将 tool_use/tool_result 降级为文本
- gateway_request: 改进 FilterThinkingBlocksForRetry，禁用顶层 thinking 配置以避免结构约束冲突
- gateway_service: 实现保守的两阶段重试逻辑，优先保留内容，仅在必要时降级工具调用
- 新增 antigravity_gateway_service_test.go 测试签名块剥离逻辑
- 更新相关测试用例以验证降级行为

此修复解决了跨平台/账户切换时历史消息签名失效导致的请求失败问题。

											
										
										
											2026-01-04 22:32:36 +08:00
+																	}
 																}
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+															}
-												fix(backend): 修复 CI 失败问题

修复内容：
1. 修复 6 个 golangci-lint 错误
   - 3 个 errcheck 错误：在 gateway_request_test.go 中添加类型断言检查
   - 3 个 gofmt 格式化问题：修复代码格式
2. 修复 API 契约测试失败
   - 在测试中添加缺失的字段：enable_identity_patch 和 identity_patch_prompt

所有测试和 linter 检查现已通过。

											
										
										
											2026-01-05 00:56:48 +08:00
 															// Fall back to the original retry response context.
 															resp = &http.Response{
 																StatusCode: retryResp.StatusCode,
 																Header:     retryResp.Header.Clone(),
 																Body:       io.NopCloser(bytes.NewReader(retryRespBody)),
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+															}
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+															break
 														}
-												fix(backend): 修复 CI 失败问题

修复内容：
1. 修复 6 个 golangci-lint 错误
   - 3 个 errcheck 错误：在 gateway_request_test.go 中添加类型断言检查
   - 3 个 gofmt 格式化问题：修复代码格式
2. 修复 API 契约测试失败
   - 在测试中添加缺失的字段：enable_identity_patch 和 identity_patch_prompt

所有测试和 linter 检查现已通过。

											
										
										
											2026-01-05 00:56:48 +08:00
+														if retryResp != nil && retryResp.Body != nil {
 															_ = retryResp.Body.Close()
 														}
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+														log.Printf("Account %d: signature error retry failed: %v", account.ID, retryErr)
 													} else {
 														log.Printf("Account %d: signature error retry build request failed: %v", account.ID, buildErr)
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+													}
-												fix(backend): 修复 CI 失败问题

修复内容：
1. 修复 6 个 golangci-lint 错误
   - 3 个 errcheck 错误：在 gateway_request_test.go 中添加类型断言检查
   - 3 个 gofmt 格式化问题：修复代码格式
2. 修复 API 契约测试失败
   - 在测试中添加缺失的字段：enable_identity_patch 和 identity_patch_prompt

所有测试和 linter 检查现已通过。

											
										
										
											2026-01-05 00:56:48 +08:00
 													// Retry failed: restore original response body and continue handling.
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+													resp.Body = io.NopCloser(bytes.NewReader(respBody))
 													break
 												}
 												// 不是thinking签名错误，恢复响应体
 												resp.Body = io.NopCloser(bytes.NewReader(respBody))
 											}
 										}
 										// 检查是否需要通用重试（排除400，因为400已经在上面特殊处理过了）
 										if resp.StatusCode >= 400 && resp.StatusCode != 400 && s.shouldRetryUpstreamError(account, resp.StatusCode) {
-												fix(frontend): comprehensive i18n cleanup and Select component hardening

											
										
										
											2026-01-04 21:09:14 +08:00
+											if attempt < maxRetryAttempts {
 												elapsed := time.Since(retryStart)
 												if elapsed >= maxRetryElapsed {
 													break
 												}
 												delay := retryBackoffDelay(attempt)
 												remaining := maxRetryElapsed - elapsed
 												if delay > remaining {
 													delay = remaining
 												}
 												if delay <= 0 {
 													break
 												}
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+												respBody, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
 												_ = resp.Body.Close()
 												appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 													Platform:           account.Platform,
 													AccountID:          account.ID,
-												feat: merge dev

											
										
										
											2026-01-15 15:14:44 +08:00
+													AccountName:        account.Name,
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+													UpstreamStatusCode: resp.StatusCode,
 													UpstreamRequestID:  resp.Header.Get("x-request-id"),
 													Kind:               "retry",
 													Message:            extractUpstreamErrorMessage(respBody),
 													Detail: func() string {
 														if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 															return truncateString(string(respBody), s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes)
 														}
 														return ""
 													}(),
 												})
-												fix(frontend): comprehensive i18n cleanup and Select component hardening

											
										
										
											2026-01-04 21:09:14 +08:00
+												log.Printf("Account %d: upstream error %d, retry %d/%d after %v (elapsed=%v/%v)",
 													account.ID, resp.StatusCode, attempt, maxRetryAttempts, delay, elapsed, maxRetryElapsed)
 												if err := sleepWithContext(ctx, delay); err != nil {
 													return nil, err
 												}
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+												continue
 											}
 											// 最后一次尝试也失败，跳出循环处理重试耗尽
 											break
 										}
 										// 不需要重试（成功或不可重试的错误），跳出循环
-												feat(gemini): 完善 Gemini OAuth 配额系统和用量显示

主要改动：
- 后端：重构 Gemini 配额服务，支持多层级配额策略（GCP Standard/Free, Google One, AI Studio, Code Assist）
- 后端：优化 OAuth 服务，增强 tier_id 识别和存储逻辑
- 后端：改进用量统计服务，支持不同平台的配额查询
- 后端：优化限流服务，增加临时解除调度状态管理
- 前端：统一四种授权方式的用量显示格式和徽标样式
- 前端：增强账户配额信息展示，支持多种配额类型
- 前端：改进创建和重新授权模态框的用户体验
- 国际化：完善中英文配额相关文案
- 移除 CHANGELOG.md 文件

测试：所有单元测试通过

											
										
										
											2026-01-04 15:36:00 +08:00
+										// DEBUG: 输出响应 headers（用于检测 rate limit 信息）
 										if account.Platform == PlatformGemini && resp.StatusCode < 400 {
 											log.Printf("[DEBUG] Gemini API Response Headers for account %d:", account.ID)
 											for k, v := range resp.Header {
 												log.Printf("[DEBUG]   %s: %v", k, v)
 											}
 										}
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+										break
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
-												fix(frontend): comprehensive i18n cleanup and Select component hardening

											
										
										
											2026-01-04 21:09:14 +08:00
+									if resp == nil || resp.Body == nil {
 										return nil, errors.New("upstream request failed: empty response")
 									}
-												ci(backend): 添加 github actions (#10)

## 变更内容

### CI/CD
- 添加 GitHub Actions 工作流（test + golangci-lint）
- 添加 golangci-lint 配置，启用 errcheck/govet/staticcheck/unused/depguard
- 通过 depguard 强制 service 层不能直接导入 repository

### 错误处理修复
- 修复 CSV 写入、SSE 流式输出、随机数生成等未处理的错误
- GenerateRedeemCode() 现在返回 error

### 资源泄露修复
- 统一使用 defer func() { _ = xxx.Close() }() 模式

### 代码清理
- 移除未使用的常量
- 简化 nil map 检查
- 统一代码格式
											
										
										
											2025-12-20 15:29:52 +08:00
+									defer func() { _ = resp.Body.Close() }()
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+									// 处理重试耗尽的情况
 									if resp.StatusCode >= 400 && s.shouldRetryUpstreamError(account, resp.StatusCode) {
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+										if s.shouldFailoverUpstreamError(resp.StatusCode) {
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+											respBody, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
 											_ = resp.Body.Close()
 											resp.Body = io.NopCloser(bytes.NewReader(respBody))
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+											// 调试日志：打印重试耗尽后的错误响应
 											log.Printf("[Forward] Upstream error (retry exhausted, failover): Account=%d(%s) Status=%d RequestID=%s Body=%s",
 												account.ID, account.Name, resp.StatusCode, resp.Header.Get("x-request-id"), truncateString(string(respBody), 1000))
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+											s.handleRetryExhaustedSideEffects(ctx, resp, account)
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+											appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 												Platform:           account.Platform,
 												AccountID:          account.ID,
-												feat: merge dev

											
										
										
											2026-01-15 15:14:44 +08:00
+												AccountName:        account.Name,
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+												UpstreamStatusCode: resp.StatusCode,
 												UpstreamRequestID:  resp.Header.Get("x-request-id"),
 												Kind:               "retry_exhausted_failover",
 												Message:            extractUpstreamErrorMessage(respBody),
 												Detail: func() string {
 													if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 														return truncateString(string(respBody), s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes)
 													}
 													return ""
 												}(),
 											})
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+											return nil, &UpstreamFailoverError{StatusCode: resp.StatusCode}
 										}
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+										return s.handleRetryExhaustedError(ctx, resp, c, account)
 									}
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+									// 处理可切换账号的错误
 									if resp.StatusCode >= 400 && s.shouldFailoverUpstreamError(resp.StatusCode) {
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+										respBody, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
 										_ = resp.Body.Close()
 										resp.Body = io.NopCloser(bytes.NewReader(respBody))
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+										// 调试日志：打印上游错误响应
 										log.Printf("[Forward] Upstream error (failover): Account=%d(%s) Status=%d RequestID=%s Body=%s",
 											account.ID, account.Name, resp.StatusCode, resp.Header.Get("x-request-id"), truncateString(string(respBody), 1000))
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+										s.handleFailoverSideEffects(ctx, resp, account)
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+										appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 											Platform:           account.Platform,
 											AccountID:          account.ID,
 											UpstreamStatusCode: resp.StatusCode,
 											UpstreamRequestID:  resp.Header.Get("x-request-id"),
 											Kind:               "failover",
 											Message:            extractUpstreamErrorMessage(respBody),
 											Detail: func() string {
 												if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 													return truncateString(string(respBody), s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes)
 												}
 												return ""
 											}(),
 										})
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+										return nil, &UpstreamFailoverError{StatusCode: resp.StatusCode}
 									}
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+									// 处理错误响应（不可重试的错误）
-												fix(lint): 修复 golangci-lint 检查问题

- 格式化代码 (gofmt)
- 修复 rows.Close() 返回值未检查 (errcheck)
- 删除未使用的 usage_clamp.go 文件 (unused)
- 删除临时测试目录

											
										
										
											2026-01-03 06:57:08 -08:00
+									if resp.StatusCode >= 400 {
 										// 可选：对部分 400 触发 failover（默认关闭以保持语义）
 										if resp.StatusCode == 400 && s.cfg != nil && s.cfg.Gateway.FailoverOn400 {
 											respBody, readErr := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
 											if readErr != nil {
 												// ReadAll failed, fall back to normal error handling without consuming the stream
 												return s.handleErrorResponse(ctx, resp, c, account)
-												fix: 修复 /v1/messages 间歇性 400 错误 (#18)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* feat(gemini): 添加Gemini限额与TierID支持

实现PR1：Gemini限额与TierID功能

后端修改：
- GeminiTokenInfo结构体添加TierID字段
- fetchProjectID函数返回(projectID, tierID, error)
- 从LoadCodeAssist响应中提取tierID（优先IsDefault，回退到第一个非空tier）
- ExchangeCode、RefreshAccountToken、GetAccessToken函数更新以处理tierID
- BuildAccountCredentials函数保存tier_id到credentials

前端修改：
- AccountStatusIndicator组件添加tier显示
- 支持LEGACY/PRO/ULTRA等tier类型的友好显示
- 使用蓝色badge展示tier信息

技术细节：
- tierID提取逻辑：优先选择IsDefault的tier，否则选择第一个非空tier
- 所有fetchProjectID调用点已更新以处理新的返回签名
- 前端gracefully处理missing/unknown tier_id

* refactor(gemini): 优化TierID实现并添加安全验证

根据并发代码审查（code-reviewer, security-auditor, gemini, codex）的反馈进行改进：

安全改进：
- 添加validateTierID函数验证tier_id格式和长度（最大64字符）
- 限制tier_id字符集为字母数字、下划线、连字符和斜杠
- 在BuildAccountCredentials中验证tier_id后再存储
- 静默跳过无效tier_id，不阻塞账户创建

代码质量改进：
- 提取extractTierIDFromAllowedTiers辅助函数消除重复代码
- 重构fetchProjectID函数，tierID提取逻辑只执行一次
- 改进代码可读性和可维护性

审查工具：
- code-reviewer agent (a09848e)
- security-auditor agent (a9a149c)
- gemini CLI (bcc7c81)
- codex (b5d8919)

修复问题：
- HIGH: 未验证的tier_id输入
- MEDIUM: 代码重复（tierID提取逻辑重复2次）

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(upstream): 修复上游格式兼容性问题 (#14)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(format): 修复 claude_types.go 的 gofmt 格式问题

* feat(antigravity): 优化 thinking block 和 schema 处理

- 为 dummy thinking block 添加 ThoughtSignature
- 重构 thinking block 处理逻辑，在每个条件分支内创建 part
- 优化 excludedSchemaKeys，移除 Gemini 实际支持的字段
  (minItems, maxItems, minimum, maximum, additionalProperties, format)
- 添加详细注释说明 Gemini API 支持的 schema 字段

* fix(antigravity): 增强 schema 清理的安全性

基于 Codex review 建议：
- 添加 format 字段白名单过滤，只保留 Gemini 支持的 date-time/date/time
- 补充更多不支持的 schema 关键字到黑名单：
  * 组合 schema: oneOf, anyOf, allOf, not, if/then/else
  * 对象验证: minProperties, maxProperties, patternProperties 等
  * 定义引用: $defs, definitions
- 避免不支持的 schema 字段导致 Gemini API 校验失败

* fix(lint): 修复 gemini_messages_compat_service 空分支警告

- 在 cleanToolSchema 的 if 语句中添加 continue
- 移除重复的注释

* fix(antigravity): 移除 minItems/maxItems 以兼容 Claude API

- 将 minItems 和 maxItems 添加到 schema 黑名单
- Claude API (Vertex AI) 不支持这些数组验证字段
- 添加调试日志记录工具 schema 转换过程
- 修复 tools.14.custom.input_schema 验证错误

* fix(antigravity): 修复 additionalProperties schema 对象问题

- 将 additionalProperties 的 schema 对象转换为布尔值 true
- Claude API 只支持 additionalProperties: false，不支持 schema 对象
- 修复 tools.14.custom.input_schema 验证错误
- 参考 Claude 官方文档的 JSON Schema 限制

* fix(antigravity): 修复 Claude 模型 thinking 块兼容性问题

- 完全跳过 Claude 模型的 thinking 块以避免 signature 验证失败
- 只在 Gemini 模型中使用 dummy thought signature
- 修改 additionalProperties 默认值为 false（更安全）
- 添加调试日志以便排查问题

* fix(upstream): 修复跨模型切换时的 dummy signature 问题

基于 Codex review 和用户场景分析的修复：

1. 问题场景
   - Gemini (thinking) → Claude (thinking) 切换时
   - Gemini 返回的 thinking 块使用 dummy signature
   - Claude API 会拒绝 dummy signature，导致 400 错误

2. 修复内容
   - request_transformer.go:262: 跳过 dummy signature
   - 只保留真实的 Claude signature
   - 支持频繁的跨模型切换

3. 其他修复（基于 Codex review）
   - gateway_service.go:691: 修复 io.ReadAll 错误处理
   - gateway_service.go:687: 条件日志（尊重 LogUpstreamErrorBody 配置）
   - gateway_service.go:915: 收紧 400 failover 启发式
   - request_transformer.go:188: 移除签名成功日志

4. 新增功能（默认关闭）
   - 阶段 1: 上游错误日志（GATEWAY_LOG_UPSTREAM_ERROR_BODY）
   - 阶段 2: Antigravity thinking 修复
   - 阶段 3: API-key beta 注入（GATEWAY_INJECT_BETA_FOR_APIKEY）
   - 阶段 3: 智能 400 failover（GATEWAY_FAILOVER_ON_400）

测试：所有测试通过

* fix(lint): 修复 golangci-lint 问题

- 应用 De Morgan 定律简化条件判断
- 修复 gofmt 格式问题
- 移除未使用的 min 函数
											
										
										
											2026-01-01 04:21:18 +08:00
+											}
 											_ = resp.Body.Close()
 											resp.Body = io.NopCloser(bytes.NewReader(respBody))
 											if s.shouldFailoverOn400(respBody) {
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+												upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(respBody))
 												upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)
 												upstreamDetail := ""
 												if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 													maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
 													if maxBytes <= 0 {
 														maxBytes = 2048
 													}
 													upstreamDetail = truncateString(string(respBody), maxBytes)
 												}
 												appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 													Platform:           account.Platform,
 													AccountID:          account.ID,
-												feat: merge dev

											
										
										
											2026-01-15 15:14:44 +08:00
+													AccountName:        account.Name,
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+													UpstreamStatusCode: resp.StatusCode,
 													UpstreamRequestID:  resp.Header.Get("x-request-id"),
 													Kind:               "failover_on_400",
 													Message:            upstreamMsg,
 													Detail:             upstreamDetail,
 												})
-												fix: 修复 /v1/messages 间歇性 400 错误 (#18)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* feat(gemini): 添加Gemini限额与TierID支持

实现PR1：Gemini限额与TierID功能

后端修改：
- GeminiTokenInfo结构体添加TierID字段
- fetchProjectID函数返回(projectID, tierID, error)
- 从LoadCodeAssist响应中提取tierID（优先IsDefault，回退到第一个非空tier）
- ExchangeCode、RefreshAccountToken、GetAccessToken函数更新以处理tierID
- BuildAccountCredentials函数保存tier_id到credentials

前端修改：
- AccountStatusIndicator组件添加tier显示
- 支持LEGACY/PRO/ULTRA等tier类型的友好显示
- 使用蓝色badge展示tier信息

技术细节：
- tierID提取逻辑：优先选择IsDefault的tier，否则选择第一个非空tier
- 所有fetchProjectID调用点已更新以处理新的返回签名
- 前端gracefully处理missing/unknown tier_id

* refactor(gemini): 优化TierID实现并添加安全验证

根据并发代码审查（code-reviewer, security-auditor, gemini, codex）的反馈进行改进：

安全改进：
- 添加validateTierID函数验证tier_id格式和长度（最大64字符）
- 限制tier_id字符集为字母数字、下划线、连字符和斜杠
- 在BuildAccountCredentials中验证tier_id后再存储
- 静默跳过无效tier_id，不阻塞账户创建

代码质量改进：
- 提取extractTierIDFromAllowedTiers辅助函数消除重复代码
- 重构fetchProjectID函数，tierID提取逻辑只执行一次
- 改进代码可读性和可维护性

审查工具：
- code-reviewer agent (a09848e)
- security-auditor agent (a9a149c)
- gemini CLI (bcc7c81)
- codex (b5d8919)

修复问题：
- HIGH: 未验证的tier_id输入
- MEDIUM: 代码重复（tierID提取逻辑重复2次）

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(upstream): 修复上游格式兼容性问题 (#14)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(format): 修复 claude_types.go 的 gofmt 格式问题

* feat(antigravity): 优化 thinking block 和 schema 处理

- 为 dummy thinking block 添加 ThoughtSignature
- 重构 thinking block 处理逻辑，在每个条件分支内创建 part
- 优化 excludedSchemaKeys，移除 Gemini 实际支持的字段
  (minItems, maxItems, minimum, maximum, additionalProperties, format)
- 添加详细注释说明 Gemini API 支持的 schema 字段

* fix(antigravity): 增强 schema 清理的安全性

基于 Codex review 建议：
- 添加 format 字段白名单过滤，只保留 Gemini 支持的 date-time/date/time
- 补充更多不支持的 schema 关键字到黑名单：
  * 组合 schema: oneOf, anyOf, allOf, not, if/then/else
  * 对象验证: minProperties, maxProperties, patternProperties 等
  * 定义引用: $defs, definitions
- 避免不支持的 schema 字段导致 Gemini API 校验失败

* fix(lint): 修复 gemini_messages_compat_service 空分支警告

- 在 cleanToolSchema 的 if 语句中添加 continue
- 移除重复的注释

* fix(antigravity): 移除 minItems/maxItems 以兼容 Claude API

- 将 minItems 和 maxItems 添加到 schema 黑名单
- Claude API (Vertex AI) 不支持这些数组验证字段
- 添加调试日志记录工具 schema 转换过程
- 修复 tools.14.custom.input_schema 验证错误

* fix(antigravity): 修复 additionalProperties schema 对象问题

- 将 additionalProperties 的 schema 对象转换为布尔值 true
- Claude API 只支持 additionalProperties: false，不支持 schema 对象
- 修复 tools.14.custom.input_schema 验证错误
- 参考 Claude 官方文档的 JSON Schema 限制

* fix(antigravity): 修复 Claude 模型 thinking 块兼容性问题

- 完全跳过 Claude 模型的 thinking 块以避免 signature 验证失败
- 只在 Gemini 模型中使用 dummy thought signature
- 修改 additionalProperties 默认值为 false（更安全）
- 添加调试日志以便排查问题

* fix(upstream): 修复跨模型切换时的 dummy signature 问题

基于 Codex review 和用户场景分析的修复：

1. 问题场景
   - Gemini (thinking) → Claude (thinking) 切换时
   - Gemini 返回的 thinking 块使用 dummy signature
   - Claude API 会拒绝 dummy signature，导致 400 错误

2. 修复内容
   - request_transformer.go:262: 跳过 dummy signature
   - 只保留真实的 Claude signature
   - 支持频繁的跨模型切换

3. 其他修复（基于 Codex review）
   - gateway_service.go:691: 修复 io.ReadAll 错误处理
   - gateway_service.go:687: 条件日志（尊重 LogUpstreamErrorBody 配置）
   - gateway_service.go:915: 收紧 400 failover 启发式
   - request_transformer.go:188: 移除签名成功日志

4. 新增功能（默认关闭）
   - 阶段 1: 上游错误日志（GATEWAY_LOG_UPSTREAM_ERROR_BODY）
   - 阶段 2: Antigravity thinking 修复
   - 阶段 3: API-key beta 注入（GATEWAY_INJECT_BETA_FOR_APIKEY）
   - 阶段 3: 智能 400 failover（GATEWAY_FAILOVER_ON_400）

测试：所有测试通过

* fix(lint): 修复 golangci-lint 问题

- 应用 De Morgan 定律简化条件判断
- 修复 gofmt 格式问题
- 移除未使用的 min 函数
											
										
										
											2026-01-01 04:21:18 +08:00
+												if s.cfg.Gateway.LogUpstreamErrorBody {
 													log.Printf(
 														"Account %d: 400 error, attempting failover: %s",
 														account.ID,
 														truncateForLog(respBody, s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes),
 													)
 												} else {
 													log.Printf("Account %d: 400 error, attempting failover", account.ID)
 												}
 												s.handleFailoverSideEffects(ctx, resp, account)
 												return nil, &UpstreamFailoverError{StatusCode: resp.StatusCode}
 											}
 										}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										return s.handleErrorResponse(ctx, resp, c, account)
 									}
 									// 处理正常响应
 									var usage *ClaudeUsage
 									var firstTokenMs *int
-												fix(billing): 修复客户端取消请求时计费丢失问题

检测 context.Canceled 作为客户端断开信号，返回已收集的 usage 而非错误

											
										
										
											2026-01-08 11:25:17 +08:00
+									var clientDisconnect bool
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+									if reqStream {
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+										streamResult, err := s.handleStreamingResponse(ctx, resp, c, account, startTime, originalModel, reqModel, toolNameMap, shouldMimicClaudeCode)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										if err != nil {
-												CC Stream 响应流中出现 error 时, 增加返回重试 (#86)

* 响应流中出现 error, 返回重试

* 响应流中出现 error, 返回重试
											
										
										
											2025-12-30 10:48:55 +08:00
+											if err.Error() == "have error in stream" {
 												return nil, &UpstreamFailoverError{
 													StatusCode: 403,
 												}
 											}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+											return nil, err
 										}
 										usage = streamResult.usage
 										firstTokenMs = streamResult.firstTokenMs
-												fix(billing): 修复客户端取消请求时计费丢失问题

检测 context.Canceled 作为客户端断开信号，返回已收集的 usage 而非错误

											
										
										
											2026-01-08 11:25:17 +08:00
+										clientDisconnect = streamResult.clientDisconnect
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									} else {
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+										usage, err = s.handleNonStreamingResponse(ctx, resp, c, account, originalModel, reqModel, toolNameMap, shouldMimicClaudeCode)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										if err != nil {
 											return nil, err
 										}
 									}
 									return &ForwardResult{
-												fix(billing): 修复客户端取消请求时计费丢失问题

检测 context.Canceled 作为客户端断开信号，返回已收集的 usage 而非错误

											
										
										
											2026-01-08 11:25:17 +08:00
+										RequestID:        resp.Header.Get("x-request-id"),
 										Usage:            *usage,
 										Model:            originalModel, // 使用原始模型用于计费和日志
 										Stream:           reqStream,
 										Duration:         time.Since(startTime),
 										FirstTokenMs:     firstTokenMs,
 										ClientDisconnect: clientDisconnect,
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}, nil
 								}
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+								func (s *GatewayService) buildUpstreamRequest(ctx context.Context, c *gin.Context, account *Account, body []byte, token, tokenType, modelID string, reqStream bool, mimicClaudeCode bool) (*http.Request, error) {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									// 确定目标URL
 									targetURL := claudeAPIURL
-												fix(lint): 修复所有 Go 命名规范问题

- 全局替换 ApiKey → APIKey（类型、字段、方法、变量）
- 修复所有 initialism 命名（API, SMTP, HTML, URL 等）
- 添加所有缺失的包注释
- 修复导出符号的注释格式

主要修改：
- ApiKey → APIKey（所有出现的地方）
- ApiKeyID → APIKeyID
- ApiKeyIDs → APIKeyIDs
- TestSmtpConnection → TestSMTPConnection
- HtmlURL → HTMLURL
- 添加 20+ 个包注释
- 修复 10+ 个导出符号注释格式

验证结果：
- ✓ golangci-lint: 0 issues
- ✓ 单元测试: 通过
- ✓ 集成测试: 通过

											
										
										
											2026-01-04 19:27:53 +08:00
+									if account.Type == AccountTypeAPIKey {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										baseURL := account.GetBaseURL()
-												feat(安全): 强化安全策略与配置校验

- 增加 CORS/CSP/安全响应头与代理信任配置

- 引入 URL 白名单与私网开关，校验上游与价格源

- 改善 API Key 处理与网关错误返回

- 管理端设置隐藏敏感字段并优化前端提示

- 增加计费熔断与相关配置示例

测试: go test ./...

											
										
										
											2026-01-02 17:40:57 +08:00
+										if baseURL != "" {
 											validatedURL, err := s.validateUpstreamBaseURL(baseURL)
 											if err != nil {
 												return nil, err
 											}
 											targetURL = validatedURL + "/v1/messages"
 										}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
-												fix: satisfy golangci-lint (nil checks, remove unused helpers)

											
										
										
											2026-01-31 02:07:57 +08:00
+									clientHeaders := http.Header{}
 									if c != nil && c.Request != nil {
 										clientHeaders = c.Request.Header
 									}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									// OAuth账号：应用统一指纹
-												refactor: 删除 ports 目录

											
										
										
											2025-12-25 17:15:01 +08:00
+									var fingerprint *Fingerprint
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									if account.IsOAuth() && s.identityService != nil {
 										// 1. 获取或创建指纹（包含随机生成的ClientID）
-												fix: satisfy golangci-lint (nil checks, remove unused helpers)

											
										
										
											2026-01-31 02:07:57 +08:00
+										fp, err := s.identityService.GetOrCreateFingerprint(ctx, account.ID, clientHeaders)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										if err != nil {
 											log.Printf("Warning: failed to get fingerprint for account %d: %v", account.ID, err)
 											// 失败时降级为透传原始headers
 										} else {
 											fingerprint = fp
 											// 2. 重写metadata.user_id（需要指纹中的ClientID和账号的account_uuid）
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+											// 如果启用了会话ID伪装，会在重写后替换 session 部分为固定值
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+											accountUUID := account.GetExtraString("account_uuid")
 											if accountUUID != "" && fp.ClientID != "" {
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+												if newBody, err := s.identityService.RewriteUserIDWithMasking(ctx, body, account, accountUUID, fp.ClientID); err == nil && len(newBody) > 0 {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+													body = newBody
 												}
 											}
 										}
 									}
 									req, err := http.NewRequestWithContext(ctx, "POST", targetURL, bytes.NewReader(body))
 									if err != nil {
 										return nil, err
 									}
 									// 设置认证头
 									if tokenType == "oauth" {
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										req.Header.Set("authorization", "Bearer "+token)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									} else {
 										req.Header.Set("x-api-key", token)
 									}
 									// 白名单透传headers
-												fix: satisfy golangci-lint (nil checks, remove unused helpers)

											
										
										
											2026-01-31 02:07:57 +08:00
+									for key, values := range clientHeaders {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										lowerKey := strings.ToLower(key)
 										if allowedHeaders[lowerKey] {
 											for _, v := range values {
 												req.Header.Add(key, v)
 											}
 										}
 									}
 									// OAuth账号：应用缓存的指纹到请求头（覆盖白名单透传的头）
 									if fingerprint != nil {
 										s.identityService.ApplyFingerprint(req, fingerprint)
 									}
 									// 确保必要的headers存在
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									if req.Header.Get("content-type") == "" {
 										req.Header.Set("content-type", "application/json")
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
 									if req.Header.Get("anthropic-version") == "" {
 										req.Header.Set("anthropic-version", "2023-06-01")
 									}
-												fix(网关): OAuth 请求统一 user_id 与指纹

											
										
										
											2026-01-19 15:01:32 +08:00
+									if tokenType == "oauth" {
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+										applyClaudeOAuthHeaderDefaults(req, reqStream)
 									}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
-												fix(网关): Claude Code OAuth 补齐 oauth beta

											
										
										
											2026-01-16 23:15:52 +08:00
+									// 处理 anthropic-beta header（OAuth 账号需要包含 oauth beta）
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									if tokenType == "oauth" {
-												fix(网关): Claude Code OAuth 补齐 oauth beta

											
										
										
											2026-01-16 23:15:52 +08:00
+										if mimicClaudeCode {
-												fix(oauth): merge anthropic-beta and force Claude Code headers in mimic mode

											
										
										
											2026-01-29 02:36:28 +08:00
+											// 非 Claude Code 客户端：按 opencode 的策略处理：
 											// - 强制 Claude Code 指纹相关请求头（尤其是 user-agent/x-stainless/x-app）
 											// - 保留 incoming beta 的同时，确保 OAuth 所需 beta 存在
 											applyClaudeCodeMimicHeaders(req, reqStream)
 											incomingBeta := req.Header.Get("anthropic-beta")
-												fix(oauth): match Claude CLI accept header and beta set

											
										
										
											2026-01-29 15:31:29 +08:00
+											// Match real Claude CLI traffic (per mitmproxy reports):
 											// messages requests typically use only oauth + interleaved-thinking.
 											// Also drop claude-code beta if a downstream client added it.
-												fix(oauth): merge anthropic-beta and force Claude Code headers in mimic mode

											
										
										
											2026-01-29 02:36:28 +08:00
+											requiredBetas := []string{claude.BetaOAuth, claude.BetaInterleavedThinking}
-												fix(oauth): match Claude CLI accept header and beta set

											
										
										
											2026-01-29 15:31:29 +08:00
+											drop := map[string]struct{}{claude.BetaClaudeCode: {}}
 											req.Header.Set("anthropic-beta", mergeAnthropicBetaDropping(requiredBetas, incomingBeta, drop))
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+										} else {
-												fix(网关): Claude Code OAuth 补齐 oauth beta

											
										
										
											2026-01-16 23:15:52 +08:00
+											// Claude Code 客户端：尽量透传原始 header，仅补齐 oauth beta
 											clientBetaHeader := req.Header.Get("anthropic-beta")
 											req.Header.Set("anthropic-beta", s.getBetaHeader(modelID, clientBetaHeader))
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+										}
-												fix(lint): 修复所有 Go 命名规范问题

- 全局替换 ApiKey → APIKey（类型、字段、方法、变量）
- 修复所有 initialism 命名（API, SMTP, HTML, URL 等）
- 添加所有缺失的包注释
- 修复导出符号的注释格式

主要修改：
- ApiKey → APIKey（所有出现的地方）
- ApiKeyID → APIKeyID
- ApiKeyIDs → APIKeyIDs
- TestSmtpConnection → TestSMTPConnection
- HtmlURL → HTMLURL
- 添加 20+ 个包注释
- 修复 10+ 个导出符号注释格式

验证结果：
- ✓ golangci-lint: 0 issues
- ✓ 单元测试: 通过
- ✓ 集成测试: 通过

											
										
										
											2026-01-04 19:27:53 +08:00
+									} else if s.cfg != nil && s.cfg.Gateway.InjectBetaForAPIKey && req.Header.Get("anthropic-beta") == "" {
-												fix: 修复 /v1/messages 间歇性 400 错误 (#18)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* feat(gemini): 添加Gemini限额与TierID支持

实现PR1：Gemini限额与TierID功能

后端修改：
- GeminiTokenInfo结构体添加TierID字段
- fetchProjectID函数返回(projectID, tierID, error)
- 从LoadCodeAssist响应中提取tierID（优先IsDefault，回退到第一个非空tier）
- ExchangeCode、RefreshAccountToken、GetAccessToken函数更新以处理tierID
- BuildAccountCredentials函数保存tier_id到credentials

前端修改：
- AccountStatusIndicator组件添加tier显示
- 支持LEGACY/PRO/ULTRA等tier类型的友好显示
- 使用蓝色badge展示tier信息

技术细节：
- tierID提取逻辑：优先选择IsDefault的tier，否则选择第一个非空tier
- 所有fetchProjectID调用点已更新以处理新的返回签名
- 前端gracefully处理missing/unknown tier_id

* refactor(gemini): 优化TierID实现并添加安全验证

根据并发代码审查（code-reviewer, security-auditor, gemini, codex）的反馈进行改进：

安全改进：
- 添加validateTierID函数验证tier_id格式和长度（最大64字符）
- 限制tier_id字符集为字母数字、下划线、连字符和斜杠
- 在BuildAccountCredentials中验证tier_id后再存储
- 静默跳过无效tier_id，不阻塞账户创建

代码质量改进：
- 提取extractTierIDFromAllowedTiers辅助函数消除重复代码
- 重构fetchProjectID函数，tierID提取逻辑只执行一次
- 改进代码可读性和可维护性

审查工具：
- code-reviewer agent (a09848e)
- security-auditor agent (a9a149c)
- gemini CLI (bcc7c81)
- codex (b5d8919)

修复问题：
- HIGH: 未验证的tier_id输入
- MEDIUM: 代码重复（tierID提取逻辑重复2次）

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(upstream): 修复上游格式兼容性问题 (#14)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(format): 修复 claude_types.go 的 gofmt 格式问题

* feat(antigravity): 优化 thinking block 和 schema 处理

- 为 dummy thinking block 添加 ThoughtSignature
- 重构 thinking block 处理逻辑，在每个条件分支内创建 part
- 优化 excludedSchemaKeys，移除 Gemini 实际支持的字段
  (minItems, maxItems, minimum, maximum, additionalProperties, format)
- 添加详细注释说明 Gemini API 支持的 schema 字段

* fix(antigravity): 增强 schema 清理的安全性

基于 Codex review 建议：
- 添加 format 字段白名单过滤，只保留 Gemini 支持的 date-time/date/time
- 补充更多不支持的 schema 关键字到黑名单：
  * 组合 schema: oneOf, anyOf, allOf, not, if/then/else
  * 对象验证: minProperties, maxProperties, patternProperties 等
  * 定义引用: $defs, definitions
- 避免不支持的 schema 字段导致 Gemini API 校验失败

* fix(lint): 修复 gemini_messages_compat_service 空分支警告

- 在 cleanToolSchema 的 if 语句中添加 continue
- 移除重复的注释

* fix(antigravity): 移除 minItems/maxItems 以兼容 Claude API

- 将 minItems 和 maxItems 添加到 schema 黑名单
- Claude API (Vertex AI) 不支持这些数组验证字段
- 添加调试日志记录工具 schema 转换过程
- 修复 tools.14.custom.input_schema 验证错误

* fix(antigravity): 修复 additionalProperties schema 对象问题

- 将 additionalProperties 的 schema 对象转换为布尔值 true
- Claude API 只支持 additionalProperties: false，不支持 schema 对象
- 修复 tools.14.custom.input_schema 验证错误
- 参考 Claude 官方文档的 JSON Schema 限制

* fix(antigravity): 修复 Claude 模型 thinking 块兼容性问题

- 完全跳过 Claude 模型的 thinking 块以避免 signature 验证失败
- 只在 Gemini 模型中使用 dummy thought signature
- 修改 additionalProperties 默认值为 false（更安全）
- 添加调试日志以便排查问题

* fix(upstream): 修复跨模型切换时的 dummy signature 问题

基于 Codex review 和用户场景分析的修复：

1. 问题场景
   - Gemini (thinking) → Claude (thinking) 切换时
   - Gemini 返回的 thinking 块使用 dummy signature
   - Claude API 会拒绝 dummy signature，导致 400 错误

2. 修复内容
   - request_transformer.go:262: 跳过 dummy signature
   - 只保留真实的 Claude signature
   - 支持频繁的跨模型切换

3. 其他修复（基于 Codex review）
   - gateway_service.go:691: 修复 io.ReadAll 错误处理
   - gateway_service.go:687: 条件日志（尊重 LogUpstreamErrorBody 配置）
   - gateway_service.go:915: 收紧 400 failover 启发式
   - request_transformer.go:188: 移除签名成功日志

4. 新增功能（默认关闭）
   - 阶段 1: 上游错误日志（GATEWAY_LOG_UPSTREAM_ERROR_BODY）
   - 阶段 2: Antigravity thinking 修复
   - 阶段 3: API-key beta 注入（GATEWAY_INJECT_BETA_FOR_APIKEY）
   - 阶段 3: 智能 400 failover（GATEWAY_FAILOVER_ON_400）

测试：所有测试通过

* fix(lint): 修复 golangci-lint 问题

- 应用 De Morgan 定律简化条件判断
- 修复 gofmt 格式问题
- 移除未使用的 min 函数
											
										
										
											2026-01-01 04:21:18 +08:00
+										// API-key：仅在请求显式使用 beta 特性且客户端未提供时，按需补齐（默认关闭）
 										if requestNeedsBetaFeatures(body) {
-												fix(lint): 修复所有 Go 命名规范问题

- 全局替换 ApiKey → APIKey（类型、字段、方法、变量）
- 修复所有 initialism 命名（API, SMTP, HTML, URL 等）
- 添加所有缺失的包注释
- 修复导出符号的注释格式

主要修改：
- ApiKey → APIKey（所有出现的地方）
- ApiKeyID → APIKeyID
- ApiKeyIDs → APIKeyIDs
- TestSmtpConnection → TestSMTPConnection
- HtmlURL → HTMLURL
- 添加 20+ 个包注释
- 修复 10+ 个导出符号注释格式

验证结果：
- ✓ golangci-lint: 0 issues
- ✓ 单元测试: 通过
- ✓ 集成测试: 通过

											
										
										
											2026-01-04 19:27:53 +08:00
+											if beta := defaultAPIKeyBetaHeader(body); beta != "" {
-												fix: 修复 /v1/messages 间歇性 400 错误 (#18)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* feat(gemini): 添加Gemini限额与TierID支持

实现PR1：Gemini限额与TierID功能

后端修改：
- GeminiTokenInfo结构体添加TierID字段
- fetchProjectID函数返回(projectID, tierID, error)
- 从LoadCodeAssist响应中提取tierID（优先IsDefault，回退到第一个非空tier）
- ExchangeCode、RefreshAccountToken、GetAccessToken函数更新以处理tierID
- BuildAccountCredentials函数保存tier_id到credentials

前端修改：
- AccountStatusIndicator组件添加tier显示
- 支持LEGACY/PRO/ULTRA等tier类型的友好显示
- 使用蓝色badge展示tier信息

技术细节：
- tierID提取逻辑：优先选择IsDefault的tier，否则选择第一个非空tier
- 所有fetchProjectID调用点已更新以处理新的返回签名
- 前端gracefully处理missing/unknown tier_id

* refactor(gemini): 优化TierID实现并添加安全验证

根据并发代码审查（code-reviewer, security-auditor, gemini, codex）的反馈进行改进：

安全改进：
- 添加validateTierID函数验证tier_id格式和长度（最大64字符）
- 限制tier_id字符集为字母数字、下划线、连字符和斜杠
- 在BuildAccountCredentials中验证tier_id后再存储
- 静默跳过无效tier_id，不阻塞账户创建

代码质量改进：
- 提取extractTierIDFromAllowedTiers辅助函数消除重复代码
- 重构fetchProjectID函数，tierID提取逻辑只执行一次
- 改进代码可读性和可维护性

审查工具：
- code-reviewer agent (a09848e)
- security-auditor agent (a9a149c)
- gemini CLI (bcc7c81)
- codex (b5d8919)

修复问题：
- HIGH: 未验证的tier_id输入
- MEDIUM: 代码重复（tierID提取逻辑重复2次）

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(upstream): 修复上游格式兼容性问题 (#14)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(format): 修复 claude_types.go 的 gofmt 格式问题

* feat(antigravity): 优化 thinking block 和 schema 处理

- 为 dummy thinking block 添加 ThoughtSignature
- 重构 thinking block 处理逻辑，在每个条件分支内创建 part
- 优化 excludedSchemaKeys，移除 Gemini 实际支持的字段
  (minItems, maxItems, minimum, maximum, additionalProperties, format)
- 添加详细注释说明 Gemini API 支持的 schema 字段

* fix(antigravity): 增强 schema 清理的安全性

基于 Codex review 建议：
- 添加 format 字段白名单过滤，只保留 Gemini 支持的 date-time/date/time
- 补充更多不支持的 schema 关键字到黑名单：
  * 组合 schema: oneOf, anyOf, allOf, not, if/then/else
  * 对象验证: minProperties, maxProperties, patternProperties 等
  * 定义引用: $defs, definitions
- 避免不支持的 schema 字段导致 Gemini API 校验失败

* fix(lint): 修复 gemini_messages_compat_service 空分支警告

- 在 cleanToolSchema 的 if 语句中添加 continue
- 移除重复的注释

* fix(antigravity): 移除 minItems/maxItems 以兼容 Claude API

- 将 minItems 和 maxItems 添加到 schema 黑名单
- Claude API (Vertex AI) 不支持这些数组验证字段
- 添加调试日志记录工具 schema 转换过程
- 修复 tools.14.custom.input_schema 验证错误

* fix(antigravity): 修复 additionalProperties schema 对象问题

- 将 additionalProperties 的 schema 对象转换为布尔值 true
- Claude API 只支持 additionalProperties: false，不支持 schema 对象
- 修复 tools.14.custom.input_schema 验证错误
- 参考 Claude 官方文档的 JSON Schema 限制

* fix(antigravity): 修复 Claude 模型 thinking 块兼容性问题

- 完全跳过 Claude 模型的 thinking 块以避免 signature 验证失败
- 只在 Gemini 模型中使用 dummy thought signature
- 修改 additionalProperties 默认值为 false（更安全）
- 添加调试日志以便排查问题

* fix(upstream): 修复跨模型切换时的 dummy signature 问题

基于 Codex review 和用户场景分析的修复：

1. 问题场景
   - Gemini (thinking) → Claude (thinking) 切换时
   - Gemini 返回的 thinking 块使用 dummy signature
   - Claude API 会拒绝 dummy signature，导致 400 错误

2. 修复内容
   - request_transformer.go:262: 跳过 dummy signature
   - 只保留真实的 Claude signature
   - 支持频繁的跨模型切换

3. 其他修复（基于 Codex review）
   - gateway_service.go:691: 修复 io.ReadAll 错误处理
   - gateway_service.go:687: 条件日志（尊重 LogUpstreamErrorBody 配置）
   - gateway_service.go:915: 收紧 400 failover 启发式
   - request_transformer.go:188: 移除签名成功日志

4. 新增功能（默认关闭）
   - 阶段 1: 上游错误日志（GATEWAY_LOG_UPSTREAM_ERROR_BODY）
   - 阶段 2: Antigravity thinking 修复
   - 阶段 3: API-key beta 注入（GATEWAY_INJECT_BETA_FOR_APIKEY）
   - 阶段 3: 智能 400 failover（GATEWAY_FAILOVER_ON_400）

测试：所有测试通过

* fix(lint): 修复 golangci-lint 问题

- 应用 De Morgan 定律简化条件判断
- 修复 gofmt 格式问题
- 移除未使用的 min 函数
											
										
										
											2026-01-01 04:21:18 +08:00
+												req.Header.Set("anthropic-beta", beta)
 											}
 										}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
-												chore(debug): emit Claude mimic fingerprint on credential-scope error

											
										
										
											2026-01-29 15:17:46 +08:00
+									// Always capture a compact fingerprint line for later error diagnostics.
 									// We only print it when needed (or when the explicit debug flag is enabled).
 									if c != nil && tokenType == "oauth" {
 										c.Set(claudeMimicDebugInfoKey, buildClaudeMimicDebugLine(req, body, account, tokenType, mimicClaudeCode))
 									}
-												chore(debug): log Claude mimic fingerprint

											
										
										
											2026-01-29 03:13:14 +08:00
+									if s.debugClaudeMimicEnabled() {
 										logClaudeMimicDebug(req, body, account, tokenType, mimicClaudeCode)
 									}
-												refactor(backend): service http ports

											
										
										
											2025-12-20 11:56:11 +08:00
+									return req, nil
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								}
 								// getBetaHeader 处理anthropic-beta header
 								// 对于OAuth账号，需要确保包含oauth-2025-04-20
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+								func (s *GatewayService) getBetaHeader(modelID string, clientBetaHeader string) string {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									// 如果客户端传了anthropic-beta
 									if clientBetaHeader != "" {
 										// 已包含oauth beta则直接返回
-												 refactor: 提取 Claude 客户端常量到独立包

  - 新增 internal/pkg/claude 包统一管理 Claude Code 相关常量
  - 统一账号测试逻辑，所有账号类型使用相同的 Claude Code 风格请求
  - 网关服务使用常量包替换硬编码的 beta header 字符串

											
										
										
											2025-12-19 15:22:52 +08:00
+										if strings.Contains(clientBetaHeader, claude.BetaOAuth) {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+											return clientBetaHeader
 										}
 										// 需要添加oauth beta
 										parts := strings.Split(clientBetaHeader, ",")
 										for i, p := range parts {
 											parts[i] = strings.TrimSpace(p)
 										}
 										// 在claude-code-20250219后面插入oauth beta
 										claudeCodeIdx := -1
 										for i, p := range parts {
-												 refactor: 提取 Claude 客户端常量到独立包

  - 新增 internal/pkg/claude 包统一管理 Claude Code 相关常量
  - 统一账号测试逻辑，所有账号类型使用相同的 Claude Code 风格请求
  - 网关服务使用常量包替换硬编码的 beta header 字符串

											
										
										
											2025-12-19 15:22:52 +08:00
+											if p == claude.BetaClaudeCode {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+												claudeCodeIdx = i
 												break
 											}
 										}
 										if claudeCodeIdx >= 0 {
 											// 在claude-code后面插入
 											newParts := make([]string, 0, len(parts)+1)
 											newParts = append(newParts, parts[:claudeCodeIdx+1]...)
-												 refactor: 提取 Claude 客户端常量到独立包

  - 新增 internal/pkg/claude 包统一管理 Claude Code 相关常量
  - 统一账号测试逻辑，所有账号类型使用相同的 Claude Code 风格请求
  - 网关服务使用常量包替换硬编码的 beta header 字符串

											
										
										
											2025-12-19 15:22:52 +08:00
+											newParts = append(newParts, claude.BetaOAuth)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+											newParts = append(newParts, parts[claudeCodeIdx+1:]...)
 											return strings.Join(newParts, ",")
 										}
 										// 没有claude-code，放在第一位
-												 refactor: 提取 Claude 客户端常量到独立包

  - 新增 internal/pkg/claude 包统一管理 Claude Code 相关常量
  - 统一账号测试逻辑，所有账号类型使用相同的 Claude Code 风格请求
  - 网关服务使用常量包替换硬编码的 beta header 字符串

											
										
										
											2025-12-19 15:22:52 +08:00
+										return claude.BetaOAuth + "," + clientBetaHeader
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
 									// 客户端没传，根据模型生成
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+									// haiku 模型不需要 claude-code beta
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									if strings.Contains(strings.ToLower(modelID), "haiku") {
-												 refactor: 提取 Claude 客户端常量到独立包

  - 新增 internal/pkg/claude 包统一管理 Claude Code 相关常量
  - 统一账号测试逻辑，所有账号类型使用相同的 Claude Code 风格请求
  - 网关服务使用常量包替换硬编码的 beta header 字符串

											
										
										
											2025-12-19 15:22:52 +08:00
+										return claude.HaikuBetaHeader
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
-												 refactor: 提取 Claude 客户端常量到独立包

  - 新增 internal/pkg/claude 包统一管理 Claude Code 相关常量
  - 统一账号测试逻辑，所有账号类型使用相同的 Claude Code 风格请求
  - 网关服务使用常量包替换硬编码的 beta header 字符串

											
										
										
											2025-12-19 15:22:52 +08:00
+									return claude.DefaultBetaHeader
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								}
-												fix: 修复 /v1/messages 间歇性 400 错误 (#18)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* feat(gemini): 添加Gemini限额与TierID支持

实现PR1：Gemini限额与TierID功能

后端修改：
- GeminiTokenInfo结构体添加TierID字段
- fetchProjectID函数返回(projectID, tierID, error)
- 从LoadCodeAssist响应中提取tierID（优先IsDefault，回退到第一个非空tier）
- ExchangeCode、RefreshAccountToken、GetAccessToken函数更新以处理tierID
- BuildAccountCredentials函数保存tier_id到credentials

前端修改：
- AccountStatusIndicator组件添加tier显示
- 支持LEGACY/PRO/ULTRA等tier类型的友好显示
- 使用蓝色badge展示tier信息

技术细节：
- tierID提取逻辑：优先选择IsDefault的tier，否则选择第一个非空tier
- 所有fetchProjectID调用点已更新以处理新的返回签名
- 前端gracefully处理missing/unknown tier_id

* refactor(gemini): 优化TierID实现并添加安全验证

根据并发代码审查（code-reviewer, security-auditor, gemini, codex）的反馈进行改进：

安全改进：
- 添加validateTierID函数验证tier_id格式和长度（最大64字符）
- 限制tier_id字符集为字母数字、下划线、连字符和斜杠
- 在BuildAccountCredentials中验证tier_id后再存储
- 静默跳过无效tier_id，不阻塞账户创建

代码质量改进：
- 提取extractTierIDFromAllowedTiers辅助函数消除重复代码
- 重构fetchProjectID函数，tierID提取逻辑只执行一次
- 改进代码可读性和可维护性

审查工具：
- code-reviewer agent (a09848e)
- security-auditor agent (a9a149c)
- gemini CLI (bcc7c81)
- codex (b5d8919)

修复问题：
- HIGH: 未验证的tier_id输入
- MEDIUM: 代码重复（tierID提取逻辑重复2次）

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(upstream): 修复上游格式兼容性问题 (#14)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(format): 修复 claude_types.go 的 gofmt 格式问题

* feat(antigravity): 优化 thinking block 和 schema 处理

- 为 dummy thinking block 添加 ThoughtSignature
- 重构 thinking block 处理逻辑，在每个条件分支内创建 part
- 优化 excludedSchemaKeys，移除 Gemini 实际支持的字段
  (minItems, maxItems, minimum, maximum, additionalProperties, format)
- 添加详细注释说明 Gemini API 支持的 schema 字段

* fix(antigravity): 增强 schema 清理的安全性

基于 Codex review 建议：
- 添加 format 字段白名单过滤，只保留 Gemini 支持的 date-time/date/time
- 补充更多不支持的 schema 关键字到黑名单：
  * 组合 schema: oneOf, anyOf, allOf, not, if/then/else
  * 对象验证: minProperties, maxProperties, patternProperties 等
  * 定义引用: $defs, definitions
- 避免不支持的 schema 字段导致 Gemini API 校验失败

* fix(lint): 修复 gemini_messages_compat_service 空分支警告

- 在 cleanToolSchema 的 if 语句中添加 continue
- 移除重复的注释

* fix(antigravity): 移除 minItems/maxItems 以兼容 Claude API

- 将 minItems 和 maxItems 添加到 schema 黑名单
- Claude API (Vertex AI) 不支持这些数组验证字段
- 添加调试日志记录工具 schema 转换过程
- 修复 tools.14.custom.input_schema 验证错误

* fix(antigravity): 修复 additionalProperties schema 对象问题

- 将 additionalProperties 的 schema 对象转换为布尔值 true
- Claude API 只支持 additionalProperties: false，不支持 schema 对象
- 修复 tools.14.custom.input_schema 验证错误
- 参考 Claude 官方文档的 JSON Schema 限制

* fix(antigravity): 修复 Claude 模型 thinking 块兼容性问题

- 完全跳过 Claude 模型的 thinking 块以避免 signature 验证失败
- 只在 Gemini 模型中使用 dummy thought signature
- 修改 additionalProperties 默认值为 false（更安全）
- 添加调试日志以便排查问题

* fix(upstream): 修复跨模型切换时的 dummy signature 问题

基于 Codex review 和用户场景分析的修复：

1. 问题场景
   - Gemini (thinking) → Claude (thinking) 切换时
   - Gemini 返回的 thinking 块使用 dummy signature
   - Claude API 会拒绝 dummy signature，导致 400 错误

2. 修复内容
   - request_transformer.go:262: 跳过 dummy signature
   - 只保留真实的 Claude signature
   - 支持频繁的跨模型切换

3. 其他修复（基于 Codex review）
   - gateway_service.go:691: 修复 io.ReadAll 错误处理
   - gateway_service.go:687: 条件日志（尊重 LogUpstreamErrorBody 配置）
   - gateway_service.go:915: 收紧 400 failover 启发式
   - request_transformer.go:188: 移除签名成功日志

4. 新增功能（默认关闭）
   - 阶段 1: 上游错误日志（GATEWAY_LOG_UPSTREAM_ERROR_BODY）
   - 阶段 2: Antigravity thinking 修复
   - 阶段 3: API-key beta 注入（GATEWAY_INJECT_BETA_FOR_APIKEY）
   - 阶段 3: 智能 400 failover（GATEWAY_FAILOVER_ON_400）

测试：所有测试通过

* fix(lint): 修复 golangci-lint 问题

- 应用 De Morgan 定律简化条件判断
- 修复 gofmt 格式问题
- 移除未使用的 min 函数
											
										
										
											2026-01-01 04:21:18 +08:00
+								func requestNeedsBetaFeatures(body []byte) bool {
 									tools := gjson.GetBytes(body, "tools")
 									if tools.Exists() && tools.IsArray() && len(tools.Array()) > 0 {
 										return true
 									}
 									if strings.EqualFold(gjson.GetBytes(body, "thinking.type").String(), "enabled") {
 										return true
 									}
 									return false
 								}
-												fix(lint): 修复所有 Go 命名规范问题

- 全局替换 ApiKey → APIKey（类型、字段、方法、变量）
- 修复所有 initialism 命名（API, SMTP, HTML, URL 等）
- 添加所有缺失的包注释
- 修复导出符号的注释格式

主要修改：
- ApiKey → APIKey（所有出现的地方）
- ApiKeyID → APIKeyID
- ApiKeyIDs → APIKeyIDs
- TestSmtpConnection → TestSMTPConnection
- HtmlURL → HTMLURL
- 添加 20+ 个包注释
- 修复 10+ 个导出符号注释格式

验证结果：
- ✓ golangci-lint: 0 issues
- ✓ 单元测试: 通过
- ✓ 集成测试: 通过

											
										
										
											2026-01-04 19:27:53 +08:00
+								func defaultAPIKeyBetaHeader(body []byte) string {
-												fix: 修复 /v1/messages 间歇性 400 错误 (#18)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* feat(gemini): 添加Gemini限额与TierID支持

实现PR1：Gemini限额与TierID功能

后端修改：
- GeminiTokenInfo结构体添加TierID字段
- fetchProjectID函数返回(projectID, tierID, error)
- 从LoadCodeAssist响应中提取tierID（优先IsDefault，回退到第一个非空tier）
- ExchangeCode、RefreshAccountToken、GetAccessToken函数更新以处理tierID
- BuildAccountCredentials函数保存tier_id到credentials

前端修改：
- AccountStatusIndicator组件添加tier显示
- 支持LEGACY/PRO/ULTRA等tier类型的友好显示
- 使用蓝色badge展示tier信息

技术细节：
- tierID提取逻辑：优先选择IsDefault的tier，否则选择第一个非空tier
- 所有fetchProjectID调用点已更新以处理新的返回签名
- 前端gracefully处理missing/unknown tier_id

* refactor(gemini): 优化TierID实现并添加安全验证

根据并发代码审查（code-reviewer, security-auditor, gemini, codex）的反馈进行改进：

安全改进：
- 添加validateTierID函数验证tier_id格式和长度（最大64字符）
- 限制tier_id字符集为字母数字、下划线、连字符和斜杠
- 在BuildAccountCredentials中验证tier_id后再存储
- 静默跳过无效tier_id，不阻塞账户创建

代码质量改进：
- 提取extractTierIDFromAllowedTiers辅助函数消除重复代码
- 重构fetchProjectID函数，tierID提取逻辑只执行一次
- 改进代码可读性和可维护性

审查工具：
- code-reviewer agent (a09848e)
- security-auditor agent (a9a149c)
- gemini CLI (bcc7c81)
- codex (b5d8919)

修复问题：
- HIGH: 未验证的tier_id输入
- MEDIUM: 代码重复（tierID提取逻辑重复2次）

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(upstream): 修复上游格式兼容性问题 (#14)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(format): 修复 claude_types.go 的 gofmt 格式问题

* feat(antigravity): 优化 thinking block 和 schema 处理

- 为 dummy thinking block 添加 ThoughtSignature
- 重构 thinking block 处理逻辑，在每个条件分支内创建 part
- 优化 excludedSchemaKeys，移除 Gemini 实际支持的字段
  (minItems, maxItems, minimum, maximum, additionalProperties, format)
- 添加详细注释说明 Gemini API 支持的 schema 字段

* fix(antigravity): 增强 schema 清理的安全性

基于 Codex review 建议：
- 添加 format 字段白名单过滤，只保留 Gemini 支持的 date-time/date/time
- 补充更多不支持的 schema 关键字到黑名单：
  * 组合 schema: oneOf, anyOf, allOf, not, if/then/else
  * 对象验证: minProperties, maxProperties, patternProperties 等
  * 定义引用: $defs, definitions
- 避免不支持的 schema 字段导致 Gemini API 校验失败

* fix(lint): 修复 gemini_messages_compat_service 空分支警告

- 在 cleanToolSchema 的 if 语句中添加 continue
- 移除重复的注释

* fix(antigravity): 移除 minItems/maxItems 以兼容 Claude API

- 将 minItems 和 maxItems 添加到 schema 黑名单
- Claude API (Vertex AI) 不支持这些数组验证字段
- 添加调试日志记录工具 schema 转换过程
- 修复 tools.14.custom.input_schema 验证错误

* fix(antigravity): 修复 additionalProperties schema 对象问题

- 将 additionalProperties 的 schema 对象转换为布尔值 true
- Claude API 只支持 additionalProperties: false，不支持 schema 对象
- 修复 tools.14.custom.input_schema 验证错误
- 参考 Claude 官方文档的 JSON Schema 限制

* fix(antigravity): 修复 Claude 模型 thinking 块兼容性问题

- 完全跳过 Claude 模型的 thinking 块以避免 signature 验证失败
- 只在 Gemini 模型中使用 dummy thought signature
- 修改 additionalProperties 默认值为 false（更安全）
- 添加调试日志以便排查问题

* fix(upstream): 修复跨模型切换时的 dummy signature 问题

基于 Codex review 和用户场景分析的修复：

1. 问题场景
   - Gemini (thinking) → Claude (thinking) 切换时
   - Gemini 返回的 thinking 块使用 dummy signature
   - Claude API 会拒绝 dummy signature，导致 400 错误

2. 修复内容
   - request_transformer.go:262: 跳过 dummy signature
   - 只保留真实的 Claude signature
   - 支持频繁的跨模型切换

3. 其他修复（基于 Codex review）
   - gateway_service.go:691: 修复 io.ReadAll 错误处理
   - gateway_service.go:687: 条件日志（尊重 LogUpstreamErrorBody 配置）
   - gateway_service.go:915: 收紧 400 failover 启发式
   - request_transformer.go:188: 移除签名成功日志

4. 新增功能（默认关闭）
   - 阶段 1: 上游错误日志（GATEWAY_LOG_UPSTREAM_ERROR_BODY）
   - 阶段 2: Antigravity thinking 修复
   - 阶段 3: API-key beta 注入（GATEWAY_INJECT_BETA_FOR_APIKEY）
   - 阶段 3: 智能 400 failover（GATEWAY_FAILOVER_ON_400）

测试：所有测试通过

* fix(lint): 修复 golangci-lint 问题

- 应用 De Morgan 定律简化条件判断
- 修复 gofmt 格式问题
- 移除未使用的 min 函数
											
										
										
											2026-01-01 04:21:18 +08:00
+									modelID := gjson.GetBytes(body, "model").String()
 									if strings.Contains(strings.ToLower(modelID), "haiku") {
-												fix(lint): 修复所有 Go 命名规范问题

- 全局替换 ApiKey → APIKey（类型、字段、方法、变量）
- 修复所有 initialism 命名（API, SMTP, HTML, URL 等）
- 添加所有缺失的包注释
- 修复导出符号的注释格式

主要修改：
- ApiKey → APIKey（所有出现的地方）
- ApiKeyID → APIKeyID
- ApiKeyIDs → APIKeyIDs
- TestSmtpConnection → TestSMTPConnection
- HtmlURL → HTMLURL
- 添加 20+ 个包注释
- 修复 10+ 个导出符号注释格式

验证结果：
- ✓ golangci-lint: 0 issues
- ✓ 单元测试: 通过
- ✓ 集成测试: 通过

											
										
										
											2026-01-04 19:27:53 +08:00
+										return claude.APIKeyHaikuBetaHeader
-												fix: 修复 /v1/messages 间歇性 400 错误 (#18)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* feat(gemini): 添加Gemini限额与TierID支持

实现PR1：Gemini限额与TierID功能

后端修改：
- GeminiTokenInfo结构体添加TierID字段
- fetchProjectID函数返回(projectID, tierID, error)
- 从LoadCodeAssist响应中提取tierID（优先IsDefault，回退到第一个非空tier）
- ExchangeCode、RefreshAccountToken、GetAccessToken函数更新以处理tierID
- BuildAccountCredentials函数保存tier_id到credentials

前端修改：
- AccountStatusIndicator组件添加tier显示
- 支持LEGACY/PRO/ULTRA等tier类型的友好显示
- 使用蓝色badge展示tier信息

技术细节：
- tierID提取逻辑：优先选择IsDefault的tier，否则选择第一个非空tier
- 所有fetchProjectID调用点已更新以处理新的返回签名
- 前端gracefully处理missing/unknown tier_id

* refactor(gemini): 优化TierID实现并添加安全验证

根据并发代码审查（code-reviewer, security-auditor, gemini, codex）的反馈进行改进：

安全改进：
- 添加validateTierID函数验证tier_id格式和长度（最大64字符）
- 限制tier_id字符集为字母数字、下划线、连字符和斜杠
- 在BuildAccountCredentials中验证tier_id后再存储
- 静默跳过无效tier_id，不阻塞账户创建

代码质量改进：
- 提取extractTierIDFromAllowedTiers辅助函数消除重复代码
- 重构fetchProjectID函数，tierID提取逻辑只执行一次
- 改进代码可读性和可维护性

审查工具：
- code-reviewer agent (a09848e)
- security-auditor agent (a9a149c)
- gemini CLI (bcc7c81)
- codex (b5d8919)

修复问题：
- HIGH: 未验证的tier_id输入
- MEDIUM: 代码重复（tierID提取逻辑重复2次）

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(upstream): 修复上游格式兼容性问题 (#14)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(format): 修复 claude_types.go 的 gofmt 格式问题

* feat(antigravity): 优化 thinking block 和 schema 处理

- 为 dummy thinking block 添加 ThoughtSignature
- 重构 thinking block 处理逻辑，在每个条件分支内创建 part
- 优化 excludedSchemaKeys，移除 Gemini 实际支持的字段
  (minItems, maxItems, minimum, maximum, additionalProperties, format)
- 添加详细注释说明 Gemini API 支持的 schema 字段

* fix(antigravity): 增强 schema 清理的安全性

基于 Codex review 建议：
- 添加 format 字段白名单过滤，只保留 Gemini 支持的 date-time/date/time
- 补充更多不支持的 schema 关键字到黑名单：
  * 组合 schema: oneOf, anyOf, allOf, not, if/then/else
  * 对象验证: minProperties, maxProperties, patternProperties 等
  * 定义引用: $defs, definitions
- 避免不支持的 schema 字段导致 Gemini API 校验失败

* fix(lint): 修复 gemini_messages_compat_service 空分支警告

- 在 cleanToolSchema 的 if 语句中添加 continue
- 移除重复的注释

* fix(antigravity): 移除 minItems/maxItems 以兼容 Claude API

- 将 minItems 和 maxItems 添加到 schema 黑名单
- Claude API (Vertex AI) 不支持这些数组验证字段
- 添加调试日志记录工具 schema 转换过程
- 修复 tools.14.custom.input_schema 验证错误

* fix(antigravity): 修复 additionalProperties schema 对象问题

- 将 additionalProperties 的 schema 对象转换为布尔值 true
- Claude API 只支持 additionalProperties: false，不支持 schema 对象
- 修复 tools.14.custom.input_schema 验证错误
- 参考 Claude 官方文档的 JSON Schema 限制

* fix(antigravity): 修复 Claude 模型 thinking 块兼容性问题

- 完全跳过 Claude 模型的 thinking 块以避免 signature 验证失败
- 只在 Gemini 模型中使用 dummy thought signature
- 修改 additionalProperties 默认值为 false（更安全）
- 添加调试日志以便排查问题

* fix(upstream): 修复跨模型切换时的 dummy signature 问题

基于 Codex review 和用户场景分析的修复：

1. 问题场景
   - Gemini (thinking) → Claude (thinking) 切换时
   - Gemini 返回的 thinking 块使用 dummy signature
   - Claude API 会拒绝 dummy signature，导致 400 错误

2. 修复内容
   - request_transformer.go:262: 跳过 dummy signature
   - 只保留真实的 Claude signature
   - 支持频繁的跨模型切换

3. 其他修复（基于 Codex review）
   - gateway_service.go:691: 修复 io.ReadAll 错误处理
   - gateway_service.go:687: 条件日志（尊重 LogUpstreamErrorBody 配置）
   - gateway_service.go:915: 收紧 400 failover 启发式
   - request_transformer.go:188: 移除签名成功日志

4. 新增功能（默认关闭）
   - 阶段 1: 上游错误日志（GATEWAY_LOG_UPSTREAM_ERROR_BODY）
   - 阶段 2: Antigravity thinking 修复
   - 阶段 3: API-key beta 注入（GATEWAY_INJECT_BETA_FOR_APIKEY）
   - 阶段 3: 智能 400 failover（GATEWAY_FAILOVER_ON_400）

测试：所有测试通过

* fix(lint): 修复 golangci-lint 问题

- 应用 De Morgan 定律简化条件判断
- 修复 gofmt 格式问题
- 移除未使用的 min 函数
											
										
										
											2026-01-01 04:21:18 +08:00
+									}
-												fix(lint): 修复所有 Go 命名规范问题

- 全局替换 ApiKey → APIKey（类型、字段、方法、变量）
- 修复所有 initialism 命名（API, SMTP, HTML, URL 等）
- 添加所有缺失的包注释
- 修复导出符号的注释格式

主要修改：
- ApiKey → APIKey（所有出现的地方）
- ApiKeyID → APIKeyID
- ApiKeyIDs → APIKeyIDs
- TestSmtpConnection → TestSMTPConnection
- HtmlURL → HTMLURL
- 添加 20+ 个包注释
- 修复 10+ 个导出符号注释格式

验证结果：
- ✓ golangci-lint: 0 issues
- ✓ 单元测试: 通过
- ✓ 集成测试: 通过

											
										
										
											2026-01-04 19:27:53 +08:00
+									return claude.APIKeyBetaHeader
-												fix: 修复 /v1/messages 间歇性 400 错误 (#18)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* feat(gemini): 添加Gemini限额与TierID支持

实现PR1：Gemini限额与TierID功能

后端修改：
- GeminiTokenInfo结构体添加TierID字段
- fetchProjectID函数返回(projectID, tierID, error)
- 从LoadCodeAssist响应中提取tierID（优先IsDefault，回退到第一个非空tier）
- ExchangeCode、RefreshAccountToken、GetAccessToken函数更新以处理tierID
- BuildAccountCredentials函数保存tier_id到credentials

前端修改：
- AccountStatusIndicator组件添加tier显示
- 支持LEGACY/PRO/ULTRA等tier类型的友好显示
- 使用蓝色badge展示tier信息

技术细节：
- tierID提取逻辑：优先选择IsDefault的tier，否则选择第一个非空tier
- 所有fetchProjectID调用点已更新以处理新的返回签名
- 前端gracefully处理missing/unknown tier_id

* refactor(gemini): 优化TierID实现并添加安全验证

根据并发代码审查（code-reviewer, security-auditor, gemini, codex）的反馈进行改进：

安全改进：
- 添加validateTierID函数验证tier_id格式和长度（最大64字符）
- 限制tier_id字符集为字母数字、下划线、连字符和斜杠
- 在BuildAccountCredentials中验证tier_id后再存储
- 静默跳过无效tier_id，不阻塞账户创建

代码质量改进：
- 提取extractTierIDFromAllowedTiers辅助函数消除重复代码
- 重构fetchProjectID函数，tierID提取逻辑只执行一次
- 改进代码可读性和可维护性

审查工具：
- code-reviewer agent (a09848e)
- security-auditor agent (a9a149c)
- gemini CLI (bcc7c81)
- codex (b5d8919)

修复问题：
- HIGH: 未验证的tier_id输入
- MEDIUM: 代码重复（tierID提取逻辑重复2次）

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(upstream): 修复上游格式兼容性问题 (#14)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(format): 修复 claude_types.go 的 gofmt 格式问题

* feat(antigravity): 优化 thinking block 和 schema 处理

- 为 dummy thinking block 添加 ThoughtSignature
- 重构 thinking block 处理逻辑，在每个条件分支内创建 part
- 优化 excludedSchemaKeys，移除 Gemini 实际支持的字段
  (minItems, maxItems, minimum, maximum, additionalProperties, format)
- 添加详细注释说明 Gemini API 支持的 schema 字段

* fix(antigravity): 增强 schema 清理的安全性

基于 Codex review 建议：
- 添加 format 字段白名单过滤，只保留 Gemini 支持的 date-time/date/time
- 补充更多不支持的 schema 关键字到黑名单：
  * 组合 schema: oneOf, anyOf, allOf, not, if/then/else
  * 对象验证: minProperties, maxProperties, patternProperties 等
  * 定义引用: $defs, definitions
- 避免不支持的 schema 字段导致 Gemini API 校验失败

* fix(lint): 修复 gemini_messages_compat_service 空分支警告

- 在 cleanToolSchema 的 if 语句中添加 continue
- 移除重复的注释

* fix(antigravity): 移除 minItems/maxItems 以兼容 Claude API

- 将 minItems 和 maxItems 添加到 schema 黑名单
- Claude API (Vertex AI) 不支持这些数组验证字段
- 添加调试日志记录工具 schema 转换过程
- 修复 tools.14.custom.input_schema 验证错误

* fix(antigravity): 修复 additionalProperties schema 对象问题

- 将 additionalProperties 的 schema 对象转换为布尔值 true
- Claude API 只支持 additionalProperties: false，不支持 schema 对象
- 修复 tools.14.custom.input_schema 验证错误
- 参考 Claude 官方文档的 JSON Schema 限制

* fix(antigravity): 修复 Claude 模型 thinking 块兼容性问题

- 完全跳过 Claude 模型的 thinking 块以避免 signature 验证失败
- 只在 Gemini 模型中使用 dummy thought signature
- 修改 additionalProperties 默认值为 false（更安全）
- 添加调试日志以便排查问题

* fix(upstream): 修复跨模型切换时的 dummy signature 问题

基于 Codex review 和用户场景分析的修复：

1. 问题场景
   - Gemini (thinking) → Claude (thinking) 切换时
   - Gemini 返回的 thinking 块使用 dummy signature
   - Claude API 会拒绝 dummy signature，导致 400 错误

2. 修复内容
   - request_transformer.go:262: 跳过 dummy signature
   - 只保留真实的 Claude signature
   - 支持频繁的跨模型切换

3. 其他修复（基于 Codex review）
   - gateway_service.go:691: 修复 io.ReadAll 错误处理
   - gateway_service.go:687: 条件日志（尊重 LogUpstreamErrorBody 配置）
   - gateway_service.go:915: 收紧 400 failover 启发式
   - request_transformer.go:188: 移除签名成功日志

4. 新增功能（默认关闭）
   - 阶段 1: 上游错误日志（GATEWAY_LOG_UPSTREAM_ERROR_BODY）
   - 阶段 2: Antigravity thinking 修复
   - 阶段 3: API-key beta 注入（GATEWAY_INJECT_BETA_FOR_APIKEY）
   - 阶段 3: 智能 400 failover（GATEWAY_FAILOVER_ON_400）

测试：所有测试通过

* fix(lint): 修复 golangci-lint 问题

- 应用 De Morgan 定律简化条件判断
- 修复 gofmt 格式问题
- 移除未使用的 min 函数
											
										
										
											2026-01-01 04:21:18 +08:00
+								}
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+								func applyClaudeOAuthHeaderDefaults(req *http.Request, isStream bool) {
 									if req == nil {
 										return
-												fix: 修复 /v1/messages 间歇性 400 错误 (#18)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* feat(gemini): 添加Gemini限额与TierID支持

实现PR1：Gemini限额与TierID功能

后端修改：
- GeminiTokenInfo结构体添加TierID字段
- fetchProjectID函数返回(projectID, tierID, error)
- 从LoadCodeAssist响应中提取tierID（优先IsDefault，回退到第一个非空tier）
- ExchangeCode、RefreshAccountToken、GetAccessToken函数更新以处理tierID
- BuildAccountCredentials函数保存tier_id到credentials

前端修改：
- AccountStatusIndicator组件添加tier显示
- 支持LEGACY/PRO/ULTRA等tier类型的友好显示
- 使用蓝色badge展示tier信息

技术细节：
- tierID提取逻辑：优先选择IsDefault的tier，否则选择第一个非空tier
- 所有fetchProjectID调用点已更新以处理新的返回签名
- 前端gracefully处理missing/unknown tier_id

* refactor(gemini): 优化TierID实现并添加安全验证

根据并发代码审查（code-reviewer, security-auditor, gemini, codex）的反馈进行改进：

安全改进：
- 添加validateTierID函数验证tier_id格式和长度（最大64字符）
- 限制tier_id字符集为字母数字、下划线、连字符和斜杠
- 在BuildAccountCredentials中验证tier_id后再存储
- 静默跳过无效tier_id，不阻塞账户创建

代码质量改进：
- 提取extractTierIDFromAllowedTiers辅助函数消除重复代码
- 重构fetchProjectID函数，tierID提取逻辑只执行一次
- 改进代码可读性和可维护性

审查工具：
- code-reviewer agent (a09848e)
- security-auditor agent (a9a149c)
- gemini CLI (bcc7c81)
- codex (b5d8919)

修复问题：
- HIGH: 未验证的tier_id输入
- MEDIUM: 代码重复（tierID提取逻辑重复2次）

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(upstream): 修复上游格式兼容性问题 (#14)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(format): 修复 claude_types.go 的 gofmt 格式问题

* feat(antigravity): 优化 thinking block 和 schema 处理

- 为 dummy thinking block 添加 ThoughtSignature
- 重构 thinking block 处理逻辑，在每个条件分支内创建 part
- 优化 excludedSchemaKeys，移除 Gemini 实际支持的字段
  (minItems, maxItems, minimum, maximum, additionalProperties, format)
- 添加详细注释说明 Gemini API 支持的 schema 字段

* fix(antigravity): 增强 schema 清理的安全性

基于 Codex review 建议：
- 添加 format 字段白名单过滤，只保留 Gemini 支持的 date-time/date/time
- 补充更多不支持的 schema 关键字到黑名单：
  * 组合 schema: oneOf, anyOf, allOf, not, if/then/else
  * 对象验证: minProperties, maxProperties, patternProperties 等
  * 定义引用: $defs, definitions
- 避免不支持的 schema 字段导致 Gemini API 校验失败

* fix(lint): 修复 gemini_messages_compat_service 空分支警告

- 在 cleanToolSchema 的 if 语句中添加 continue
- 移除重复的注释

* fix(antigravity): 移除 minItems/maxItems 以兼容 Claude API

- 将 minItems 和 maxItems 添加到 schema 黑名单
- Claude API (Vertex AI) 不支持这些数组验证字段
- 添加调试日志记录工具 schema 转换过程
- 修复 tools.14.custom.input_schema 验证错误

* fix(antigravity): 修复 additionalProperties schema 对象问题

- 将 additionalProperties 的 schema 对象转换为布尔值 true
- Claude API 只支持 additionalProperties: false，不支持 schema 对象
- 修复 tools.14.custom.input_schema 验证错误
- 参考 Claude 官方文档的 JSON Schema 限制

* fix(antigravity): 修复 Claude 模型 thinking 块兼容性问题

- 完全跳过 Claude 模型的 thinking 块以避免 signature 验证失败
- 只在 Gemini 模型中使用 dummy thought signature
- 修改 additionalProperties 默认值为 false（更安全）
- 添加调试日志以便排查问题

* fix(upstream): 修复跨模型切换时的 dummy signature 问题

基于 Codex review 和用户场景分析的修复：

1. 问题场景
   - Gemini (thinking) → Claude (thinking) 切换时
   - Gemini 返回的 thinking 块使用 dummy signature
   - Claude API 会拒绝 dummy signature，导致 400 错误

2. 修复内容
   - request_transformer.go:262: 跳过 dummy signature
   - 只保留真实的 Claude signature
   - 支持频繁的跨模型切换

3. 其他修复（基于 Codex review）
   - gateway_service.go:691: 修复 io.ReadAll 错误处理
   - gateway_service.go:687: 条件日志（尊重 LogUpstreamErrorBody 配置）
   - gateway_service.go:915: 收紧 400 failover 启发式
   - request_transformer.go:188: 移除签名成功日志

4. 新增功能（默认关闭）
   - 阶段 1: 上游错误日志（GATEWAY_LOG_UPSTREAM_ERROR_BODY）
   - 阶段 2: Antigravity thinking 修复
   - 阶段 3: API-key beta 注入（GATEWAY_INJECT_BETA_FOR_APIKEY）
   - 阶段 3: 智能 400 failover（GATEWAY_FAILOVER_ON_400）

测试：所有测试通过

* fix(lint): 修复 golangci-lint 问题

- 应用 De Morgan 定律简化条件判断
- 修复 gofmt 格式问题
- 移除未使用的 min 函数
											
										
										
											2026-01-01 04:21:18 +08:00
+									}
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+									if req.Header.Get("accept") == "" {
 										req.Header.Set("accept", "application/json")
 									}
 									for key, value := range claude.DefaultHeaders {
 										if value == "" {
 											continue
 										}
 										if req.Header.Get(key) == "" {
 											req.Header.Set(key, value)
 										}
 									}
 									if isStream && req.Header.Get("x-stainless-helper-method") == "" {
 										req.Header.Set("x-stainless-helper-method", "stream")
-												fix: 修复 /v1/messages 间歇性 400 错误 (#18)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* feat(gemini): 添加Gemini限额与TierID支持

实现PR1：Gemini限额与TierID功能

后端修改：
- GeminiTokenInfo结构体添加TierID字段
- fetchProjectID函数返回(projectID, tierID, error)
- 从LoadCodeAssist响应中提取tierID（优先IsDefault，回退到第一个非空tier）
- ExchangeCode、RefreshAccountToken、GetAccessToken函数更新以处理tierID
- BuildAccountCredentials函数保存tier_id到credentials

前端修改：
- AccountStatusIndicator组件添加tier显示
- 支持LEGACY/PRO/ULTRA等tier类型的友好显示
- 使用蓝色badge展示tier信息

技术细节：
- tierID提取逻辑：优先选择IsDefault的tier，否则选择第一个非空tier
- 所有fetchProjectID调用点已更新以处理新的返回签名
- 前端gracefully处理missing/unknown tier_id

* refactor(gemini): 优化TierID实现并添加安全验证

根据并发代码审查（code-reviewer, security-auditor, gemini, codex）的反馈进行改进：

安全改进：
- 添加validateTierID函数验证tier_id格式和长度（最大64字符）
- 限制tier_id字符集为字母数字、下划线、连字符和斜杠
- 在BuildAccountCredentials中验证tier_id后再存储
- 静默跳过无效tier_id，不阻塞账户创建

代码质量改进：
- 提取extractTierIDFromAllowedTiers辅助函数消除重复代码
- 重构fetchProjectID函数，tierID提取逻辑只执行一次
- 改进代码可读性和可维护性

审查工具：
- code-reviewer agent (a09848e)
- security-auditor agent (a9a149c)
- gemini CLI (bcc7c81)
- codex (b5d8919)

修复问题：
- HIGH: 未验证的tier_id输入
- MEDIUM: 代码重复（tierID提取逻辑重复2次）

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(upstream): 修复上游格式兼容性问题 (#14)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(format): 修复 claude_types.go 的 gofmt 格式问题

* feat(antigravity): 优化 thinking block 和 schema 处理

- 为 dummy thinking block 添加 ThoughtSignature
- 重构 thinking block 处理逻辑，在每个条件分支内创建 part
- 优化 excludedSchemaKeys，移除 Gemini 实际支持的字段
  (minItems, maxItems, minimum, maximum, additionalProperties, format)
- 添加详细注释说明 Gemini API 支持的 schema 字段

* fix(antigravity): 增强 schema 清理的安全性

基于 Codex review 建议：
- 添加 format 字段白名单过滤，只保留 Gemini 支持的 date-time/date/time
- 补充更多不支持的 schema 关键字到黑名单：
  * 组合 schema: oneOf, anyOf, allOf, not, if/then/else
  * 对象验证: minProperties, maxProperties, patternProperties 等
  * 定义引用: $defs, definitions
- 避免不支持的 schema 字段导致 Gemini API 校验失败

* fix(lint): 修复 gemini_messages_compat_service 空分支警告

- 在 cleanToolSchema 的 if 语句中添加 continue
- 移除重复的注释

* fix(antigravity): 移除 minItems/maxItems 以兼容 Claude API

- 将 minItems 和 maxItems 添加到 schema 黑名单
- Claude API (Vertex AI) 不支持这些数组验证字段
- 添加调试日志记录工具 schema 转换过程
- 修复 tools.14.custom.input_schema 验证错误

* fix(antigravity): 修复 additionalProperties schema 对象问题

- 将 additionalProperties 的 schema 对象转换为布尔值 true
- Claude API 只支持 additionalProperties: false，不支持 schema 对象
- 修复 tools.14.custom.input_schema 验证错误
- 参考 Claude 官方文档的 JSON Schema 限制

* fix(antigravity): 修复 Claude 模型 thinking 块兼容性问题

- 完全跳过 Claude 模型的 thinking 块以避免 signature 验证失败
- 只在 Gemini 模型中使用 dummy thought signature
- 修改 additionalProperties 默认值为 false（更安全）
- 添加调试日志以便排查问题

* fix(upstream): 修复跨模型切换时的 dummy signature 问题

基于 Codex review 和用户场景分析的修复：

1. 问题场景
   - Gemini (thinking) → Claude (thinking) 切换时
   - Gemini 返回的 thinking 块使用 dummy signature
   - Claude API 会拒绝 dummy signature，导致 400 错误

2. 修复内容
   - request_transformer.go:262: 跳过 dummy signature
   - 只保留真实的 Claude signature
   - 支持频繁的跨模型切换

3. 其他修复（基于 Codex review）
   - gateway_service.go:691: 修复 io.ReadAll 错误处理
   - gateway_service.go:687: 条件日志（尊重 LogUpstreamErrorBody 配置）
   - gateway_service.go:915: 收紧 400 failover 启发式
   - request_transformer.go:188: 移除签名成功日志

4. 新增功能（默认关闭）
   - 阶段 1: 上游错误日志（GATEWAY_LOG_UPSTREAM_ERROR_BODY）
   - 阶段 2: Antigravity thinking 修复
   - 阶段 3: API-key beta 注入（GATEWAY_INJECT_BETA_FOR_APIKEY）
   - 阶段 3: 智能 400 failover（GATEWAY_FAILOVER_ON_400）

测试：所有测试通过

* fix(lint): 修复 golangci-lint 问题

- 应用 De Morgan 定律简化条件判断
- 修复 gofmt 格式问题
- 移除未使用的 min 函数
											
										
										
											2026-01-01 04:21:18 +08:00
+									}
 								}
-												fix(oauth): merge anthropic-beta and force Claude Code headers in mimic mode

											
										
										
											2026-01-29 02:36:28 +08:00
+								func mergeAnthropicBeta(required []string, incoming string) string {
 									seen := make(map[string]struct{}, len(required)+8)
 									out := make([]string, 0, len(required)+8)
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
-												fix(oauth): merge anthropic-beta and force Claude Code headers in mimic mode

											
										
										
											2026-01-29 02:36:28 +08:00
+									add := func(v string) {
 										v = strings.TrimSpace(v)
 										if v == "" {
 											return
 										}
 										if _, ok := seen[v]; ok {
 											return
 										}
 										seen[v] = struct{}{}
 										out = append(out, v)
 									}
 									for _, r := range required {
 										add(r)
 									}
 									for _, p := range strings.Split(incoming, ",") {
 										add(p)
 									}
 									return strings.Join(out, ",")
 								}
-												fix(oauth): match Claude CLI accept header and beta set

											
										
										
											2026-01-29 15:31:29 +08:00
+								func mergeAnthropicBetaDropping(required []string, incoming string, drop map[string]struct{}) string {
 									merged := mergeAnthropicBeta(required, incoming)
 									if merged == "" || len(drop) == 0 {
 										return merged
 									}
 									out := make([]string, 0, 8)
 									for _, p := range strings.Split(merged, ",") {
 										p = strings.TrimSpace(p)
 										if p == "" {
 											continue
 										}
 										if _, ok := drop[p]; ok {
 											continue
 										}
 										out = append(out, p)
 									}
 									return strings.Join(out, ",")
 								}
-												fix(oauth): merge anthropic-beta and force Claude Code headers in mimic mode

											
										
										
											2026-01-29 02:36:28 +08:00
+								// applyClaudeCodeMimicHeaders forces "Claude Code-like" request headers.
 								// This mirrors opencode-anthropic-auth behavior: do not trust downstream
 								// headers when using Claude Code-scoped OAuth credentials.
 								func applyClaudeCodeMimicHeaders(req *http.Request, isStream bool) {
 									if req == nil {
 										return
 									}
 									// Start with the standard defaults (fill missing).
 									applyClaudeOAuthHeaderDefaults(req, isStream)
 									// Then force key headers to match Claude Code fingerprint regardless of what the client sent.
 									for key, value := range claude.DefaultHeaders {
 										if value == "" {
 											continue
 										}
 										req.Header.Set(key, value)
 									}
-												fix(oauth): match Claude CLI accept header and beta set

											
										
										
											2026-01-29 15:31:29 +08:00
+									// Real Claude CLI uses Accept: application/json (even for streaming).
 									req.Header.Set("accept", "application/json")
-												fix(oauth): merge anthropic-beta and force Claude Code headers in mimic mode

											
										
										
											2026-01-29 02:36:28 +08:00
+									if isStream {
 										req.Header.Set("x-stainless-helper-method", "stream")
 									}
 								}
-												fix: 修复 /v1/messages 间歇性 400 错误 (#18)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* feat(gemini): 添加Gemini限额与TierID支持

实现PR1：Gemini限额与TierID功能

后端修改：
- GeminiTokenInfo结构体添加TierID字段
- fetchProjectID函数返回(projectID, tierID, error)
- 从LoadCodeAssist响应中提取tierID（优先IsDefault，回退到第一个非空tier）
- ExchangeCode、RefreshAccountToken、GetAccessToken函数更新以处理tierID
- BuildAccountCredentials函数保存tier_id到credentials

前端修改：
- AccountStatusIndicator组件添加tier显示
- 支持LEGACY/PRO/ULTRA等tier类型的友好显示
- 使用蓝色badge展示tier信息

技术细节：
- tierID提取逻辑：优先选择IsDefault的tier，否则选择第一个非空tier
- 所有fetchProjectID调用点已更新以处理新的返回签名
- 前端gracefully处理missing/unknown tier_id

* refactor(gemini): 优化TierID实现并添加安全验证

根据并发代码审查（code-reviewer, security-auditor, gemini, codex）的反馈进行改进：

安全改进：
- 添加validateTierID函数验证tier_id格式和长度（最大64字符）
- 限制tier_id字符集为字母数字、下划线、连字符和斜杠
- 在BuildAccountCredentials中验证tier_id后再存储
- 静默跳过无效tier_id，不阻塞账户创建

代码质量改进：
- 提取extractTierIDFromAllowedTiers辅助函数消除重复代码
- 重构fetchProjectID函数，tierID提取逻辑只执行一次
- 改进代码可读性和可维护性

审查工具：
- code-reviewer agent (a09848e)
- security-auditor agent (a9a149c)
- gemini CLI (bcc7c81)
- codex (b5d8919)

修复问题：
- HIGH: 未验证的tier_id输入
- MEDIUM: 代码重复（tierID提取逻辑重复2次）

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(upstream): 修复上游格式兼容性问题 (#14)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(format): 修复 claude_types.go 的 gofmt 格式问题

* feat(antigravity): 优化 thinking block 和 schema 处理

- 为 dummy thinking block 添加 ThoughtSignature
- 重构 thinking block 处理逻辑，在每个条件分支内创建 part
- 优化 excludedSchemaKeys，移除 Gemini 实际支持的字段
  (minItems, maxItems, minimum, maximum, additionalProperties, format)
- 添加详细注释说明 Gemini API 支持的 schema 字段

* fix(antigravity): 增强 schema 清理的安全性

基于 Codex review 建议：
- 添加 format 字段白名单过滤，只保留 Gemini 支持的 date-time/date/time
- 补充更多不支持的 schema 关键字到黑名单：
  * 组合 schema: oneOf, anyOf, allOf, not, if/then/else
  * 对象验证: minProperties, maxProperties, patternProperties 等
  * 定义引用: $defs, definitions
- 避免不支持的 schema 字段导致 Gemini API 校验失败

* fix(lint): 修复 gemini_messages_compat_service 空分支警告

- 在 cleanToolSchema 的 if 语句中添加 continue
- 移除重复的注释

* fix(antigravity): 移除 minItems/maxItems 以兼容 Claude API

- 将 minItems 和 maxItems 添加到 schema 黑名单
- Claude API (Vertex AI) 不支持这些数组验证字段
- 添加调试日志记录工具 schema 转换过程
- 修复 tools.14.custom.input_schema 验证错误

* fix(antigravity): 修复 additionalProperties schema 对象问题

- 将 additionalProperties 的 schema 对象转换为布尔值 true
- Claude API 只支持 additionalProperties: false，不支持 schema 对象
- 修复 tools.14.custom.input_schema 验证错误
- 参考 Claude 官方文档的 JSON Schema 限制

* fix(antigravity): 修复 Claude 模型 thinking 块兼容性问题

- 完全跳过 Claude 模型的 thinking 块以避免 signature 验证失败
- 只在 Gemini 模型中使用 dummy thought signature
- 修改 additionalProperties 默认值为 false（更安全）
- 添加调试日志以便排查问题

* fix(upstream): 修复跨模型切换时的 dummy signature 问题

基于 Codex review 和用户场景分析的修复：

1. 问题场景
   - Gemini (thinking) → Claude (thinking) 切换时
   - Gemini 返回的 thinking 块使用 dummy signature
   - Claude API 会拒绝 dummy signature，导致 400 错误

2. 修复内容
   - request_transformer.go:262: 跳过 dummy signature
   - 只保留真实的 Claude signature
   - 支持频繁的跨模型切换

3. 其他修复（基于 Codex review）
   - gateway_service.go:691: 修复 io.ReadAll 错误处理
   - gateway_service.go:687: 条件日志（尊重 LogUpstreamErrorBody 配置）
   - gateway_service.go:915: 收紧 400 failover 启发式
   - request_transformer.go:188: 移除签名成功日志

4. 新增功能（默认关闭）
   - 阶段 1: 上游错误日志（GATEWAY_LOG_UPSTREAM_ERROR_BODY）
   - 阶段 2: Antigravity thinking 修复
   - 阶段 3: API-key beta 注入（GATEWAY_INJECT_BETA_FOR_APIKEY）
   - 阶段 3: 智能 400 failover（GATEWAY_FAILOVER_ON_400）

测试：所有测试通过

* fix(lint): 修复 golangci-lint 问题

- 应用 De Morgan 定律简化条件判断
- 修复 gofmt 格式问题
- 移除未使用的 min 函数
											
										
										
											2026-01-01 04:21:18 +08:00
+								func truncateForLog(b []byte, maxBytes int) string {
 									if maxBytes <= 0 {
 										maxBytes = 2048
 									}
 									if len(b) > maxBytes {
 										b = b[:maxBytes]
 									}
 									s := string(b)
 									// 保持一行，避免污染日志格式
 									s = strings.ReplaceAll(s, "\n", "\\n")
 									s = strings.ReplaceAll(s, "\r", "\\r")
 									return s
 								}
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+								// isThinkingBlockSignatureError 检测是否是thinking block相关错误
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+								// 这类错误可以通过过滤thinking blocks并重试来解决
 								func (s *GatewayService) isThinkingBlockSignatureError(respBody []byte) bool {
 									msg := strings.ToLower(strings.TrimSpace(extractUpstreamErrorMessage(respBody)))
 									if msg == "" {
 										return false
 									}
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+									// Log for debugging
 									log.Printf("[SignatureCheck] Checking error message: %s", msg)
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+									// 检测signature相关的错误（更宽松的匹配）
 									// 例如: "Invalid `signature` in `thinking` block", "***.signature" 等
 									if strings.Contains(msg, "signature") {
-												fix(gateway): 优化 thinking block 重试逻辑

- 保留用户的 thinking.type=enabled 设置（不再禁用）
- 只移除历史消息中的 thinking/redacted_thinking blocks
- 处理过滤后空消息：跳过 assistant 消息，user 消息添加占位符
- 增强错误检测：覆盖 signature、Expected thinking、empty content 错误
- 添加重试成功/失败日志便于排查

											
										
										
											2026-01-03 18:05:15 -08:00
+										log.Printf("[SignatureCheck] Detected signature error")
 										return true
 									}
 									// 检测 thinking block 顺序/类型错误
 									// 例如: "Expected `thinking` or `redacted_thinking`, but found `text`"
 									if strings.Contains(msg, "expected") && (strings.Contains(msg, "thinking") || strings.Contains(msg, "redacted_thinking")) {
 										log.Printf("[SignatureCheck] Detected thinking block type error")
 										return true
 									}
 									// 检测空消息内容错误（可能是过滤 thinking blocks 后导致的）
 									// 例如: "all messages must have non-empty content"
 									if strings.Contains(msg, "non-empty content") || strings.Contains(msg, "empty content") {
 										log.Printf("[SignatureCheck] Detected empty content error")
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+										return true
 									}
 									return false
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+								}
-												fix: 修复 /v1/messages 间歇性 400 错误 (#18)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* feat(gemini): 添加Gemini限额与TierID支持

实现PR1：Gemini限额与TierID功能

后端修改：
- GeminiTokenInfo结构体添加TierID字段
- fetchProjectID函数返回(projectID, tierID, error)
- 从LoadCodeAssist响应中提取tierID（优先IsDefault，回退到第一个非空tier）
- ExchangeCode、RefreshAccountToken、GetAccessToken函数更新以处理tierID
- BuildAccountCredentials函数保存tier_id到credentials

前端修改：
- AccountStatusIndicator组件添加tier显示
- 支持LEGACY/PRO/ULTRA等tier类型的友好显示
- 使用蓝色badge展示tier信息

技术细节：
- tierID提取逻辑：优先选择IsDefault的tier，否则选择第一个非空tier
- 所有fetchProjectID调用点已更新以处理新的返回签名
- 前端gracefully处理missing/unknown tier_id

* refactor(gemini): 优化TierID实现并添加安全验证

根据并发代码审查（code-reviewer, security-auditor, gemini, codex）的反馈进行改进：

安全改进：
- 添加validateTierID函数验证tier_id格式和长度（最大64字符）
- 限制tier_id字符集为字母数字、下划线、连字符和斜杠
- 在BuildAccountCredentials中验证tier_id后再存储
- 静默跳过无效tier_id，不阻塞账户创建

代码质量改进：
- 提取extractTierIDFromAllowedTiers辅助函数消除重复代码
- 重构fetchProjectID函数，tierID提取逻辑只执行一次
- 改进代码可读性和可维护性

审查工具：
- code-reviewer agent (a09848e)
- security-auditor agent (a9a149c)
- gemini CLI (bcc7c81)
- codex (b5d8919)

修复问题：
- HIGH: 未验证的tier_id输入
- MEDIUM: 代码重复（tierID提取逻辑重复2次）

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(upstream): 修复上游格式兼容性问题 (#14)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(format): 修复 claude_types.go 的 gofmt 格式问题

* feat(antigravity): 优化 thinking block 和 schema 处理

- 为 dummy thinking block 添加 ThoughtSignature
- 重构 thinking block 处理逻辑，在每个条件分支内创建 part
- 优化 excludedSchemaKeys，移除 Gemini 实际支持的字段
  (minItems, maxItems, minimum, maximum, additionalProperties, format)
- 添加详细注释说明 Gemini API 支持的 schema 字段

* fix(antigravity): 增强 schema 清理的安全性

基于 Codex review 建议：
- 添加 format 字段白名单过滤，只保留 Gemini 支持的 date-time/date/time
- 补充更多不支持的 schema 关键字到黑名单：
  * 组合 schema: oneOf, anyOf, allOf, not, if/then/else
  * 对象验证: minProperties, maxProperties, patternProperties 等
  * 定义引用: $defs, definitions
- 避免不支持的 schema 字段导致 Gemini API 校验失败

* fix(lint): 修复 gemini_messages_compat_service 空分支警告

- 在 cleanToolSchema 的 if 语句中添加 continue
- 移除重复的注释

* fix(antigravity): 移除 minItems/maxItems 以兼容 Claude API

- 将 minItems 和 maxItems 添加到 schema 黑名单
- Claude API (Vertex AI) 不支持这些数组验证字段
- 添加调试日志记录工具 schema 转换过程
- 修复 tools.14.custom.input_schema 验证错误

* fix(antigravity): 修复 additionalProperties schema 对象问题

- 将 additionalProperties 的 schema 对象转换为布尔值 true
- Claude API 只支持 additionalProperties: false，不支持 schema 对象
- 修复 tools.14.custom.input_schema 验证错误
- 参考 Claude 官方文档的 JSON Schema 限制

* fix(antigravity): 修复 Claude 模型 thinking 块兼容性问题

- 完全跳过 Claude 模型的 thinking 块以避免 signature 验证失败
- 只在 Gemini 模型中使用 dummy thought signature
- 修改 additionalProperties 默认值为 false（更安全）
- 添加调试日志以便排查问题

* fix(upstream): 修复跨模型切换时的 dummy signature 问题

基于 Codex review 和用户场景分析的修复：

1. 问题场景
   - Gemini (thinking) → Claude (thinking) 切换时
   - Gemini 返回的 thinking 块使用 dummy signature
   - Claude API 会拒绝 dummy signature，导致 400 错误

2. 修复内容
   - request_transformer.go:262: 跳过 dummy signature
   - 只保留真实的 Claude signature
   - 支持频繁的跨模型切换

3. 其他修复（基于 Codex review）
   - gateway_service.go:691: 修复 io.ReadAll 错误处理
   - gateway_service.go:687: 条件日志（尊重 LogUpstreamErrorBody 配置）
   - gateway_service.go:915: 收紧 400 failover 启发式
   - request_transformer.go:188: 移除签名成功日志

4. 新增功能（默认关闭）
   - 阶段 1: 上游错误日志（GATEWAY_LOG_UPSTREAM_ERROR_BODY）
   - 阶段 2: Antigravity thinking 修复
   - 阶段 3: API-key beta 注入（GATEWAY_INJECT_BETA_FOR_APIKEY）
   - 阶段 3: 智能 400 failover（GATEWAY_FAILOVER_ON_400）

测试：所有测试通过

* fix(lint): 修复 golangci-lint 问题

- 应用 De Morgan 定律简化条件判断
- 修复 gofmt 格式问题
- 移除未使用的 min 函数
											
										
										
											2026-01-01 04:21:18 +08:00
+								func (s *GatewayService) shouldFailoverOn400(respBody []byte) bool {
 									// 只对“可能是兼容性差异导致”的 400 允许切换，避免无意义重试。
 									// 默认保守：无法识别则不切换。
 									msg := strings.ToLower(strings.TrimSpace(extractUpstreamErrorMessage(respBody)))
 									if msg == "" {
 										return false
 									}
 									// 缺少/错误的 beta header：换账号/链路可能成功（尤其是混合调度时）。
 									// 更精确匹配 beta 相关的兼容性问题，避免误触发切换。
 									if strings.Contains(msg, "anthropic-beta") ||
 										strings.Contains(msg, "beta feature") ||
 										strings.Contains(msg, "requires beta") {
 										return true
 									}
 									// thinking/tool streaming 等兼容性约束（常见于中间转换链路）
 									if strings.Contains(msg, "thinking") || strings.Contains(msg, "thought_signature") || strings.Contains(msg, "signature") {
 										return true
 									}
 									if strings.Contains(msg, "tool_use") || strings.Contains(msg, "tool_result") || strings.Contains(msg, "tools") {
 										return true
 									}
 									return false
 								}
 								func extractUpstreamErrorMessage(body []byte) string {
 									// Claude 风格：{"type":"error","error":{"type":"...","message":"..."}}
 									if m := gjson.GetBytes(body, "error.message").String(); strings.TrimSpace(m) != "" {
 										inner := strings.TrimSpace(m)
 										// 有些上游会把完整 JSON 作为字符串塞进 message
 										if strings.HasPrefix(inner, "{") {
 											if innerMsg := gjson.Get(inner, "error.message").String(); strings.TrimSpace(innerMsg) != "" {
 												return innerMsg
 											}
 										}
 										return m
 									}
 									// 兜底：尝试顶层 message
 									return gjson.GetBytes(body, "message").String()
 								}
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+								func (s *GatewayService) handleErrorResponse(ctx context.Context, resp *http.Response, c *gin.Context, account *Account) (*ForwardResult, error) {
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
+									body, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+									// 调试日志：打印上游错误响应
 									log.Printf("[Forward] Upstream error (non-retryable): Account=%d(%s) Status=%d RequestID=%s Body=%s",
 										account.ID, account.Name, resp.StatusCode, resp.Header.Get("x-request-id"), truncateString(string(body), 1000))
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
+									upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(body))
 									upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)
-												chore(debug): emit Claude mimic fingerprint on credential-scope error

											
										
										
											2026-01-29 15:17:46 +08:00
+									// Print a compact upstream request fingerprint when we hit the Claude Code OAuth
 									// credential scope error. This avoids requiring env-var tweaks in a fixed deploy.
 									if isClaudeCodeCredentialScopeError(upstreamMsg) && c != nil {
 										if v, ok := c.Get(claudeMimicDebugInfoKey); ok {
 											if line, ok := v.(string); ok && strings.TrimSpace(line) != "" {
 												log.Printf("[ClaudeMimicDebugOnError] status=%d request_id=%s %s",
 													resp.StatusCode,
 													resp.Header.Get("x-request-id"),
 													line,
 												)
 											}
 										}
 									}
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
+									// Enrich Ops error logs with upstream status + message, and optionally a truncated body snippet.
 									upstreamDetail := ""
 									if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 										maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
 										if maxBytes <= 0 {
 											maxBytes = 2048
 										}
 										upstreamDetail = truncateString(string(body), maxBytes)
 									}
 									setOpsUpstreamError(c, resp.StatusCode, upstreamMsg, upstreamDetail)
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+									appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 										Platform:           account.Platform,
 										AccountID:          account.ID,
 										UpstreamStatusCode: resp.StatusCode,
 										UpstreamRequestID:  resp.Header.Get("x-request-id"),
 										Kind:               "http_error",
 										Message:            upstreamMsg,
 										Detail:             upstreamDetail,
 									})
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
 									// 处理上游错误，标记账号状态
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+									shouldDisable := false
 									if s.rateLimitService != nil {
 										shouldDisable = s.rateLimitService.HandleUpstreamError(ctx, account, resp.StatusCode, resp.Header, body)
 									}
 									if shouldDisable {
 										return nil, &UpstreamFailoverError{StatusCode: resp.StatusCode}
 									}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
+									// 记录上游错误响应体摘要便于排障（可选：由配置控制；不回显到客户端）
 									if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 										log.Printf(
 											"Upstream error %d (account=%d platform=%s type=%s): %s",
 											resp.StatusCode,
 											account.ID,
 											account.Platform,
 											account.Type,
 											truncateForLog(body, s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes),
 										)
 									}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									// 根据状态码返回适当的自定义错误响应（不透传上游详细信息）
 									var errType, errMsg string
 									var statusCode int
 									switch resp.StatusCode {
-												CC 400 返回具体错误信息 && 非 CC 请求时增加 system prompt (#26)

* feat: http 400 返回具体错误

* 更新 workflows

* 优化打包/docker 构建流程

* 400 是返回 原始错误 - json 格式

* feat: 非 cc请求时补充 system

* go mod tidy
											
										
										
											2025-12-25 14:47:19 +08:00
+									case 400:
 										c.Data(http.StatusBadRequest, "application/json", body)
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
+										summary := upstreamMsg
 										if summary == "" {
 											summary = truncateForLog(body, 512)
 										}
 										if summary == "" {
 											return nil, fmt.Errorf("upstream error: %d", resp.StatusCode)
 										}
 										return nil, fmt.Errorf("upstream error: %d message=%s", resp.StatusCode, summary)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									case 401:
 										statusCode = http.StatusBadGateway
 										errType = "upstream_error"
 										errMsg = "Upstream authentication failed, please contact administrator"
 									case 403:
 										statusCode = http.StatusBadGateway
 										errType = "upstream_error"
 										errMsg = "Upstream access forbidden, please contact administrator"
 									case 429:
 										statusCode = http.StatusTooManyRequests
 										errType = "rate_limit_error"
 										errMsg = "Upstream rate limit exceeded, please retry later"
 									case 529:
 										statusCode = http.StatusServiceUnavailable
 										errType = "overloaded_error"
 										errMsg = "Upstream service overloaded, please retry later"
 									case 500, 502, 503, 504:
 										statusCode = http.StatusBadGateway
 										errType = "upstream_error"
 										errMsg = "Upstream service temporarily unavailable"
 									default:
 										statusCode = http.StatusBadGateway
 										errType = "upstream_error"
 										errMsg = "Upstream request failed"
 									}
 									// 返回自定义错误响应
 									c.JSON(statusCode, gin.H{
 										"type": "error",
 										"error": gin.H{
 											"type":    errType,
 											"message": errMsg,
 										},
 									})
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
+									if upstreamMsg == "" {
 										return nil, fmt.Errorf("upstream error: %d", resp.StatusCode)
 									}
 									return nil, fmt.Errorf("upstream error: %d message=%s", resp.StatusCode, upstreamMsg)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								}
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+								func (s *GatewayService) handleRetryExhaustedSideEffects(ctx context.Context, resp *http.Response, account *Account) {
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+									body, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+									statusCode := resp.StatusCode
 									// OAuth/Setup Token 账号的 403：标记账号异常
 									if account.IsOAuth() && statusCode == 403 {
 										s.rateLimitService.HandleUpstreamError(ctx, account, statusCode, resp.Header, body)
-												fix(backend): 修复 P0/P1 严重安全和稳定性问题

P0 严重问题修复：
- 优化重试机制：降至 5 次 + 指数退避 + 10s 上限，防止请求堆积
- 修复 SSE 错误格式：符合 Anthropic API 规范，添加错误类型标准化

P1 重要问题修复：
- 防止 DOS 攻击：使用 io.LimitReader 限制请求体 10MB，流式解析
- 修复计费数据丢失：改为同步计费，使用独立 context 防止中断

技术细节：
- 新增 retryBackoffDelay() 和 sleepWithContext() 支持 context 取消
- 新增 normalizeAnthropicErrorType() 和 sanitizePublicErrorMessage()
- 新增 parseGatewayRequestStream() 实现流式解析
- 新增 recordUsageSync() 确保计费数据持久化

影响：
- 极端场景重试时间从 30s 降至 ≤10s
- 防止高并发 OOM 攻击
- 消除计费数据丢失风险
- 提升客户端兼容性

											
										
										
											2026-01-04 21:29:09 +08:00
+										log.Printf("Account %d: marked as error after %d retries for status %d", account.ID, maxRetryAttempts, statusCode)
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+									} else {
 										// API Key 未配置错误码：不标记账号状态
-												fix(backend): 修复 P0/P1 严重安全和稳定性问题

P0 严重问题修复：
- 优化重试机制：降至 5 次 + 指数退避 + 10s 上限，防止请求堆积
- 修复 SSE 错误格式：符合 Anthropic API 规范，添加错误类型标准化

P1 重要问题修复：
- 防止 DOS 攻击：使用 io.LimitReader 限制请求体 10MB，流式解析
- 修复计费数据丢失：改为同步计费，使用独立 context 防止中断

技术细节：
- 新增 retryBackoffDelay() 和 sleepWithContext() 支持 context 取消
- 新增 normalizeAnthropicErrorType() 和 sanitizePublicErrorMessage()
- 新增 parseGatewayRequestStream() 实现流式解析
- 新增 recordUsageSync() 确保计费数据持久化

影响：
- 极端场景重试时间从 30s 降至 ≤10s
- 防止高并发 OOM 攻击
- 消除计费数据丢失风险
- 提升客户端兼容性

											
										
										
											2026-01-04 21:29:09 +08:00
+										log.Printf("Account %d: upstream error %d after %d retries (not marking account)", account.ID, statusCode, maxRetryAttempts)
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+									}
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+								}
 								func (s *GatewayService) handleFailoverSideEffects(ctx context.Context, resp *http.Response, account *Account) {
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+									body, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+									s.rateLimitService.HandleUpstreamError(ctx, account, resp.StatusCode, resp.Header, body)
 								}
 								// handleRetryExhaustedError 处理重试耗尽后的错误
 								// OAuth 403：标记账号异常
 								// API Key 未配置错误码：仅返回错误，不标记账号
 								func (s *GatewayService) handleRetryExhaustedError(ctx context.Context, resp *http.Response, c *gin.Context, account *Account) (*ForwardResult, error) {
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
+									// Capture upstream error body before side-effects consume the stream.
 									respBody, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
 									_ = resp.Body.Close()
 									resp.Body = io.NopCloser(bytes.NewReader(respBody))
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+									s.handleRetryExhaustedSideEffects(ctx, resp, account)
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
+									upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(respBody))
 									upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)
-												chore(debug): emit Claude mimic fingerprint on credential-scope error

											
										
										
											2026-01-29 15:17:46 +08:00
 									if isClaudeCodeCredentialScopeError(upstreamMsg) && c != nil {
 										if v, ok := c.Get(claudeMimicDebugInfoKey); ok {
 											if line, ok := v.(string); ok && strings.TrimSpace(line) != "" {
 												log.Printf("[ClaudeMimicDebugOnError] status=%d request_id=%s %s",
 													resp.StatusCode,
 													resp.Header.Get("x-request-id"),
 													line,
 												)
 											}
 										}
 									}
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
+									upstreamDetail := ""
 									if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 										maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
 										if maxBytes <= 0 {
 											maxBytes = 2048
 										}
 										upstreamDetail = truncateString(string(respBody), maxBytes)
 									}
 									setOpsUpstreamError(c, resp.StatusCode, upstreamMsg, upstreamDetail)
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+									appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 										Platform:           account.Platform,
 										AccountID:          account.ID,
 										UpstreamStatusCode: resp.StatusCode,
 										UpstreamRequestID:  resp.Header.Get("x-request-id"),
 										Kind:               "retry_exhausted",
 										Message:            upstreamMsg,
 										Detail:             upstreamDetail,
 									})
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
 									if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 										log.Printf(
 											"Upstream error %d retries_exhausted (account=%d platform=%s type=%s): %s",
 											resp.StatusCode,
 											account.ID,
 											account.Platform,
 											account.Type,
 											truncateForLog(respBody, s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes),
 										)
 									}
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+									// 返回统一的重试耗尽错误响应
 									c.JSON(http.StatusBadGateway, gin.H{
 										"type": "error",
 										"error": gin.H{
 											"type":    "upstream_error",
 											"message": "Upstream request failed after retries",
 										},
 									})
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
+									if upstreamMsg == "" {
 										return nil, fmt.Errorf("upstream error: %d (retries exhausted)", resp.StatusCode)
 									}
 									return nil, fmt.Errorf("upstream error: %d (retries exhausted) message=%s", resp.StatusCode, upstreamMsg)
-												feat(gateway): 添加上游错误重试机制

- OAuth/Setup Token 账号遇到 403 错误时，等待 2 秒后重试，最多 3 次
- Console 账号遇到未配置的错误码时，同样进行重试
- 重试耗尽后：OAuth 403 标记账号异常，Console 未配置错误码不标记账号
- 移除 handleErrorResponse 中已被重试逻辑覆盖的死代码

											
										
										
											2025-12-24 16:55:46 +08:00
+								}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								// streamingResult 流式响应结果
 								type streamingResult struct {
-												fix(billing): 修复客户端取消请求时计费丢失问题

检测 context.Canceled 作为客户端断开信号，返回已收集的 usage 而非错误

											
										
										
											2026-01-08 11:25:17 +08:00
+									usage            *ClaudeUsage
 									firstTokenMs     *int
 									clientDisconnect bool // 客户端是否在流式传输过程中断开
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								}
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+								func (s *GatewayService) handleStreamingResponse(ctx context.Context, resp *http.Response, c *gin.Context, account *Account, startTime time.Time, originalModel, mappedModel string, toolNameMap map[string]string, mimicClaudeCode bool) (*streamingResult, error) {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									// 更新5h窗口状态
 									s.rateLimitService.UpdateSessionWindow(ctx, account, resp.Header)
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+									if s.cfg != nil {
 										responseheaders.WriteFilteredHeaders(c.Writer.Header(), resp.Header, s.cfg.Security.ResponseHeaders)
 									}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									// 设置SSE响应头
 									c.Header("Content-Type", "text/event-stream")
 									c.Header("Cache-Control", "no-cache")
 									c.Header("Connection", "keep-alive")
 									c.Header("X-Accel-Buffering", "no")
 									// 透传其他响应头
 									if v := resp.Header.Get("x-request-id"); v != "" {
 										c.Header("x-request-id", v)
 									}
 									w := c.Writer
 									flusher, ok := w.(http.Flusher)
 									if !ok {
 										return nil, errors.New("streaming not supported")
 									}
 									usage := &ClaudeUsage{}
 									var firstTokenMs *int
 									scanner := bufio.NewScanner(resp.Body)
 									// 设置更大的buffer以处理长行
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									maxLineSize := defaultMaxLineSize
 									if s.cfg != nil && s.cfg.Gateway.MaxLineSize > 0 {
 										maxLineSize = s.cfg.Gateway.MaxLineSize
 									}
 									scanner.Buffer(make([]byte, 64*1024), maxLineSize)
 									type scanEvent struct {
 										line string
 										err  error
 									}
 									// 独立 goroutine 读取上游，避免读取阻塞导致超时/keepalive无法处理
-												fix(流式): 以上游读取判定超时并调大事件缓冲

- 以读取时间戳判定流式间隔超时，避免下游阻塞误判
- antigravity 流式读取使用 MaxLineSize 配置
- 事件通道缓冲提升到 16

测试: go test ./...

											
										
										
											2026-01-04 20:19:07 +08:00
+									events := make(chan scanEvent, 16)
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									done := make(chan struct{})
 									sendEvent := func(ev scanEvent) bool {
 										select {
 										case events <- ev:
 											return true
 										case <-done:
 											return false
 										}
 									}
-												fix(流式): 以上游读取判定超时并调大事件缓冲

- 以读取时间戳判定流式间隔超时，避免下游阻塞误判
- antigravity 流式读取使用 MaxLineSize 配置
- 事件通道缓冲提升到 16

测试: go test ./...

											
										
										
											2026-01-04 20:19:07 +08:00
+									var lastReadAt int64
 									atomic.StoreInt64(&lastReadAt, time.Now().UnixNano())
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									go func() {
 										defer close(events)
 										for scanner.Scan() {
-												fix(流式): 以上游读取判定超时并调大事件缓冲

- 以读取时间戳判定流式间隔超时，避免下游阻塞误判
- antigravity 流式读取使用 MaxLineSize 配置
- 事件通道缓冲提升到 16

测试: go test ./...

											
										
										
											2026-01-04 20:19:07 +08:00
+											atomic.StoreInt64(&lastReadAt, time.Now().UnixNano())
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+											if !sendEvent(scanEvent{line: scanner.Text()}) {
 												return
 											}
 										}
 										if err := scanner.Err(); err != nil {
 											_ = sendEvent(scanEvent{err: err})
 										}
 									}()
 									defer close(done)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									streamInterval := time.Duration(0)
 									if s.cfg != nil && s.cfg.Gateway.StreamDataIntervalTimeout > 0 {
 										streamInterval = time.Duration(s.cfg.Gateway.StreamDataIntervalTimeout) * time.Second
 									}
-												fix(流式): 以上游读取判定超时并调大事件缓冲

- 以读取时间戳判定流式间隔超时，避免下游阻塞误判
- antigravity 流式读取使用 MaxLineSize 配置
- 事件通道缓冲提升到 16

测试: go test ./...

											
										
										
											2026-01-04 20:19:07 +08:00
+									// 仅监控上游数据间隔超时，避免下游写入阻塞导致误判
 									var intervalTicker *time.Ticker
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									if streamInterval > 0 {
-												fix(流式): 以上游读取判定超时并调大事件缓冲

- 以读取时间戳判定流式间隔超时，避免下游阻塞误判
- antigravity 流式读取使用 MaxLineSize 配置
- 事件通道缓冲提升到 16

测试: go test ./...

											
										
										
											2026-01-04 20:19:07 +08:00
+										intervalTicker = time.NewTicker(streamInterval)
 										defer intervalTicker.Stop()
 									}
 									var intervalCh <-chan time.Time
 									if intervalTicker != nil {
 										intervalCh = intervalTicker.C
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									// 仅发送一次错误事件，避免多次写入导致协议混乱（写失败时尽力通知客户端）
 									errorEventSent := false
 									sendErrorEvent := func(reason string) {
 										if errorEventSent {
 											return
-												CC Stream 响应流中出现 error 时, 增加返回重试 (#86)

* 响应流中出现 error, 返回重试

* 响应流中出现 error, 返回重试
											
										
										
											2025-12-30 10:48:55 +08:00
+										}
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+										errorEventSent = true
 										_, _ = fmt.Fprintf(w, "event: error\ndata: {\"error\":\"%s\"}\n\n", reason)
 										flusher.Flush()
 									}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									needModelReplace := originalModel != mappedModel
-												fix(billing): 修复客户端取消请求时计费丢失问题

检测 context.Canceled 作为客户端断开信号，返回已收集的 usage 而非错误

											
										
										
											2026-01-08 11:25:17 +08:00
+									clientDisconnected := false // 客户端断开标志，断开后继续读取上游以获取完整usage
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
-												fix(网关): SSE 缓冲 input_json_delta 反向转换

											
										
										
											2026-01-19 03:46:09 +08:00
+									pendingEventLines := make([]string, 0, 4)
-												fix(gateway): gate streaming tool rewrites behind mimic

											
										
										
											2026-01-19 16:20:24 +08:00
+									var toolInputBuffers map[int]string
 									if mimicClaudeCode {
 										toolInputBuffers = make(map[int]string)
 									}
-												fix(网关): SSE 缓冲 input_json_delta 反向转换

											
										
										
											2026-01-19 03:46:09 +08:00
 									transformToolInputJSON := func(raw string) string {
-												fix(gateway): gate streaming tool rewrites behind mimic

											
										
										
											2026-01-19 16:20:24 +08:00
+										if !mimicClaudeCode {
 											return raw
 										}
-												fix(网关): SSE 缓冲 input_json_delta 反向转换

											
										
										
											2026-01-19 03:46:09 +08:00
+										raw = strings.TrimSpace(raw)
 										if raw == "" {
 											return raw
 										}
 										var parsed any
 										if err := json.Unmarshal([]byte(raw), &parsed); err != nil {
 											return replaceToolNamesInText(raw, toolNameMap)
 										}
 										rewritten, changed := rewriteParamKeysInValue(parsed, toolNameMap)
 										if changed {
 											if bytes, err := json.Marshal(rewritten); err == nil {
 												return string(bytes)
 											}
 										}
 										return raw
 									}
 									processSSEEvent := func(lines []string) ([]string, string, error) {
 										if len(lines) == 0 {
 											return nil, "", nil
 										}
 										eventName := ""
 										dataLine := ""
 										for _, line := range lines {
 											trimmed := strings.TrimSpace(line)
 											if strings.HasPrefix(trimmed, "event:") {
 												eventName = strings.TrimSpace(strings.TrimPrefix(trimmed, "event:"))
 												continue
 											}
 											if dataLine == "" && sseDataRe.MatchString(trimmed) {
 												dataLine = sseDataRe.ReplaceAllString(trimmed, "")
 											}
 										}
 										if eventName == "error" {
 											return nil, dataLine, errors.New("have error in stream")
 										}
 										if dataLine == "" {
 											return []string{strings.Join(lines, "\n") + "\n\n"}, "", nil
 										}
 										if dataLine == "[DONE]" {
 											block := ""
 											if eventName != "" {
 												block = "event: " + eventName + "\n"
 											}
 											block += "data: " + dataLine + "\n\n"
 											return []string{block}, dataLine, nil
 										}
 										var event map[string]any
 										if err := json.Unmarshal([]byte(dataLine), &event); err != nil {
-												fix(gateway): gate streaming tool rewrites behind mimic

											
										
										
											2026-01-19 16:20:24 +08:00
+											replaced := dataLine
 											if mimicClaudeCode {
 												replaced = replaceToolNamesInText(dataLine, toolNameMap)
 											}
-												fix(网关): SSE 缓冲 input_json_delta 反向转换

											
										
										
											2026-01-19 03:46:09 +08:00
+											block := ""
 											if eventName != "" {
 												block = "event: " + eventName + "\n"
 											}
 											block += "data: " + replaced + "\n\n"
 											return []string{block}, replaced, nil
 										}
 										eventType, _ := event["type"].(string)
 										if eventName == "" {
 											eventName = eventType
 										}
-												fix(网关): 修复流式 tool 输入参数转换

											
										
										
											2026-01-19 03:53:08 +08:00
+										if needModelReplace {
-												fix(网关): SSE 缓冲 input_json_delta 反向转换

											
										
										
											2026-01-19 03:46:09 +08:00
+											if msg, ok := event["message"].(map[string]any); ok {
 												if model, ok := msg["model"].(string); ok && model == mappedModel {
 													msg["model"] = originalModel
 												}
 											}
 										}
-												fix(gateway): gate streaming tool rewrites behind mimic

											
										
										
											2026-01-19 16:20:24 +08:00
+										if mimicClaudeCode && eventType == "content_block_delta" {
-												fix(网关): SSE 缓冲 input_json_delta 反向转换

											
										
										
											2026-01-19 03:46:09 +08:00
+											if delta, ok := event["delta"].(map[string]any); ok {
 												if deltaType, _ := delta["type"].(string); deltaType == "input_json_delta" {
 													if indexVal, ok := event["index"].(float64); ok {
 														index := int(indexVal)
 														if partial, ok := delta["partial_json"].(string); ok {
 															toolInputBuffers[index] += partial
 														}
 													}
 													return nil, dataLine, nil
 												}
 											}
 										}
-												fix(gateway): gate streaming tool rewrites behind mimic

											
										
										
											2026-01-19 16:20:24 +08:00
+										if mimicClaudeCode && eventType == "content_block_stop" {
-												fix(网关): SSE 缓冲 input_json_delta 反向转换

											
										
										
											2026-01-19 03:46:09 +08:00
+											if indexVal, ok := event["index"].(float64); ok {
 												index := int(indexVal)
 												if buffered := toolInputBuffers[index]; buffered != "" {
 													delete(toolInputBuffers, index)
 													transformed := transformToolInputJSON(buffered)
 													synthetic := map[string]any{
 														"type":  "content_block_delta",
 														"index": index,
 														"delta": map[string]any{
 															"type":         "input_json_delta",
 															"partial_json": transformed,
 														},
 													}
 													synthBytes, synthErr := json.Marshal(synthetic)
 													if synthErr == nil {
 														synthBlock := "event: content_block_delta\n" + "data: " + string(synthBytes) + "\n\n"
 														rewriteToolNamesInValue(event, toolNameMap)
 														stopBytes, stopErr := json.Marshal(event)
 														if stopErr == nil {
 															stopBlock := ""
 															if eventName != "" {
 																stopBlock = "event: " + eventName + "\n"
 															}
 															stopBlock += "data: " + string(stopBytes) + "\n\n"
 															return []string{synthBlock, stopBlock}, string(stopBytes), nil
 														}
 													}
 												}
 											}
 										}
-												fix(gateway): gate streaming tool rewrites behind mimic

											
										
										
											2026-01-19 16:20:24 +08:00
+										if mimicClaudeCode {
 											rewriteToolNamesInValue(event, toolNameMap)
 										}
-												fix(网关): SSE 缓冲 input_json_delta 反向转换

											
										
										
											2026-01-19 03:46:09 +08:00
+										newData, err := json.Marshal(event)
 										if err != nil {
-												fix(gateway): gate streaming tool rewrites behind mimic

											
										
										
											2026-01-19 16:20:24 +08:00
+											replaced := dataLine
 											if mimicClaudeCode {
 												replaced = replaceToolNamesInText(dataLine, toolNameMap)
 											}
-												fix(网关): SSE 缓冲 input_json_delta 反向转换

											
										
										
											2026-01-19 03:46:09 +08:00
+											block := ""
 											if eventName != "" {
 												block = "event: " + eventName + "\n"
 											}
 											block += "data: " + replaced + "\n\n"
 											return []string{block}, replaced, nil
 										}
 										block := ""
 										if eventName != "" {
 											block = "event: " + eventName + "\n"
 										}
 										block += "data: " + string(newData) + "\n\n"
 										return []string{block}, string(newData), nil
 									}
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									for {
 										select {
 										case ev, ok := <-events:
 											if !ok {
-												fix(billing): 修复客户端取消请求时计费丢失问题

检测 context.Canceled 作为客户端断开信号，返回已收集的 usage 而非错误

											
										
										
											2026-01-08 11:25:17 +08:00
+												// 上游完成，返回结果
 												return &streamingResult{usage: usage, firstTokenMs: firstTokenMs, clientDisconnect: clientDisconnected}, nil
-												fix(sse): 修复非标准 SSE 格式解析问题

部分上游 API 返回的 SSE 格式不符合标准规范：
- 标准格式: `data: {...}`（冒号后有空格）
- 非标准格式: `data:{...}`（冒号后无空格）

使用预编译正则 `^data:\s*` 统一处理两种格式。

											
										
										
											2025-12-26 03:49:55 -08:00
+											}
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+											if ev.err != nil {
-												fix(billing): 修复客户端取消请求时计费丢失问题

检测 context.Canceled 作为客户端断开信号，返回已收集的 usage 而非错误

											
										
										
											2026-01-08 11:25:17 +08:00
+												// 检测 context 取消（客户端断开会导致 context 取消，进而影响上游读取）
 												if errors.Is(ev.err, context.Canceled) || errors.Is(ev.err, context.DeadlineExceeded) {
 													log.Printf("Context canceled during streaming, returning collected usage")
 													return &streamingResult{usage: usage, firstTokenMs: firstTokenMs, clientDisconnect: true}, nil
 												}
 												// 客户端已通过写入失败检测到断开，上游也出错了，返回已收集的 usage
 												if clientDisconnected {
 													log.Printf("Upstream read error after client disconnect: %v, returning collected usage", ev.err)
 													return &streamingResult{usage: usage, firstTokenMs: firstTokenMs, clientDisconnect: true}, nil
 												}
 												// 客户端未断开，正常的错误处理
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+												if errors.Is(ev.err, bufio.ErrTooLong) {
 													log.Printf("SSE line too long: account=%d max_size=%d error=%v", account.ID, maxLineSize, ev.err)
 													sendErrorEvent("response_too_large")
 													return &streamingResult{usage: usage, firstTokenMs: firstTokenMs}, ev.err
 												}
 												sendErrorEvent("stream_read_error")
 												return &streamingResult{usage: usage, firstTokenMs: firstTokenMs}, fmt.Errorf("stream read error: %w", ev.err)
 											}
 											line := ev.line
-												fix(网关): SSE 缓冲 input_json_delta 反向转换

											
										
										
											2026-01-19 03:46:09 +08:00
+											trimmed := strings.TrimSpace(line)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
-												fix(网关): SSE 缓冲 input_json_delta 反向转换

											
										
										
											2026-01-19 03:46:09 +08:00
+											if trimmed == "" {
 												if len(pendingEventLines) == 0 {
 													continue
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+												}
-												fix(网关): SSE 缓冲 input_json_delta 反向转换

											
										
										
											2026-01-19 03:46:09 +08:00
+												outputBlocks, data, err := processSSEEvent(pendingEventLines)
 												pendingEventLines = pendingEventLines[:0]
 												if err != nil {
 													if clientDisconnected {
 														return &streamingResult{usage: usage, firstTokenMs: firstTokenMs, clientDisconnect: true}, nil
 													}
 													return nil, err
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+												}
-												fix(网关): SSE 缓冲 input_json_delta 反向转换

											
										
										
											2026-01-19 03:46:09 +08:00
+												for _, block := range outputBlocks {
 													if !clientDisconnected {
 														if _, werr := fmt.Fprint(w, block); werr != nil {
 															clientDisconnected = true
 															log.Printf("Client disconnected during streaming, continuing to drain upstream for billing")
 															break
 														}
 														flusher.Flush()
 													}
 													if data != "" {
 														if firstTokenMs == nil && data != "[DONE]" {
 															ms := int(time.Since(startTime).Milliseconds())
 															firstTokenMs = &ms
 														}
 														s.parseSSEUsage(data, usage)
 													}
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+												}
-												fix(网关): SSE 缓冲 input_json_delta 反向转换

											
										
										
											2026-01-19 03:46:09 +08:00
+												continue
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+											}
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
-												fix(网关): SSE 缓冲 input_json_delta 反向转换

											
										
										
											2026-01-19 03:46:09 +08:00
+											pendingEventLines = append(pendingEventLines, line)
-												fix(流式): 以上游读取判定超时并调大事件缓冲

- 以读取时间戳判定流式间隔超时，避免下游阻塞误判
- antigravity 流式读取使用 MaxLineSize 配置
- 事件通道缓冲提升到 16

测试: go test ./...

											
										
										
											2026-01-04 20:19:07 +08:00
+										case <-intervalCh:
 											lastRead := time.Unix(0, atomic.LoadInt64(&lastReadAt))
 											if time.Since(lastRead) < streamInterval {
 												continue
-												fix(sse): 修复非标准 SSE 格式解析问题

部分上游 API 返回的 SSE 格式不符合标准规范：
- 标准格式: `data: {...}`（冒号后有空格）
- 非标准格式: `data:{...}`（冒号后无空格）

使用预编译正则 `^data:\s*` 统一处理两种格式。

											
										
										
											2025-12-26 03:49:55 -08:00
+											}
-												fix(billing): 修复客户端取消请求时计费丢失问题

检测 context.Canceled 作为客户端断开信号，返回已收集的 usage 而非错误

											
										
										
											2026-01-08 11:25:17 +08:00
+											if clientDisconnected {
 												// 客户端已断开，上游也超时了，返回已收集的 usage
 												log.Printf("Upstream timeout after client disconnect, returning collected usage")
 												return &streamingResult{usage: usage, firstTokenMs: firstTokenMs, clientDisconnect: true}, nil
 											}
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+											log.Printf("Stream data interval timeout: account=%d model=%s interval=%s", account.ID, originalModel, streamInterval)
-												feat(gateway): 添加流超时处理机制

- 添加 StreamTimeoutSettings 配置结构体和系统设置
- 实现 TimeoutCounterCache Redis 计数器用于累计超时次数
- 在 RateLimitService 添加 HandleStreamTimeout 方法
- 在 gateway_service、openai_gateway_service、antigravity_gateway_service 中调用超时处理
- 添加后端 API 端点 GET/PUT /admin/settings/stream-timeout
- 添加前端配置界面到系统设置页面
- 支持配置：启用开关、超时阈值、处理方式、暂停时长、触发阈值、阈值窗口

默认配置：
- 启用：true
- 超时阈值：60秒
- 处理方式：临时不可调度
- 暂停时长：5分钟
- 触发阈值：3次
- 阈值窗口：10分钟

											
										
										
											2026-01-11 21:54:52 -08:00
+											// 处理流超时，可能标记账户为临时不可调度或错误状态
 											if s.rateLimitService != nil {
 												s.rateLimitService.HandleStreamTimeout(ctx, account, originalModel)
 											}
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+											sendErrorEvent("stream_timeout")
 											return &streamingResult{usage: usage, firstTokenMs: firstTokenMs}, fmt.Errorf("stream data interval timeout")
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										}
 									}
 								}
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+								func rewriteParamKeysInValue(value any, cache map[string]string) (any, bool) {
 									switch v := value.(type) {
 									case map[string]any:
 										changed := false
 										rewritten := make(map[string]any, len(v))
 										for key, item := range v {
 											newKey := normalizeParamNameForOpenCode(key, cache)
 											newItem, childChanged := rewriteParamKeysInValue(item, cache)
 											if childChanged {
 												changed = true
 											}
 											if newKey != key {
 												changed = true
 											}
 											rewritten[newKey] = newItem
 										}
 										if !changed {
 											return value, false
 										}
 										return rewritten, true
 									case []any:
 										changed := false
 										rewritten := make([]any, len(v))
 										for idx, item := range v {
 											newItem, childChanged := rewriteParamKeysInValue(item, cache)
 											if childChanged {
 												changed = true
 											}
 											rewritten[idx] = newItem
 										}
 										if !changed {
 											return value, false
 										}
 										return rewritten, true
 									default:
 										return value, false
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+								}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+								func rewriteToolNamesInValue(value any, toolNameMap map[string]string) bool {
 									switch v := value.(type) {
 									case map[string]any:
 										changed := false
 										if blockType, _ := v["type"].(string); blockType == "tool_use" {
 											if name, ok := v["name"].(string); ok {
 												mapped := normalizeToolNameForOpenCode(name, toolNameMap)
 												if mapped != name {
 													v["name"] = mapped
 													changed = true
 												}
 											}
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+											if input, ok := v["input"].(map[string]any); ok {
 												rewrittenInput, inputChanged := rewriteParamKeysInValue(input, toolNameMap)
 												if inputChanged {
 													if m, ok := rewrittenInput.(map[string]any); ok {
 														v["input"] = m
 														changed = true
 													}
 												}
 											}
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+										}
 										for _, item := range v {
 											if rewriteToolNamesInValue(item, toolNameMap) {
 												changed = true
 											}
 										}
 										return changed
 									case []any:
 										changed := false
 										for _, item := range v {
 											if rewriteToolNamesInValue(item, toolNameMap) {
 												changed = true
 											}
 										}
 										return changed
 									default:
 										return false
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+								}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+								func replaceToolNamesInText(text string, toolNameMap map[string]string) string {
 									if text == "" {
 										return text
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+									output := toolNameFieldRe.ReplaceAllStringFunc(text, func(match string) string {
 										submatches := toolNameFieldRe.FindStringSubmatch(match)
 										if len(submatches) < 2 {
 											return match
 										}
 										name := submatches[1]
 										mapped := normalizeToolNameForOpenCode(name, toolNameMap)
 										if mapped == name {
 											return match
 										}
 										return strings.Replace(match, name, mapped, 1)
 									})
 									output = modelFieldRe.ReplaceAllStringFunc(output, func(match string) string {
 										submatches := modelFieldRe.FindStringSubmatch(match)
 										if len(submatches) < 2 {
 											return match
 										}
 										model := submatches[1]
 										mapped := claude.DenormalizeModelID(model)
 										if mapped == model {
 											return match
 										}
 										return strings.Replace(match, model, mapped, 1)
 									})
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
-												fix(网关): 补齐非 Claude Code OAuth 兼容

											
										
										
											2026-01-16 00:41:29 +08:00
+									for mapped, original := range toolNameMap {
 										if mapped == "" || original == "" || mapped == original {
 											continue
 										}
 										output = strings.ReplaceAll(output, "\""+mapped+"\":", "\""+original+"\":")
 										output = strings.ReplaceAll(output, "\\\""+mapped+"\\\":", "\\\""+original+"\\\":")
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+									return output
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								}
 								func (s *GatewayService) parseSSEUsage(data string, usage *ClaudeUsage) {
-												fix: 兼容GLM等API的usage数据解析

部分第三方API（如GLM）的SSE响应格式与标准Claude API不同：
- 标准Claude: input_tokens在message_start中
- GLM等API: 所有tokens都在message_delta中

现在从message_delta中也解析input_tokens和cache相关字段，
如果message_start中没有值则使用message_delta中的数据。

											
										
										
											2025-12-23 16:53:53 +08:00
+									// 解析message_start获取input tokens（标准Claude API格式）
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									var msgStart struct {
 										Type    string `json:"type"`
 										Message struct {
 											Usage ClaudeUsage `json:"usage"`
 										} `json:"message"`
 									}
 									if json.Unmarshal([]byte(data), &msgStart) == nil && msgStart.Type == "message_start" {
 										usage.InputTokens = msgStart.Message.Usage.InputTokens
 										usage.CacheCreationInputTokens = msgStart.Message.Usage.CacheCreationInputTokens
 										usage.CacheReadInputTokens = msgStart.Message.Usage.CacheReadInputTokens
 									}
-												fix: 兼容GLM等API的usage数据解析

部分第三方API（如GLM）的SSE响应格式与标准Claude API不同：
- 标准Claude: input_tokens在message_start中
- GLM等API: 所有tokens都在message_delta中

现在从message_delta中也解析input_tokens和cache相关字段，
如果message_start中没有值则使用message_delta中的数据。

											
										
										
											2025-12-23 16:53:53 +08:00
+									// 解析message_delta获取tokens（兼容GLM等把所有usage放在delta中的API）
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									var msgDelta struct {
 										Type  string `json:"type"`
 										Usage struct {
-												fix: 兼容GLM等API的usage数据解析

部分第三方API（如GLM）的SSE响应格式与标准Claude API不同：
- 标准Claude: input_tokens在message_start中
- GLM等API: 所有tokens都在message_delta中

现在从message_delta中也解析input_tokens和cache相关字段，
如果message_start中没有值则使用message_delta中的数据。

											
										
										
											2025-12-23 16:53:53 +08:00
+											InputTokens              int `json:"input_tokens"`
 											OutputTokens             int `json:"output_tokens"`
 											CacheCreationInputTokens int `json:"cache_creation_input_tokens"`
 											CacheReadInputTokens     int `json:"cache_read_input_tokens"`
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										} `json:"usage"`
 									}
 									if json.Unmarshal([]byte(data), &msgDelta) == nil && msgDelta.Type == "message_delta" {
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+										// message_delta 仅覆盖存在且非0的字段
 										// 避免覆盖 message_start 中已有的值（如 input_tokens）
 										// Claude API 的 message_delta 通常只包含 output_tokens
 										if msgDelta.Usage.InputTokens > 0 {
-												fix: 兼容GLM等API的usage数据解析

部分第三方API（如GLM）的SSE响应格式与标准Claude API不同：
- 标准Claude: input_tokens在message_start中
- GLM等API: 所有tokens都在message_delta中

现在从message_delta中也解析input_tokens和cache相关字段，
如果message_start中没有值则使用message_delta中的数据。

											
										
										
											2025-12-23 16:53:53 +08:00
+											usage.InputTokens = msgDelta.Usage.InputTokens
 										}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+										if msgDelta.Usage.OutputTokens > 0 {
 											usage.OutputTokens = msgDelta.Usage.OutputTokens
 										}
 										if msgDelta.Usage.CacheCreationInputTokens > 0 {
-												fix: 兼容GLM等API的usage数据解析

部分第三方API（如GLM）的SSE响应格式与标准Claude API不同：
- 标准Claude: input_tokens在message_start中
- GLM等API: 所有tokens都在message_delta中

现在从message_delta中也解析input_tokens和cache相关字段，
如果message_start中没有值则使用message_delta中的数据。

											
										
										
											2025-12-23 16:53:53 +08:00
+											usage.CacheCreationInputTokens = msgDelta.Usage.CacheCreationInputTokens
 										}
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+										if msgDelta.Usage.CacheReadInputTokens > 0 {
-												fix: 兼容GLM等API的usage数据解析

部分第三方API（如GLM）的SSE响应格式与标准Claude API不同：
- 标准Claude: input_tokens在message_start中
- GLM等API: 所有tokens都在message_delta中

现在从message_delta中也解析input_tokens和cache相关字段，
如果message_start中没有值则使用message_delta中的数据。

											
										
										
											2025-12-23 16:53:53 +08:00
+											usage.CacheReadInputTokens = msgDelta.Usage.CacheReadInputTokens
 										}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
 								}
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+								func (s *GatewayService) handleNonStreamingResponse(ctx context.Context, resp *http.Response, c *gin.Context, account *Account, originalModel, mappedModel string, toolNameMap map[string]string, mimicClaudeCode bool) (*ClaudeUsage, error) {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									// 更新5h窗口状态
 									s.rateLimitService.UpdateSessionWindow(ctx, account, resp.Header)
 									body, err := io.ReadAll(resp.Body)
 									if err != nil {
 										return nil, err
 									}
 									// 解析usage
 									var response struct {
 										Usage ClaudeUsage `json:"usage"`
 									}
 									if err := json.Unmarshal(body, &response); err != nil {
 										return nil, fmt.Errorf("parse response: %w", err)
 									}
 									// 如果有模型映射，替换响应中的model字段
 									if originalModel != mappedModel {
 										body = s.replaceModelInResponseBody(body, mappedModel, originalModel)
 									}
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+									if mimicClaudeCode {
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+										body = s.replaceToolNamesInResponseBody(body, toolNameMap)
 									}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
-												feat(安全): 强化安全策略与配置校验

- 增加 CORS/CSP/安全响应头与代理信任配置

- 引入 URL 白名单与私网开关，校验上游与价格源

- 改善 API Key 处理与网关错误返回

- 管理端设置隐藏敏感字段并优化前端提示

- 增加计费熔断与相关配置示例

测试: go test ./...

											
										
										
											2026-01-02 17:40:57 +08:00
+									responseheaders.WriteFilteredHeaders(c.Writer.Header(), resp.Header, s.cfg.Security.ResponseHeaders)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+									contentType := "application/json"
 									if s.cfg != nil && !s.cfg.Security.ResponseHeaders.Enabled {
 										if upstreamType := resp.Header.Get("Content-Type"); upstreamType != "" {
 											contentType = upstreamType
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										}
 									}
 									// 写入响应
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+									c.Data(resp.StatusCode, contentType, body)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
 									return &response.Usage, nil
 								}
 								// replaceModelInResponseBody 替换响应体中的model字段
 								func (s *GatewayService) replaceModelInResponseBody(body []byte, fromModel, toModel string) []byte {
-												ci(backend): 添加 gofmt 配置

											
										
										
											2025-12-20 16:19:40 +08:00
+									var resp map[string]any
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									if err := json.Unmarshal(body, &resp); err != nil {
 										return body
 									}
 									model, ok := resp["model"].(string)
 									if !ok || model != fromModel {
 										return body
 									}
 									resp["model"] = toModel
 									newBody, err := json.Marshal(resp)
 									if err != nil {
 										return body
 									}
 									return newBody
 								}
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+								func (s *GatewayService) replaceToolNamesInResponseBody(body []byte, toolNameMap map[string]string) []byte {
 									if len(body) == 0 {
 										return body
 									}
 									var resp map[string]any
 									if err := json.Unmarshal(body, &resp); err != nil {
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+										replaced := replaceToolNamesInText(string(body), toolNameMap)
 										if replaced == string(body) {
 											return body
 										}
 										return []byte(replaced)
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+									}
 									if !rewriteToolNamesInValue(resp, toolNameMap) {
 										return body
 									}
 									newBody, err := json.Marshal(resp)
 									if err != nil {
 										return body
 									}
 									return newBody
 								}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								// RecordUsageInput 记录使用量的输入参数
 								type RecordUsageInput struct {
 									Result       *ForwardResult
-												fix(lint): 修复所有 Go 命名规范问题

- 全局替换 ApiKey → APIKey（类型、字段、方法、变量）
- 修复所有 initialism 命名（API, SMTP, HTML, URL 等）
- 添加所有缺失的包注释
- 修复导出符号的注释格式

主要修改：
- ApiKey → APIKey（所有出现的地方）
- ApiKeyID → APIKeyID
- ApiKeyIDs → APIKeyIDs
- TestSmtpConnection → TestSMTPConnection
- HtmlURL → HTMLURL
- 添加 20+ 个包注释
- 修复 10+ 个导出符号注释格式

验证结果：
- ✓ golangci-lint: 0 issues
- ✓ 单元测试: 通过
- ✓ 集成测试: 通过

											
										
										
											2026-01-04 19:27:53 +08:00
+									APIKey       *APIKey
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+									User         *User
 									Account      *Account
 									Subscription *UserSubscription // 可选：订阅信息
-												feat(usage-log): 增加请求 User-Agent 记录

在使用记录中添加 user_agent 字段，用于记录 API 请求的 User-Agent 头信息，
便于分析客户端类型和调试。

变更内容：
- 新增数据库迁移 028_add_usage_logs_user_agent.sql
- 更新 UsageLog 模型和 Ent Schema 添加 user_agent 字段
- 更新 Repository 层的 Create 和 scanUsageLog 方法
- 更新 RecordUsageInput 结构体支持传入 UserAgent
- 更新 Claude/OpenAI/Gemini 三个网关 Handler 传递 UserAgent

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>

											
										
										
											2026-01-06 16:23:56 +08:00
+									UserAgent    string            // 请求的 User-Agent
-												feat(api-key): 添加 IP 白名单/黑名单限制功能 (#221)

* feat(api-key): add IP whitelist/blacklist restriction and usage log IP tracking

- Add IP restriction feature for API keys (whitelist/blacklist with CIDR support)
- Add IP address logging to usage logs (admin-only visibility)
- Remove billing_type column from usage logs UI (redundant)
- Use generic "Access denied" error message for security

Backend:
- New ip package with IP/CIDR validation and matching utilities
- Database migrations for ip_whitelist, ip_blacklist (api_keys) and ip_address (usage_logs)
- Middleware IP restriction check after API key validation
- Input validation for IP/CIDR patterns on create/update

Frontend:
- API key form with enable toggle for IP restriction
- Shield icon indicator in table for keys with IP restriction
- Removed billing_type filter and column from usage views

* fix: update API contract tests for ip_whitelist/ip_blacklist fields

Add ip_whitelist and ip_blacklist fields to expected JSON responses
in API contract tests to match the new API key schema.
											
										
										
											2026-01-09 21:59:32 +08:00
+									IPAddress    string            // 请求的客户端 IP 地址
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+								}
 								// RecordUsage 记录使用量并扣费（或更新订阅用量）
 								func (s *GatewayService) RecordUsage(ctx context.Context, input *RecordUsageInput) error {
 									result := input.Result
-												fix(lint): 修复所有 Go 命名规范问题

- 全局替换 ApiKey → APIKey（类型、字段、方法、变量）
- 修复所有 initialism 命名（API, SMTP, HTML, URL 等）
- 添加所有缺失的包注释
- 修复导出符号的注释格式

主要修改：
- ApiKey → APIKey（所有出现的地方）
- ApiKeyID → APIKeyID
- ApiKeyIDs → APIKeyIDs
- TestSmtpConnection → TestSMTPConnection
- HtmlURL → HTMLURL
- 添加 20+ 个包注释
- 修复 10+ 个导出符号注释格式

验证结果：
- ✓ golangci-lint: 0 issues
- ✓ 单元测试: 通过
- ✓ 集成测试: 通过

											
										
										
											2026-01-04 19:27:53 +08:00
+									apiKey := input.APIKey
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									user := input.User
 									account := input.Account
 									subscription := input.Subscription
 									// 获取费率倍数
 									multiplier := s.cfg.Default.RateMultiplier
 									if apiKey.GroupID != nil && apiKey.Group != nil {
 										multiplier = apiKey.Group.RateMultiplier
 									}
-												feat: 图片生成计费功能

- 新增 Group 图片价格配置（image_price_1k/2k/4k）
- BillingService 新增 CalculateImageCost 方法
- AntigravityGatewayService 支持识别图片生成模型并按次计费
- UsageLog 新增 image_count 和 image_size 字段
- 前端分组管理支持配置图片价格（antigravity 和 gemini 平台）
- 图片计费复用通用计费能力（余额检查、扣费、倍率、订阅限额）

											
										
										
											2026-01-05 17:07:29 +08:00
+									var cost *CostBreakdown
 									// 根据请求类型选择计费方式
 									if result.ImageCount > 0 {
 										// 图片生成计费
 										var groupConfig *ImagePriceConfig
 										if apiKey.Group != nil {
 											groupConfig = &ImagePriceConfig{
 												Price1K: apiKey.Group.ImagePrice1K,
 												Price2K: apiKey.Group.ImagePrice2K,
 												Price4K: apiKey.Group.ImagePrice4K,
 											}
 										}
 										cost = s.billingService.CalculateImageCost(result.Model, result.ImageSize, result.ImageCount, groupConfig, multiplier)
 									} else {
 										// Token 计费
 										tokens := UsageTokens{
 											InputTokens:         result.Usage.InputTokens,
 											OutputTokens:        result.Usage.OutputTokens,
 											CacheCreationTokens: result.Usage.CacheCreationInputTokens,
 											CacheReadTokens:     result.Usage.CacheReadInputTokens,
 										}
 										var err error
 										cost, err = s.billingService.CalculateCost(result.Model, tokens, multiplier)
 										if err != nil {
 											log.Printf("Calculate cost failed: %v", err)
 											cost = &CostBreakdown{ActualCost: 0}
 										}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
 									// 判断计费方式：订阅模式 vs 余额模式
 									isSubscriptionBilling := subscription != nil && apiKey.Group != nil && apiKey.Group.IsSubscriptionType()
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+									billingType := BillingTypeBalance
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									if isSubscriptionBilling {
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+										billingType = BillingTypeSubscription
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
 									// 创建使用日志
 									durationMs := int(result.Duration.Milliseconds())
-												feat: 图片生成计费功能

- 新增 Group 图片价格配置（image_price_1k/2k/4k）
- BillingService 新增 CalculateImageCost 方法
- AntigravityGatewayService 支持识别图片生成模型并按次计费
- UsageLog 新增 image_count 和 image_size 字段
- 前端分组管理支持配置图片价格（antigravity 和 gemini 平台）
- 图片计费复用通用计费能力（余额检查、扣费、倍率、订阅限额）

											
										
										
											2026-01-05 17:07:29 +08:00
+									var imageSize *string
 									if result.ImageSize != "" {
 										imageSize = &result.ImageSize
 									}
-												feat: merge dev

											
										
										
											2026-01-15 15:14:44 +08:00
+									accountRateMultiplier := account.BillingRateMultiplier()
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+									usageLog := &UsageLog{
-												feat: merge dev

											
										
										
											2026-01-15 15:14:44 +08:00
+										UserID:                user.ID,
 										APIKeyID:              apiKey.ID,
 										AccountID:             account.ID,
 										RequestID:             result.RequestID,
 										Model:                 result.Model,
 										InputTokens:           result.Usage.InputTokens,
 										OutputTokens:          result.Usage.OutputTokens,
 										CacheCreationTokens:   result.Usage.CacheCreationInputTokens,
 										CacheReadTokens:       result.Usage.CacheReadInputTokens,
 										InputCost:             cost.InputCost,
 										OutputCost:            cost.OutputCost,
 										CacheCreationCost:     cost.CacheCreationCost,
 										CacheReadCost:         cost.CacheReadCost,
 										TotalCost:             cost.TotalCost,
 										ActualCost:            cost.ActualCost,
 										RateMultiplier:        multiplier,
 										AccountRateMultiplier: &accountRateMultiplier,
 										BillingType:           billingType,
 										Stream:                result.Stream,
 										DurationMs:            &durationMs,
 										FirstTokenMs:          result.FirstTokenMs,
 										ImageCount:            result.ImageCount,
 										ImageSize:             imageSize,
 										CreatedAt:             time.Now(),
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
-												feat(usage-log): 增加请求 User-Agent 记录

在使用记录中添加 user_agent 字段，用于记录 API 请求的 User-Agent 头信息，
便于分析客户端类型和调试。

变更内容：
- 新增数据库迁移 028_add_usage_logs_user_agent.sql
- 更新 UsageLog 模型和 Ent Schema 添加 user_agent 字段
- 更新 Repository 层的 Create 和 scanUsageLog 方法
- 更新 RecordUsageInput 结构体支持传入 UserAgent
- 更新 Claude/OpenAI/Gemini 三个网关 Handler 传递 UserAgent

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>

											
										
										
											2026-01-06 16:23:56 +08:00
+									// 添加 UserAgent
 									if input.UserAgent != "" {
 										usageLog.UserAgent = &input.UserAgent
 									}
-												feat(api-key): 添加 IP 白名单/黑名单限制功能 (#221)

* feat(api-key): add IP whitelist/blacklist restriction and usage log IP tracking

- Add IP restriction feature for API keys (whitelist/blacklist with CIDR support)
- Add IP address logging to usage logs (admin-only visibility)
- Remove billing_type column from usage logs UI (redundant)
- Use generic "Access denied" error message for security

Backend:
- New ip package with IP/CIDR validation and matching utilities
- Database migrations for ip_whitelist, ip_blacklist (api_keys) and ip_address (usage_logs)
- Middleware IP restriction check after API key validation
- Input validation for IP/CIDR patterns on create/update

Frontend:
- API key form with enable toggle for IP restriction
- Shield icon indicator in table for keys with IP restriction
- Removed billing_type filter and column from usage views

* fix: update API contract tests for ip_whitelist/ip_blacklist fields

Add ip_whitelist and ip_blacklist fields to expected JSON responses
in API contract tests to match the new API key schema.
											
										
										
											2026-01-09 21:59:32 +08:00
+									// 添加 IPAddress
 									if input.IPAddress != "" {
 										usageLog.IPAddress = &input.IPAddress
 									}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									// 添加分组和订阅关联
 									if apiKey.GroupID != nil {
 										usageLog.GroupID = apiKey.GroupID
 									}
 									if subscription != nil {
 										usageLog.SubscriptionID = &subscription.ID
 									}
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+									inserted, err := s.usageLogRepo.Create(ctx, usageLog)
 									if err != nil {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										log.Printf("Create usage log failed: %v", err)
 									}
-												feat(全栈): 实现简易模式核心功能

**功能概述**：
实现简易模式(Simple Mode)，为个人用户和小团队提供简化的使用体验，隐藏复杂的分组、订阅、配额等概念。

**后端改动**：
1. 配置系统
   - 新增 run_mode 配置项（standard/simple）
   - 支持环境变量 RUN_MODE
   - 默认值为 standard

2. 数据库初始化
   - 自动创建3个默认分组：anthropic-default、openai-default、gemini-default
   - 默认分组配置：无并发限制、active状态、非独占
   - 幂等性保证：重复启动不会重复创建

3. 账号管理
   - 创建账号时自动绑定对应平台的默认分组
   - 如果未指定分组，自动查找并绑定默认分组

**前端改动**：
1. 状态管理
   - authStore 新增 isSimpleMode 计算属性
   - 从后端API获取并同步运行模式

2. UI隐藏
   - 侧边栏：隐藏分组管理、订阅管理、兑换码菜单
   - 账号管理页面：隐藏分组列
   - 创建/编辑账号对话框：隐藏分组选择器

3. 路由守卫
   - 限制访问分组、订阅、兑换码相关页面
   - 访问受限页面时自动重定向到仪表板

**配置示例**：
```yaml
run_mode: simple

run_mode: standard
```

**影响范围**：
- 后端：配置、数据库迁移、账号服务
- 前端：认证状态、路由、UI组件
- 部署：配置文件示例

**兼容性**：
- 简易模式和标准模式可无缝切换
- 不需要数据迁移
- 现有数据不受影响

											
										
										
											2025-12-29 03:17:25 +08:00
+									if s.cfg != nil && s.cfg.RunMode == config.RunModeSimple {
 										log.Printf("[SIMPLE MODE] Usage recorded (not billed): user=%d, tokens=%d", usageLog.UserID, usageLog.TotalTokens())
 										s.deferredService.ScheduleLastUsedUpdate(account.ID)
 										return nil
 									}
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+									shouldBill := inserted || err != nil
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									// 根据计费类型执行扣费
 									if isSubscriptionBilling {
 										// 订阅模式：更新订阅用量（使用 TotalCost 原始费用，不考虑倍率）
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+										if shouldBill && cost.TotalCost > 0 {
-												refactor(backend): 引入端口接口模式

											
										
										
											2025-12-19 21:26:19 +08:00
+											if err := s.userSubRepo.IncrementUsage(ctx, subscription.ID, cost.TotalCost); err != nil {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+												log.Printf("Increment subscription usage failed: %v", err)
 											}
 											// 异步更新订阅缓存
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+											s.billingCacheService.QueueUpdateSubscriptionUsage(user.ID, *apiKey.GroupID, cost.TotalCost)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										}
 									} else {
 										// 余额模式：扣除用户余额（使用 ActualCost 考虑倍率后的费用）
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+										if shouldBill && cost.ActualCost > 0 {
-												refactor(backend): 引入端口接口模式

											
										
										
											2025-12-19 21:26:19 +08:00
+											if err := s.userRepo.DeductBalance(ctx, user.ID, cost.ActualCost); err != nil {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+												log.Printf("Deduct balance failed: %v", err)
 											}
 											// 异步更新余额缓存
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+											s.billingCacheService.QueueDeductBalance(user.ID, cost.ActualCost)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										}
 									}
-												feat: Schedule batch update for account last_used_at

Implement deferred batch update mechanism to reduce database load:

- Add DeferredService for batching account last_used_at updates
- Add TimingWheelService for efficient recurring task scheduling
- Integrate with GatewayService and OpenAIGatewayService
- Implement BatchUpdateLastUsed repository method using CASE...WHEN SQL
- Fix golangci-lint error: Replace interface{} with any

Benefits:
- Reduces database writes by batching updates (10-second intervals)
- Improves request throughput by deferring non-critical updates
- Maintains accurate account usage tracking for scheduling

											
										
										
											2025-12-28 08:07:15 +08:00
+									// Schedule batch update for account last_used_at
 									s.deferredService.ScheduleLastUsedUpdate(account.ID)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
 									return nil
 								}
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
-												feat(billing): 添加 Gemini 200K 长上下文双倍计费功能

- 新增 CalculateCostWithLongContext 方法支持阈值双倍计费
- 新增 RecordUsageWithLongContext 方法专用于 Gemini 计费
- Gemini 超过 200K token 的部分按 2 倍费率计算
- 其他平台（Claude/OpenAI）完全不受影响

											
										
										
											2026-02-02 16:37:22 +08:00
+								// RecordUsageLongContextInput 记录使用量的输入参数（支持长上下文双倍计费）
 								type RecordUsageLongContextInput struct {
 									Result                *ForwardResult
 									APIKey                *APIKey
 									User                  *User
 									Account               *Account
 									Subscription          *UserSubscription // 可选：订阅信息
 									UserAgent             string            // 请求的 User-Agent
 									IPAddress             string            // 请求的客户端 IP 地址
 									LongContextThreshold  int               // 长上下文阈值（如 200000）
 									LongContextMultiplier float64           // 超出阈值部分的倍率（如 2.0）
 								}
 								// RecordUsageWithLongContext 记录使用量并扣费，支持长上下文双倍计费（用于 Gemini）
 								func (s *GatewayService) RecordUsageWithLongContext(ctx context.Context, input *RecordUsageLongContextInput) error {
 									result := input.Result
 									apiKey := input.APIKey
 									user := input.User
 									account := input.Account
 									subscription := input.Subscription
 									// 获取费率倍数
 									multiplier := s.cfg.Default.RateMultiplier
 									if apiKey.GroupID != nil && apiKey.Group != nil {
 										multiplier = apiKey.Group.RateMultiplier
 									}
 									var cost *CostBreakdown
 									// 根据请求类型选择计费方式
 									if result.ImageCount > 0 {
 										// 图片生成计费
 										var groupConfig *ImagePriceConfig
 										if apiKey.Group != nil {
 											groupConfig = &ImagePriceConfig{
 												Price1K: apiKey.Group.ImagePrice1K,
 												Price2K: apiKey.Group.ImagePrice2K,
 												Price4K: apiKey.Group.ImagePrice4K,
 											}
 										}
 										cost = s.billingService.CalculateImageCost(result.Model, result.ImageSize, result.ImageCount, groupConfig, multiplier)
 									} else {
 										// Token 计费（使用长上下文计费方法）
 										tokens := UsageTokens{
 											InputTokens:         result.Usage.InputTokens,
 											OutputTokens:        result.Usage.OutputTokens,
 											CacheCreationTokens: result.Usage.CacheCreationInputTokens,
 											CacheReadTokens:     result.Usage.CacheReadInputTokens,
 										}
 										var err error
 										cost, err = s.billingService.CalculateCostWithLongContext(result.Model, tokens, multiplier, input.LongContextThreshold, input.LongContextMultiplier)
 										if err != nil {
 											log.Printf("Calculate cost failed: %v", err)
 											cost = &CostBreakdown{ActualCost: 0}
 										}
 									}
 									// 判断计费方式：订阅模式 vs 余额模式
 									isSubscriptionBilling := subscription != nil && apiKey.Group != nil && apiKey.Group.IsSubscriptionType()
 									billingType := BillingTypeBalance
 									if isSubscriptionBilling {
 										billingType = BillingTypeSubscription
 									}
 									// 创建使用日志
 									durationMs := int(result.Duration.Milliseconds())
 									var imageSize *string
 									if result.ImageSize != "" {
 										imageSize = &result.ImageSize
 									}
 									accountRateMultiplier := account.BillingRateMultiplier()
 									usageLog := &UsageLog{
 										UserID:                user.ID,
 										APIKeyID:              apiKey.ID,
 										AccountID:             account.ID,
-												feat: merge dev

											
										
										
											2026-01-15 15:14:44 +08:00
+										RequestID:             result.RequestID,
 										Model:                 result.Model,
 										InputTokens:           result.Usage.InputTokens,
 										OutputTokens:          result.Usage.OutputTokens,
 										CacheCreationTokens:   result.Usage.CacheCreationInputTokens,
 										CacheReadTokens:       result.Usage.CacheReadInputTokens,
 										InputCost:             cost.InputCost,
 										OutputCost:            cost.OutputCost,
 										CacheCreationCost:     cost.CacheCreationCost,
 										CacheReadCost:         cost.CacheReadCost,
 										TotalCost:             cost.TotalCost,
 										ActualCost:            cost.ActualCost,
 										RateMultiplier:        multiplier,
 										AccountRateMultiplier: &accountRateMultiplier,
 										BillingType:           billingType,
 										Stream:                result.Stream,
 										DurationMs:            &durationMs,
 										FirstTokenMs:          result.FirstTokenMs,
 										ImageCount:            result.ImageCount,
 										ImageSize:             imageSize,
 										CreatedAt:             time.Now(),
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									}
-												feat(usage-log): 增加请求 User-Agent 记录

在使用记录中添加 user_agent 字段，用于记录 API 请求的 User-Agent 头信息，
便于分析客户端类型和调试。

变更内容：
- 新增数据库迁移 028_add_usage_logs_user_agent.sql
- 更新 UsageLog 模型和 Ent Schema 添加 user_agent 字段
- 更新 Repository 层的 Create 和 scanUsageLog 方法
- 更新 RecordUsageInput 结构体支持传入 UserAgent
- 更新 Claude/OpenAI/Gemini 三个网关 Handler 传递 UserAgent

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>

											
										
										
											2026-01-06 16:23:56 +08:00
+									// 添加 UserAgent
 									if input.UserAgent != "" {
 										usageLog.UserAgent = &input.UserAgent
 									}
-												feat(api-key): 添加 IP 白名单/黑名单限制功能 (#221)

* feat(api-key): add IP whitelist/blacklist restriction and usage log IP tracking

- Add IP restriction feature for API keys (whitelist/blacklist with CIDR support)
- Add IP address logging to usage logs (admin-only visibility)
- Remove billing_type column from usage logs UI (redundant)
- Use generic "Access denied" error message for security

Backend:
- New ip package with IP/CIDR validation and matching utilities
- Database migrations for ip_whitelist, ip_blacklist (api_keys) and ip_address (usage_logs)
- Middleware IP restriction check after API key validation
- Input validation for IP/CIDR patterns on create/update

Frontend:
- API key form with enable toggle for IP restriction
- Shield icon indicator in table for keys with IP restriction
- Removed billing_type filter and column from usage views

* fix: update API contract tests for ip_whitelist/ip_blacklist fields

Add ip_whitelist and ip_blacklist fields to expected JSON responses
in API contract tests to match the new API key schema.
											
										
										
											2026-01-09 21:59:32 +08:00
+									// 添加 IPAddress
 									if input.IPAddress != "" {
 										usageLog.IPAddress = &input.IPAddress
 									}
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									// 添加分组和订阅关联
 									if apiKey.GroupID != nil {
 										usageLog.GroupID = apiKey.GroupID
 									}
 									if subscription != nil {
 										usageLog.SubscriptionID = &subscription.ID
 									}
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+									inserted, err := s.usageLogRepo.Create(ctx, usageLog)
 									if err != nil {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										log.Printf("Create usage log failed: %v", err)
 									}
-												feat(全栈): 实现简易模式核心功能

**功能概述**：
实现简易模式(Simple Mode)，为个人用户和小团队提供简化的使用体验，隐藏复杂的分组、订阅、配额等概念。

**后端改动**：
1. 配置系统
   - 新增 run_mode 配置项（standard/simple）
   - 支持环境变量 RUN_MODE
   - 默认值为 standard

2. 数据库初始化
   - 自动创建3个默认分组：anthropic-default、openai-default、gemini-default
   - 默认分组配置：无并发限制、active状态、非独占
   - 幂等性保证：重复启动不会重复创建

3. 账号管理
   - 创建账号时自动绑定对应平台的默认分组
   - 如果未指定分组，自动查找并绑定默认分组

**前端改动**：
1. 状态管理
   - authStore 新增 isSimpleMode 计算属性
   - 从后端API获取并同步运行模式

2. UI隐藏
   - 侧边栏：隐藏分组管理、订阅管理、兑换码菜单
   - 账号管理页面：隐藏分组列
   - 创建/编辑账号对话框：隐藏分组选择器

3. 路由守卫
   - 限制访问分组、订阅、兑换码相关页面
   - 访问受限页面时自动重定向到仪表板

**配置示例**：
```yaml
run_mode: simple

run_mode: standard
```

**影响范围**：
- 后端：配置、数据库迁移、账号服务
- 前端：认证状态、路由、UI组件
- 部署：配置文件示例

**兼容性**：
- 简易模式和标准模式可无缝切换
- 不需要数据迁移
- 现有数据不受影响

											
										
										
											2025-12-29 03:17:25 +08:00
+									if s.cfg != nil && s.cfg.RunMode == config.RunModeSimple {
 										log.Printf("[SIMPLE MODE] Usage recorded (not billed): user=%d, tokens=%d", usageLog.UserID, usageLog.TotalTokens())
 										s.deferredService.ScheduleLastUsedUpdate(account.ID)
 										return nil
 									}
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+									shouldBill := inserted || err != nil
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+									// 根据计费类型执行扣费
 									if isSubscriptionBilling {
 										// 订阅模式：更新订阅用量（使用 TotalCost 原始费用，不考虑倍率）
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+										if shouldBill && cost.TotalCost > 0 {
-												refactor(backend): 引入端口接口模式

											
										
										
											2025-12-19 21:26:19 +08:00
+											if err := s.userSubRepo.IncrementUsage(ctx, subscription.ID, cost.TotalCost); err != nil {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+												log.Printf("Increment subscription usage failed: %v", err)
 											}
 											// 异步更新订阅缓存
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+											s.billingCacheService.QueueUpdateSubscriptionUsage(user.ID, *apiKey.GroupID, cost.TotalCost)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										}
 									} else {
 										// 余额模式：扣除用户余额（使用 ActualCost 考虑倍率后的费用）
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+										if shouldBill && cost.ActualCost > 0 {
-												refactor(backend): 引入端口接口模式

											
										
										
											2025-12-19 21:26:19 +08:00
+											if err := s.userRepo.DeductBalance(ctx, user.ID, cost.ActualCost); err != nil {
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+												log.Printf("Deduct balance failed: %v", err)
 											}
 											// 异步更新余额缓存
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+											s.billingCacheService.QueueDeductBalance(user.ID, cost.ActualCost)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
+										}
 									}
-												feat: Schedule batch update for account last_used_at

Implement deferred batch update mechanism to reduce database load:

- Add DeferredService for batching account last_used_at updates
- Add TimingWheelService for efficient recurring task scheduling
- Integrate with GatewayService and OpenAIGatewayService
- Implement BatchUpdateLastUsed repository method using CASE...WHEN SQL
- Fix golangci-lint error: Replace interface{} with any

Benefits:
- Reduces database writes by batching updates (10-second intervals)
- Improves request throughput by deferring non-critical updates
- Maintains accurate account usage tracking for scheduling

											
										
										
											2025-12-28 08:07:15 +08:00
+									// Schedule batch update for account last_used_at
 									s.deferredService.ScheduleLastUsedUpdate(account.ID)
-												First commit

											
										
										
											2025-12-18 13:50:39 +08:00
 									return nil
 								}
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
 								// ForwardCountTokens 转发 count_tokens 请求到上游 API
 								// 特点：不记录使用量、仅支持非流式响应
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+								func (s *GatewayService) ForwardCountTokens(ctx context.Context, c *gin.Context, account *Account, parsed *ParsedRequest) error {
 									if parsed == nil {
 										s.countTokensError(c, http.StatusBadRequest, "invalid_request_error", "Request body is empty")
 										return fmt.Errorf("parse request: empty request")
 									}
 									body := parsed.Body
 									reqModel := parsed.Model
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+									isClaudeCode := isClaudeCodeRequest(ctx, c, parsed)
 									shouldMimicClaudeCode := account.IsOAuth() && !isClaudeCode
 									if shouldMimicClaudeCode {
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+										normalizeOpts := claudeOAuthNormalizeOptions{stripSystemCacheControl: true}
 										body, reqModel, _ = normalizeClaudeOAuthRequestBody(body, reqModel, normalizeOpts)
 									}
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+									// Antigravity 账户不支持 count_tokens 转发，直接返回空值
-												fix(gateway): Antigravity 账户 count_tokens 返回估算值

Antigravity 不支持 count_tokens 转发，直接返回估算值，
与 Antigravity-Manager 和 proxycast 实现保持一致。

修复 count_tokens 请求选择到 Antigravity 账户时导致 401 的问题。

											
										
										
											2025-12-28 21:56:52 +08:00
+									if account.Platform == PlatformAntigravity {
-												perf(gateway): 优化负载感知调度

主要改进：
- 优化负载感知调度的准确性和响应速度
- 将 AccountUsageService 的包级缓存改为依赖注入
- 修复 SSE/JSON 转义和 nil 安全问题
- 恢复 Google One 功能兼容性

											
										
										
											2026-01-03 06:32:51 -08:00
+										c.JSON(http.StatusOK, gin.H{"input_tokens": 0})
-												fix(gateway): Antigravity 账户 count_tokens 返回估算值

Antigravity 不支持 count_tokens 转发，直接返回估算值，
与 Antigravity-Manager 和 proxycast 实现保持一致。

修复 count_tokens 请求选择到 Antigravity 账户时导致 401 的问题。

											
										
										
											2025-12-28 21:56:52 +08:00
+										return nil
 									}
-												Add invalid-request fallback routing

											
										
										
											2026-01-23 22:24:46 +08:00
+									// 应用模型映射（APIKey 明确映射优先，其次使用 Anthropic 前缀映射）
 									if reqModel != "" {
 										mappedModel := reqModel
 										mappingSource := ""
 										if account.Type == AccountTypeAPIKey {
 											mappedModel = account.GetMappedModel(reqModel)
-												perf(后端): 完成性能优化与连接池配置

新增 DB/Redis 连接池配置与校验，并补充单测

网关请求体大小限制与 413 处理

HTTP/req 客户端池化并调整上游连接池默认值

并发槽位改为 ZSET+Lua 与指数退避

用量统计改 SQL 聚合并新增索引迁移

计费缓存写入改工作池并补测试/基准

测试: 在 backend/ 下运行 go test ./...

											
										
										
											2025-12-31 08:50:12 +08:00
+											if mappedModel != reqModel {
-												Add invalid-request fallback routing

											
										
										
											2026-01-23 22:24:46 +08:00
+												mappingSource = "account"
 											}
 										}
 										if mappingSource == "" && account.Platform == PlatformAnthropic {
 											normalized := normalizeClaudeModelForAnthropic(reqModel)
 											if normalized != reqModel {
 												mappedModel = normalized
 												mappingSource = "prefix"
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+											}
 										}
-												Add invalid-request fallback routing

											
										
										
											2026-01-23 22:24:46 +08:00
+										if mappedModel != reqModel {
 											body = s.replaceModelInBody(body, mappedModel)
 											reqModel = mappedModel
 											log.Printf("CountTokens model mapping applied: %s -> %s (account: %s, source=%s)", parsed.Model, mappedModel, account.Name, mappingSource)
 										}
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+									}
 									// 获取凭证
 									token, tokenType, err := s.GetAccessToken(ctx, account)
 									if err != nil {
 										s.countTokensError(c, http.StatusBadGateway, "upstream_error", "Failed to get access token")
 										return err
 									}
 									// 构建上游请求
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+									upstreamReq, err := s.buildCountTokensRequest(ctx, c, account, body, token, tokenType, reqModel, shouldMimicClaudeCode)
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+									if err != nil {
 										s.countTokensError(c, http.StatusInternalServerError, "api_error", "Failed to build request")
 										return err
 									}
-												refactor(backend): service http ports

											
										
										
											2025-12-20 11:56:11 +08:00
+									// 获取代理URL
 									proxyURL := ""
 									if account.ProxyID != nil && account.Proxy != nil {
 										proxyURL = account.Proxy.URL()
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+									}
 									// 发送请求
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+									resp, err := s.httpUpstream.DoWithTLS(upstreamReq, proxyURL, account.ID, account.Concurrency, account.IsTLSFingerprintEnabled())
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+									if err != nil {
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+										setOpsUpstreamError(c, 0, sanitizeUpstreamErrorMessage(err.Error()), "")
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+										s.countTokensError(c, http.StatusBadGateway, "upstream_error", "Request failed")
 										return fmt.Errorf("upstream request failed: %w", err)
 									}
 									// 读取响应体
 									respBody, err := io.ReadAll(resp.Body)
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+									_ = resp.Body.Close()
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+									if err != nil {
 										s.countTokensError(c, http.StatusBadGateway, "upstream_error", "Failed to read response")
 										return err
 									}
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+									// 检测 thinking block 签名错误（400）并重试一次（过滤 thinking blocks）
 									if resp.StatusCode == 400 && s.isThinkingBlockSignatureError(respBody) {
 										log.Printf("Account %d: detected thinking block signature error on count_tokens, retrying with filtered thinking blocks", account.ID)
-												fix(backend): 改进 thinking/tool block 签名处理和重试策略

主要改动：
- request_transformer: thinking block 缺少签名时降级为文本而非丢弃，保留内容并在上层禁用 thinking mode
- antigravity_gateway_service: 新增两阶段降级策略，先处理 thinking blocks，如仍失败且涉及 tool 签名错误则进一步降级 tool blocks
- gateway_request: 新增 FilterSignatureSensitiveBlocksForRetry 函数，支持将 tool_use/tool_result 降级为文本
- gateway_request: 改进 FilterThinkingBlocksForRetry，禁用顶层 thinking 配置以避免结构约束冲突
- gateway_service: 实现保守的两阶段重试逻辑，优先保留内容，仅在必要时降级工具调用
- 新增 antigravity_gateway_service_test.go 测试签名块剥离逻辑
- 更新相关测试用例以验证降级行为

此修复解决了跨平台/账户切换时历史消息签名失效导致的请求失败问题。

											
										
										
											2026-01-04 22:32:36 +08:00
+										filteredBody := FilterThinkingBlocksForRetry(body)
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+										retryReq, buildErr := s.buildCountTokensRequest(ctx, c, account, filteredBody, token, tokenType, reqModel, shouldMimicClaudeCode)
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+										if buildErr == nil {
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+											retryResp, retryErr := s.httpUpstream.DoWithTLS(retryReq, proxyURL, account.ID, account.Concurrency, account.IsTLSFingerprintEnabled())
-												fix(gateway): 完善 thinking block 重试和 cache nil 检查

- 使用 FilterThinkingBlocksForRetry 替代 FilterThinkingBlocks
- count_tokens 增加 thinking block 签名错误重试
- cache nil 检查防止空指针
- shouldBill 逻辑修复避免重复扣费
- 移除 debug 日志

											
										
										
											2026-01-03 17:10:25 -08:00
+											if retryErr == nil {
 												resp = retryResp
 												respBody, err = io.ReadAll(resp.Body)
 												_ = resp.Body.Close()
 												if err != nil {
 													s.countTokensError(c, http.StatusBadGateway, "upstream_error", "Failed to read response")
 													return err
 												}
 											}
 										}
 									}
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+									// 处理错误响应
 									if resp.StatusCode >= 400 {
 										// 标记账号状态（429/529等）
 										s.rateLimitService.HandleUpstreamError(ctx, account, resp.StatusCode, resp.Header, respBody)
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+										upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(respBody))
 										upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)
 										upstreamDetail := ""
 										if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 											maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
 											if maxBytes <= 0 {
 												maxBytes = 2048
 											}
 											upstreamDetail = truncateString(string(respBody), maxBytes)
 										}
 										setOpsUpstreamError(c, resp.StatusCode, upstreamMsg, upstreamDetail)
-												fix: 修复 /v1/messages 间歇性 400 错误 (#18)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* feat(gemini): 添加Gemini限额与TierID支持

实现PR1：Gemini限额与TierID功能

后端修改：
- GeminiTokenInfo结构体添加TierID字段
- fetchProjectID函数返回(projectID, tierID, error)
- 从LoadCodeAssist响应中提取tierID（优先IsDefault，回退到第一个非空tier）
- ExchangeCode、RefreshAccountToken、GetAccessToken函数更新以处理tierID
- BuildAccountCredentials函数保存tier_id到credentials

前端修改：
- AccountStatusIndicator组件添加tier显示
- 支持LEGACY/PRO/ULTRA等tier类型的友好显示
- 使用蓝色badge展示tier信息

技术细节：
- tierID提取逻辑：优先选择IsDefault的tier，否则选择第一个非空tier
- 所有fetchProjectID调用点已更新以处理新的返回签名
- 前端gracefully处理missing/unknown tier_id

* refactor(gemini): 优化TierID实现并添加安全验证

根据并发代码审查（code-reviewer, security-auditor, gemini, codex）的反馈进行改进：

安全改进：
- 添加validateTierID函数验证tier_id格式和长度（最大64字符）
- 限制tier_id字符集为字母数字、下划线、连字符和斜杠
- 在BuildAccountCredentials中验证tier_id后再存储
- 静默跳过无效tier_id，不阻塞账户创建

代码质量改进：
- 提取extractTierIDFromAllowedTiers辅助函数消除重复代码
- 重构fetchProjectID函数，tierID提取逻辑只执行一次
- 改进代码可读性和可维护性

审查工具：
- code-reviewer agent (a09848e)
- security-auditor agent (a9a149c)
- gemini CLI (bcc7c81)
- codex (b5d8919)

修复问题：
- HIGH: 未验证的tier_id输入
- MEDIUM: 代码重复（tierID提取逻辑重复2次）

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(upstream): 修复上游格式兼容性问题 (#14)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(format): 修复 claude_types.go 的 gofmt 格式问题

* feat(antigravity): 优化 thinking block 和 schema 处理

- 为 dummy thinking block 添加 ThoughtSignature
- 重构 thinking block 处理逻辑，在每个条件分支内创建 part
- 优化 excludedSchemaKeys，移除 Gemini 实际支持的字段
  (minItems, maxItems, minimum, maximum, additionalProperties, format)
- 添加详细注释说明 Gemini API 支持的 schema 字段

* fix(antigravity): 增强 schema 清理的安全性

基于 Codex review 建议：
- 添加 format 字段白名单过滤，只保留 Gemini 支持的 date-time/date/time
- 补充更多不支持的 schema 关键字到黑名单：
  * 组合 schema: oneOf, anyOf, allOf, not, if/then/else
  * 对象验证: minProperties, maxProperties, patternProperties 等
  * 定义引用: $defs, definitions
- 避免不支持的 schema 字段导致 Gemini API 校验失败

* fix(lint): 修复 gemini_messages_compat_service 空分支警告

- 在 cleanToolSchema 的 if 语句中添加 continue
- 移除重复的注释

* fix(antigravity): 移除 minItems/maxItems 以兼容 Claude API

- 将 minItems 和 maxItems 添加到 schema 黑名单
- Claude API (Vertex AI) 不支持这些数组验证字段
- 添加调试日志记录工具 schema 转换过程
- 修复 tools.14.custom.input_schema 验证错误

* fix(antigravity): 修复 additionalProperties schema 对象问题

- 将 additionalProperties 的 schema 对象转换为布尔值 true
- Claude API 只支持 additionalProperties: false，不支持 schema 对象
- 修复 tools.14.custom.input_schema 验证错误
- 参考 Claude 官方文档的 JSON Schema 限制

* fix(antigravity): 修复 Claude 模型 thinking 块兼容性问题

- 完全跳过 Claude 模型的 thinking 块以避免 signature 验证失败
- 只在 Gemini 模型中使用 dummy thought signature
- 修改 additionalProperties 默认值为 false（更安全）
- 添加调试日志以便排查问题

* fix(upstream): 修复跨模型切换时的 dummy signature 问题

基于 Codex review 和用户场景分析的修复：

1. 问题场景
   - Gemini (thinking) → Claude (thinking) 切换时
   - Gemini 返回的 thinking 块使用 dummy signature
   - Claude API 会拒绝 dummy signature，导致 400 错误

2. 修复内容
   - request_transformer.go:262: 跳过 dummy signature
   - 只保留真实的 Claude signature
   - 支持频繁的跨模型切换

3. 其他修复（基于 Codex review）
   - gateway_service.go:691: 修复 io.ReadAll 错误处理
   - gateway_service.go:687: 条件日志（尊重 LogUpstreamErrorBody 配置）
   - gateway_service.go:915: 收紧 400 failover 启发式
   - request_transformer.go:188: 移除签名成功日志

4. 新增功能（默认关闭）
   - 阶段 1: 上游错误日志（GATEWAY_LOG_UPSTREAM_ERROR_BODY）
   - 阶段 2: Antigravity thinking 修复
   - 阶段 3: API-key beta 注入（GATEWAY_INJECT_BETA_FOR_APIKEY）
   - 阶段 3: 智能 400 failover（GATEWAY_FAILOVER_ON_400）

测试：所有测试通过

* fix(lint): 修复 golangci-lint 问题

- 应用 De Morgan 定律简化条件判断
- 修复 gofmt 格式问题
- 移除未使用的 min 函数
											
										
										
											2026-01-01 04:21:18 +08:00
+										// 记录上游错误摘要便于排障（不回显请求内容）
 										if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 											log.Printf(
 												"count_tokens upstream error %d (account=%d platform=%s type=%s): %s",
 												resp.StatusCode,
 												account.ID,
 												account.Platform,
 												account.Type,
 												truncateForLog(respBody, s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes),
 											)
 										}
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+										// 返回简化的错误响应
 										errMsg := "Upstream request failed"
 										switch resp.StatusCode {
 										case 429:
 											errMsg = "Rate limit exceeded"
 										case 529:
 											errMsg = "Service overloaded"
 										}
 										s.countTokensError(c, resp.StatusCode, "upstream_error", errMsg)
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+										if upstreamMsg == "" {
 											return fmt.Errorf("upstream error: %d", resp.StatusCode)
 										}
 										return fmt.Errorf("upstream error: %d message=%s", resp.StatusCode, upstreamMsg)
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+									}
 									// 透传成功响应
 									c.Data(resp.StatusCode, "application/json", respBody)
 									return nil
 								}
 								// buildCountTokensRequest 构建 count_tokens 上游请求
-												fix(网关): 区分 Claude Code OAuth 适配

											
										
										
											2026-01-15 19:17:07 +08:00
+								func (s *GatewayService) buildCountTokensRequest(ctx context.Context, c *gin.Context, account *Account, body []byte, token, tokenType, modelID string, mimicClaudeCode bool) (*http.Request, error) {
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+									// 确定目标 URL
 									targetURL := claudeAPICountTokensURL
-												fix(lint): 修复所有 Go 命名规范问题

- 全局替换 ApiKey → APIKey（类型、字段、方法、变量）
- 修复所有 initialism 命名（API, SMTP, HTML, URL 等）
- 添加所有缺失的包注释
- 修复导出符号的注释格式

主要修改：
- ApiKey → APIKey（所有出现的地方）
- ApiKeyID → APIKeyID
- ApiKeyIDs → APIKeyIDs
- TestSmtpConnection → TestSMTPConnection
- HtmlURL → HTMLURL
- 添加 20+ 个包注释
- 修复 10+ 个导出符号注释格式

验证结果：
- ✓ golangci-lint: 0 issues
- ✓ 单元测试: 通过
- ✓ 集成测试: 通过

											
										
										
											2026-01-04 19:27:53 +08:00
+									if account.Type == AccountTypeAPIKey {
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+										baseURL := account.GetBaseURL()
-												feat(安全): 强化安全策略与配置校验

- 增加 CORS/CSP/安全响应头与代理信任配置

- 引入 URL 白名单与私网开关，校验上游与价格源

- 改善 API Key 处理与网关错误返回

- 管理端设置隐藏敏感字段并优化前端提示

- 增加计费熔断与相关配置示例

测试: go test ./...

											
										
										
											2026-01-02 17:40:57 +08:00
+										if baseURL != "" {
 											validatedURL, err := s.validateUpstreamBaseURL(baseURL)
 											if err != nil {
 												return nil, err
 											}
 											targetURL = validatedURL + "/v1/messages/count_tokens"
 										}
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+									}
-												fix: satisfy golangci-lint (nil checks, remove unused helpers)

											
										
										
											2026-01-31 02:07:57 +08:00
+									clientHeaders := http.Header{}
 									if c != nil && c.Request != nil {
 										clientHeaders = c.Request.Header
 									}
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+									// OAuth 账号：应用统一指纹和重写 userID
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+									// 如果启用了会话ID伪装，会在重写后替换 session 部分为固定值
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+									if account.IsOAuth() && s.identityService != nil {
-												fix: satisfy golangci-lint (nil checks, remove unused helpers)

											
										
										
											2026-01-31 02:07:57 +08:00
+										fp, err := s.identityService.GetOrCreateFingerprint(ctx, account.ID, clientHeaders)
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+										if err == nil {
 											accountUUID := account.GetExtraString("account_uuid")
 											if accountUUID != "" && fp.ClientID != "" {
-												merge upstream main

											
										
										
											2026-02-02 22:13:50 +08:00
+												if newBody, err := s.identityService.RewriteUserIDWithMasking(ctx, body, account, accountUUID, fp.ClientID); err == nil && len(newBody) > 0 {
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+													body = newBody
 												}
 											}
 										}
 									}
 									req, err := http.NewRequestWithContext(ctx, "POST", targetURL, bytes.NewReader(body))
 									if err != nil {
 										return nil, err
 									}
 									// 设置认证头
 									if tokenType == "oauth" {
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										req.Header.Set("authorization", "Bearer "+token)
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+									} else {
 										req.Header.Set("x-api-key", token)
 									}
 									// 白名单透传 headers
-												fix: satisfy golangci-lint (nil checks, remove unused helpers)

											
										
										
											2026-01-31 02:07:57 +08:00
+									for key, values := range clientHeaders {
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+										lowerKey := strings.ToLower(key)
 										if allowedHeaders[lowerKey] {
 											for _, v := range values {
 												req.Header.Add(key, v)
 											}
 										}
 									}
 									// OAuth 账号：应用指纹到请求头
 									if account.IsOAuth() && s.identityService != nil {
-												fix: satisfy golangci-lint (nil checks, remove unused helpers)

											
										
										
											2026-01-31 02:07:57 +08:00
+										fp, _ := s.identityService.GetOrCreateFingerprint(ctx, account.ID, clientHeaders)
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+										if fp != nil {
 											s.identityService.ApplyFingerprint(req, fp)
 										}
 									}
 									// 确保必要的 headers 存在
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									if req.Header.Get("content-type") == "" {
 										req.Header.Set("content-type", "application/json")
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+									}
 									if req.Header.Get("anthropic-version") == "" {
 										req.Header.Set("anthropic-version", "2023-06-01")
 									}
-												fix(网关): OAuth 请求统一 user_id 与指纹

											
										
										
											2026-01-19 15:01:32 +08:00
+									if tokenType == "oauth" {
-												fix(网关): 对齐 Claude OAuth 请求适配

											
										
										
											2026-01-15 18:54:42 +08:00
+										applyClaudeOAuthHeaderDefaults(req, false)
 									}
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
 									// OAuth 账号：处理 anthropic-beta header
 									if tokenType == "oauth" {
-												fix(网关): Claude Code OAuth 补齐 oauth beta

											
										
										
											2026-01-16 23:15:52 +08:00
+										if mimicClaudeCode {
-												fix(oauth): merge anthropic-beta and force Claude Code headers in mimic mode

											
										
										
											2026-01-29 02:36:28 +08:00
+											applyClaudeCodeMimicHeaders(req, false)
 											incomingBeta := req.Header.Get("anthropic-beta")
 											requiredBetas := []string{claude.BetaClaudeCode, claude.BetaOAuth, claude.BetaInterleavedThinking, claude.BetaTokenCounting}
 											req.Header.Set("anthropic-beta", mergeAnthropicBeta(requiredBetas, incomingBeta))
-												fix(网关): Claude Code OAuth 补齐 oauth beta

											
										
										
											2026-01-16 23:15:52 +08:00
+										} else {
 											clientBetaHeader := req.Header.Get("anthropic-beta")
 											if clientBetaHeader == "" {
 												req.Header.Set("anthropic-beta", claude.CountTokensBetaHeader)
 											} else {
 												beta := s.getBetaHeader(modelID, clientBetaHeader)
 												if !strings.Contains(beta, claude.BetaTokenCounting) {
 													beta = beta + "," + claude.BetaTokenCounting
 												}
 												req.Header.Set("anthropic-beta", beta)
 											}
 										}
-												fix(lint): 修复所有 Go 命名规范问题

- 全局替换 ApiKey → APIKey（类型、字段、方法、变量）
- 修复所有 initialism 命名（API, SMTP, HTML, URL 等）
- 添加所有缺失的包注释
- 修复导出符号的注释格式

主要修改：
- ApiKey → APIKey（所有出现的地方）
- ApiKeyID → APIKeyID
- ApiKeyIDs → APIKeyIDs
- TestSmtpConnection → TestSMTPConnection
- HtmlURL → HTMLURL
- 添加 20+ 个包注释
- 修复 10+ 个导出符号注释格式

验证结果：
- ✓ golangci-lint: 0 issues
- ✓ 单元测试: 通过
- ✓ 集成测试: 通过

											
										
										
											2026-01-04 19:27:53 +08:00
+									} else if s.cfg != nil && s.cfg.Gateway.InjectBetaForAPIKey && req.Header.Get("anthropic-beta") == "" {
-												fix: 修复 /v1/messages 间歇性 400 错误 (#18)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* feat(gemini): 添加Gemini限额与TierID支持

实现PR1：Gemini限额与TierID功能

后端修改：
- GeminiTokenInfo结构体添加TierID字段
- fetchProjectID函数返回(projectID, tierID, error)
- 从LoadCodeAssist响应中提取tierID（优先IsDefault，回退到第一个非空tier）
- ExchangeCode、RefreshAccountToken、GetAccessToken函数更新以处理tierID
- BuildAccountCredentials函数保存tier_id到credentials

前端修改：
- AccountStatusIndicator组件添加tier显示
- 支持LEGACY/PRO/ULTRA等tier类型的友好显示
- 使用蓝色badge展示tier信息

技术细节：
- tierID提取逻辑：优先选择IsDefault的tier，否则选择第一个非空tier
- 所有fetchProjectID调用点已更新以处理新的返回签名
- 前端gracefully处理missing/unknown tier_id

* refactor(gemini): 优化TierID实现并添加安全验证

根据并发代码审查（code-reviewer, security-auditor, gemini, codex）的反馈进行改进：

安全改进：
- 添加validateTierID函数验证tier_id格式和长度（最大64字符）
- 限制tier_id字符集为字母数字、下划线、连字符和斜杠
- 在BuildAccountCredentials中验证tier_id后再存储
- 静默跳过无效tier_id，不阻塞账户创建

代码质量改进：
- 提取extractTierIDFromAllowedTiers辅助函数消除重复代码
- 重构fetchProjectID函数，tierID提取逻辑只执行一次
- 改进代码可读性和可维护性

审查工具：
- code-reviewer agent (a09848e)
- security-auditor agent (a9a149c)
- gemini CLI (bcc7c81)
- codex (b5d8919)

修复问题：
- HIGH: 未验证的tier_id输入
- MEDIUM: 代码重复（tierID提取逻辑重复2次）

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(upstream): 修复上游格式兼容性问题 (#14)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(format): 修复 claude_types.go 的 gofmt 格式问题

* feat(antigravity): 优化 thinking block 和 schema 处理

- 为 dummy thinking block 添加 ThoughtSignature
- 重构 thinking block 处理逻辑，在每个条件分支内创建 part
- 优化 excludedSchemaKeys，移除 Gemini 实际支持的字段
  (minItems, maxItems, minimum, maximum, additionalProperties, format)
- 添加详细注释说明 Gemini API 支持的 schema 字段

* fix(antigravity): 增强 schema 清理的安全性

基于 Codex review 建议：
- 添加 format 字段白名单过滤，只保留 Gemini 支持的 date-time/date/time
- 补充更多不支持的 schema 关键字到黑名单：
  * 组合 schema: oneOf, anyOf, allOf, not, if/then/else
  * 对象验证: minProperties, maxProperties, patternProperties 等
  * 定义引用: $defs, definitions
- 避免不支持的 schema 字段导致 Gemini API 校验失败

* fix(lint): 修复 gemini_messages_compat_service 空分支警告

- 在 cleanToolSchema 的 if 语句中添加 continue
- 移除重复的注释

* fix(antigravity): 移除 minItems/maxItems 以兼容 Claude API

- 将 minItems 和 maxItems 添加到 schema 黑名单
- Claude API (Vertex AI) 不支持这些数组验证字段
- 添加调试日志记录工具 schema 转换过程
- 修复 tools.14.custom.input_schema 验证错误

* fix(antigravity): 修复 additionalProperties schema 对象问题

- 将 additionalProperties 的 schema 对象转换为布尔值 true
- Claude API 只支持 additionalProperties: false，不支持 schema 对象
- 修复 tools.14.custom.input_schema 验证错误
- 参考 Claude 官方文档的 JSON Schema 限制

* fix(antigravity): 修复 Claude 模型 thinking 块兼容性问题

- 完全跳过 Claude 模型的 thinking 块以避免 signature 验证失败
- 只在 Gemini 模型中使用 dummy thought signature
- 修改 additionalProperties 默认值为 false（更安全）
- 添加调试日志以便排查问题

* fix(upstream): 修复跨模型切换时的 dummy signature 问题

基于 Codex review 和用户场景分析的修复：

1. 问题场景
   - Gemini (thinking) → Claude (thinking) 切换时
   - Gemini 返回的 thinking 块使用 dummy signature
   - Claude API 会拒绝 dummy signature，导致 400 错误

2. 修复内容
   - request_transformer.go:262: 跳过 dummy signature
   - 只保留真实的 Claude signature
   - 支持频繁的跨模型切换

3. 其他修复（基于 Codex review）
   - gateway_service.go:691: 修复 io.ReadAll 错误处理
   - gateway_service.go:687: 条件日志（尊重 LogUpstreamErrorBody 配置）
   - gateway_service.go:915: 收紧 400 failover 启发式
   - request_transformer.go:188: 移除签名成功日志

4. 新增功能（默认关闭）
   - 阶段 1: 上游错误日志（GATEWAY_LOG_UPSTREAM_ERROR_BODY）
   - 阶段 2: Antigravity thinking 修复
   - 阶段 3: API-key beta 注入（GATEWAY_INJECT_BETA_FOR_APIKEY）
   - 阶段 3: 智能 400 failover（GATEWAY_FAILOVER_ON_400）

测试：所有测试通过

* fix(lint): 修复 golangci-lint 问题

- 应用 De Morgan 定律简化条件判断
- 修复 gofmt 格式问题
- 移除未使用的 min 函数
											
										
										
											2026-01-01 04:21:18 +08:00
+										// API-key：与 messages 同步的按需 beta 注入（默认关闭）
 										if requestNeedsBetaFeatures(body) {
-												fix(lint): 修复所有 Go 命名规范问题

- 全局替换 ApiKey → APIKey（类型、字段、方法、变量）
- 修复所有 initialism 命名（API, SMTP, HTML, URL 等）
- 添加所有缺失的包注释
- 修复导出符号的注释格式

主要修改：
- ApiKey → APIKey（所有出现的地方）
- ApiKeyID → APIKeyID
- ApiKeyIDs → APIKeyIDs
- TestSmtpConnection → TestSMTPConnection
- HtmlURL → HTMLURL
- 添加 20+ 个包注释
- 修复 10+ 个导出符号注释格式

验证结果：
- ✓ golangci-lint: 0 issues
- ✓ 单元测试: 通过
- ✓ 集成测试: 通过

											
										
										
											2026-01-04 19:27:53 +08:00
+											if beta := defaultAPIKeyBetaHeader(body); beta != "" {
-												fix: 修复 /v1/messages 间歇性 400 错误 (#18)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* feat(gemini): 添加Gemini限额与TierID支持

实现PR1：Gemini限额与TierID功能

后端修改：
- GeminiTokenInfo结构体添加TierID字段
- fetchProjectID函数返回(projectID, tierID, error)
- 从LoadCodeAssist响应中提取tierID（优先IsDefault，回退到第一个非空tier）
- ExchangeCode、RefreshAccountToken、GetAccessToken函数更新以处理tierID
- BuildAccountCredentials函数保存tier_id到credentials

前端修改：
- AccountStatusIndicator组件添加tier显示
- 支持LEGACY/PRO/ULTRA等tier类型的友好显示
- 使用蓝色badge展示tier信息

技术细节：
- tierID提取逻辑：优先选择IsDefault的tier，否则选择第一个非空tier
- 所有fetchProjectID调用点已更新以处理新的返回签名
- 前端gracefully处理missing/unknown tier_id

* refactor(gemini): 优化TierID实现并添加安全验证

根据并发代码审查（code-reviewer, security-auditor, gemini, codex）的反馈进行改进：

安全改进：
- 添加validateTierID函数验证tier_id格式和长度（最大64字符）
- 限制tier_id字符集为字母数字、下划线、连字符和斜杠
- 在BuildAccountCredentials中验证tier_id后再存储
- 静默跳过无效tier_id，不阻塞账户创建

代码质量改进：
- 提取extractTierIDFromAllowedTiers辅助函数消除重复代码
- 重构fetchProjectID函数，tierID提取逻辑只执行一次
- 改进代码可读性和可维护性

审查工具：
- code-reviewer agent (a09848e)
- security-auditor agent (a9a149c)
- gemini CLI (bcc7c81)
- codex (b5d8919)

修复问题：
- HIGH: 未验证的tier_id输入
- MEDIUM: 代码重复（tierID提取逻辑重复2次）

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(upstream): 修复上游格式兼容性问题 (#14)

* fix(upstream): 修复上游格式兼容性问题

- 跳过Claude模型无signature的thinking block
- 支持custom类型工具(MCP)格式转换
- 添加ClaudeCustomToolSpec结构体支持MCP工具
- 添加Custom字段验证，跳过无效custom工具
- 在convertClaudeToolsToGeminiTools中添加schema清理
- 完整的单元测试覆盖，包含边界情况

修复: Issue 0.1 signature缺失, Issue 0.2 custom工具格式
改进: Codex审查发现的2个重要问题

测试:
- TestBuildParts_ThinkingBlockWithoutSignature: 验证thinking block处理
- TestBuildTools_CustomTypeTools: 验证custom工具转换和边界情况
- TestConvertClaudeToolsToGeminiTools_CustomType: 验证service层转换

* fix(format): 修复 gofmt 格式问题

- 修复 claude_types.go 中的字段对齐问题
- 修复 gemini_messages_compat_service.go 中的缩进问题

* fix(format): 修复 claude_types.go 的 gofmt 格式问题

* feat(antigravity): 优化 thinking block 和 schema 处理

- 为 dummy thinking block 添加 ThoughtSignature
- 重构 thinking block 处理逻辑，在每个条件分支内创建 part
- 优化 excludedSchemaKeys，移除 Gemini 实际支持的字段
  (minItems, maxItems, minimum, maximum, additionalProperties, format)
- 添加详细注释说明 Gemini API 支持的 schema 字段

* fix(antigravity): 增强 schema 清理的安全性

基于 Codex review 建议：
- 添加 format 字段白名单过滤，只保留 Gemini 支持的 date-time/date/time
- 补充更多不支持的 schema 关键字到黑名单：
  * 组合 schema: oneOf, anyOf, allOf, not, if/then/else
  * 对象验证: minProperties, maxProperties, patternProperties 等
  * 定义引用: $defs, definitions
- 避免不支持的 schema 字段导致 Gemini API 校验失败

* fix(lint): 修复 gemini_messages_compat_service 空分支警告

- 在 cleanToolSchema 的 if 语句中添加 continue
- 移除重复的注释

* fix(antigravity): 移除 minItems/maxItems 以兼容 Claude API

- 将 minItems 和 maxItems 添加到 schema 黑名单
- Claude API (Vertex AI) 不支持这些数组验证字段
- 添加调试日志记录工具 schema 转换过程
- 修复 tools.14.custom.input_schema 验证错误

* fix(antigravity): 修复 additionalProperties schema 对象问题

- 将 additionalProperties 的 schema 对象转换为布尔值 true
- Claude API 只支持 additionalProperties: false，不支持 schema 对象
- 修复 tools.14.custom.input_schema 验证错误
- 参考 Claude 官方文档的 JSON Schema 限制

* fix(antigravity): 修复 Claude 模型 thinking 块兼容性问题

- 完全跳过 Claude 模型的 thinking 块以避免 signature 验证失败
- 只在 Gemini 模型中使用 dummy thought signature
- 修改 additionalProperties 默认值为 false（更安全）
- 添加调试日志以便排查问题

* fix(upstream): 修复跨模型切换时的 dummy signature 问题

基于 Codex review 和用户场景分析的修复：

1. 问题场景
   - Gemini (thinking) → Claude (thinking) 切换时
   - Gemini 返回的 thinking 块使用 dummy signature
   - Claude API 会拒绝 dummy signature，导致 400 错误

2. 修复内容
   - request_transformer.go:262: 跳过 dummy signature
   - 只保留真实的 Claude signature
   - 支持频繁的跨模型切换

3. 其他修复（基于 Codex review）
   - gateway_service.go:691: 修复 io.ReadAll 错误处理
   - gateway_service.go:687: 条件日志（尊重 LogUpstreamErrorBody 配置）
   - gateway_service.go:915: 收紧 400 failover 启发式
   - request_transformer.go:188: 移除签名成功日志

4. 新增功能（默认关闭）
   - 阶段 1: 上游错误日志（GATEWAY_LOG_UPSTREAM_ERROR_BODY）
   - 阶段 2: Antigravity thinking 修复
   - 阶段 3: API-key beta 注入（GATEWAY_INJECT_BETA_FOR_APIKEY）
   - 阶段 3: 智能 400 failover（GATEWAY_FAILOVER_ON_400）

测试：所有测试通过

* fix(lint): 修复 golangci-lint 问题

- 应用 De Morgan 定律简化条件判断
- 修复 gofmt 格式问题
- 移除未使用的 min 函数
											
										
										
											2026-01-01 04:21:18 +08:00
+												req.Header.Set("anthropic-beta", beta)
 											}
 										}
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+									}
-												chore(debug): emit Claude mimic fingerprint on credential-scope error

											
										
										
											2026-01-29 15:17:46 +08:00
+									if c != nil && tokenType == "oauth" {
 										c.Set(claudeMimicDebugInfoKey, buildClaudeMimicDebugLine(req, body, account, tokenType, mimicClaudeCode))
 									}
-												chore(debug): log Claude mimic fingerprint

											
										
										
											2026-01-29 03:13:14 +08:00
+									if s.debugClaudeMimicEnabled() {
 										logClaudeMimicDebug(req, body, account, tokenType, mimicClaudeCode)
 									}
-												refactor(backend): service http ports

											
										
										
											2025-12-20 11:56:11 +08:00
+									return req, nil
-												feat(gateway): 添加 /v1/messages/count_tokens 端点

实现 Claude API 的 token 计数功能，支持 OAuth、SetupToken 和 ApiKey 三种账号类型。

特点：
- 校验订阅/余额（不扣费）
- 不计算用户和账号并发
- 不记录使用量
- 支持模型映射（ApiKey 账号）
- 支持 OAuth 账号的指纹管理和 401 重试

											
										
										
											2025-12-19 11:12:41 +08:00
+								}
 								// countTokensError 返回 count_tokens 错误响应
 								func (s *GatewayService) countTokensError(c *gin.Context, status int, errType, message string) {
 									c.JSON(status, gin.H{
 										"type": "error",
 										"error": gin.H{
 											"type":    errType,
 											"message": message,
 										},
 									})
 								}
-												feat: 添加模型白名单选择器组件，同步 new-api 模型列表

- 新增 ModelWhitelistSelector.vue 支持模型白名单多选
- 新增 ModelIcon.vue 显示品牌图标（基于 @lobehub/icons）
- 新增 useModelWhitelist.ts 硬编码各平台模型列表
- 更新账号编辑表单支持模型白名单配置
- 支持 Claude/OpenAI/Gemini/智谱/百度/讯飞等主流平台

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>

											
										
										
											2026-01-01 16:03:48 +08:00
-												feat(安全): 强化安全策略与配置校验

- 增加 CORS/CSP/安全响应头与代理信任配置

- 引入 URL 白名单与私网开关，校验上游与价格源

- 改善 API Key 处理与网关错误返回

- 管理端设置隐藏敏感字段并优化前端提示

- 增加计费熔断与相关配置示例

测试: go test ./...

											
										
										
											2026-01-02 17:40:57 +08:00
+								func (s *GatewayService) validateUpstreamBaseURL(raw string) (string, error) {
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+									if s.cfg != nil && !s.cfg.Security.URLAllowlist.Enabled {
-												fix(安全): 关闭白名单时保留最小校验与默认白名单

实现 allow_insecure_http 并在关闭校验时执行最小格式验证
- 关闭 allowlist 时要求 URL 可解析且 scheme 合规
- 响应头过滤关闭时使用默认白名单策略
- 更新相关文档、示例与测试覆盖

											
										
										
											2026-01-05 14:41:08 +08:00
+										normalized, err := urlvalidator.ValidateURLFormat(raw, s.cfg.Security.URLAllowlist.AllowInsecureHTTP)
 										if err != nil {
 											return "", fmt.Errorf("invalid base_url: %w", err)
 										}
 										return normalized, nil
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+									}
-												feat(安全): 强化安全策略与配置校验

- 增加 CORS/CSP/安全响应头与代理信任配置

- 引入 URL 白名单与私网开关，校验上游与价格源

- 改善 API Key 处理与网关错误返回

- 管理端设置隐藏敏感字段并优化前端提示

- 增加计费熔断与相关配置示例

测试: go test ./...

											
										
										
											2026-01-02 17:40:57 +08:00
+									normalized, err := urlvalidator.ValidateHTTPSURL(raw, urlvalidator.ValidationOptions{
 										AllowedHosts:     s.cfg.Security.URLAllowlist.UpstreamHosts,
 										RequireAllowlist: true,
 										AllowPrivate:     s.cfg.Security.URLAllowlist.AllowPrivateHosts,
 									})
 									if err != nil {
 										return "", fmt.Errorf("invalid base_url: %w", err)
 									}
 									return normalized, nil
 								}
-												merge: 合并 test 分支到 test-dev，解决冲突

解决的冲突文件：
- wire_gen.go: 合并 ConcurrencyService/CRSSyncService 参数和 userAttributeHandler
- gateway_handler.go: 合并 pkg/errors 和 antigravity 导入
- gateway_service.go: 合并 validateUpstreamBaseURL 和 GetAvailableModels
- config.example.yaml: 合并 billing/turnstile 配置和额外 gateway 选项

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>

											
										
										
											2026-01-03 11:36:31 +08:00
-												chore: apply stashed changes

											
										
										
											2026-02-02 22:20:08 +08:00
+								// checkAntigravityModelScope 检查 Antigravity 平台的模型系列是否在分组支持范围内
 								func (s *GatewayService) checkAntigravityModelScope(ctx context.Context, groupID int64, requestedModel string) error {
 									scope, ok := ResolveAntigravityQuotaScope(requestedModel)
 									if !ok {
 										return nil // 无法解析 scope，跳过检查
 									}
 									group, err := s.resolveGroupByID(ctx, groupID)
 									if err != nil {
 										return nil // 查询失败时放行
 									}
 									if group == nil {
 										return nil // 分组不存在时放行
 									}
 									if !IsScopeSupported(group.SupportedModelScopes, scope) {
 										return ErrModelScopeNotSupported
 									}
 									return nil
 								}
-												feat: 添加模型白名单选择器组件，同步 new-api 模型列表

- 新增 ModelWhitelistSelector.vue 支持模型白名单多选
- 新增 ModelIcon.vue 显示品牌图标（基于 @lobehub/icons）
- 新增 useModelWhitelist.ts 硬编码各平台模型列表
- 更新账号编辑表单支持模型白名单配置
- 支持 Claude/OpenAI/Gemini/智谱/百度/讯飞等主流平台

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>

											
										
										
											2026-01-01 16:03:48 +08:00
+								// GetAvailableModels returns the list of models available for a group
 								// It aggregates model_mapping keys from all schedulable accounts in the group
 								func (s *GatewayService) GetAvailableModels(ctx context.Context, groupID *int64, platform string) []string {
 									var accounts []Account
 									var err error
 									if groupID != nil {
 										accounts, err = s.accountRepo.ListSchedulableByGroupID(ctx, *groupID)
 									} else {
 										accounts, err = s.accountRepo.ListSchedulable(ctx)
 									}
 									if err != nil || len(accounts) == 0 {
 										return nil
 									}
 									// Filter by platform if specified
 									if platform != "" {
 										filtered := make([]Account, 0)
 										for _, acc := range accounts {
 											if acc.Platform == platform {
 												filtered = append(filtered, acc)
 											}
 										}
 										accounts = filtered
 									}
 									// Collect unique models from all accounts
 									modelSet := make(map[string]struct{})
 									hasAnyMapping := false
 									for _, acc := range accounts {
 										mapping := acc.GetModelMapping()
 										if len(mapping) > 0 {
 											hasAnyMapping = true
 											for model := range mapping {
 												modelSet[model] = struct{}{}
 											}
 										}
 									}
 									// If no account has model_mapping, return nil (use default)
 									if !hasAnyMapping {
 										return nil
 									}
 									// Convert to slice
 									models := make([]string, 0, len(modelSet))
 									for model := range modelSet {
 										models = append(models, model)
 									}
 									return models
 								}