backend/internal/service/openai_gateway_service.go

package service

import (
	"bufio"
	"bytes"
	"context"
	"crypto/sha256"
	"encoding/hex"
	"encoding/json"
	"errors"
	"fmt"
	"io"
	"log/slog"
	"math/rand"
	"net/http"
	"sort"
	"strconv"
	"strings"
	"sync"
	"sync/atomic"
	"time"

	"github.com/Wei-Shaw/sub2api/internal/config"
	"github.com/Wei-Shaw/sub2api/internal/pkg/apicompat"
	"github.com/Wei-Shaw/sub2api/internal/pkg/logger"
	"github.com/Wei-Shaw/sub2api/internal/pkg/openai"
	"github.com/Wei-Shaw/sub2api/internal/util/responseheaders"
	"github.com/Wei-Shaw/sub2api/internal/util/urlvalidator"
	"github.com/cespare/xxhash/v2"
	"github.com/gin-gonic/gin"
	"github.com/google/uuid"
	"github.com/tidwall/gjson"
	"github.com/tidwall/sjson"
	"go.uber.org/zap"
)

const (
	// ChatGPT internal API for OAuth accounts
	chatgptCodexURL = "https://chatgpt.com/backend-api/codex/responses"
	// OpenAI Platform API for API Key accounts (fallback)
	openaiPlatformAPIURL   = "https://api.openai.com/v1/responses"
	openaiStickySessionTTL = time.Hour // 粘性会话TTL
	codexCLIUserAgent      = "codex_cli_rs/0.125.0"
	// codex_cli_only 拒绝时单个请求头日志长度上限（字符）
	codexCLIOnlyHeaderValueMaxBytes = 256

	// OpenAIParsedRequestBodyKey 缓存 handler 侧已解析的请求体，避免重复解析。
	OpenAIParsedRequestBodyKey = "openai_parsed_request_body"
	// OpenAI WS Mode 失败后的重连次数上限（不含首次尝试）。
	// 与 Codex 客户端保持一致：失败后最多重连 5 次。
	openAIWSReconnectRetryLimit = 5
	// OpenAI WS Mode 重连退避默认值（可由配置覆盖）。
	openAIWSRetryBackoffInitialDefault = 120 * time.Millisecond
	openAIWSRetryBackoffMaxDefault     = 2 * time.Second
	openAIWSRetryJitterRatioDefault    = 0.2
	openAICompactSessionSeedKey        = "openai_compact_session_seed"
	codexCLIVersion                    = "0.125.0"
	// Codex 限额快照仅用于后台展示/诊断，不需要每个成功请求都立即落库。
	openAICodexSnapshotPersistMinInterval = 30 * time.Second
)

// OpenAI allowed headers whitelist (for non-passthrough).
var openaiAllowedHeaders = map[string]bool{
	"accept-language":       true,
	"content-type":          true,
	"conversation_id":       true,
	"user-agent":            true,
	"originator":            true,
	"session_id":            true,
	"x-codex-turn-state":    true,
	"x-codex-turn-metadata": true,
}

// OpenAI passthrough allowed headers whitelist.
// 透传模式下仅放行这些低风险请求头，避免将非标准/环境噪声头传给上游触发风控。
var openaiPassthroughAllowedHeaders = map[string]bool{
	"accept":                true,
	"accept-language":       true,
	"content-type":          true,
	"conversation_id":       true,
	"openai-beta":           true,
	"user-agent":            true,
	"originator":            true,
	"session_id":            true,
	"x-codex-turn-state":    true,
	"x-codex-turn-metadata": true,
}

// codex_cli_only 拒绝时记录的请求头白名单（仅用于诊断日志，不参与上游透传）
var codexCLIOnlyDebugHeaderWhitelist = []string{
	"User-Agent",
	"Content-Type",
	"Accept",
	"Accept-Language",
	"OpenAI-Beta",
	"Originator",
	"Session_ID",
	"Conversation_ID",
	"X-Request-ID",
	"X-Client-Request-ID",
	"X-Forwarded-For",
	"X-Real-IP",
}

// OpenAICodexUsageSnapshot represents Codex API usage limits from response headers
type OpenAICodexUsageSnapshot struct {
	PrimaryUsedPercent          *float64 `json:"primary_used_percent,omitempty"`
	PrimaryResetAfterSeconds    *int     `json:"primary_reset_after_seconds,omitempty"`
	PrimaryWindowMinutes        *int     `json:"primary_window_minutes,omitempty"`
	SecondaryUsedPercent        *float64 `json:"secondary_used_percent,omitempty"`
	SecondaryResetAfterSeconds  *int     `json:"secondary_reset_after_seconds,omitempty"`
	SecondaryWindowMinutes      *int     `json:"secondary_window_minutes,omitempty"`
	PrimaryOverSecondaryPercent *float64 `json:"primary_over_secondary_percent,omitempty"`
	UpdatedAt                   string   `json:"updated_at,omitempty"`
}

// NormalizedCodexLimits contains normalized 5h/7d rate limit data
type NormalizedCodexLimits struct {
	Used5hPercent   *float64
	Reset5hSeconds  *int
	Window5hMinutes *int
	Used7dPercent   *float64
	Reset7dSeconds  *int
	Window7dMinutes *int
}

// Normalize converts primary/secondary fields to canonical 5h/7d fields.
// Strategy: Compare window_minutes to determine which is 5h vs 7d.
// Returns nil if snapshot is nil or has no useful data.
func (s *OpenAICodexUsageSnapshot) Normalize() *NormalizedCodexLimits {
	if s == nil {
		return nil
	}

	result := &NormalizedCodexLimits{}

	primaryMins := 0
	secondaryMins := 0
	hasPrimaryWindow := false
	hasSecondaryWindow := false

	if s.PrimaryWindowMinutes != nil {
		primaryMins = *s.PrimaryWindowMinutes
		hasPrimaryWindow = true
	}
	if s.SecondaryWindowMinutes != nil {
		secondaryMins = *s.SecondaryWindowMinutes
		hasSecondaryWindow = true
	}

	// Determine mapping based on window_minutes
	use5hFromPrimary := false
	use7dFromPrimary := false

	if hasPrimaryWindow && hasSecondaryWindow {
		// Both known: smaller window is 5h, larger is 7d
		if primaryMins < secondaryMins {
			use5hFromPrimary = true
		} else {
			use7dFromPrimary = true
		}
	} else if hasPrimaryWindow {
		// Only primary known: classify by threshold (<=360 min = 6h -> 5h window)
		if primaryMins <= 360 {
			use5hFromPrimary = true
		} else {
			use7dFromPrimary = true
		}
	} else if hasSecondaryWindow {
		// Only secondary known: classify by threshold
		if secondaryMins <= 360 {
			// 5h from secondary, so primary (if any data) is 7d
			use7dFromPrimary = true
		} else {
			// 7d from secondary, so primary (if any data) is 5h
			use5hFromPrimary = true
		}
	} else {
		// No window_minutes: fall back to legacy assumption (primary=7d, secondary=5h)
		use7dFromPrimary = true
	}

	// Assign values
	if use5hFromPrimary {
		result.Used5hPercent = s.PrimaryUsedPercent
		result.Reset5hSeconds = s.PrimaryResetAfterSeconds
		result.Window5hMinutes = s.PrimaryWindowMinutes
		result.Used7dPercent = s.SecondaryUsedPercent
		result.Reset7dSeconds = s.SecondaryResetAfterSeconds
		result.Window7dMinutes = s.SecondaryWindowMinutes
	} else if use7dFromPrimary {
		result.Used7dPercent = s.PrimaryUsedPercent
		result.Reset7dSeconds = s.PrimaryResetAfterSeconds
		result.Window7dMinutes = s.PrimaryWindowMinutes
		result.Used5hPercent = s.SecondaryUsedPercent
		result.Reset5hSeconds = s.SecondaryResetAfterSeconds
		result.Window5hMinutes = s.SecondaryWindowMinutes
	}

	return result
}

// OpenAIUsage represents OpenAI API response usage
type OpenAIUsage struct {
	InputTokens              int `json:"input_tokens"`
	OutputTokens             int `json:"output_tokens"`
	CacheCreationInputTokens int `json:"cache_creation_input_tokens,omitempty"`
	CacheReadInputTokens     int `json:"cache_read_input_tokens,omitempty"`
	ImageOutputTokens        int `json:"image_output_tokens,omitempty"`
}

// OpenAIForwardResult represents the result of forwarding
type OpenAIForwardResult struct {
	RequestID string
	Usage     OpenAIUsage
	Model     string // 原始模型（用于响应和日志显示）
	// BillingModel is the model used for cost calculation.
	// When non-empty, CalculateCost uses this instead of Model.
	// This is set by the Anthropic Messages conversion path where
	// the mapped upstream model differs from the client-facing model.
	BillingModel string
	// UpstreamModel is the actual model sent to the upstream provider after mapping.
	// Empty when no mapping was applied (requested model was used as-is).
	UpstreamModel string
	// ServiceTier records the OpenAI Responses API service tier, e.g. "priority" / "flex".
	// Nil means the request did not specify a recognized tier.
	ServiceTier *string
	// ReasoningEffort is extracted from request body (reasoning.effort) or derived from model suffix.
	// Stored for usage records display; nil means not provided / not applicable.
	ReasoningEffort *string
	Stream          bool
	OpenAIWSMode    bool
	ResponseHeaders http.Header
	Duration        time.Duration
	FirstTokenMs    *int
	ImageCount      int
	ImageSize       string
}

type OpenAIWSRetryMetricsSnapshot struct {
	RetryAttemptsTotal            int64 `json:"retry_attempts_total"`
	RetryBackoffMsTotal           int64 `json:"retry_backoff_ms_total"`
	RetryExhaustedTotal           int64 `json:"retry_exhausted_total"`
	NonRetryableFastFallbackTotal int64 `json:"non_retryable_fast_fallback_total"`
}

type OpenAICompatibilityFallbackMetricsSnapshot struct {
	SessionHashLegacyReadFallbackTotal int64   `json:"session_hash_legacy_read_fallback_total"`
	SessionHashLegacyReadFallbackHit   int64   `json:"session_hash_legacy_read_fallback_hit"`
	SessionHashLegacyDualWriteTotal    int64   `json:"session_hash_legacy_dual_write_total"`
	SessionHashLegacyReadHitRate       float64 `json:"session_hash_legacy_read_hit_rate"`

	MetadataLegacyFallbackIsMaxTokensOneHaikuTotal int64 `json:"metadata_legacy_fallback_is_max_tokens_one_haiku_total"`
	MetadataLegacyFallbackThinkingEnabledTotal     int64 `json:"metadata_legacy_fallback_thinking_enabled_total"`
	MetadataLegacyFallbackPrefetchedStickyAccount  int64 `json:"metadata_legacy_fallback_prefetched_sticky_account_total"`
	MetadataLegacyFallbackPrefetchedStickyGroup    int64 `json:"metadata_legacy_fallback_prefetched_sticky_group_total"`
	MetadataLegacyFallbackSingleAccountRetryTotal  int64 `json:"metadata_legacy_fallback_single_account_retry_total"`
	MetadataLegacyFallbackAccountSwitchCountTotal  int64 `json:"metadata_legacy_fallback_account_switch_count_total"`
	MetadataLegacyFallbackTotal                    int64 `json:"metadata_legacy_fallback_total"`
}

type openAIWSRetryMetrics struct {
	retryAttempts            atomic.Int64
	retryBackoffMs           atomic.Int64
	retryExhausted           atomic.Int64
	nonRetryableFastFallback atomic.Int64
}

type accountWriteThrottle struct {
	minInterval time.Duration
	mu          sync.Mutex
	lastByID    map[int64]time.Time
}

func newAccountWriteThrottle(minInterval time.Duration) *accountWriteThrottle {
	return &accountWriteThrottle{
		minInterval: minInterval,
		lastByID:    make(map[int64]time.Time),
	}
}

func (t *accountWriteThrottle) Allow(id int64, now time.Time) bool {
	if t == nil || id <= 0 || t.minInterval <= 0 {
		return true
	}

	t.mu.Lock()
	defer t.mu.Unlock()

	if last, ok := t.lastByID[id]; ok && now.Sub(last) < t.minInterval {
		return false
	}
	t.lastByID[id] = now

	if len(t.lastByID) > 4096 {
		cutoff := now.Add(-4 * t.minInterval)
		for accountID, writtenAt := range t.lastByID {
			if writtenAt.Before(cutoff) {
				delete(t.lastByID, accountID)
			}
		}
	}

	return true
}

var defaultOpenAICodexSnapshotPersistThrottle = newAccountWriteThrottle(openAICodexSnapshotPersistMinInterval)

// ErrNoAvailableCompactAccounts indicates the request needs /responses/compact
// support but no compatible account is available.
var ErrNoAvailableCompactAccounts = errors.New("no available OpenAI accounts support /responses/compact")

// OpenAIGatewayService handles OpenAI API gateway operations
type OpenAIGatewayService struct {
	accountRepo           AccountRepository
	usageLogRepo          UsageLogRepository
	usageBillingRepo      UsageBillingRepository
	userRepo              UserRepository
	userSubRepo           UserSubscriptionRepository
	cache                 GatewayCache
	cfg                   *config.Config
	codexDetector         CodexClientRestrictionDetector
	schedulerSnapshot     *SchedulerSnapshotService
	concurrencyService    *ConcurrencyService
	billingService        *BillingService
	rateLimitService      *RateLimitService
	billingCacheService   *BillingCacheService
	userGroupRateResolver *userGroupRateResolver
	httpUpstream          HTTPUpstream
	deferredService       *DeferredService
	openAITokenProvider   *OpenAITokenProvider
	toolCorrector         *CodexToolCorrector
	openaiWSResolver      OpenAIWSProtocolResolver
	resolver              *ModelPricingResolver
	channelService        *ChannelService
	balanceNotifyService  *BalanceNotifyService
	settingService        *SettingService

	openaiWSPoolOnce              sync.Once
	openaiWSStateStoreOnce        sync.Once
	openaiSchedulerOnce           sync.Once
	openaiWSPassthroughDialerOnce sync.Once
	openaiWSPool                  *openAIWSConnPool
	openaiWSStateStore            OpenAIWSStateStore
	openaiScheduler               OpenAIAccountScheduler
	openaiWSPassthroughDialer     openAIWSClientDialer
	openaiAccountStats            *openAIAccountRuntimeStats

	openaiWSFallbackUntil sync.Map // key: int64(accountID), value: time.Time
	openaiWSRetryMetrics  openAIWSRetryMetrics
	responseHeaderFilter  *responseheaders.CompiledHeaderFilter
	codexSnapshotThrottle *accountWriteThrottle
}

// NewOpenAIGatewayService creates a new OpenAIGatewayService
func NewOpenAIGatewayService(
	accountRepo AccountRepository,
	usageLogRepo UsageLogRepository,
	usageBillingRepo UsageBillingRepository,
	userRepo UserRepository,
	userSubRepo UserSubscriptionRepository,
	userGroupRateRepo UserGroupRateRepository,
	cache GatewayCache,
	cfg *config.Config,
	schedulerSnapshot *SchedulerSnapshotService,
	concurrencyService *ConcurrencyService,
	billingService *BillingService,
	rateLimitService *RateLimitService,
	billingCacheService *BillingCacheService,
	httpUpstream HTTPUpstream,
	deferredService *DeferredService,
	openAITokenProvider *OpenAITokenProvider,
	resolver *ModelPricingResolver,
	channelService *ChannelService,
	balanceNotifyService *BalanceNotifyService,
	settingService *SettingService,
) *OpenAIGatewayService {
	svc := &OpenAIGatewayService{
		accountRepo:         accountRepo,
		usageLogRepo:        usageLogRepo,
		usageBillingRepo:    usageBillingRepo,
		userRepo:            userRepo,
		userSubRepo:         userSubRepo,
		cache:               cache,
		cfg:                 cfg,
		codexDetector:       NewOpenAICodexClientRestrictionDetector(cfg),
		schedulerSnapshot:   schedulerSnapshot,
		concurrencyService:  concurrencyService,
		billingService:      billingService,
		rateLimitService:    rateLimitService,
		billingCacheService: billingCacheService,
		userGroupRateResolver: newUserGroupRateResolver(
			userGroupRateRepo,
			nil,
			resolveUserGroupRateCacheTTL(cfg),
			nil,
			"service.openai_gateway",
		),
		httpUpstream:          httpUpstream,
		deferredService:       deferredService,
		openAITokenProvider:   openAITokenProvider,
		toolCorrector:         NewCodexToolCorrector(),
		openaiWSResolver:      NewOpenAIWSProtocolResolver(cfg),
		resolver:              resolver,
		channelService:        channelService,
		balanceNotifyService:  balanceNotifyService,
		settingService:        settingService,
		responseHeaderFilter:  compileResponseHeaderFilter(cfg),
		codexSnapshotThrottle: newAccountWriteThrottle(openAICodexSnapshotPersistMinInterval),
	}
	svc.logOpenAIWSModeBootstrap()
	return svc
}

// ResolveChannelMapping 解析渠道级模型映射（代理到 ChannelService）
func (s *OpenAIGatewayService) ResolveChannelMapping(ctx context.Context, groupID int64, model string) ChannelMappingResult {
	if s.channelService == nil {
		return ChannelMappingResult{MappedModel: model}
	}
	return s.channelService.ResolveChannelMapping(ctx, groupID, model)
}

// IsModelRestricted 检查模型是否被渠道限制（代理到 ChannelService）
func (s *OpenAIGatewayService) IsModelRestricted(ctx context.Context, groupID int64, model string) bool {
	if s.channelService == nil {
		return false
	}
	return s.channelService.IsModelRestricted(ctx, groupID, model)
}

// ResolveChannelMappingAndRestrict 解析渠道映射。
// 模型限制检查已移至调度阶段，restricted 始终返回 false。
func (s *OpenAIGatewayService) ResolveChannelMappingAndRestrict(ctx context.Context, groupID *int64, model string) (ChannelMappingResult, bool) {
	if s.channelService == nil {
		return ChannelMappingResult{MappedModel: model}, false
	}
	return s.channelService.ResolveChannelMappingAndRestrict(ctx, groupID, model)
}

func (s *OpenAIGatewayService) checkChannelPricingRestriction(ctx context.Context, groupID *int64, requestedModel string) bool {
	if groupID == nil || s.channelService == nil || requestedModel == "" {
		return false
	}
	mapping := s.channelService.ResolveChannelMapping(ctx, *groupID, requestedModel)
	billingModel := billingModelForRestriction(mapping.BillingModelSource, requestedModel, mapping.MappedModel)
	if billingModel == "" {
		return false
	}
	return s.channelService.IsModelRestricted(ctx, *groupID, billingModel)
}

func (s *OpenAIGatewayService) isUpstreamModelRestrictedByChannel(ctx context.Context, groupID int64, account *Account, requestedModel string, requireCompact bool) bool {
	if s.channelService == nil {
		return false
	}
	upstreamModel := resolveOpenAIAccountUpstreamModelForRequest(account, requestedModel, requireCompact)
	if upstreamModel == "" {
		return false
	}
	return s.channelService.IsModelRestricted(ctx, groupID, upstreamModel)
}

func (s *OpenAIGatewayService) needsUpstreamChannelRestrictionCheck(ctx context.Context, groupID *int64) bool {
	if groupID == nil || s.channelService == nil {
		return false
	}
	ch, err := s.channelService.GetChannelForGroup(ctx, *groupID)
	if err != nil {
		slog.Warn("failed to check openai channel upstream restriction", "group_id", *groupID, "error", err)
		return false
	}
	if ch == nil || !ch.RestrictModels {
		return false
	}
	return ch.BillingModelSource == BillingModelSourceUpstream
}

// ReplaceModelInBody 替换请求体中的 JSON model 字段（通用 gjson/sjson 实现）。
func (s *OpenAIGatewayService) ReplaceModelInBody(body []byte, newModel string) []byte {
	return ReplaceModelInBody(body, newModel)
}

func (s *OpenAIGatewayService) getCodexSnapshotThrottle() *accountWriteThrottle {
	if s != nil && s.codexSnapshotThrottle != nil {
		return s.codexSnapshotThrottle
	}
	return defaultOpenAICodexSnapshotPersistThrottle
}

func (s *OpenAIGatewayService) billingDeps() *billingDeps {
	return &billingDeps{
		accountRepo:          s.accountRepo,
		userRepo:             s.userRepo,
		userSubRepo:          s.userSubRepo,
		billingCacheService:  s.billingCacheService,
		deferredService:      s.deferredService,
		balanceNotifyService: s.balanceNotifyService,
	}
}

// CloseOpenAIWSPool 关闭 OpenAI WebSocket 连接池的后台 worker 和空闲连接。
// 应在应用优雅关闭时调用。
func (s *OpenAIGatewayService) CloseOpenAIWSPool() {
	if s != nil && s.openaiWSPool != nil {
		s.openaiWSPool.Close()
	}
}

func (s *OpenAIGatewayService) logOpenAIWSModeBootstrap() {
	if s == nil || s.cfg == nil {
		return
	}
	wsCfg := s.cfg.Gateway.OpenAIWS
	logOpenAIWSModeInfo(
		"bootstrap enabled=%v oauth_enabled=%v apikey_enabled=%v force_http=%v responses_websockets_v2=%v responses_websockets=%v payload_log_sample_rate=%.3f event_flush_batch_size=%d event_flush_interval_ms=%d prewarm_cooldown_ms=%d retry_backoff_initial_ms=%d retry_backoff_max_ms=%d retry_jitter_ratio=%.3f retry_total_budget_ms=%d ws_read_limit_bytes=%d",
		wsCfg.Enabled,
		wsCfg.OAuthEnabled,
		wsCfg.APIKeyEnabled,
		wsCfg.ForceHTTP,
		wsCfg.ResponsesWebsocketsV2,
		wsCfg.ResponsesWebsockets,
		wsCfg.PayloadLogSampleRate,
		wsCfg.EventFlushBatchSize,
		wsCfg.EventFlushIntervalMS,
		wsCfg.PrewarmCooldownMS,
		wsCfg.RetryBackoffInitialMS,
		wsCfg.RetryBackoffMaxMS,
		wsCfg.RetryJitterRatio,
		wsCfg.RetryTotalBudgetMS,
		openAIWSMessageReadLimitBytes,
	)
}

func (s *OpenAIGatewayService) getCodexClientRestrictionDetector() CodexClientRestrictionDetector {
	if s != nil && s.codexDetector != nil {
		return s.codexDetector
	}
	var cfg *config.Config
	if s != nil {
		cfg = s.cfg
	}
	return NewOpenAICodexClientRestrictionDetector(cfg)
}

func (s *OpenAIGatewayService) getOpenAIWSProtocolResolver() OpenAIWSProtocolResolver {
	if s != nil && s.openaiWSResolver != nil {
		return s.openaiWSResolver
	}
	var cfg *config.Config
	if s != nil {
		cfg = s.cfg
	}
	return NewOpenAIWSProtocolResolver(cfg)
}

func classifyOpenAIWSReconnectReason(err error) (string, bool) {
	if err == nil {
		return "", false
	}
	var fallbackErr *openAIWSFallbackError
	if !errors.As(err, &fallbackErr) || fallbackErr == nil {
		return "", false
	}
	reason := strings.TrimSpace(fallbackErr.Reason)
	if reason == "" {
		return "", false
	}

	baseReason := strings.TrimPrefix(reason, "prewarm_")

	switch baseReason {
	case "policy_violation",
		"message_too_big",
		"upgrade_required",
		"ws_unsupported",
		"auth_failed",
		"invalid_encrypted_content",
		"previous_response_not_found":
		return reason, false
	}

	switch baseReason {
	case "read_event",
		"write_request",
		"write",
		"acquire_timeout",
		"acquire_conn",
		"conn_queue_full",
		"dial_failed",
		"upstream_5xx",
		"event_error",
		"error_event",
		"upstream_error_event",
		"ws_connection_limit_reached",
		"missing_final_response":
		return reason, true
	default:
		return reason, false
	}
}

func resolveOpenAIWSFallbackErrorResponse(err error) (statusCode int, errType string, clientMessage string, upstreamMessage string, ok bool) {
	if err == nil {
		return 0, "", "", "", false
	}
	var fallbackErr *openAIWSFallbackError
	if !errors.As(err, &fallbackErr) || fallbackErr == nil {
		return 0, "", "", "", false
	}

	reason := strings.TrimSpace(fallbackErr.Reason)
	reason = strings.TrimPrefix(reason, "prewarm_")
	if reason == "" {
		return 0, "", "", "", false
	}

	var dialErr *openAIWSDialError
	if fallbackErr.Err != nil && errors.As(fallbackErr.Err, &dialErr) && dialErr != nil {
		if dialErr.StatusCode > 0 {
			statusCode = dialErr.StatusCode
		}
		if dialErr.Err != nil {
			upstreamMessage = sanitizeUpstreamErrorMessage(strings.TrimSpace(dialErr.Err.Error()))
		}
	}

	switch reason {
	case "invalid_encrypted_content":
		if statusCode == 0 {
			statusCode = http.StatusBadRequest
		}
		errType = "invalid_request_error"
		if upstreamMessage == "" {
			upstreamMessage = "encrypted content could not be verified"
		}
	case "previous_response_not_found":
		if statusCode == 0 {
			statusCode = http.StatusBadRequest
		}
		errType = "invalid_request_error"
		if upstreamMessage == "" {
			upstreamMessage = "previous response not found"
		}
	case "upgrade_required":
		if statusCode == 0 {
			statusCode = http.StatusUpgradeRequired
		}
	case "ws_unsupported":
		if statusCode == 0 {
			statusCode = http.StatusBadRequest
		}
	case "auth_failed":
		if statusCode == 0 {
			statusCode = http.StatusUnauthorized
		}
	case "upstream_rate_limited":
		if statusCode == 0 {
			statusCode = http.StatusTooManyRequests
		}
	default:
		if statusCode == 0 {
			return 0, "", "", "", false
		}
	}

	if upstreamMessage == "" && fallbackErr.Err != nil {
		upstreamMessage = sanitizeUpstreamErrorMessage(strings.TrimSpace(fallbackErr.Err.Error()))
	}
	if upstreamMessage == "" {
		switch reason {
		case "upgrade_required":
			upstreamMessage = "upstream websocket upgrade required"
		case "ws_unsupported":
			upstreamMessage = "upstream websocket not supported"
		case "auth_failed":
			upstreamMessage = "upstream authentication failed"
		case "upstream_rate_limited":
			upstreamMessage = "upstream rate limit exceeded, please retry later"
		default:
			upstreamMessage = "Upstream request failed"
		}
	}

	if errType == "" {
		if statusCode == http.StatusTooManyRequests {
			errType = "rate_limit_error"
		} else {
			errType = "upstream_error"
		}
	}
	clientMessage = upstreamMessage
	return statusCode, errType, clientMessage, upstreamMessage, true
}

func (s *OpenAIGatewayService) writeOpenAIWSFallbackErrorResponse(c *gin.Context, account *Account, wsErr error) bool {
	if c == nil || c.Writer == nil || c.Writer.Written() {
		return false
	}
	statusCode, errType, clientMessage, upstreamMessage, ok := resolveOpenAIWSFallbackErrorResponse(wsErr)
	if !ok {
		return false
	}
	if strings.TrimSpace(clientMessage) == "" {
		clientMessage = "Upstream request failed"
	}
	if strings.TrimSpace(upstreamMessage) == "" {
		upstreamMessage = clientMessage
	}

	setOpsUpstreamError(c, statusCode, upstreamMessage, "")
	if account != nil {
		appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
			Platform:           account.Platform,
			AccountID:          account.ID,
			AccountName:        account.Name,
			UpstreamStatusCode: statusCode,
			Kind:               "ws_error",
			Message:            upstreamMessage,
		})
	}
	c.JSON(statusCode, gin.H{
		"error": gin.H{
			"type":    errType,
			"message": clientMessage,
		},
	})
	return true
}

func (s *OpenAIGatewayService) openAIWSRetryBackoff(attempt int) time.Duration {
	if attempt <= 0 {
		return 0
	}

	initial := openAIWSRetryBackoffInitialDefault
	maxBackoff := openAIWSRetryBackoffMaxDefault
	jitterRatio := openAIWSRetryJitterRatioDefault
	if s != nil && s.cfg != nil {
		wsCfg := s.cfg.Gateway.OpenAIWS
		if wsCfg.RetryBackoffInitialMS > 0 {
			initial = time.Duration(wsCfg.RetryBackoffInitialMS) * time.Millisecond
		}
		if wsCfg.RetryBackoffMaxMS > 0 {
			maxBackoff = time.Duration(wsCfg.RetryBackoffMaxMS) * time.Millisecond
		}
		if wsCfg.RetryJitterRatio >= 0 {
			jitterRatio = wsCfg.RetryJitterRatio
		}
	}
	if initial <= 0 {
		return 0
	}
	if maxBackoff <= 0 {
		maxBackoff = initial
	}
	if maxBackoff < initial {
		maxBackoff = initial
	}
	if jitterRatio < 0 {
		jitterRatio = 0
	}
	if jitterRatio > 1 {
		jitterRatio = 1
	}

	shift := attempt - 1
	if shift < 0 {
		shift = 0
	}
	backoff := initial
	if shift > 0 {
		backoff = initial * time.Duration(1<<shift)
	}
	if backoff > maxBackoff {
		backoff = maxBackoff
	}
	if jitterRatio <= 0 {
		return backoff
	}
	jitter := time.Duration(float64(backoff) * jitterRatio)
	if jitter <= 0 {
		return backoff
	}
	delta := time.Duration(rand.Int63n(int64(jitter)*2+1)) - jitter
	withJitter := backoff + delta
	if withJitter < 0 {
		return 0
	}
	return withJitter
}

func (s *OpenAIGatewayService) openAIWSRetryTotalBudget() time.Duration {
	if s != nil && s.cfg != nil {
		ms := s.cfg.Gateway.OpenAIWS.RetryTotalBudgetMS
		if ms <= 0 {
			return 0
		}
		return time.Duration(ms) * time.Millisecond
	}
	return 0
}

func (s *OpenAIGatewayService) recordOpenAIWSRetryAttempt(backoff time.Duration) {
	if s == nil {
		return
	}
	s.openaiWSRetryMetrics.retryAttempts.Add(1)
	if backoff > 0 {
		s.openaiWSRetryMetrics.retryBackoffMs.Add(backoff.Milliseconds())
	}
}

func (s *OpenAIGatewayService) recordOpenAIWSRetryExhausted() {
	if s == nil {
		return
	}
	s.openaiWSRetryMetrics.retryExhausted.Add(1)
}

func (s *OpenAIGatewayService) recordOpenAIWSNonRetryableFastFallback() {
	if s == nil {
		return
	}
	s.openaiWSRetryMetrics.nonRetryableFastFallback.Add(1)
}

func (s *OpenAIGatewayService) SnapshotOpenAIWSRetryMetrics() OpenAIWSRetryMetricsSnapshot {
	if s == nil {
		return OpenAIWSRetryMetricsSnapshot{}
	}
	return OpenAIWSRetryMetricsSnapshot{
		RetryAttemptsTotal:            s.openaiWSRetryMetrics.retryAttempts.Load(),
		RetryBackoffMsTotal:           s.openaiWSRetryMetrics.retryBackoffMs.Load(),
		RetryExhaustedTotal:           s.openaiWSRetryMetrics.retryExhausted.Load(),
		NonRetryableFastFallbackTotal: s.openaiWSRetryMetrics.nonRetryableFastFallback.Load(),
	}
}

func SnapshotOpenAICompatibilityFallbackMetrics() OpenAICompatibilityFallbackMetricsSnapshot {
	legacyReadFallbackTotal, legacyReadFallbackHit, legacyDualWriteTotal := openAIStickyCompatStats()
	isMaxTokensOneHaiku, thinkingEnabled, prefetchedStickyAccount, prefetchedStickyGroup, singleAccountRetry, accountSwitchCount := RequestMetadataFallbackStats()

	readHitRate := float64(0)
	if legacyReadFallbackTotal > 0 {
		readHitRate = float64(legacyReadFallbackHit) / float64(legacyReadFallbackTotal)
	}
	metadataFallbackTotal := isMaxTokensOneHaiku + thinkingEnabled + prefetchedStickyAccount + prefetchedStickyGroup + singleAccountRetry + accountSwitchCount

	return OpenAICompatibilityFallbackMetricsSnapshot{
		SessionHashLegacyReadFallbackTotal: legacyReadFallbackTotal,
		SessionHashLegacyReadFallbackHit:   legacyReadFallbackHit,
		SessionHashLegacyDualWriteTotal:    legacyDualWriteTotal,
		SessionHashLegacyReadHitRate:       readHitRate,

		MetadataLegacyFallbackIsMaxTokensOneHaikuTotal: isMaxTokensOneHaiku,
		MetadataLegacyFallbackThinkingEnabledTotal:     thinkingEnabled,
		MetadataLegacyFallbackPrefetchedStickyAccount:  prefetchedStickyAccount,
		MetadataLegacyFallbackPrefetchedStickyGroup:    prefetchedStickyGroup,
		MetadataLegacyFallbackSingleAccountRetryTotal:  singleAccountRetry,
		MetadataLegacyFallbackAccountSwitchCountTotal:  accountSwitchCount,
		MetadataLegacyFallbackTotal:                    metadataFallbackTotal,
	}
}

func (s *OpenAIGatewayService) detectCodexClientRestriction(c *gin.Context, account *Account) CodexClientRestrictionDetectionResult {
	return s.getCodexClientRestrictionDetector().Detect(c, account)
}

func getAPIKeyIDFromContext(c *gin.Context) int64 {
	if c == nil {
		return 0
	}
	v, exists := c.Get("api_key")
	if !exists {
		return 0
	}
	apiKey, ok := v.(*APIKey)
	if !ok || apiKey == nil {
		return 0
	}
	return apiKey.ID
}

// isolateOpenAISessionID 将 apiKeyID 混入 session 标识符，
// 确保不同 API Key 的用户即使使用相同的原始 session_id/conversation_id，
// 到达上游的标识符也不同，防止跨用户会话碰撞。
func isolateOpenAISessionID(apiKeyID int64, raw string) string {
	raw = strings.TrimSpace(raw)
	if raw == "" {
		return ""
	}
	h := xxhash.New()
	_, _ = fmt.Fprintf(h, "k%d:", apiKeyID)
	_, _ = h.WriteString(raw)
	return fmt.Sprintf("%016x", h.Sum64())
}

func logCodexCLIOnlyDetection(ctx context.Context, c *gin.Context, account *Account, apiKeyID int64, result CodexClientRestrictionDetectionResult, body []byte) {
	if !result.Enabled {
		return
	}
	if ctx == nil {
		ctx = context.Background()
	}
	accountID := int64(0)
	if account != nil {
		accountID = account.ID
	}
	fields := []zap.Field{
		zap.String("component", "service.openai_gateway"),
		zap.Int64("account_id", accountID),
		zap.Bool("codex_cli_only_enabled", result.Enabled),
		zap.Bool("codex_official_client_match", result.Matched),
		zap.String("reject_reason", result.Reason),
	}
	if apiKeyID > 0 {
		fields = append(fields, zap.Int64("api_key_id", apiKeyID))
	}
	if !result.Matched {
		fields = appendCodexCLIOnlyRejectedRequestFields(fields, c, body)
	}
	log := logger.FromContext(ctx).With(fields...)
	if result.Matched {
		return
	}
	log.Warn("OpenAI codex_cli_only 拒绝非官方客户端请求")
}

func appendCodexCLIOnlyRejectedRequestFields(fields []zap.Field, c *gin.Context, body []byte) []zap.Field {
	if c == nil || c.Request == nil {
		return fields
	}

	req := c.Request
	requestModel, requestStream, promptCacheKey := extractOpenAIRequestMetaFromBody(body)
	fields = append(fields,
		zap.String("request_method", strings.TrimSpace(req.Method)),
		zap.String("request_path", strings.TrimSpace(req.URL.Path)),
		zap.String("request_query", strings.TrimSpace(req.URL.RawQuery)),
		zap.String("request_host", strings.TrimSpace(req.Host)),
		zap.String("request_client_ip", strings.TrimSpace(c.ClientIP())),
		zap.String("request_remote_addr", strings.TrimSpace(req.RemoteAddr)),
		zap.String("request_user_agent", strings.TrimSpace(req.Header.Get("User-Agent"))),
		zap.String("request_content_type", strings.TrimSpace(req.Header.Get("Content-Type"))),
		zap.Int64("request_content_length", req.ContentLength),
		zap.Bool("request_stream", requestStream),
	)
	if requestModel != "" {
		fields = append(fields, zap.String("request_model", requestModel))
	}
	if promptCacheKey != "" {
		fields = append(fields, zap.String("request_prompt_cache_key_sha256", hashSensitiveValueForLog(promptCacheKey)))
	}

	if headers := snapshotCodexCLIOnlyHeaders(req.Header); len(headers) > 0 {
		fields = append(fields, zap.Any("request_headers", headers))
	}
	fields = append(fields, zap.Int("request_body_size", len(body)))
	return fields
}

func snapshotCodexCLIOnlyHeaders(header http.Header) map[string]string {
	if len(header) == 0 {
		return nil
	}
	result := make(map[string]string, len(codexCLIOnlyDebugHeaderWhitelist))
	for _, key := range codexCLIOnlyDebugHeaderWhitelist {
		value := strings.TrimSpace(header.Get(key))
		if value == "" {
			continue
		}
		result[strings.ToLower(key)] = truncateString(value, codexCLIOnlyHeaderValueMaxBytes)
	}
	return result
}

func hashSensitiveValueForLog(raw string) string {
	value := strings.TrimSpace(raw)
	if value == "" {
		return ""
	}
	sum := sha256.Sum256([]byte(value))
	return hex.EncodeToString(sum[:8])
}

func logOpenAIInstructionsRequiredDebug(
	ctx context.Context,
	c *gin.Context,
	account *Account,
	upstreamStatusCode int,
	upstreamMsg string,
	requestBody []byte,
	upstreamBody []byte,
) {
	msg := strings.TrimSpace(upstreamMsg)
	if !isOpenAIInstructionsRequiredError(upstreamStatusCode, msg, upstreamBody) {
		return
	}
	if ctx == nil {
		ctx = context.Background()
	}

	accountID := int64(0)
	accountName := ""
	if account != nil {
		accountID = account.ID
		accountName = strings.TrimSpace(account.Name)
	}

	userAgent := ""
	originator := ""
	if c != nil {
		userAgent = strings.TrimSpace(c.GetHeader("User-Agent"))
		originator = strings.TrimSpace(c.GetHeader("originator"))
	}

	fields := []zap.Field{
		zap.String("component", "service.openai_gateway"),
		zap.Int64("account_id", accountID),
		zap.String("account_name", accountName),
		zap.Int("upstream_status_code", upstreamStatusCode),
		zap.String("upstream_error_message", msg),
		zap.String("request_user_agent", userAgent),
		zap.Bool("codex_official_client_match", openai.IsCodexOfficialClientByHeaders(userAgent, originator)),
	}
	fields = appendCodexCLIOnlyRejectedRequestFields(fields, c, requestBody)

	logger.FromContext(ctx).With(fields...).Warn("OpenAI 上游返回 Instructions are required，已记录请求详情用于排查")
}

func isOpenAIInstructionsRequiredError(upstreamStatusCode int, upstreamMsg string, upstreamBody []byte) bool {
	if upstreamStatusCode != http.StatusBadRequest {
		return false
	}

	hasInstructionRequired := func(text string) bool {
		lower := strings.ToLower(strings.TrimSpace(text))
		if lower == "" {
			return false
		}
		if strings.Contains(lower, "instructions are required") {
			return true
		}
		if strings.Contains(lower, "required parameter: 'instructions'") {
			return true
		}
		if strings.Contains(lower, "required parameter: instructions") {
			return true
		}
		if strings.Contains(lower, "missing required parameter") && strings.Contains(lower, "instructions") {
			return true
		}
		return strings.Contains(lower, "instruction") && strings.Contains(lower, "required")
	}

	if hasInstructionRequired(upstreamMsg) {
		return true
	}
	if len(upstreamBody) == 0 {
		return false
	}

	errMsg := gjson.GetBytes(upstreamBody, "error.message").String()
	errMsgLower := strings.ToLower(strings.TrimSpace(errMsg))
	errCode := strings.ToLower(strings.TrimSpace(gjson.GetBytes(upstreamBody, "error.code").String()))
	errParam := strings.ToLower(strings.TrimSpace(gjson.GetBytes(upstreamBody, "error.param").String()))
	errType := strings.ToLower(strings.TrimSpace(gjson.GetBytes(upstreamBody, "error.type").String()))

	if errParam == "instructions" {
		return true
	}
	if hasInstructionRequired(errMsg) {
		return true
	}
	if strings.Contains(errCode, "missing_required_parameter") && strings.Contains(errMsgLower, "instructions") {
		return true
	}
	if strings.Contains(errType, "invalid_request") && strings.Contains(errMsgLower, "instructions") && strings.Contains(errMsgLower, "required") {
		return true
	}

	return false
}

func isOpenAITransientProcessingError(upstreamStatusCode int, upstreamMsg string, upstreamBody []byte) bool {
	if upstreamStatusCode != http.StatusBadRequest {
		return false
	}

	match := func(text string) bool {
		lower := strings.ToLower(strings.TrimSpace(text))
		if lower == "" {
			return false
		}
		if strings.Contains(lower, "an error occurred while processing your request") {
			return true
		}
		return strings.Contains(lower, "you can retry your request") &&
			strings.Contains(lower, "help.openai.com") &&
			strings.Contains(lower, "request id")
	}

	if match(upstreamMsg) {
		return true
	}
	if len(upstreamBody) == 0 {
		return false
	}
	if match(gjson.GetBytes(upstreamBody, "error.message").String()) {
		return true
	}
	return match(string(upstreamBody))
}

// ExtractSessionID extracts the raw session ID from headers or body without hashing.
// Used by ForwardAsAnthropic to pass as prompt_cache_key for upstream cache.
func (s *OpenAIGatewayService) ExtractSessionID(c *gin.Context, body []byte) string {
	if c == nil {
		return ""
	}
	sessionID := strings.TrimSpace(c.GetHeader("session_id"))
	if sessionID == "" {
		sessionID = strings.TrimSpace(c.GetHeader("conversation_id"))
	}
	if sessionID == "" && len(body) > 0 {
		sessionID = strings.TrimSpace(gjson.GetBytes(body, "prompt_cache_key").String())
	}
	return sessionID
}

func explicitOpenAISessionID(c *gin.Context, body []byte) string {
	if c == nil {
		return ""
	}

	sessionID := strings.TrimSpace(c.GetHeader("session_id"))
	if sessionID == "" {
		sessionID = strings.TrimSpace(c.GetHeader("conversation_id"))
	}
	if sessionID == "" && len(body) > 0 {
		sessionID = strings.TrimSpace(gjson.GetBytes(body, "prompt_cache_key").String())
	}
	return sessionID
}

// GenerateExplicitSessionHash generates a sticky-session hash only from explicit
// client session signals. It intentionally skips content-derived fallback and is
// used by stateless endpoints such as /v1/images.
func (s *OpenAIGatewayService) GenerateExplicitSessionHash(c *gin.Context, body []byte) string {
	sessionID := explicitOpenAISessionID(c, body)
	if sessionID == "" {
		return ""
	}

	currentHash, legacyHash := deriveOpenAISessionHashes(sessionID)
	attachOpenAILegacySessionHashToGin(c, legacyHash)
	return currentHash
}

// GenerateSessionHash generates a sticky-session hash for OpenAI requests.
//
// Priority:
//  1. Header: session_id
//  2. Header: conversation_id
//  3. Body:   prompt_cache_key (opencode)
//  4. Body:   content-based fallback (model + system + tools + first user message)
func (s *OpenAIGatewayService) GenerateSessionHash(c *gin.Context, body []byte) string {
	if c == nil {
		return ""
	}

	sessionID := explicitOpenAISessionID(c, body)
	if sessionID == "" && len(body) > 0 {
		sessionID = deriveOpenAIContentSessionSeed(body)
	}
	if sessionID == "" {
		return ""
	}

	currentHash, legacyHash := deriveOpenAISessionHashes(sessionID)
	attachOpenAILegacySessionHashToGin(c, legacyHash)
	return currentHash
}

// GenerateSessionHashWithFallback 先按常规信号生成会话哈希；
// 当未携带 session_id/conversation_id/prompt_cache_key 时，使用 fallbackSeed 生成稳定哈希。
// 该方法用于 WS ingress，避免会话信号缺失时发生跨账号漂移。
func (s *OpenAIGatewayService) GenerateSessionHashWithFallback(c *gin.Context, body []byte, fallbackSeed string) string {
	sessionHash := s.GenerateSessionHash(c, body)
	if sessionHash != "" {
		return sessionHash
	}

	seed := strings.TrimSpace(fallbackSeed)
	if seed == "" {
		return ""
	}

	currentHash, legacyHash := deriveOpenAISessionHashes(seed)
	attachOpenAILegacySessionHashToGin(c, legacyHash)
	return currentHash
}

func resolveOpenAIUpstreamOriginator(c *gin.Context, isOfficialClient bool) string {
	if c != nil {
		if originator := strings.TrimSpace(c.GetHeader("originator")); originator != "" {
			return originator
		}
	}
	if isOfficialClient {
		return "codex_cli_rs"
	}
	return "opencode"
}

// BindStickySession sets session -> account binding with standard TTL.
func (s *OpenAIGatewayService) BindStickySession(ctx context.Context, groupID *int64, sessionHash string, accountID int64) error {
	if sessionHash == "" || accountID <= 0 {
		return nil
	}
	ttl := openaiStickySessionTTL
	if s != nil && s.cfg != nil && s.cfg.Gateway.OpenAIWS.StickySessionTTLSeconds > 0 {
		ttl = time.Duration(s.cfg.Gateway.OpenAIWS.StickySessionTTLSeconds) * time.Second
	}
	return s.setStickySessionAccountID(ctx, groupID, sessionHash, accountID, ttl)
}

// SelectAccount selects an OpenAI account with sticky session support
func (s *OpenAIGatewayService) SelectAccount(ctx context.Context, groupID *int64, sessionHash string) (*Account, error) {
	return s.SelectAccountForModel(ctx, groupID, sessionHash, "")
}

// SelectAccountForModel selects an account supporting the requested model
func (s *OpenAIGatewayService) SelectAccountForModel(ctx context.Context, groupID *int64, sessionHash string, requestedModel string) (*Account, error) {
	return s.SelectAccountForModelWithExclusions(ctx, groupID, sessionHash, requestedModel, nil)
}

// SelectAccountForModelWithExclusions selects an account supporting the requested model while excluding specified accounts.
// SelectAccountForModelWithExclusions 选择支持指定模型的账号，同时排除指定的账号。
func (s *OpenAIGatewayService) SelectAccountForModelWithExclusions(ctx context.Context, groupID *int64, sessionHash string, requestedModel string, excludedIDs map[int64]struct{}) (*Account, error) {
	return s.selectAccountForModelWithExclusions(ctx, groupID, sessionHash, requestedModel, excludedIDs, false, 0)
}

// noAvailableOpenAISelectionError builds the standard "no account available" error
// while preserving the compact-specific error when applicable.
func noAvailableOpenAISelectionError(requestedModel string, compactBlocked bool) error {
	if compactBlocked {
		return ErrNoAvailableCompactAccounts
	}
	if requestedModel != "" {
		return fmt.Errorf("no available OpenAI accounts supporting model: %s", requestedModel)
	}
	return errors.New("no available OpenAI accounts")
}

// openAICompactSupportTier classifies an OpenAI account by compact capability.
// 0 = explicitly unsupported, 1 = unknown / not yet probed, 2 = explicitly supported.
func openAICompactSupportTier(account *Account) int {
	if account == nil || !account.IsOpenAI() {
		return 0
	}
	supported, known := account.OpenAICompactSupportKnown()
	if !known {
		return 1
	}
	if supported {
		return 2
	}
	return 0
}

// isOpenAIAccountEligibleForRequest centralises the schedulable / OpenAI / model /
// compact-support checks used during account selection.
func isOpenAIAccountEligibleForRequest(account *Account, requestedModel string, requireCompact bool) bool {
	if account == nil || !account.IsSchedulable() || !account.IsOpenAI() {
		return false
	}
	if requestedModel != "" && !account.IsModelSupported(requestedModel) {
		return false
	}
	if requireCompact && openAICompactSupportTier(account) == 0 {
		return false
	}
	return true
}

// prioritizeOpenAICompactAccounts re-orders a slice so that accounts with known
// compact support are tried first, followed by unknown, then explicitly unsupported.
// The relative order within each tier is preserved.
func prioritizeOpenAICompactAccounts(accounts []*Account) []*Account {
	if len(accounts) == 0 {
		return nil
	}
	supported := make([]*Account, 0, len(accounts))
	unknown := make([]*Account, 0, len(accounts))
	unsupported := make([]*Account, 0, len(accounts))
	for _, account := range accounts {
		switch openAICompactSupportTier(account) {
		case 2:
			supported = append(supported, account)
		case 1:
			unknown = append(unknown, account)
		default:
			unsupported = append(unsupported, account)
		}
	}
	out := make([]*Account, 0, len(accounts))
	out = append(out, supported...)
	out = append(out, unknown...)
	out = append(out, unsupported...)
	return out
}

// resolveOpenAIAccountUpstreamModelForRequest resolves the upstream model that
// would be sent for a given request, honouring compact-only mappings when the
// caller is on the /responses/compact path.
func resolveOpenAIAccountUpstreamModelForRequest(account *Account, requestedModel string, requireCompact bool) string {
	upstreamModel := resolveOpenAIForwardModel(account, requestedModel, "")
	if upstreamModel == "" {
		return ""
	}
	if requireCompact {
		return resolveOpenAICompactForwardModel(account, upstreamModel)
	}
	return upstreamModel
}

func (s *OpenAIGatewayService) selectAccountForModelWithExclusions(ctx context.Context, groupID *int64, sessionHash string, requestedModel string, excludedIDs map[int64]struct{}, requireCompact bool, stickyAccountID int64) (*Account, error) {
	if s.checkChannelPricingRestriction(ctx, groupID, requestedModel) {
		slog.Warn("channel pricing restriction blocked request",
			"group_id", derefGroupID(groupID),
			"model", requestedModel)
		return nil, fmt.Errorf("%w supporting model: %s (channel pricing restriction)", ErrNoAvailableAccounts, requestedModel)
	}

	// 1. 尝试粘性会话命中
	// Try sticky session hit
	if account := s.tryStickySessionHit(ctx, groupID, sessionHash, requestedModel, excludedIDs, requireCompact, stickyAccountID); account != nil {
		return account, nil
	}

	// 2. 获取可调度的 OpenAI 账号
	// Get schedulable OpenAI accounts
	accounts, err := s.listSchedulableAccounts(ctx, groupID)
	if err != nil {
		return nil, fmt.Errorf("query accounts failed: %w", err)
	}

	// 3. 按优先级 + LRU 选择最佳账号
	// Select by priority + LRU
	selected, compactBlocked := s.selectBestAccount(ctx, groupID, accounts, requestedModel, excludedIDs, requireCompact)

	if selected == nil {
		return nil, noAvailableOpenAISelectionError(requestedModel, compactBlocked)
	}

	// 4. 设置粘性会话绑定
	// Set sticky session binding
	if sessionHash != "" {
		_ = s.setStickySessionAccountID(ctx, groupID, sessionHash, selected.ID, openaiStickySessionTTL)
	}

	return s.hydrateSelectedAccount(ctx, selected)
}

// tryStickySessionHit 尝试从粘性会话获取账号。
// 如果命中且账号可用则返回账号；如果账号不可用则清理会话并返回 nil。
//
// tryStickySessionHit attempts to get account from sticky session.
// Returns account if hit and usable; clears session and returns nil if account is unavailable.
func (s *OpenAIGatewayService) tryStickySessionHit(ctx context.Context, groupID *int64, sessionHash, requestedModel string, excludedIDs map[int64]struct{}, requireCompact bool, stickyAccountID int64) *Account {
	if sessionHash == "" {
		return nil
	}

	accountID := stickyAccountID
	if accountID <= 0 {
		var err error
		accountID, err = s.getStickySessionAccountID(ctx, groupID, sessionHash)
		if err != nil || accountID <= 0 {
			return nil
		}
	}

	if _, excluded := excludedIDs[accountID]; excluded {
		return nil
	}

	account, err := s.getSchedulableAccount(ctx, accountID)
	if err != nil {
		return nil
	}

	// 检查账号是否需要清理粘性会话
	// Check if sticky session should be cleared
	if shouldClearStickySession(account, requestedModel) {
		_ = s.deleteStickySessionAccountID(ctx, groupID, sessionHash)
		return nil
	}

	// 验证账号是否可用于当前请求
	// Verify account is usable for current request
	if !isOpenAIAccountEligibleForRequest(account, requestedModel, false) {
		return nil
	}
	account = s.recheckSelectedOpenAIAccountFromDB(ctx, account, requestedModel, requireCompact)
	if account == nil {
		_ = s.deleteStickySessionAccountID(ctx, groupID, sessionHash)
		return nil
	}
	if groupID != nil && s.needsUpstreamChannelRestrictionCheck(ctx, groupID) &&
		s.isUpstreamModelRestrictedByChannel(ctx, *groupID, account, requestedModel, requireCompact) {
		_ = s.deleteStickySessionAccountID(ctx, groupID, sessionHash)
		return nil
	}

	// 刷新会话 TTL 并返回账号
	// Refresh session TTL and return account
	_ = s.refreshStickySessionTTL(ctx, groupID, sessionHash, openaiStickySessionTTL)
	return account
}

// selectBestAccount 从候选账号中选择最佳账号（优先级 + LRU）。
// 返回 nil 表示无可用账号。
//
// selectBestAccount selects the best account from candidates (priority + LRU).
// Returns nil if no available account. The second return reports whether at
// least one candidate was filtered out solely because it lacks compact support
// (only meaningful when requireCompact=true).
func (s *OpenAIGatewayService) selectBestAccount(ctx context.Context, groupID *int64, accounts []Account, requestedModel string, excludedIDs map[int64]struct{}, requireCompact bool) (*Account, bool) {
	var selected *Account
	selectedCompactTier := -1
	compactBlocked := false
	needsUpstreamCheck := s.needsUpstreamChannelRestrictionCheck(ctx, groupID)

	for i := range accounts {
		acc := &accounts[i]

		// 跳过被排除的账号
		// Skip excluded accounts
		if _, excluded := excludedIDs[acc.ID]; excluded {
			continue
		}

		fresh := s.resolveFreshSchedulableOpenAIAccount(ctx, acc, requestedModel, false)
		if fresh == nil {
			continue
		}
		fresh = s.recheckSelectedOpenAIAccountFromDB(ctx, fresh, requestedModel, false)
		if fresh == nil {
			continue
		}
		if needsUpstreamCheck && s.isUpstreamModelRestrictedByChannel(ctx, *groupID, fresh, requestedModel, requireCompact) {
			continue
		}
		compactTier := 0
		if requireCompact {
			compactTier = openAICompactSupportTier(fresh)
			if compactTier == 0 {
				compactBlocked = true
				continue
			}
		}

		// 选择优先级最高且最久未使用的账号
		// Select highest priority and least recently used
		if selected == nil {
			selected = fresh
			selectedCompactTier = compactTier
			continue
		}

		// compact 模式下高 tier 优先；同 tier 内才比较 priority/LRU。
		if requireCompact && compactTier != selectedCompactTier {
			if compactTier > selectedCompactTier {
				selected = fresh
				selectedCompactTier = compactTier
			}
			continue
		}

		if s.isBetterAccount(fresh, selected) {
			selected = fresh
			selectedCompactTier = compactTier
		}
	}

	return selected, compactBlocked
}

// isBetterAccount 判断 candidate 是否比 current 更优。
// 规则：优先级更高（数值更小）优先；同优先级时，未使用过的优先，其次是最久未使用的。
//
// isBetterAccount checks if candidate is better than current.
// Rules: higher priority (lower value) wins; same priority: never used > least recently used.
func (s *OpenAIGatewayService) isBetterAccount(candidate, current *Account) bool {
	// 优先级更高（数值更小）
	// Higher priority (lower value)
	if candidate.Priority < current.Priority {
		return true
	}
	if candidate.Priority > current.Priority {
		return false
	}

	// 同优先级，比较最后使用时间
	// Same priority, compare last used time
	switch {
	case candidate.LastUsedAt == nil && current.LastUsedAt != nil:
		// candidate 从未使用，优先
		return true
	case candidate.LastUsedAt != nil && current.LastUsedAt == nil:
		// current 从未使用，保持
		return false
	case candidate.LastUsedAt == nil && current.LastUsedAt == nil:
		// 都未使用，保持
		return false
	default:
		// 都使用过，选择最久未使用的
		return candidate.LastUsedAt.Before(*current.LastUsedAt)
	}
}

// SelectAccountWithLoadAwareness selects an account with load-awareness and wait plan.
func (s *OpenAIGatewayService) SelectAccountWithLoadAwareness(ctx context.Context, groupID *int64, sessionHash string, requestedModel string, excludedIDs map[int64]struct{}) (*AccountSelectionResult, error) {
	return s.selectAccountWithLoadAwareness(ctx, groupID, sessionHash, requestedModel, excludedIDs, false)
}

func (s *OpenAIGatewayService) selectAccountWithLoadAwareness(ctx context.Context, groupID *int64, sessionHash string, requestedModel string, excludedIDs map[int64]struct{}, requireCompact bool) (*AccountSelectionResult, error) {
	if s.checkChannelPricingRestriction(ctx, groupID, requestedModel) {
		slog.Warn("channel pricing restriction blocked request",
			"group_id", derefGroupID(groupID),
			"model", requestedModel)
		return nil, fmt.Errorf("%w supporting model: %s (channel pricing restriction)", ErrNoAvailableAccounts, requestedModel)
	}

	cfg := s.schedulingConfig()
	needsUpstreamCheck := s.needsUpstreamChannelRestrictionCheck(ctx, groupID)
	var stickyAccountID int64
	if sessionHash != "" && s.cache != nil {
		if accountID, err := s.getStickySessionAccountID(ctx, groupID, sessionHash); err == nil {
			stickyAccountID = accountID
		}
	}
	if s.concurrencyService == nil || !cfg.LoadBatchEnabled {
		account, err := s.selectAccountForModelWithExclusions(ctx, groupID, sessionHash, requestedModel, excludedIDs, requireCompact, stickyAccountID)
		if err != nil {
			return nil, err
		}
		result, err := s.tryAcquireAccountSlot(ctx, account.ID, account.Concurrency)
		if err == nil && result.Acquired {
			return s.newSelectionResult(ctx, account, true, result.ReleaseFunc, nil)
		}
		if stickyAccountID > 0 && stickyAccountID == account.ID && s.concurrencyService != nil {
			waitingCount, _ := s.concurrencyService.GetAccountWaitingCount(ctx, account.ID)
			if waitingCount < cfg.StickySessionMaxWaiting {
				return s.newSelectionResult(ctx, account, false, nil, &AccountWaitPlan{
					AccountID:      account.ID,
					MaxConcurrency: account.Concurrency,
					Timeout:        cfg.StickySessionWaitTimeout,
					MaxWaiting:     cfg.StickySessionMaxWaiting,
				})
			}
		}
		return s.newSelectionResult(ctx, account, false, nil, &AccountWaitPlan{
			AccountID:      account.ID,
			MaxConcurrency: account.Concurrency,
			Timeout:        cfg.FallbackWaitTimeout,
			MaxWaiting:     cfg.FallbackMaxWaiting,
		})
	}

	accounts, err := s.listSchedulableAccounts(ctx, groupID)
	if err != nil {
		return nil, err
	}
	if len(accounts) == 0 {
		return nil, ErrNoAvailableAccounts
	}

	isExcluded := func(accountID int64) bool {
		if excludedIDs == nil {
			return false
		}
		_, excluded := excludedIDs[accountID]
		return excluded
	}

	// ============ Layer 1: Sticky session ============
	if sessionHash != "" {
		accountID := stickyAccountID
		if accountID > 0 && !isExcluded(accountID) {
			account, err := s.getSchedulableAccount(ctx, accountID)
			if err == nil {
				clearSticky := shouldClearStickySession(account, requestedModel)
				if clearSticky {
					_ = s.deleteStickySessionAccountID(ctx, groupID, sessionHash)
				}
				if !clearSticky && isOpenAIAccountEligibleForRequest(account, requestedModel, false) {
					account = s.recheckSelectedOpenAIAccountFromDB(ctx, account, requestedModel, requireCompact)
					if account == nil {
						_ = s.deleteStickySessionAccountID(ctx, groupID, sessionHash)
					} else if needsUpstreamCheck && s.isUpstreamModelRestrictedByChannel(ctx, *groupID, account, requestedModel, requireCompact) {
						_ = s.deleteStickySessionAccountID(ctx, groupID, sessionHash)
					} else {
						result, err := s.tryAcquireAccountSlot(ctx, accountID, account.Concurrency)
						if err == nil && result.Acquired {
							_ = s.refreshStickySessionTTL(ctx, groupID, sessionHash, openaiStickySessionTTL)
							return s.newSelectionResult(ctx, account, true, result.ReleaseFunc, nil)
						}

						waitingCount, _ := s.concurrencyService.GetAccountWaitingCount(ctx, accountID)
						if waitingCount < cfg.StickySessionMaxWaiting {
							return s.newSelectionResult(ctx, account, false, nil, &AccountWaitPlan{
								AccountID:      accountID,
								MaxConcurrency: account.Concurrency,
								Timeout:        cfg.StickySessionWaitTimeout,
								MaxWaiting:     cfg.StickySessionMaxWaiting,
							})
						}
					}
				}
			}
		}
	}

	// ============ Layer 2: Load-aware selection ============
	baseCandidateCount := 0
	candidates := make([]*Account, 0, len(accounts))
	for i := range accounts {
		acc := &accounts[i]
		if isExcluded(acc.ID) {
			continue
		}
		// Scheduler snapshots can be temporarily stale (bucket rebuild is throttled);
		// re-check schedulability here so recently rate-limited/overloaded accounts
		// are not selected again before the bucket is rebuilt.
		if !acc.IsSchedulable() {
			continue
		}
		if requestedModel != "" && !acc.IsModelSupported(requestedModel) {
			continue
		}
		if needsUpstreamCheck && s.isUpstreamModelRestrictedByChannel(ctx, *groupID, acc, requestedModel, requireCompact) {
			continue
		}
		baseCandidateCount++
		candidates = append(candidates, acc)
	}

	if len(candidates) == 0 {
		return nil, ErrNoAvailableAccounts
	}

	accountLoads := make([]AccountWithConcurrency, 0, len(candidates))
	for _, acc := range candidates {
		accountLoads = append(accountLoads, AccountWithConcurrency{
			ID:             acc.ID,
			MaxConcurrency: acc.EffectiveLoadFactor(),
		})
	}

	loadMap, err := s.concurrencyService.GetAccountsLoadBatch(ctx, accountLoads)
	if err != nil {
		ordered := append([]*Account(nil), candidates...)
		sortAccountsByPriorityAndLastUsed(ordered, false)
		if requireCompact {
			ordered = prioritizeOpenAICompactAccounts(ordered)
		}
		for _, acc := range ordered {
			fresh := s.resolveFreshSchedulableOpenAIAccount(ctx, acc, requestedModel, false)
			if fresh == nil {
				continue
			}
			fresh = s.recheckSelectedOpenAIAccountFromDB(ctx, fresh, requestedModel, requireCompact)
			if fresh == nil {
				continue
			}
			if needsUpstreamCheck && s.isUpstreamModelRestrictedByChannel(ctx, *groupID, fresh, requestedModel, requireCompact) {
				continue
			}
			result, err := s.tryAcquireAccountSlot(ctx, fresh.ID, fresh.Concurrency)
			if err == nil && result.Acquired {
				if sessionHash != "" {
					_ = s.setStickySessionAccountID(ctx, groupID, sessionHash, fresh.ID, openaiStickySessionTTL)
				}
				return s.newSelectionResult(ctx, fresh, true, result.ReleaseFunc, nil)
			}
		}
	} else {
		var available []accountWithLoad
		for _, acc := range candidates {
			loadInfo := loadMap[acc.ID]
			if loadInfo == nil {
				loadInfo = &AccountLoadInfo{AccountID: acc.ID}
			}
			if loadInfo.LoadRate < 100 {
				available = append(available, accountWithLoad{
					account:  acc,
					loadInfo: loadInfo,
				})
			}
		}

		if len(available) > 0 {
			sort.SliceStable(available, func(i, j int) bool {
				a, b := available[i], available[j]
				if a.account.Priority != b.account.Priority {
					return a.account.Priority < b.account.Priority
				}
				if a.loadInfo.LoadRate != b.loadInfo.LoadRate {
					return a.loadInfo.LoadRate < b.loadInfo.LoadRate
				}
				switch {
				case a.account.LastUsedAt == nil && b.account.LastUsedAt != nil:
					return true
				case a.account.LastUsedAt != nil && b.account.LastUsedAt == nil:
					return false
				case a.account.LastUsedAt == nil && b.account.LastUsedAt == nil:
					return false
				default:
					return a.account.LastUsedAt.Before(*b.account.LastUsedAt)
				}
			})
			shuffleWithinSortGroups(available)

			selectionOrder := make([]accountWithLoad, 0, len(available))
			if requireCompact {
				appendTier := func(out []accountWithLoad, tier int) []accountWithLoad {
					for _, item := range available {
						if openAICompactSupportTier(item.account) == tier {
							out = append(out, item)
						}
					}
					return out
				}
				selectionOrder = appendTier(selectionOrder, 2)
				selectionOrder = appendTier(selectionOrder, 1)
				// tier 0 候选作为兜底追加：DB recheck 时若发现 cache tier 0 实际
				// 已升级为 1/2（探测刚跑完，cache 尚未刷新），仍可正常命中。
				selectionOrder = appendTier(selectionOrder, 0)
			} else {
				selectionOrder = append(selectionOrder, available...)
			}

			for _, item := range selectionOrder {
				fresh := s.resolveFreshSchedulableOpenAIAccount(ctx, item.account, requestedModel, false)
				if fresh == nil {
					continue
				}
				fresh = s.recheckSelectedOpenAIAccountFromDB(ctx, fresh, requestedModel, requireCompact)
				if fresh == nil {
					continue
				}
				if needsUpstreamCheck && s.isUpstreamModelRestrictedByChannel(ctx, *groupID, fresh, requestedModel, requireCompact) {
					continue
				}
				result, err := s.tryAcquireAccountSlot(ctx, fresh.ID, fresh.Concurrency)
				if err == nil && result.Acquired {
					if sessionHash != "" {
						_ = s.setStickySessionAccountID(ctx, groupID, sessionHash, fresh.ID, openaiStickySessionTTL)
					}
					return s.newSelectionResult(ctx, fresh, true, result.ReleaseFunc, nil)
				}
			}
		}
	}

	// ============ Layer 3: Fallback wait ============
	sortAccountsByPriorityAndLastUsed(candidates, false)
	if requireCompact {
		candidates = prioritizeOpenAICompactAccounts(candidates)
	}
	for _, acc := range candidates {
		fresh := s.resolveFreshSchedulableOpenAIAccount(ctx, acc, requestedModel, false)
		if fresh == nil {
			continue
		}
		fresh = s.recheckSelectedOpenAIAccountFromDB(ctx, fresh, requestedModel, requireCompact)
		if fresh == nil {
			continue
		}
		if needsUpstreamCheck && s.isUpstreamModelRestrictedByChannel(ctx, *groupID, fresh, requestedModel, requireCompact) {
			continue
		}
		return s.newSelectionResult(ctx, fresh, false, nil, &AccountWaitPlan{
			AccountID:      fresh.ID,
			MaxConcurrency: fresh.Concurrency,
			Timeout:        cfg.FallbackWaitTimeout,
			MaxWaiting:     cfg.FallbackMaxWaiting,
		})
	}

	if requireCompact && baseCandidateCount > 0 {
		return nil, ErrNoAvailableCompactAccounts
	}
	return nil, ErrNoAvailableAccounts
}

func (s *OpenAIGatewayService) listSchedulableAccounts(ctx context.Context, groupID *int64) ([]Account, error) {
	if s.schedulerSnapshot != nil {
		accounts, _, err := s.schedulerSnapshot.ListSchedulableAccounts(ctx, groupID, PlatformOpenAI, false)
		return accounts, err
	}
	var accounts []Account
	var err error
	if s.cfg != nil && s.cfg.RunMode == config.RunModeSimple {
		accounts, err = s.accountRepo.ListSchedulableByPlatform(ctx, PlatformOpenAI)
	} else if groupID != nil {
		accounts, err = s.accountRepo.ListSchedulableByGroupIDAndPlatform(ctx, *groupID, PlatformOpenAI)
	} else {
		accounts, err = s.accountRepo.ListSchedulableUngroupedByPlatform(ctx, PlatformOpenAI)
	}
	if err != nil {
		return nil, fmt.Errorf("query accounts failed: %w", err)
	}
	return accounts, nil
}

func (s *OpenAIGatewayService) tryAcquireAccountSlot(ctx context.Context, accountID int64, maxConcurrency int) (*AcquireResult, error) {
	if s.concurrencyService == nil {
		return &AcquireResult{Acquired: true, ReleaseFunc: func() {}}, nil
	}
	return s.concurrencyService.AcquireAccountSlot(ctx, accountID, maxConcurrency)
}

func (s *OpenAIGatewayService) resolveFreshSchedulableOpenAIAccount(ctx context.Context, account *Account, requestedModel string, requireCompact bool) *Account {
	if account == nil {
		return nil
	}

	fresh := account
	if s.schedulerSnapshot != nil {
		current, err := s.getSchedulableAccount(ctx, account.ID)
		if err != nil || current == nil {
			return nil
		}
		fresh = current
	}

	if !isOpenAIAccountEligibleForRequest(fresh, requestedModel, requireCompact) {
		return nil
	}
	return fresh
}

func (s *OpenAIGatewayService) recheckSelectedOpenAIAccountFromDB(ctx context.Context, account *Account, requestedModel string, requireCompact bool) *Account {
	if account == nil {
		return nil
	}
	if s.schedulerSnapshot == nil || s.accountRepo == nil {
		if !isOpenAIAccountEligibleForRequest(account, requestedModel, requireCompact) {
			return nil
		}
		return account
	}

	latest, err := s.accountRepo.GetByID(ctx, account.ID)
	if err != nil || latest == nil {
		return nil
	}
	if !isOpenAIAccountEligibleForRequest(latest, requestedModel, requireCompact) {
		return nil
	}
	return latest
}

func (s *OpenAIGatewayService) getSchedulableAccount(ctx context.Context, accountID int64) (*Account, error) {
	var (
		account *Account
		err     error
	)
	if s.schedulerSnapshot != nil {
		account, err = s.schedulerSnapshot.GetAccount(ctx, accountID)
	} else {
		account, err = s.accountRepo.GetByID(ctx, accountID)
	}
	if err != nil || account == nil {
		return account, err
	}
	return account, nil
}

func (s *OpenAIGatewayService) hydrateSelectedAccount(ctx context.Context, account *Account) (*Account, error) {
	if account == nil || s.schedulerSnapshot == nil {
		return account, nil
	}
	hydrated, err := s.schedulerSnapshot.GetAccount(ctx, account.ID)
	if err != nil {
		return nil, err
	}
	if hydrated == nil {
		return nil, fmt.Errorf("selected openai account %d not found during hydration", account.ID)
	}
	return hydrated, nil
}

func (s *OpenAIGatewayService) newSelectionResult(ctx context.Context, account *Account, acquired bool, release func(), waitPlan *AccountWaitPlan) (*AccountSelectionResult, error) {
	hydrated, err := s.hydrateSelectedAccount(ctx, account)
	if err != nil {
		return nil, err
	}
	return &AccountSelectionResult{
		Account:     hydrated,
		Acquired:    acquired,
		ReleaseFunc: release,
		WaitPlan:    waitPlan,
	}, nil
}

func (s *OpenAIGatewayService) schedulingConfig() config.GatewaySchedulingConfig {
	if s.cfg != nil {
		return s.cfg.Gateway.Scheduling
	}
	return config.GatewaySchedulingConfig{
		StickySessionMaxWaiting:  3,
		StickySessionWaitTimeout: 45 * time.Second,
		FallbackWaitTimeout:      30 * time.Second,
		FallbackMaxWaiting:       100,
		LoadBatchEnabled:         true,
		SlotCleanupInterval:      30 * time.Second,
	}
}

// GetAccessToken gets the access token for an OpenAI account
func (s *OpenAIGatewayService) GetAccessToken(ctx context.Context, account *Account) (string, string, error) {
	switch account.Type {
	case AccountTypeOAuth:
		// 使用 TokenProvider 获取缓存的 token
		if s.openAITokenProvider != nil {
			accessToken, err := s.openAITokenProvider.GetAccessToken(ctx, account)
			if err != nil {
				return "", "", err
			}
			return accessToken, "oauth", nil
		}
		// 降级：TokenProvider 未配置时直接从账号读取
		accessToken := account.GetOpenAIAccessToken()
		if accessToken == "" {
			return "", "", errors.New("access_token not found in credentials")
		}
		return accessToken, "oauth", nil
	case AccountTypeAPIKey:
		apiKey := account.GetOpenAIApiKey()
		if apiKey == "" {
			return "", "", errors.New("api_key not found in credentials")
		}
		return apiKey, "apikey", nil
	default:
		return "", "", fmt.Errorf("unsupported account type: %s", account.Type)
	}
}

func (s *OpenAIGatewayService) shouldFailoverUpstreamError(statusCode int) bool {
	switch statusCode {
	case 401, 402, 403, 429, 529:
		return true
	default:
		return statusCode >= 500
	}
}

func (s *OpenAIGatewayService) shouldFailoverOpenAIUpstreamResponse(statusCode int, upstreamMsg string, upstreamBody []byte) bool {
	if s.shouldFailoverUpstreamError(statusCode) {
		return true
	}
	return isOpenAITransientProcessingError(statusCode, upstreamMsg, upstreamBody)
}

func (s *OpenAIGatewayService) handleFailoverSideEffects(ctx context.Context, resp *http.Response, account *Account) {
	body, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
	s.rateLimitService.HandleUpstreamError(ctx, account, resp.StatusCode, resp.Header, body)
}

// Forward forwards request to OpenAI API
func (s *OpenAIGatewayService) Forward(ctx context.Context, c *gin.Context, account *Account, body []byte) (*OpenAIForwardResult, error) {
	startTime := time.Now()

	restrictionResult := s.detectCodexClientRestriction(c, account)
	apiKeyID := getAPIKeyIDFromContext(c)
	logCodexCLIOnlyDetection(ctx, c, account, apiKeyID, restrictionResult, body)
	if restrictionResult.Enabled && !restrictionResult.Matched {
		c.JSON(http.StatusForbidden, gin.H{
			"error": gin.H{
				"type":    "forbidden_error",
				"message": "This account only allows Codex official clients",
			},
		})
		return nil, errors.New("codex_cli_only restriction: only codex official clients are allowed")
	}

	originalBody := body
	reqModel, reqStream, promptCacheKey := extractOpenAIRequestMetaFromBody(body)
	originalModel := reqModel

	isCodexCLI := openai.IsCodexOfficialClientByHeaders(c.GetHeader("User-Agent"), c.GetHeader("originator")) || (s.cfg != nil && s.cfg.Gateway.ForceCodexCLI)
	wsDecision := s.getOpenAIWSProtocolResolver().Resolve(account)
	clientTransport := GetOpenAIClientTransport(c)
	// 仅允许 WS 入站请求走 WS 上游，避免出现 HTTP -> WS 协议混用。
	wsDecision = resolveOpenAIWSDecisionByClientTransport(wsDecision, clientTransport)
	if c != nil {
		c.Set("openai_ws_transport_decision", string(wsDecision.Transport))
		c.Set("openai_ws_transport_reason", wsDecision.Reason)
	}
	if wsDecision.Transport == OpenAIUpstreamTransportResponsesWebsocketV2 {
		logOpenAIWSModeDebug(
			"selected account_id=%d account_type=%s transport=%s reason=%s model=%s stream=%v",
			account.ID,
			account.Type,
			normalizeOpenAIWSLogValue(string(wsDecision.Transport)),
			normalizeOpenAIWSLogValue(wsDecision.Reason),
			reqModel,
			reqStream,
		)
	}
	// 当前仅支持 WSv2；WSv1 命中时直接返回错误，避免出现“配置可开但行为不确定”。
	if wsDecision.Transport == OpenAIUpstreamTransportResponsesWebsocket {
		if c != nil {
			c.JSON(http.StatusBadRequest, gin.H{
				"error": gin.H{
					"type":    "invalid_request_error",
					"message": "OpenAI WSv1 is temporarily unsupported. Please enable responses_websockets_v2.",
				},
			})
		}
		return nil, errors.New("openai ws v1 is temporarily unsupported; use ws v2")
	}
	passthroughEnabled := account.IsOpenAIPassthroughEnabled()
	if passthroughEnabled {
		// 透传分支只需要轻量提取字段，避免热路径全量 Unmarshal。
		reasoningEffort := extractOpenAIReasoningEffortFromBody(body, reqModel)
		return s.forwardOpenAIPassthrough(ctx, c, account, originalBody, reqModel, reasoningEffort, reqStream, startTime)
	}

	reqBody, err := getOpenAIRequestBodyMap(c, body)
	if err != nil {
		return nil, err
	}

	if v, ok := reqBody["model"].(string); ok {
		reqModel = v
		originalModel = reqModel
	}
	if v, ok := reqBody["stream"].(bool); ok {
		reqStream = v
	}
	if promptCacheKey == "" {
		if v, ok := reqBody["prompt_cache_key"].(string); ok {
			promptCacheKey = strings.TrimSpace(v)
		}
	}

	// Track if body needs re-serialization
	bodyModified := false
	// 单字段补丁快速路径：只要整个变更集最终可归约为同一路径的 set/delete，就避免全量 Marshal。
	patchDisabled := false
	patchHasOp := false
	patchDelete := false
	patchPath := ""
	var patchValue any
	markPatchSet := func(path string, value any) {
		if strings.TrimSpace(path) == "" {
			patchDisabled = true
			return
		}
		if patchDisabled {
			return
		}
		if !patchHasOp {
			patchHasOp = true
			patchDelete = false
			patchPath = path
			patchValue = value
			return
		}
		if patchDelete || patchPath != path {
			patchDisabled = true
			return
		}
		patchValue = value
	}
	markPatchDelete := func(path string) {
		if strings.TrimSpace(path) == "" {
			patchDisabled = true
			return
		}
		if patchDisabled {
			return
		}
		if !patchHasOp {
			patchHasOp = true
			patchDelete = true
			patchPath = path
			return
		}
		if !patchDelete || patchPath != path {
			patchDisabled = true
		}
	}
	disablePatch := func() {
		patchDisabled = true
	}

	// 非透传模式下，instructions 为空时注入默认指令。
	if isInstructionsEmpty(reqBody) {
		reqBody["instructions"] = "You are a helpful coding assistant."
		bodyModified = true
		markPatchSet("instructions", "You are a helpful coding assistant.")
	}

	if isCodexCLI && ensureOpenAIResponsesImageGenerationTool(reqBody) {
		bodyModified = true
		disablePatch()
		logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Injected /responses image_generation tool for Codex client")
	}

	if normalizeOpenAIResponsesImageGenerationTools(reqBody) {
		bodyModified = true
		disablePatch()
		logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Normalized /responses image_generation tool payload")
	}
	if isCodexCLI && applyCodexImageGenerationBridgeInstructions(reqBody) {
		bodyModified = true
		disablePatch()
		logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Added Codex image_generation bridge instructions")
	}

	// 对所有请求执行模型映射（包含 Codex CLI）。
	billingModel := account.GetMappedModel(reqModel)
	if billingModel != reqModel {
		logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Model mapping applied: %s -> %s (account: %s, isCodexCLI: %v)", reqModel, billingModel, account.Name, isCodexCLI)
		reqBody["model"] = billingModel
		bodyModified = true
		markPatchSet("model", billingModel)
	}
	upstreamModel := billingModel
	if normalizeOpenAIResponsesImageOnlyModel(reqBody) {
		bodyModified = true
		disablePatch()
		if model, ok := reqBody["model"].(string); ok {
			upstreamModel = strings.TrimSpace(model)
		}
		logger.LegacyPrintf(
			"service.openai_gateway",
			"[OpenAI] Normalized /responses image-only model request inbound_model=%s image_model=%s upstream_model=%s",
			reqModel,
			billingModel,
			upstreamModel,
		)
	}
	if err := validateOpenAIResponsesImageModel(reqBody, upstreamModel); err != nil {
		setOpsUpstreamError(c, http.StatusBadRequest, err.Error(), "")
		c.JSON(http.StatusBadRequest, gin.H{
			"error": gin.H{
				"type":    "invalid_request_error",
				"message": err.Error(),
				"param":   "model",
			},
		})
		return nil, err
	}
	if hasOpenAIImageGenerationTool(reqBody) {
		logger.LegacyPrintf(
			"service.openai_gateway",
			"[OpenAI] /responses image_generation request inbound_model=%s mapped_model=%s account_type=%s",
			reqModel,
			upstreamModel,
			account.Type,
		)
	}
	if err := validateCodexSparkInput(reqBody, upstreamModel); err != nil {
		setOpsUpstreamError(c, http.StatusBadRequest, err.Error(), "")
		c.JSON(http.StatusBadRequest, gin.H{
			"error": gin.H{
				"type":    "invalid_request_error",
				"message": err.Error(),
				"param":   "input",
			},
		})
		return nil, err
	}

	// Compact-only model 映射：仅在 /responses/compact 路径生效，且优先级高于
	// OAuth 模型规范化（避免 OAuth 规范化覆盖 compact-only 自定义模型）。
	isCompactRequest := isOpenAIResponsesCompactPath(c)
	compactMapped := false
	if isCompactRequest {
		compactMappedModel := resolveOpenAICompactForwardModel(account, billingModel)
		if compactMappedModel != "" && compactMappedModel != billingModel {
			compactMapped = true
			upstreamModel = compactMappedModel
			reqBody["model"] = compactMappedModel
			bodyModified = true
			markPatchSet("model", compactMappedModel)
			logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Compact model mapping applied: %s -> %s (account: %s, isCodexCLI: %v)", billingModel, compactMappedModel, account.Name, isCodexCLI)
		}
	}

	// OpenAI OAuth 账号走 ChatGPT internal Codex endpoint，需要将模型名规范化为
	// 上游可识别的 Codex/GPT 系列。API Key 账号则应保留原始/映射后的模型名，
	// 以兼容自定义 base_url 的 OpenAI-compatible 上游。
	if model, ok := reqBody["model"].(string); ok {
		if !compactMapped {
			upstreamModel = normalizeOpenAIModelForUpstream(account, model)
			if upstreamModel != "" && upstreamModel != model {
				logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Upstream model resolved: %s -> %s (account: %s, type: %s, isCodexCLI: %v)",
					model, upstreamModel, account.Name, account.Type, isCodexCLI)
				reqBody["model"] = upstreamModel
				bodyModified = true
				markPatchSet("model", upstreamModel)
			}
		}

		// 移除 gpt-5.2-codex 以下的版本 verbosity 参数
		// 确保高版本模型向低版本模型映射不报错
		if !SupportsVerbosity(upstreamModel) {
			if text, ok := reqBody["text"].(map[string]any); ok {
				delete(text, "verbosity")
			}
		}
	}

	// 规范化 reasoning.effort 参数（minimal -> none），与上游允许值对齐。
	if reasoning, ok := reqBody["reasoning"].(map[string]any); ok {
		if effort, ok := reasoning["effort"].(string); ok && effort == "minimal" {
			reasoning["effort"] = "none"
			bodyModified = true
			markPatchSet("reasoning.effort", "none")
			logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Normalized reasoning.effort: minimal -> none (account: %s)", account.Name)
		}
	}

	if account.Type == AccountTypeOAuth {
		codexResult := applyCodexOAuthTransform(reqBody, isCodexCLI, isCompactRequest)
		if codexResult.Modified {
			bodyModified = true
			disablePatch()
		}
		if codexResult.NormalizedModel != "" {
			upstreamModel = codexResult.NormalizedModel
		}
		if codexResult.PromptCacheKey != "" {
			promptCacheKey = codexResult.PromptCacheKey
		}
	}

	// Handle max_output_tokens based on platform and account type
	if !isCodexCLI {
		if maxOutputTokens, hasMaxOutputTokens := reqBody["max_output_tokens"]; hasMaxOutputTokens {
			switch account.Platform {
			case PlatformOpenAI:
				// For OpenAI API Key, remove max_output_tokens (not supported)
				// For OpenAI OAuth (Responses API), keep it (supported)
				if account.Type == AccountTypeAPIKey {
					delete(reqBody, "max_output_tokens")
					bodyModified = true
					markPatchDelete("max_output_tokens")
				}
			case PlatformAnthropic:
				// For Anthropic (Claude), convert to max_tokens
				delete(reqBody, "max_output_tokens")
				markPatchDelete("max_output_tokens")
				if _, hasMaxTokens := reqBody["max_tokens"]; !hasMaxTokens {
					reqBody["max_tokens"] = maxOutputTokens
					disablePatch()
				}
				bodyModified = true
			case PlatformGemini:
				// For Gemini, remove (will be handled by Gemini-specific transform)
				delete(reqBody, "max_output_tokens")
				bodyModified = true
				markPatchDelete("max_output_tokens")
			default:
				// For unknown platforms, remove to be safe
				delete(reqBody, "max_output_tokens")
				bodyModified = true
				markPatchDelete("max_output_tokens")
			}
		}

		// Also handle max_completion_tokens (similar logic)
		if _, hasMaxCompletionTokens := reqBody["max_completion_tokens"]; hasMaxCompletionTokens {
			if account.Type == AccountTypeAPIKey || account.Platform != PlatformOpenAI {
				delete(reqBody, "max_completion_tokens")
				bodyModified = true
				markPatchDelete("max_completion_tokens")
			}
		}

		// Remove unsupported fields (not supported by upstream OpenAI API)
		unsupportedFields := []string{"prompt_cache_retention", "safety_identifier"}
		for _, unsupportedField := range unsupportedFields {
			if _, has := reqBody[unsupportedField]; has {
				delete(reqBody, unsupportedField)
				bodyModified = true
				markPatchDelete(unsupportedField)
			}
		}
	}

	// 仅在 WSv2 模式保留 previous_response_id，其他模式（HTTP/WSv1）统一过滤。
	// 注意：该规则同样适用于 Codex CLI 请求，避免 WSv1 向上游透传不支持字段。
	if wsDecision.Transport != OpenAIUpstreamTransportResponsesWebsocketV2 {
		if _, has := reqBody["previous_response_id"]; has {
			delete(reqBody, "previous_response_id")
			bodyModified = true
			markPatchDelete("previous_response_id")
		}
	}

	if sanitizeEmptyBase64InputImagesInOpenAIRequestBodyMap(reqBody) {
		bodyModified = true
		disablePatch()
	}

	// Apply OpenAI fast policy (参照 Claude BetaPolicy 的 fast-mode 过滤)：
	// 针对 body 的 service_tier 字段（"priority" 即 fast，"flex"），按策略
	// 执行 filter（删除字段）或 block（拒绝请求）。对 gpt-5.5 等模型屏蔽
	// fast 时在此生效。
	//
	// 注意：
	//   1. 此处统一使用 upstreamModel（已经过 GetMappedModel +
	//      normalizeOpenAIModelForUpstream + Codex OAuth normalize），与
	//      chat-completions / messages 入口保持一致，避免不同入口因为模型
	//      维度不同而出现 whitelist 命中差异。
	//   2. action=pass 时也要把 raw "fast" 归一化为 "priority" 写回 body，
	//      否则 native /responses 入口透传 "fast" 给上游会被拒。chat-
	//      completions 入口由 normalizeResponsesBodyServiceTier 完成同一
	//      行为，这里手工实现等效逻辑。
	if rawTier, ok := reqBody["service_tier"].(string); ok {
		if normTier := normalizedOpenAIServiceTierValue(rawTier); normTier != "" {
			action, errMsg := s.evaluateOpenAIFastPolicy(ctx, account, upstreamModel, normTier)
			switch action {
			case BetaPolicyActionBlock:
				msg := errMsg
				if msg == "" {
					msg = fmt.Sprintf("openai service_tier=%s is not allowed for model %s", normTier, upstreamModel)
				}
				blocked := &OpenAIFastBlockedError{Message: msg}
				writeOpenAIFastPolicyBlockedResponse(c, blocked)
				return nil, blocked
			case BetaPolicyActionFilter:
				delete(reqBody, "service_tier")
				bodyModified = true
				disablePatch()
			default:
				// pass：若客户端传的是别名 "fast"，归一化为 "priority"
				// 后写回 body，确保上游收到的是其能识别的规范值。
				if normTier != rawTier {
					reqBody["service_tier"] = normTier
					bodyModified = true
					markPatchSet("service_tier", normTier)
				}
			}
		}
	}

	// Re-serialize body only if modified
	if bodyModified {
		serializedByPatch := false
		if !patchDisabled && patchHasOp {
			var patchErr error
			if patchDelete {
				body, patchErr = sjson.DeleteBytes(body, patchPath)
			} else {
				body, patchErr = sjson.SetBytes(body, patchPath, patchValue)
			}
			if patchErr == nil {
				serializedByPatch = true
			}
		}
		if !serializedByPatch {
			var marshalErr error
			body, marshalErr = json.Marshal(reqBody)
			if marshalErr != nil {
				return nil, fmt.Errorf("serialize request body: %w", marshalErr)
			}
		}
	}

	// Get access token
	token, _, err := s.GetAccessToken(ctx, account)
	if err != nil {
		return nil, err
	}

	// Capture upstream request body for ops retry of this attempt.
	setOpsUpstreamRequestBody(c, body)

	// 命中 WS 时仅走 WebSocket Mode；不再自动回退 HTTP。
	if wsDecision.Transport == OpenAIUpstreamTransportResponsesWebsocketV2 {
		wsReqBody := reqBody
		if len(reqBody) > 0 {
			wsReqBody = make(map[string]any, len(reqBody))
			for k, v := range reqBody {
				wsReqBody[k] = v
			}
		}
		_, hasPreviousResponseID := wsReqBody["previous_response_id"]
		logOpenAIWSModeDebug(
			"forward_start account_id=%d account_type=%s model=%s stream=%v has_previous_response_id=%v",
			account.ID,
			account.Type,
			upstreamModel,
			reqStream,
			hasPreviousResponseID,
		)
		maxAttempts := openAIWSReconnectRetryLimit + 1
		wsAttempts := 0
		var wsResult *OpenAIForwardResult
		var wsErr error
		wsLastFailureReason := ""
		wsPrevResponseRecoveryTried := false
		wsInvalidEncryptedContentRecoveryTried := false
		recoverPrevResponseNotFound := func(attempt int) bool {
			if wsPrevResponseRecoveryTried {
				return false
			}
			previousResponseID := openAIWSPayloadString(wsReqBody, "previous_response_id")
			if previousResponseID == "" {
				logOpenAIWSModeInfo(
					"reconnect_prev_response_recovery_skip account_id=%d attempt=%d reason=missing_previous_response_id previous_response_id_present=false",
					account.ID,
					attempt,
				)
				return false
			}
			if HasFunctionCallOutput(wsReqBody) {
				logOpenAIWSModeInfo(
					"reconnect_prev_response_recovery_skip account_id=%d attempt=%d reason=has_function_call_output previous_response_id_present=true",
					account.ID,
					attempt,
				)
				return false
			}
			delete(wsReqBody, "previous_response_id")
			wsPrevResponseRecoveryTried = true
			logOpenAIWSModeInfo(
				"reconnect_prev_response_recovery account_id=%d attempt=%d action=drop_previous_response_id retry=1 previous_response_id=%s previous_response_id_kind=%s",
				account.ID,
				attempt,
				truncateOpenAIWSLogValue(previousResponseID, openAIWSIDValueMaxLen),
				normalizeOpenAIWSLogValue(ClassifyOpenAIPreviousResponseIDKind(previousResponseID)),
			)
			return true
		}
		recoverInvalidEncryptedContent := func(attempt int) bool {
			if wsInvalidEncryptedContentRecoveryTried {
				return false
			}
			removedReasoningItems := trimOpenAIEncryptedReasoningItems(wsReqBody)
			if !removedReasoningItems {
				logOpenAIWSModeInfo(
					"reconnect_invalid_encrypted_content_recovery_skip account_id=%d attempt=%d reason=missing_encrypted_reasoning_items",
					account.ID,
					attempt,
				)
				return false
			}
			previousResponseID := openAIWSPayloadString(wsReqBody, "previous_response_id")
			hasFunctionCallOutput := HasFunctionCallOutput(wsReqBody)
			if previousResponseID != "" && !hasFunctionCallOutput {
				delete(wsReqBody, "previous_response_id")
			}
			wsInvalidEncryptedContentRecoveryTried = true
			logOpenAIWSModeInfo(
				"reconnect_invalid_encrypted_content_recovery account_id=%d attempt=%d action=drop_encrypted_reasoning_items retry=1 previous_response_id_present=%v previous_response_id=%s previous_response_id_kind=%s has_function_call_output=%v dropped_previous_response_id=%v",
				account.ID,
				attempt,
				previousResponseID != "",
				truncateOpenAIWSLogValue(previousResponseID, openAIWSIDValueMaxLen),
				normalizeOpenAIWSLogValue(ClassifyOpenAIPreviousResponseIDKind(previousResponseID)),
				hasFunctionCallOutput,
				previousResponseID != "" && !hasFunctionCallOutput,
			)
			return true
		}
		retryBudget := s.openAIWSRetryTotalBudget()
		retryStartedAt := time.Now()
	wsRetryLoop:
		for attempt := 1; attempt <= maxAttempts; attempt++ {
			wsAttempts = attempt
			wsResult, wsErr = s.forwardOpenAIWSV2(
				ctx,
				c,
				account,
				wsReqBody,
				token,
				wsDecision,
				isCodexCLI,
				reqStream,
				originalModel,
				upstreamModel,
				startTime,
				attempt,
				wsLastFailureReason,
			)
			if wsErr == nil {
				break
			}
			if c != nil && c.Writer != nil && c.Writer.Written() {
				break
			}

			reason, retryable := classifyOpenAIWSReconnectReason(wsErr)
			if reason != "" {
				wsLastFailureReason = reason
			}
			// previous_response_not_found 说明续链锚点不可用：
			// 对非 function_call_output 场景，允许一次“去掉 previous_response_id 后重放”。
			if reason == "previous_response_not_found" && recoverPrevResponseNotFound(attempt) {
				continue
			}
			if reason == "invalid_encrypted_content" && recoverInvalidEncryptedContent(attempt) {
				continue
			}
			if retryable && attempt < maxAttempts {
				backoff := s.openAIWSRetryBackoff(attempt)
				if retryBudget > 0 && time.Since(retryStartedAt)+backoff > retryBudget {
					s.recordOpenAIWSRetryExhausted()
					logOpenAIWSModeInfo(
						"reconnect_budget_exhausted account_id=%d attempts=%d max_retries=%d reason=%s elapsed_ms=%d budget_ms=%d",
						account.ID,
						attempt,
						openAIWSReconnectRetryLimit,
						normalizeOpenAIWSLogValue(reason),
						time.Since(retryStartedAt).Milliseconds(),
						retryBudget.Milliseconds(),
					)
					break
				}
				s.recordOpenAIWSRetryAttempt(backoff)
				logOpenAIWSModeInfo(
					"reconnect_retry account_id=%d retry=%d max_retries=%d reason=%s backoff_ms=%d",
					account.ID,
					attempt,
					openAIWSReconnectRetryLimit,
					normalizeOpenAIWSLogValue(reason),
					backoff.Milliseconds(),
				)
				if backoff > 0 {
					timer := time.NewTimer(backoff)
					select {
					case <-ctx.Done():
						if !timer.Stop() {
							<-timer.C
						}
						wsErr = wrapOpenAIWSFallback("retry_backoff_canceled", ctx.Err())
						break wsRetryLoop
					case <-timer.C:
					}
				}
				continue
			}
			if retryable {
				s.recordOpenAIWSRetryExhausted()
				logOpenAIWSModeInfo(
					"reconnect_exhausted account_id=%d attempts=%d max_retries=%d reason=%s",
					account.ID,
					attempt,
					openAIWSReconnectRetryLimit,
					normalizeOpenAIWSLogValue(reason),
				)
			} else if reason != "" {
				s.recordOpenAIWSNonRetryableFastFallback()
				logOpenAIWSModeInfo(
					"reconnect_stop account_id=%d attempt=%d reason=%s",
					account.ID,
					attempt,
					normalizeOpenAIWSLogValue(reason),
				)
			}
			break
		}
		if wsErr == nil {
			firstTokenMs := int64(0)
			hasFirstTokenMs := wsResult != nil && wsResult.FirstTokenMs != nil
			if hasFirstTokenMs {
				firstTokenMs = int64(*wsResult.FirstTokenMs)
			}
			requestID := ""
			if wsResult != nil {
				requestID = strings.TrimSpace(wsResult.RequestID)
			}
			logOpenAIWSModeDebug(
				"forward_succeeded account_id=%d request_id=%s stream=%v has_first_token_ms=%v first_token_ms=%d ws_attempts=%d",
				account.ID,
				requestID,
				reqStream,
				hasFirstTokenMs,
				firstTokenMs,
				wsAttempts,
			)
			wsResult.UpstreamModel = upstreamModel
			return wsResult, nil
		}
		s.writeOpenAIWSFallbackErrorResponse(c, account, wsErr)
		return nil, wsErr
	}

	httpInvalidEncryptedContentRetryTried := false
	for {
		// Build upstream request
		upstreamCtx, releaseUpstreamCtx := detachStreamUpstreamContext(ctx, reqStream)
		upstreamReq, err := s.buildUpstreamRequest(upstreamCtx, c, account, body, token, reqStream, promptCacheKey, isCodexCLI)
		releaseUpstreamCtx()
		if err != nil {
			return nil, err
		}

		// Get proxy URL
		proxyURL := ""
		if account.ProxyID != nil && account.Proxy != nil {
			proxyURL = account.Proxy.URL()
		}

		// Send request
		upstreamStart := time.Now()
		resp, err := s.httpUpstream.Do(upstreamReq, proxyURL, account.ID, account.Concurrency)
		SetOpsLatencyMs(c, OpsUpstreamLatencyMsKey, time.Since(upstreamStart).Milliseconds())
		if err != nil {
			// Ensure the client receives an error response (handlers assume Forward writes on non-failover errors).
			safeErr := sanitizeUpstreamErrorMessage(err.Error())
			setOpsUpstreamError(c, 0, safeErr, "")
			appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
				Platform:           account.Platform,
				AccountID:          account.ID,
				AccountName:        account.Name,
				UpstreamStatusCode: 0,
				Kind:               "request_error",
				Message:            safeErr,
			})
			c.JSON(http.StatusBadGateway, gin.H{
				"error": gin.H{
					"type":    "upstream_error",
					"message": "Upstream request failed",
				},
			})
			return nil, fmt.Errorf("upstream request failed: %s", safeErr)
		}

		// Handle error response
		if resp.StatusCode >= 400 {
			respBody, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
			_ = resp.Body.Close()
			resp.Body = io.NopCloser(bytes.NewReader(respBody))

			upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(respBody))
			upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)
			upstreamCode := extractUpstreamErrorCode(respBody)
			if !httpInvalidEncryptedContentRetryTried && resp.StatusCode == http.StatusBadRequest && upstreamCode == "invalid_encrypted_content" {
				if trimOpenAIEncryptedReasoningItems(reqBody) {
					body, err = json.Marshal(reqBody)
					if err != nil {
						return nil, fmt.Errorf("serialize invalid_encrypted_content retry body: %w", err)
					}
					setOpsUpstreamRequestBody(c, body)
					httpInvalidEncryptedContentRetryTried = true
					logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Retrying non-WSv2 request once after invalid_encrypted_content (account: %s)", account.Name)
					continue
				}
				logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Skip non-WSv2 invalid_encrypted_content retry because encrypted reasoning items are missing (account: %s)", account.Name)
			}
			if s.shouldFailoverOpenAIUpstreamResponse(resp.StatusCode, upstreamMsg, respBody) {
				upstreamDetail := ""
				if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
					maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
					if maxBytes <= 0 {
						maxBytes = 2048
					}
					upstreamDetail = truncateString(string(respBody), maxBytes)
				}
				appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
					Platform:           account.Platform,
					AccountID:          account.ID,
					AccountName:        account.Name,
					UpstreamStatusCode: resp.StatusCode,
					UpstreamRequestID:  resp.Header.Get("x-request-id"),
					Kind:               "failover",
					Message:            upstreamMsg,
					Detail:             upstreamDetail,
				})

				s.handleFailoverSideEffects(ctx, resp, account)
				return nil, &UpstreamFailoverError{
					StatusCode:             resp.StatusCode,
					ResponseBody:           respBody,
					RetryableOnSameAccount: account.IsPoolMode() && (isPoolModeRetryableStatus(resp.StatusCode) || isOpenAITransientProcessingError(resp.StatusCode, upstreamMsg, respBody)),
				}
			}
			return s.handleErrorResponse(ctx, resp, c, account, body)
		}
		defer func() { _ = resp.Body.Close() }()

		// Handle normal response
		var usage *OpenAIUsage
		var firstTokenMs *int
		if reqStream {
			streamResult, err := s.handleStreamingResponse(ctx, resp, c, account, startTime, originalModel, upstreamModel)
			if err != nil {
				return nil, err
			}
			usage = streamResult.usage
			firstTokenMs = streamResult.firstTokenMs
		} else {
			usage, err = s.handleNonStreamingResponse(ctx, resp, c, account, originalModel, upstreamModel)
			if err != nil {
				return nil, err
			}
		}

		// Extract and save Codex usage snapshot from response headers (for OAuth accounts)
		if account.Type == AccountTypeOAuth {
			if snapshot := ParseCodexRateLimitHeaders(resp.Header); snapshot != nil {
				s.updateCodexUsageSnapshot(ctx, account.ID, snapshot)
			}
		}

		if usage == nil {
			usage = &OpenAIUsage{}
		}

		reasoningEffort := extractOpenAIReasoningEffort(reqBody, originalModel)
		serviceTier := extractOpenAIServiceTier(reqBody)

		return &OpenAIForwardResult{
			RequestID:       resp.Header.Get("x-request-id"),
			Usage:           *usage,
			Model:           originalModel,
			UpstreamModel:   upstreamModel,
			ServiceTier:     serviceTier,
			ReasoningEffort: reasoningEffort,
			Stream:          reqStream,
			OpenAIWSMode:    false,
			Duration:        time.Since(startTime),
			FirstTokenMs:    firstTokenMs,
		}, nil
	}
}

func (s *OpenAIGatewayService) forwardOpenAIPassthrough(
	ctx context.Context,
	c *gin.Context,
	account *Account,
	body []byte,
	reqModel string,
	reasoningEffort *string,
	reqStream bool,
	startTime time.Time,
) (*OpenAIForwardResult, error) {
	upstreamPassthroughModel := ""
	if isOpenAIResponsesCompactPath(c) {
		compactMappedModel := resolveOpenAICompactForwardModel(account, reqModel)
		if compactMappedModel != "" && compactMappedModel != reqModel {
			nextBody, setErr := sjson.SetBytes(body, "model", compactMappedModel)
			if setErr != nil {
				return nil, fmt.Errorf("set compact passthrough model: %w", setErr)
			}
			body = nextBody
			upstreamPassthroughModel = compactMappedModel
		}
	}

	if account != nil && account.Type == AccountTypeOAuth {
		if rejectReason := detectOpenAIPassthroughInstructionsRejectReason(reqModel, body); rejectReason != "" {
			rejectMsg := "OpenAI codex passthrough requires a non-empty instructions field"
			setOpsUpstreamError(c, http.StatusForbidden, rejectMsg, "")
			appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
				Platform:           account.Platform,
				AccountID:          account.ID,
				AccountName:        account.Name,
				UpstreamStatusCode: http.StatusForbidden,
				Passthrough:        true,
				Kind:               "request_error",
				Message:            rejectMsg,
				Detail:             rejectReason,
			})
			logOpenAIPassthroughInstructionsRejected(ctx, c, account, reqModel, rejectReason, body)
			c.JSON(http.StatusForbidden, gin.H{
				"error": gin.H{
					"type":    "forbidden_error",
					"message": rejectMsg,
				},
			})
			return nil, fmt.Errorf("openai passthrough rejected before upstream: %s", rejectReason)
		}

		normalizedBody, normalized, err := normalizeOpenAIPassthroughOAuthBody(body, isOpenAIResponsesCompactPath(c))
		if err != nil {
			return nil, err
		}
		if normalized {
			body = normalizedBody
		}
		reqStream = gjson.GetBytes(body, "stream").Bool()
	}

	sanitizedBody, sanitized, err := sanitizeEmptyBase64InputImagesInOpenAIBody(body)
	if err != nil {
		return nil, err
	}
	if sanitized {
		body = sanitizedBody
	}

	// Apply OpenAI fast policy to the passthrough body (filter/block by service_tier).
	// 统一使用 upstream 视角的 model：透传路径下 body 已经过 compact 映射 +
	// OAuth normalize，body 中的 model 字段即上游真正会看到的 slug。
	// 这样可以与 chat-completions / messages / native /responses 入口的
	// upstreamModel 保持一致，避免 whitelist 命中差异。当 body 中没有
	// model 字段时退回 reqModel。
	policyModel := strings.TrimSpace(gjson.GetBytes(body, "model").String())
	if policyModel == "" {
		policyModel = reqModel
	}
	updatedBody, policyErr := s.applyOpenAIFastPolicyToBody(ctx, account, policyModel, body)
	if policyErr != nil {
		var blocked *OpenAIFastBlockedError
		if errors.As(policyErr, &blocked) {
			writeOpenAIFastPolicyBlockedResponse(c, blocked)
		}
		return nil, policyErr
	}
	body = updatedBody

	logger.LegacyPrintf("service.openai_gateway",
		"[OpenAI 自动透传] 命中自动透传分支: account=%d name=%s type=%s model=%s stream=%v",
		account.ID,
		account.Name,
		account.Type,
		reqModel,
		reqStream,
	)
	if reqStream && c != nil && c.Request != nil {
		if timeoutHeaders := collectOpenAIPassthroughTimeoutHeaders(c.Request.Header); len(timeoutHeaders) > 0 {
			streamWarnLogger := logger.FromContext(ctx).With(
				zap.String("component", "service.openai_gateway"),
				zap.Int64("account_id", account.ID),
				zap.Strings("timeout_headers", timeoutHeaders),
			)
			if s.isOpenAIPassthroughTimeoutHeadersAllowed() {
				streamWarnLogger.Warn("OpenAI passthrough 透传请求包含超时相关请求头，且当前配置为放行，可能导致上游提前断流")
			} else {
				streamWarnLogger.Warn("OpenAI passthrough 检测到超时相关请求头，将按配置过滤以降低断流风险")
			}
		}
	}

	// Get access token
	token, _, err := s.GetAccessToken(ctx, account)
	if err != nil {
		return nil, err
	}

	upstreamCtx, releaseUpstreamCtx := detachStreamUpstreamContext(ctx, reqStream)
	upstreamReq, err := s.buildUpstreamRequestOpenAIPassthrough(upstreamCtx, c, account, body, token)
	releaseUpstreamCtx()
	if err != nil {
		return nil, err
	}

	proxyURL := ""
	if account.ProxyID != nil && account.Proxy != nil {
		proxyURL = account.Proxy.URL()
	}

	setOpsUpstreamRequestBody(c, body)
	if c != nil {
		c.Set("openai_passthrough", true)
	}

	upstreamStart := time.Now()
	resp, err := s.httpUpstream.Do(upstreamReq, proxyURL, account.ID, account.Concurrency)
	SetOpsLatencyMs(c, OpsUpstreamLatencyMsKey, time.Since(upstreamStart).Milliseconds())
	if err != nil {
		safeErr := sanitizeUpstreamErrorMessage(err.Error())
		setOpsUpstreamError(c, 0, safeErr, "")
		appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
			Platform:           account.Platform,
			AccountID:          account.ID,
			AccountName:        account.Name,
			UpstreamStatusCode: 0,
			Passthrough:        true,
			Kind:               "request_error",
			Message:            safeErr,
		})
		c.JSON(http.StatusBadGateway, gin.H{
			"error": gin.H{
				"type":    "upstream_error",
				"message": "Upstream request failed",
			},
		})
		return nil, fmt.Errorf("upstream request failed: %s", safeErr)
	}
	defer func() { _ = resp.Body.Close() }()

	if resp.StatusCode >= 400 {
		// 透传模式默认保持原样代理；但 429/529 属于网关必须兜底的
		// 上游容量类错误，应先触发多账号 failover 以维持基础 SLA。
		if shouldFailoverOpenAIPassthroughResponse(resp.StatusCode) {
			return nil, s.handleFailoverErrorResponsePassthrough(ctx, resp, c, account, body)
		}
		return nil, s.handleErrorResponsePassthrough(ctx, resp, c, account, body)
	}

	var usage *OpenAIUsage
	var firstTokenMs *int
	if reqStream {
		result, err := s.handleStreamingResponsePassthrough(ctx, resp, c, account, startTime, reqModel, upstreamPassthroughModel)
		if err != nil {
			return nil, err
		}
		usage = result.usage
		firstTokenMs = result.firstTokenMs
	} else {
		usage, err = s.handleNonStreamingResponsePassthrough(ctx, resp, c, reqModel, upstreamPassthroughModel)
		if err != nil {
			return nil, err
		}
	}

	if snapshot := ParseCodexRateLimitHeaders(resp.Header); snapshot != nil {
		s.updateCodexUsageSnapshot(ctx, account.ID, snapshot)
	}

	if usage == nil {
		usage = &OpenAIUsage{}
	}

	return &OpenAIForwardResult{
		RequestID:       resp.Header.Get("x-request-id"),
		Usage:           *usage,
		Model:           reqModel,
		UpstreamModel:   upstreamPassthroughModel,
		ServiceTier:     extractOpenAIServiceTierFromBody(body),
		ReasoningEffort: reasoningEffort,
		Stream:          reqStream,
		OpenAIWSMode:    false,
		Duration:        time.Since(startTime),
		FirstTokenMs:    firstTokenMs,
	}, nil
}

func logOpenAIPassthroughInstructionsRejected(
	ctx context.Context,
	c *gin.Context,
	account *Account,
	reqModel string,
	rejectReason string,
	body []byte,
) {
	if ctx == nil {
		ctx = context.Background()
	}
	accountID := int64(0)
	accountName := ""
	accountType := ""
	if account != nil {
		accountID = account.ID
		accountName = strings.TrimSpace(account.Name)
		accountType = strings.TrimSpace(string(account.Type))
	}
	fields := []zap.Field{
		zap.String("component", "service.openai_gateway"),
		zap.Int64("account_id", accountID),
		zap.String("account_name", accountName),
		zap.String("account_type", accountType),
		zap.String("request_model", strings.TrimSpace(reqModel)),
		zap.String("reject_reason", strings.TrimSpace(rejectReason)),
	}
	fields = appendCodexCLIOnlyRejectedRequestFields(fields, c, body)
	logger.FromContext(ctx).With(fields...).Warn("OpenAI passthrough 本地拦截：Codex 请求缺少有效 instructions")
}

func (s *OpenAIGatewayService) buildUpstreamRequestOpenAIPassthrough(
	ctx context.Context,
	c *gin.Context,
	account *Account,
	body []byte,
	token string,
) (*http.Request, error) {
	targetURL := openaiPlatformAPIURL
	switch account.Type {
	case AccountTypeOAuth:
		targetURL = chatgptCodexURL
	case AccountTypeAPIKey:
		baseURL := account.GetOpenAIBaseURL()
		if baseURL != "" {
			validatedURL, err := s.validateUpstreamBaseURL(baseURL)
			if err != nil {
				return nil, err
			}
			targetURL = buildOpenAIResponsesURL(validatedURL)
		}
	}
	targetURL = appendOpenAIResponsesRequestPathSuffix(targetURL, openAIResponsesRequestPathSuffix(c))

	req, err := http.NewRequestWithContext(ctx, http.MethodPost, targetURL, bytes.NewReader(body))
	if err != nil {
		return nil, err
	}

	// 透传客户端请求头（安全白名单）。
	allowTimeoutHeaders := s.isOpenAIPassthroughTimeoutHeadersAllowed()
	if c != nil && c.Request != nil {
		for key, values := range c.Request.Header {
			lower := strings.ToLower(strings.TrimSpace(key))
			if !isOpenAIPassthroughAllowedRequestHeader(lower, allowTimeoutHeaders) {
				continue
			}
			for _, v := range values {
				req.Header.Add(key, v)
			}
		}
	}

	// 覆盖入站鉴权残留，并注入上游认证
	req.Header.Del("authorization")
	req.Header.Del("x-api-key")
	req.Header.Del("x-goog-api-key")
	req.Header.Set("authorization", "Bearer "+token)

	// OAuth 透传到 ChatGPT internal API 时补齐必要头。
	if account.Type == AccountTypeOAuth {
		promptCacheKey := strings.TrimSpace(gjson.GetBytes(body, "prompt_cache_key").String())
		req.Host = "chatgpt.com"
		if chatgptAccountID := account.GetChatGPTAccountID(); chatgptAccountID != "" {
			req.Header.Set("chatgpt-account-id", chatgptAccountID)
		}
		apiKeyID := getAPIKeyIDFromContext(c)
		// 先保存客户端原始值，再做 compact 补充，避免后续统一隔离时读到已处理的值。
		clientSessionID := strings.TrimSpace(req.Header.Get("session_id"))
		clientConversationID := strings.TrimSpace(req.Header.Get("conversation_id"))
		if isOpenAIResponsesCompactPath(c) {
			req.Header.Set("accept", "application/json")
			if req.Header.Get("version") == "" {
				req.Header.Set("version", codexCLIVersion)
			}
			if clientSessionID == "" {
				clientSessionID = resolveOpenAICompactSessionID(c)
			}
		} else if req.Header.Get("accept") == "" {
			req.Header.Set("accept", "text/event-stream")
		}
		if req.Header.Get("OpenAI-Beta") == "" {
			req.Header.Set("OpenAI-Beta", "responses=experimental")
		}
		if req.Header.Get("originator") == "" {
			req.Header.Set("originator", "codex_cli_rs")
		}
		// 用隔离后的 session 标识符覆盖客户端透传值，防止跨用户会话碰撞。
		if clientSessionID == "" {
			clientSessionID = promptCacheKey
		}
		if clientConversationID == "" {
			clientConversationID = promptCacheKey
		}
		if clientSessionID != "" {
			req.Header.Set("session_id", isolateOpenAISessionID(apiKeyID, clientSessionID))
		}
		if clientConversationID != "" {
			req.Header.Set("conversation_id", isolateOpenAISessionID(apiKeyID, clientConversationID))
		}
	}

	// 透传模式也支持账户自定义 User-Agent 与 ForceCodexCLI 兜底。
	customUA := account.GetOpenAIUserAgent()
	if customUA != "" {
		req.Header.Set("user-agent", customUA)
	}
	if s.cfg != nil && s.cfg.Gateway.ForceCodexCLI {
		req.Header.Set("user-agent", codexCLIUserAgent)
	}
	// OAuth 安全透传：对非 Codex UA 统一兜底，降低被上游风控拦截概率。
	if account.Type == AccountTypeOAuth && !openai.IsCodexCLIRequest(req.Header.Get("user-agent")) {
		req.Header.Set("user-agent", codexCLIUserAgent)
	}

	if req.Header.Get("content-type") == "" {
		req.Header.Set("content-type", "application/json")
	}

	return req, nil
}

func shouldFailoverOpenAIPassthroughResponse(statusCode int) bool {
	switch statusCode {
	case http.StatusTooManyRequests, 529:
		return true
	default:
		return false
	}
}

func (s *OpenAIGatewayService) handleFailoverErrorResponsePassthrough(
	ctx context.Context,
	resp *http.Response,
	c *gin.Context,
	account *Account,
	requestBody []byte,
) error {
	body, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))

	upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(body))
	upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)
	upstreamDetail := ""
	if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
		maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
		if maxBytes <= 0 {
			maxBytes = 2048
		}
		upstreamDetail = truncateString(string(body), maxBytes)
	}
	setOpsUpstreamError(c, resp.StatusCode, upstreamMsg, upstreamDetail)
	logOpenAIInstructionsRequiredDebug(ctx, c, account, resp.StatusCode, upstreamMsg, requestBody, body)
	if s.rateLimitService != nil {
		_ = s.rateLimitService.HandleUpstreamError(ctx, account, resp.StatusCode, resp.Header, body)
	}
	appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
		Platform:             account.Platform,
		AccountID:            account.ID,
		AccountName:          account.Name,
		UpstreamStatusCode:   resp.StatusCode,
		UpstreamRequestID:    resp.Header.Get("x-request-id"),
		Passthrough:          true,
		Kind:                 "failover",
		Message:              upstreamMsg,
		Detail:               upstreamDetail,
		UpstreamResponseBody: upstreamDetail,
	})
	return &UpstreamFailoverError{
		StatusCode:      resp.StatusCode,
		ResponseBody:    body,
		ResponseHeaders: resp.Header.Clone(),
	}
}

func (s *OpenAIGatewayService) handleErrorResponsePassthrough(
	ctx context.Context,
	resp *http.Response,
	c *gin.Context,
	account *Account,
	requestBody []byte,
) error {
	body, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))

	upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(body))
	upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)
	upstreamDetail := ""
	if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
		maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
		if maxBytes <= 0 {
			maxBytes = 2048
		}
		upstreamDetail = truncateString(string(body), maxBytes)
	}
	setOpsUpstreamError(c, resp.StatusCode, upstreamMsg, upstreamDetail)
	logOpenAIInstructionsRequiredDebug(ctx, c, account, resp.StatusCode, upstreamMsg, requestBody, body)
	if s.rateLimitService != nil {
		// Passthrough mode preserves the raw upstream error response, but runtime
		// account state still needs to be updated so sticky routing can stop
		// reusing a freshly rate-limited account.
		_ = s.rateLimitService.HandleUpstreamError(ctx, account, resp.StatusCode, resp.Header, body)
	}
	appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
		Platform:             account.Platform,
		AccountID:            account.ID,
		AccountName:          account.Name,
		UpstreamStatusCode:   resp.StatusCode,
		UpstreamRequestID:    resp.Header.Get("x-request-id"),
		Passthrough:          true,
		Kind:                 "http_error",
		Message:              upstreamMsg,
		Detail:               upstreamDetail,
		UpstreamResponseBody: upstreamDetail,
	})

	writeOpenAIPassthroughResponseHeaders(c.Writer.Header(), resp.Header, s.responseHeaderFilter)
	contentType := resp.Header.Get("Content-Type")
	if contentType == "" {
		contentType = "application/json"
	}
	c.Data(resp.StatusCode, contentType, body)

	if upstreamMsg == "" {
		return fmt.Errorf("upstream error: %d", resp.StatusCode)
	}
	return fmt.Errorf("upstream error: %d message=%s", resp.StatusCode, upstreamMsg)
}

func isOpenAIPassthroughAllowedRequestHeader(lowerKey string, allowTimeoutHeaders bool) bool {
	if lowerKey == "" {
		return false
	}
	if isOpenAIPassthroughTimeoutHeader(lowerKey) {
		return allowTimeoutHeaders
	}
	return openaiPassthroughAllowedHeaders[lowerKey]
}

func isOpenAIPassthroughTimeoutHeader(lowerKey string) bool {
	switch lowerKey {
	case "x-stainless-timeout", "x-stainless-read-timeout", "x-stainless-connect-timeout", "x-request-timeout", "request-timeout", "grpc-timeout":
		return true
	default:
		return false
	}
}

func (s *OpenAIGatewayService) isOpenAIPassthroughTimeoutHeadersAllowed() bool {
	return s != nil && s.cfg != nil && s.cfg.Gateway.OpenAIPassthroughAllowTimeoutHeaders
}

func collectOpenAIPassthroughTimeoutHeaders(h http.Header) []string {
	if h == nil {
		return nil
	}
	var matched []string
	for key, values := range h {
		lowerKey := strings.ToLower(strings.TrimSpace(key))
		if isOpenAIPassthroughTimeoutHeader(lowerKey) {
			entry := lowerKey
			if len(values) > 0 {
				entry = fmt.Sprintf("%s=%s", lowerKey, strings.Join(values, "|"))
			}
			matched = append(matched, entry)
		}
	}
	sort.Strings(matched)
	return matched
}

type openaiStreamingResultPassthrough struct {
	usage        *OpenAIUsage
	firstTokenMs *int
}

func openAIStreamClientOutputStarted(c *gin.Context, localStarted bool) bool {
	if localStarted {
		return true
	}
	return c != nil && c.Writer != nil && c.Writer.Written()
}

func openAIStreamEventIsPreamble(eventType string) bool {
	switch strings.TrimSpace(eventType) {
	case "response.created", "response.in_progress":
		return true
	default:
		return false
	}
}

func openAIStreamDataStartsClientOutput(data, eventType string) bool {
	trimmed := strings.TrimSpace(data)
	if trimmed == "" {
		return false
	}
	if strings.TrimSpace(eventType) == "response.failed" {
		return false
	}
	return !openAIStreamEventIsPreamble(eventType)
}

func openAIStreamFailedEventShouldFailover(payload []byte, message string) bool {
	code := strings.ToLower(strings.TrimSpace(gjson.GetBytes(payload, "response.error.code").String()))
	if code == "" {
		code = strings.ToLower(strings.TrimSpace(gjson.GetBytes(payload, "error.code").String()))
	}
	errType := strings.ToLower(strings.TrimSpace(gjson.GetBytes(payload, "response.error.type").String()))
	if errType == "" {
		errType = strings.ToLower(strings.TrimSpace(gjson.GetBytes(payload, "error.type").String()))
	}
	combined := strings.ToLower(strings.TrimSpace(message + " " + code + " " + errType))
	if combined == "" {
		return true
	}
	nonRetryableMarkers := []string{
		"invalid_request",
		"content_policy",
		"policy",
		"safety",
		"high-risk cyber",
		"not allowed",
		"violat",
	}
	for _, marker := range nonRetryableMarkers {
		if strings.Contains(combined, marker) {
			return false
		}
	}
	return true
}

func (s *OpenAIGatewayService) newOpenAIStreamFailoverError(
	c *gin.Context,
	account *Account,
	passthrough bool,
	upstreamRequestID string,
	payload []byte,
	message string,
) *UpstreamFailoverError {
	message = sanitizeUpstreamErrorMessage(strings.TrimSpace(message))
	if message == "" {
		message = "OpenAI stream disconnected before completion"
	}
	detail := ""
	if len(payload) > 0 && s != nil && s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
		maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
		if maxBytes <= 0 {
			maxBytes = 2048
		}
		detail = truncateString(string(payload), maxBytes)
	}
	if c != nil {
		setOpsUpstreamError(c, http.StatusBadGateway, message, detail)
		event := OpsUpstreamErrorEvent{
			Platform:           PlatformOpenAI,
			UpstreamStatusCode: http.StatusBadGateway,
			UpstreamRequestID:  strings.TrimSpace(upstreamRequestID),
			Passthrough:        passthrough,
			Kind:               "failover",
			Message:            message,
			Detail:             detail,
		}
		if account != nil {
			event.Platform = account.Platform
			event.AccountID = account.ID
			event.AccountName = account.Name
		}
		appendOpsUpstreamError(c, event)
	}
	body, _ := json.Marshal(gin.H{
		"error": gin.H{
			"type":    "upstream_error",
			"message": message,
		},
	})
	return &UpstreamFailoverError{
		StatusCode:   http.StatusBadGateway,
		ResponseBody: body,
	}
}

func (s *OpenAIGatewayService) handleStreamingResponsePassthrough(
	ctx context.Context,
	resp *http.Response,
	c *gin.Context,
	account *Account,
	startTime time.Time,
	originalModel string,
	mappedModel string,
) (*openaiStreamingResultPassthrough, error) {
	writeOpenAIPassthroughResponseHeaders(c.Writer.Header(), resp.Header, s.responseHeaderFilter)

	// SSE headers
	c.Header("Content-Type", "text/event-stream")
	c.Header("Cache-Control", "no-cache")
	c.Header("Connection", "keep-alive")
	c.Header("X-Accel-Buffering", "no")
	if v := resp.Header.Get("x-request-id"); v != "" {
		c.Header("x-request-id", v)
	}

	w := c.Writer
	flusher, ok := w.(http.Flusher)
	if !ok {
		return nil, errors.New("streaming not supported")
	}

	usage := &OpenAIUsage{}
	var firstTokenMs *int
	clientDisconnected := false
	sawDone := false
	sawTerminalEvent := false
	sawFailedEvent := false
	failedMessage := ""
	clientOutputStarted := false
	upstreamRequestID := strings.TrimSpace(resp.Header.Get("x-request-id"))
	pendingLines := make([]string, 0, 8)
	writePendingLines := func() bool {
		for _, pending := range pendingLines {
			if _, err := fmt.Fprintln(w, pending); err != nil {
				clientDisconnected = true
				logger.LegacyPrintf("service.openai_gateway", "[OpenAI passthrough] Client disconnected during streaming, continue draining upstream for usage: account=%d", account.ID)
				return false
			}
		}
		pendingLines = pendingLines[:0]
		return true
	}

	scanner := bufio.NewScanner(resp.Body)
	maxLineSize := defaultMaxLineSize
	if s.cfg != nil && s.cfg.Gateway.MaxLineSize > 0 {
		maxLineSize = s.cfg.Gateway.MaxLineSize
	}
	scanBuf := getSSEScannerBuf64K()
	scanner.Buffer(scanBuf[:0], maxLineSize)
	defer putSSEScannerBuf64K(scanBuf)

	needModelReplace := strings.TrimSpace(originalModel) != "" && strings.TrimSpace(mappedModel) != "" && strings.TrimSpace(originalModel) != strings.TrimSpace(mappedModel)

	for scanner.Scan() {
		line := scanner.Text()
		lineStartsClientOutput := false
		forceFlushFailedEvent := false
		if data, ok := extractOpenAISSEDataLine(line); ok {
			dataBytes := []byte(data)
			trimmedData := strings.TrimSpace(data)
			if needModelReplace && strings.Contains(data, mappedModel) {
				line = s.replaceModelInSSELine(line, mappedModel, originalModel)
				if replacedData, replaced := extractOpenAISSEDataLine(line); replaced {
					dataBytes = []byte(replacedData)
					trimmedData = strings.TrimSpace(replacedData)
				}
			}
			eventType := strings.TrimSpace(gjson.Get(trimmedData, "type").String())
			if eventType == "response.failed" {
				failedMessage = extractOpenAISSEErrorMessage(dataBytes)
				if !openAIStreamClientOutputStarted(c, clientOutputStarted) && openAIStreamFailedEventShouldFailover(dataBytes, failedMessage) {
					return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs},
						s.newOpenAIStreamFailoverError(c, account, true, upstreamRequestID, dataBytes, failedMessage)
				}
				forceFlushFailedEvent = true
				sawFailedEvent = true
			}
			if trimmedData == "[DONE]" {
				sawDone = true
			}
			if openAIStreamEventIsTerminal(trimmedData) {
				sawTerminalEvent = true
			}
			lineStartsClientOutput = forceFlushFailedEvent || openAIStreamDataStartsClientOutput(trimmedData, eventType)
			if firstTokenMs == nil && lineStartsClientOutput && trimmedData != "[DONE]" {
				ms := int(time.Since(startTime).Milliseconds())
				firstTokenMs = &ms
			}
			s.parseSSEUsageBytes(dataBytes, usage)
		}

		if !clientDisconnected {
			if !clientOutputStarted && !lineStartsClientOutput {
				pendingLines = append(pendingLines, line)
				continue
			}
			if !clientOutputStarted && len(pendingLines) > 0 {
				if !writePendingLines() {
					continue
				}
			}
			if _, err := fmt.Fprintln(w, line); err != nil {
				clientDisconnected = true
				logger.LegacyPrintf("service.openai_gateway", "[OpenAI passthrough] Client disconnected during streaming, continue draining upstream for usage: account=%d", account.ID)
			} else {
				clientOutputStarted = true
				flusher.Flush()
			}
		}
	}
	if err := scanner.Err(); err != nil {
		if sawTerminalEvent && !sawFailedEvent {
			return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, nil
		}
		if sawFailedEvent {
			return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, fmt.Errorf("upstream response failed: %s", failedMessage)
		}
		if errors.Is(err, context.Canceled) || errors.Is(err, context.DeadlineExceeded) {
			return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, fmt.Errorf("stream usage incomplete: %w", err)
		}
		if errors.Is(err, bufio.ErrTooLong) {
			logger.LegacyPrintf("service.openai_gateway", "[OpenAI passthrough] SSE line too long: account=%d max_size=%d error=%v", account.ID, maxLineSize, err)
			return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, err
		}
		if !openAIStreamClientOutputStarted(c, clientOutputStarted) {
			msg := "OpenAI stream disconnected before completion"
			if errText := strings.TrimSpace(err.Error()); errText != "" {
				msg += ": " + errText
			}
			return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs},
				s.newOpenAIStreamFailoverError(c, account, true, upstreamRequestID, nil, msg)
		}
		if clientDisconnected {
			return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, fmt.Errorf("stream usage incomplete after disconnect: %w", err)
		}
		logger.LegacyPrintf("service.openai_gateway",
			"[OpenAI passthrough] 流读取异常中断: account=%d request_id=%s err=%v",
			account.ID,
			upstreamRequestID,
			err,
		)
		return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, fmt.Errorf("stream read error: %w", err)
	}
	if sawFailedEvent {
		return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, fmt.Errorf("upstream response failed: %s", failedMessage)
	}
	if !clientDisconnected && !sawDone && !sawTerminalEvent && ctx.Err() == nil {
		logger.FromContext(ctx).With(
			zap.String("component", "service.openai_gateway"),
			zap.Int64("account_id", account.ID),
			zap.String("upstream_request_id", upstreamRequestID),
		).Info("OpenAI passthrough 上游流在未收到 [DONE] 时结束，疑似断流")
		if !openAIStreamClientOutputStarted(c, clientOutputStarted) {
			return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs},
				s.newOpenAIStreamFailoverError(c, account, true, upstreamRequestID, nil, "OpenAI stream ended before a terminal event")
		}
		return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, errors.New("stream usage incomplete: missing terminal event")
	}

	return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, nil
}

func (s *OpenAIGatewayService) handleNonStreamingResponsePassthrough(
	ctx context.Context,
	resp *http.Response,
	c *gin.Context,
	originalModel string,
	mappedModel string,
) (*OpenAIUsage, error) {
	body, err := ReadUpstreamResponseBody(resp.Body, s.cfg, c, openAITooLargeError)
	if err != nil {
		return nil, err
	}

	// Detect SSE responses from upstream and convert to JSON.
	// Some upstreams (e.g. other sub2api instances) may return SSE even when
	// stream=false was requested. Without this conversion the client would
	// receive raw SSE text or a terminal event with empty output.
	if isEventStreamResponse(resp.Header) {
		return s.handlePassthroughSSEToJSON(resp, c, body, originalModel, mappedModel)
	}

	usage := &OpenAIUsage{}
	usageParsed := false
	if len(body) > 0 {
		if parsedUsage, ok := extractOpenAIUsageFromJSONBytes(body); ok {
			*usage = parsedUsage
			usageParsed = true
		}
	}
	if !usageParsed {
		// 兜底：尝试从 SSE 文本中解析 usage
		usage = s.parseSSEUsageFromBody(string(body))
	}

	writeOpenAIPassthroughResponseHeaders(c.Writer.Header(), resp.Header, s.responseHeaderFilter)

	contentType := resp.Header.Get("Content-Type")
	if contentType == "" {
		contentType = "application/json"
	}
	if originalModel != "" && mappedModel != "" && originalModel != mappedModel {
		body = s.replaceModelInResponseBody(body, mappedModel, originalModel)
	}
	c.Data(resp.StatusCode, contentType, body)
	return usage, nil
}

// handlePassthroughSSEToJSON converts an SSE response body into a JSON
// response for the passthrough path. It mirrors handleSSEToJSON while
// preserving passthrough payloads, except compact-only model remapping may
// rewrite model fields back to the original requested model.
func (s *OpenAIGatewayService) handlePassthroughSSEToJSON(resp *http.Response, c *gin.Context, body []byte, originalModel string, mappedModel string) (*OpenAIUsage, error) {
	bodyText := string(body)
	finalResponse, ok := extractCodexFinalResponse(bodyText)

	usage := &OpenAIUsage{}
	if ok {
		if parsedUsage, parsed := extractOpenAIUsageFromJSONBytes(finalResponse); parsed {
			*usage = parsedUsage
		}
		// When the terminal event has an empty output array, reconstruct
		// output from accumulated delta events so the client gets full content.
		if len(gjson.GetBytes(finalResponse, "output").Array()) == 0 {
			if outputJSON, reconstructed := reconstructResponseOutputFromSSE(bodyText); reconstructed {
				if patched, err := sjson.SetRawBytes(finalResponse, "output", outputJSON); err == nil {
					finalResponse = patched
				}
			}
		}
		body = finalResponse
		if originalModel != "" && mappedModel != "" && originalModel != mappedModel {
			body = s.replaceModelInResponseBody(body, mappedModel, originalModel)
		}
		// Correct tool calls in final response
		body = s.correctToolCallsInResponseBody(body)
	} else {
		terminalType, terminalPayload, terminalOK := extractOpenAISSETerminalEvent(bodyText)
		if terminalOK && terminalType == "response.failed" {
			msg := extractOpenAISSEErrorMessage(terminalPayload)
			if msg == "" {
				msg = "Upstream compact response failed"
			}
			return nil, s.writeOpenAINonStreamingProtocolError(resp, c, msg)
		}
		usage = s.parseSSEUsageFromBody(bodyText)
		if originalModel != "" && mappedModel != "" && originalModel != mappedModel {
			bodyText = s.replaceModelInSSEBody(bodyText, mappedModel, originalModel)
		}
		body = []byte(bodyText)
	}

	writeOpenAIPassthroughResponseHeaders(c.Writer.Header(), resp.Header, s.responseHeaderFilter)

	contentType := "application/json; charset=utf-8"
	if !ok {
		contentType = resp.Header.Get("Content-Type")
		if contentType == "" {
			contentType = "text/event-stream"
		}
	}
	c.Data(resp.StatusCode, contentType, body)

	return usage, nil
}

func writeOpenAIPassthroughResponseHeaders(dst http.Header, src http.Header, filter *responseheaders.CompiledHeaderFilter) {
	if dst == nil || src == nil {
		return
	}
	if filter != nil {
		responseheaders.WriteFilteredHeaders(dst, src, filter)
	} else {
		// 兜底：尽量保留最基础的 content-type
		if v := strings.TrimSpace(src.Get("Content-Type")); v != "" {
			dst.Set("Content-Type", v)
		}
	}
	// 透传模式强制放行 x-codex-* 响应头（若上游返回）。
	// 注意：真实 http.Response.Header 的 key 一般会被 canonicalize；但为了兼容测试/自建响应，
	// 这里用 EqualFold 做一次大小写不敏感的查找。
	getCaseInsensitiveValues := func(h http.Header, want string) []string {
		if h == nil {
			return nil
		}
		for k, vals := range h {
			if strings.EqualFold(k, want) {
				return vals
			}
		}
		return nil
	}

	for _, rawKey := range []string{
		"x-codex-primary-used-percent",
		"x-codex-primary-reset-after-seconds",
		"x-codex-primary-window-minutes",
		"x-codex-secondary-used-percent",
		"x-codex-secondary-reset-after-seconds",
		"x-codex-secondary-window-minutes",
		"x-codex-primary-over-secondary-limit-percent",
	} {
		vals := getCaseInsensitiveValues(src, rawKey)
		if len(vals) == 0 {
			continue
		}
		key := http.CanonicalHeaderKey(rawKey)
		dst.Del(key)
		for _, v := range vals {
			dst.Add(key, v)
		}
	}
}

func (s *OpenAIGatewayService) buildUpstreamRequest(ctx context.Context, c *gin.Context, account *Account, body []byte, token string, isStream bool, promptCacheKey string, isCodexCLI bool) (*http.Request, error) {
	// Determine target URL based on account type
	var targetURL string
	switch account.Type {
	case AccountTypeOAuth:
		// OAuth accounts use ChatGPT internal API
		targetURL = chatgptCodexURL
	case AccountTypeAPIKey:
		// API Key accounts use Platform API or custom base URL
		baseURL := account.GetOpenAIBaseURL()
		if baseURL == "" {
			targetURL = openaiPlatformAPIURL
		} else {
			validatedURL, err := s.validateUpstreamBaseURL(baseURL)
			if err != nil {
				return nil, err
			}
			targetURL = buildOpenAIResponsesURL(validatedURL)
		}
	default:
		targetURL = openaiPlatformAPIURL
	}
	targetURL = appendOpenAIResponsesRequestPathSuffix(targetURL, openAIResponsesRequestPathSuffix(c))

	req, err := http.NewRequestWithContext(ctx, "POST", targetURL, bytes.NewReader(body))
	if err != nil {
		return nil, err
	}

	// Set authentication header
	req.Header.Set("authorization", "Bearer "+token)

	// Set headers specific to OAuth accounts (ChatGPT internal API)
	if account.Type == AccountTypeOAuth {
		// Required: set Host for ChatGPT API (must use req.Host, not Header.Set)
		req.Host = "chatgpt.com"
		// Required: set chatgpt-account-id header
		chatgptAccountID := account.GetChatGPTAccountID()
		if chatgptAccountID != "" {
			req.Header.Set("chatgpt-account-id", chatgptAccountID)
		}
	}

	// Whitelist passthrough headers
	for key, values := range c.Request.Header {
		lowerKey := strings.ToLower(key)
		if openaiAllowedHeaders[lowerKey] {
			for _, v := range values {
				req.Header.Add(key, v)
			}
		}
	}
	if account.Type == AccountTypeOAuth {
		// 清除客户端透传的 session 头，后续用隔离后的值重新设置，防止跨用户会话碰撞。
		req.Header.Del("conversation_id")
		req.Header.Del("session_id")

		req.Header.Set("OpenAI-Beta", "responses=experimental")
		req.Header.Set("originator", resolveOpenAIUpstreamOriginator(c, isCodexCLI))
		apiKeyID := getAPIKeyIDFromContext(c)
		if isOpenAIResponsesCompactPath(c) {
			req.Header.Set("accept", "application/json")
			if req.Header.Get("version") == "" {
				req.Header.Set("version", codexCLIVersion)
			}
			compactSession := resolveOpenAICompactSessionID(c)
			req.Header.Set("session_id", isolateOpenAISessionID(apiKeyID, compactSession))
		} else {
			req.Header.Set("accept", "text/event-stream")
		}
		if promptCacheKey != "" {
			isolated := isolateOpenAISessionID(apiKeyID, promptCacheKey)
			req.Header.Set("conversation_id", isolated)
			req.Header.Set("session_id", isolated)
		}
	}

	// Apply custom User-Agent if configured
	customUA := account.GetOpenAIUserAgent()
	if customUA != "" {
		req.Header.Set("user-agent", customUA)
	}

	// 若开启 ForceCodexCLI，则强制将上游 User-Agent 伪装为 Codex CLI。
	// 用于网关未透传/改写 User-Agent 时，仍能命中 Codex 侧识别逻辑。
	if s.cfg != nil && s.cfg.Gateway.ForceCodexCLI {
		req.Header.Set("user-agent", codexCLIUserAgent)
	}

	// Ensure required headers exist
	if req.Header.Get("content-type") == "" {
		req.Header.Set("content-type", "application/json")
	}

	return req, nil
}

func (s *OpenAIGatewayService) handleErrorResponse(
	ctx context.Context,
	resp *http.Response,
	c *gin.Context,
	account *Account,
	requestBody []byte,
) (*OpenAIForwardResult, error) {
	body, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))

	upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(body))
	upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)
	upstreamDetail := ""
	if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
		maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
		if maxBytes <= 0 {
			maxBytes = 2048
		}
		upstreamDetail = truncateString(string(body), maxBytes)
	}
	setOpsUpstreamError(c, resp.StatusCode, upstreamMsg, upstreamDetail)
	logOpenAIInstructionsRequiredDebug(ctx, c, account, resp.StatusCode, upstreamMsg, requestBody, body)

	if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
		logger.LegacyPrintf("service.openai_gateway",
			"OpenAI upstream error %d (account=%d platform=%s type=%s): %s",
			resp.StatusCode,
			account.ID,
			account.Platform,
			account.Type,
			truncateForLog(body, s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes),
		)
	}

	if status, errType, errMsg, matched := applyErrorPassthroughRule(
		c,
		PlatformOpenAI,
		resp.StatusCode,
		body,
		http.StatusBadGateway,
		"upstream_error",
		"Upstream request failed",
	); matched {
		c.JSON(status, gin.H{
			"error": gin.H{
				"type":    errType,
				"message": errMsg,
			},
		})
		if upstreamMsg == "" {
			upstreamMsg = errMsg
		}
		if upstreamMsg == "" {
			return nil, fmt.Errorf("upstream error: %d (passthrough rule matched)", resp.StatusCode)
		}
		return nil, fmt.Errorf("upstream error: %d (passthrough rule matched) message=%s", resp.StatusCode, upstreamMsg)
	}

	// Check custom error codes
	if !account.ShouldHandleErrorCode(resp.StatusCode) {
		appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
			Platform:           account.Platform,
			AccountID:          account.ID,
			AccountName:        account.Name,
			UpstreamStatusCode: resp.StatusCode,
			UpstreamRequestID:  resp.Header.Get("x-request-id"),
			Kind:               "http_error",
			Message:            upstreamMsg,
			Detail:             upstreamDetail,
		})
		c.JSON(http.StatusInternalServerError, gin.H{
			"error": gin.H{
				"type":    "upstream_error",
				"message": "Upstream gateway error",
			},
		})
		if upstreamMsg == "" {
			return nil, fmt.Errorf("upstream error: %d (not in custom error codes)", resp.StatusCode)
		}
		return nil, fmt.Errorf("upstream error: %d (not in custom error codes) message=%s", resp.StatusCode, upstreamMsg)
	}

	// Handle upstream error (mark account status)
	shouldDisable := false
	if s.rateLimitService != nil {
		shouldDisable = s.rateLimitService.HandleUpstreamError(ctx, account, resp.StatusCode, resp.Header, body)
	}
	kind := "http_error"
	if shouldDisable {
		kind = "failover"
	}
	appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
		Platform:           account.Platform,
		AccountID:          account.ID,
		AccountName:        account.Name,
		UpstreamStatusCode: resp.StatusCode,
		UpstreamRequestID:  resp.Header.Get("x-request-id"),
		Kind:               kind,
		Message:            upstreamMsg,
		Detail:             upstreamDetail,
	})
	if shouldDisable {
		return nil, &UpstreamFailoverError{
			StatusCode:             resp.StatusCode,
			ResponseBody:           body,
			RetryableOnSameAccount: account.IsPoolMode() && isPoolModeRetryableStatus(resp.StatusCode),
		}
	}

	// Return appropriate error response
	var errType, errMsg string
	var statusCode int

	switch resp.StatusCode {
	case 401:
		statusCode = http.StatusBadGateway
		errType = "upstream_error"
		errMsg = "Upstream authentication failed, please contact administrator"
	case 402:
		statusCode = http.StatusBadGateway
		errType = "upstream_error"
		errMsg = "Upstream payment required: insufficient balance or billing issue"
	case 403:
		statusCode = http.StatusBadGateway
		errType = "upstream_error"
		errMsg = "Upstream access forbidden, please contact administrator"
	case 429:
		statusCode = http.StatusTooManyRequests
		errType = "rate_limit_error"
		errMsg = "Upstream rate limit exceeded, please retry later"
	default:
		statusCode = http.StatusBadGateway
		errType = "upstream_error"
		errMsg = "Upstream request failed"
	}

	c.JSON(statusCode, gin.H{
		"error": gin.H{
			"type":    errType,
			"message": errMsg,
		},
	})

	if upstreamMsg == "" {
		return nil, fmt.Errorf("upstream error: %d", resp.StatusCode)
	}
	return nil, fmt.Errorf("upstream error: %d message=%s", resp.StatusCode, upstreamMsg)
}

// compatErrorWriter is the signature for format-specific error writers used by
// the compat paths (Chat Completions and Anthropic Messages).
type compatErrorWriter func(c *gin.Context, statusCode int, errType, message string)

// handleCompatErrorResponse is the shared non-failover error handler for the
// Chat Completions and Anthropic Messages compat paths. It mirrors the logic of
// handleErrorResponse (passthrough rules, ShouldHandleErrorCode, rate-limit
// tracking, secondary failover) but delegates the final error write to the
// format-specific writer function.
func (s *OpenAIGatewayService) handleCompatErrorResponse(
	resp *http.Response,
	c *gin.Context,
	account *Account,
	writeError compatErrorWriter,
) (*OpenAIForwardResult, error) {
	body, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))

	upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(body))
	if upstreamMsg == "" {
		upstreamMsg = fmt.Sprintf("Upstream error: %d", resp.StatusCode)
	}
	upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)

	upstreamDetail := ""
	if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
		maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
		if maxBytes <= 0 {
			maxBytes = 2048
		}
		upstreamDetail = truncateString(string(body), maxBytes)
	}
	setOpsUpstreamError(c, resp.StatusCode, upstreamMsg, upstreamDetail)

	// Apply error passthrough rules
	if status, errType, errMsg, matched := applyErrorPassthroughRule(
		c, account.Platform, resp.StatusCode, body,
		http.StatusBadGateway, "api_error", "Upstream request failed",
	); matched {
		writeError(c, status, errType, errMsg)
		if upstreamMsg == "" {
			upstreamMsg = errMsg
		}
		if upstreamMsg == "" {
			return nil, fmt.Errorf("upstream error: %d (passthrough rule matched)", resp.StatusCode)
		}
		return nil, fmt.Errorf("upstream error: %d (passthrough rule matched) message=%s", resp.StatusCode, upstreamMsg)
	}

	// Check custom error codes — if the account does not handle this status,
	// return a generic error without exposing upstream details.
	if !account.ShouldHandleErrorCode(resp.StatusCode) {
		appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
			Platform:           account.Platform,
			AccountID:          account.ID,
			AccountName:        account.Name,
			UpstreamStatusCode: resp.StatusCode,
			UpstreamRequestID:  resp.Header.Get("x-request-id"),
			Kind:               "http_error",
			Message:            upstreamMsg,
			Detail:             upstreamDetail,
		})
		writeError(c, http.StatusInternalServerError, "api_error", "Upstream gateway error")
		if upstreamMsg == "" {
			return nil, fmt.Errorf("upstream error: %d (not in custom error codes)", resp.StatusCode)
		}
		return nil, fmt.Errorf("upstream error: %d (not in custom error codes) message=%s", resp.StatusCode, upstreamMsg)
	}

	// Track rate limits and decide whether to trigger secondary failover.
	shouldDisable := false
	if s.rateLimitService != nil {
		shouldDisable = s.rateLimitService.HandleUpstreamError(
			c.Request.Context(), account, resp.StatusCode, resp.Header, body,
		)
	}
	kind := "http_error"
	if shouldDisable {
		kind = "failover"
	}
	appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
		Platform:           account.Platform,
		AccountID:          account.ID,
		AccountName:        account.Name,
		UpstreamStatusCode: resp.StatusCode,
		UpstreamRequestID:  resp.Header.Get("x-request-id"),
		Kind:               kind,
		Message:            upstreamMsg,
		Detail:             upstreamDetail,
	})
	if shouldDisable {
		return nil, &UpstreamFailoverError{
			StatusCode:             resp.StatusCode,
			ResponseBody:           body,
			RetryableOnSameAccount: account.IsPoolMode() && isPoolModeRetryableStatus(resp.StatusCode),
		}
	}

	// Map status code to error type and write response
	errType := "api_error"
	switch {
	case resp.StatusCode == 400:
		errType = "invalid_request_error"
	case resp.StatusCode == 404:
		errType = "not_found_error"
	case resp.StatusCode == 429:
		errType = "rate_limit_error"
	case resp.StatusCode >= 500:
		errType = "api_error"
	}

	writeError(c, resp.StatusCode, errType, upstreamMsg)
	return nil, fmt.Errorf("upstream error: %d %s", resp.StatusCode, upstreamMsg)
}

// openaiStreamingResult streaming response result
type openaiStreamingResult struct {
	usage        *OpenAIUsage
	firstTokenMs *int
}

func (s *OpenAIGatewayService) handleStreamingResponse(ctx context.Context, resp *http.Response, c *gin.Context, account *Account, startTime time.Time, originalModel, mappedModel string) (*openaiStreamingResult, error) {
	if s.responseHeaderFilter != nil {
		responseheaders.WriteFilteredHeaders(c.Writer.Header(), resp.Header, s.responseHeaderFilter)
	}

	// Set SSE response headers
	c.Header("Content-Type", "text/event-stream")
	c.Header("Cache-Control", "no-cache")
	c.Header("Connection", "keep-alive")
	c.Header("X-Accel-Buffering", "no")

	// Pass through other headers
	if v := resp.Header.Get("x-request-id"); v != "" {
		c.Header("x-request-id", v)
	}

	w := c.Writer
	flusher, ok := w.(http.Flusher)
	if !ok {
		return nil, errors.New("streaming not supported")
	}
	bufferedWriter := bufio.NewWriterSize(w, 4*1024)
	flushBuffered := func() error {
		if err := bufferedWriter.Flush(); err != nil {
			return err
		}
		flusher.Flush()
		return nil
	}

	usage := &OpenAIUsage{}
	var firstTokenMs *int
	scanner := bufio.NewScanner(resp.Body)
	maxLineSize := defaultMaxLineSize
	if s.cfg != nil && s.cfg.Gateway.MaxLineSize > 0 {
		maxLineSize = s.cfg.Gateway.MaxLineSize
	}
	scanBuf := getSSEScannerBuf64K()
	scanner.Buffer(scanBuf[:0], maxLineSize)

	streamInterval := time.Duration(0)
	if s.cfg != nil && s.cfg.Gateway.StreamDataIntervalTimeout > 0 {
		streamInterval = time.Duration(s.cfg.Gateway.StreamDataIntervalTimeout) * time.Second
	}
	// 仅监控上游数据间隔超时，不被下游写入阻塞影响
	var intervalTicker *time.Ticker
	if streamInterval > 0 {
		intervalTicker = time.NewTicker(streamInterval)
		defer intervalTicker.Stop()
	}
	var intervalCh <-chan time.Time
	if intervalTicker != nil {
		intervalCh = intervalTicker.C
	}

	keepaliveInterval := time.Duration(0)
	if s.cfg != nil && s.cfg.Gateway.StreamKeepaliveInterval > 0 {
		keepaliveInterval = time.Duration(s.cfg.Gateway.StreamKeepaliveInterval) * time.Second
	}
	// 下游 keepalive 仅用于防止代理空闲断开
	var keepaliveTicker *time.Ticker
	if keepaliveInterval > 0 {
		keepaliveTicker = time.NewTicker(keepaliveInterval)
		defer keepaliveTicker.Stop()
	}
	var keepaliveCh <-chan time.Time
	if keepaliveTicker != nil {
		keepaliveCh = keepaliveTicker.C
	}
	// Track downstream writes separately from upstream reads: pre-output failover
	// can buffer response.created / response.in_progress, so keepalive must be
	// based on downstream idle time.
	lastDownstreamWriteAt := time.Now()

	// 仅发送一次错误事件，避免多次写入导致协议混乱。
	// 注意：OpenAI `/v1/responses` streaming 事件必须符合 OpenAI Responses schema；
	// 否则下游 SDK（例如 OpenCode）会因为类型校验失败而报错。
	errorEventSent := false
	clientDisconnected := false // 客户端断开后继续 drain 上游以收集 usage
	sawTerminalEvent := false
	sawFailedEvent := false
	failedMessage := ""
	clientOutputStarted := false
	upstreamRequestID := strings.TrimSpace(resp.Header.Get("x-request-id"))
	var streamFailoverErr error
	sendErrorEvent := func(reason string) {
		if errorEventSent || clientDisconnected {
			return
		}
		errorEventSent = true
		payload := `{"type":"error","sequence_number":0,"error":{"type":"upstream_error","message":` + strconv.Quote(reason) + `,"code":` + strconv.Quote(reason) + `}}`
		if err := flushBuffered(); err != nil {
			clientDisconnected = true
			return
		}
		if _, err := bufferedWriter.WriteString("data: " + payload + "\n\n"); err != nil {
			clientDisconnected = true
			return
		}
		if err := flushBuffered(); err != nil {
			clientDisconnected = true
			return
		}
		clientOutputStarted = true
		lastDownstreamWriteAt = time.Now()
	}

	needModelReplace := originalModel != mappedModel
	resultWithUsage := func() *openaiStreamingResult {
		return &openaiStreamingResult{usage: usage, firstTokenMs: firstTokenMs}
	}
	finalizeStream := func() (*openaiStreamingResult, error) {
		if !sawTerminalEvent {
			if !openAIStreamClientOutputStarted(c, clientOutputStarted) {
				return resultWithUsage(), s.newOpenAIStreamFailoverError(
					c,
					account,
					false,
					upstreamRequestID,
					nil,
					"OpenAI stream ended before a terminal event",
				)
			}
			return resultWithUsage(), fmt.Errorf("stream usage incomplete: missing terminal event")
		}
		if sawFailedEvent {
			return resultWithUsage(), fmt.Errorf("upstream response failed: %s", failedMessage)
		}
		if !clientDisconnected {
			hadBufferedData := bufferedWriter.Buffered() > 0
			if err := flushBuffered(); err != nil {
				clientDisconnected = true
				logger.LegacyPrintf("service.openai_gateway", "Client disconnected during final flush, returning collected usage")
			} else if hadBufferedData {
				clientOutputStarted = true
				lastDownstreamWriteAt = time.Now()
			}
		}
		return resultWithUsage(), nil
	}
	handleScanErr := func(scanErr error) (*openaiStreamingResult, error, bool) {
		if scanErr == nil {
			return nil, nil, false
		}
		if sawTerminalEvent && !sawFailedEvent {
			logger.LegacyPrintf("service.openai_gateway", "Upstream scan ended after terminal event: %v", scanErr)
			return resultWithUsage(), nil, true
		}
		if sawFailedEvent {
			return resultWithUsage(), fmt.Errorf("upstream response failed: %s", failedMessage), true
		}
		// 客户端断开/取消请求时，上游读取往往会返回 context canceled。
		// /v1/responses 的 SSE 事件必须符合 OpenAI 协议；这里不注入自定义 error event，避免下游 SDK 解析失败。
		if errors.Is(scanErr, context.Canceled) || errors.Is(scanErr, context.DeadlineExceeded) {
			return resultWithUsage(), fmt.Errorf("stream usage incomplete: %w", scanErr), true
		}
		if errors.Is(scanErr, bufio.ErrTooLong) {
			logger.LegacyPrintf("service.openai_gateway", "SSE line too long: account=%d max_size=%d error=%v", account.ID, maxLineSize, scanErr)
			sendErrorEvent("response_too_large")
			return resultWithUsage(), scanErr, true
		}
		if !openAIStreamClientOutputStarted(c, clientOutputStarted) {
			msg := "OpenAI stream disconnected before completion"
			if errText := strings.TrimSpace(scanErr.Error()); errText != "" {
				msg += ": " + errText
			}
			return resultWithUsage(), s.newOpenAIStreamFailoverError(c, account, false, upstreamRequestID, nil, msg), true
		}
		// 客户端已断开时，上游出错仅影响体验，不影响计费；返回已收集 usage
		if clientDisconnected {
			return resultWithUsage(), fmt.Errorf("stream usage incomplete after disconnect: %w", scanErr), true
		}
		sendErrorEvent("stream_read_error")
		return resultWithUsage(), fmt.Errorf("stream read error: %w", scanErr), true
	}
	processSSELine := func(line string, queueDrained bool) {
		if streamFailoverErr != nil {
			return
		}
		// Extract data from SSE line (supports both "data: " and "data:" formats)
		if data, ok := extractOpenAISSEDataLine(line); ok {

			// Replace model in response if needed.
			// Fast path: most events do not contain model field values.
			if needModelReplace && mappedModel != "" && strings.Contains(data, mappedModel) {
				line = s.replaceModelInSSELine(line, mappedModel, originalModel)
			}

			dataBytes := []byte(data)
			if openAIStreamEventIsTerminal(data) {
				sawTerminalEvent = true
			}
			eventType := strings.TrimSpace(gjson.GetBytes(dataBytes, "type").String())
			forceFlushFailedEvent := false
			if eventType == "response.failed" {
				failedMessage = extractOpenAISSEErrorMessage(dataBytes)
				if !openAIStreamClientOutputStarted(c, clientOutputStarted) && openAIStreamFailedEventShouldFailover(dataBytes, failedMessage) {
					sawFailedEvent = true
					streamFailoverErr = s.newOpenAIStreamFailoverError(c, account, false, upstreamRequestID, dataBytes, failedMessage)
					return
				}
				forceFlushFailedEvent = true
				sawFailedEvent = true
			}

			// Correct Codex tool calls if needed (apply_patch -> edit, etc.)
			if correctedData, corrected := s.toolCorrector.CorrectToolCallsInSSEBytes(dataBytes); corrected {
				dataBytes = correctedData
				data = string(correctedData)
				line = "data: " + data
				eventType = strings.TrimSpace(gjson.GetBytes(dataBytes, "type").String())
			}
			startsClientOutput := forceFlushFailedEvent || openAIStreamDataStartsClientOutput(data, eventType)

			// 写入客户端（客户端断开后继续 drain 上游）
			if !clientDisconnected {
				shouldFlush := queueDrained && (clientOutputStarted || startsClientOutput)
				if firstTokenMs == nil && startsClientOutput {
					// 保证首个 token 事件尽快出站，避免影响 TTFT。
					shouldFlush = true
				}
				if _, err := bufferedWriter.WriteString(line); err != nil {
					clientDisconnected = true
					logger.LegacyPrintf("service.openai_gateway", "Client disconnected during streaming, continuing to drain upstream for billing")
				} else if _, err := bufferedWriter.WriteString("\n"); err != nil {
					clientDisconnected = true
					logger.LegacyPrintf("service.openai_gateway", "Client disconnected during streaming, continuing to drain upstream for billing")
				} else if shouldFlush {
					if err := flushBuffered(); err != nil {
						clientDisconnected = true
						logger.LegacyPrintf("service.openai_gateway", "Client disconnected during streaming flush, continuing to drain upstream for billing")
					} else {
						clientOutputStarted = true
						lastDownstreamWriteAt = time.Now()
					}
				}
			}

			// Record first token time
			if firstTokenMs == nil && startsClientOutput {
				ms := int(time.Since(startTime).Milliseconds())
				firstTokenMs = &ms
			}
			s.parseSSEUsageBytes(dataBytes, usage)
			return
		}

		// Forward non-data lines as-is
		if !clientDisconnected {
			if _, err := bufferedWriter.WriteString(line); err != nil {
				clientDisconnected = true
				logger.LegacyPrintf("service.openai_gateway", "Client disconnected during streaming, continuing to drain upstream for billing")
			} else if _, err := bufferedWriter.WriteString("\n"); err != nil {
				clientDisconnected = true
				logger.LegacyPrintf("service.openai_gateway", "Client disconnected during streaming, continuing to drain upstream for billing")
			} else if queueDrained && clientOutputStarted {
				if err := flushBuffered(); err != nil {
					clientDisconnected = true
					logger.LegacyPrintf("service.openai_gateway", "Client disconnected during streaming flush, continuing to drain upstream for billing")
				} else {
					clientOutputStarted = true
					lastDownstreamWriteAt = time.Now()
				}
			}
		}
	}

	// 无超时/无 keepalive 的常见路径走同步扫描，减少 goroutine 与 channel 开销。
	if streamInterval <= 0 && keepaliveInterval <= 0 {
		defer putSSEScannerBuf64K(scanBuf)
		for scanner.Scan() {
			processSSELine(scanner.Text(), true)
			if streamFailoverErr != nil {
				return resultWithUsage(), streamFailoverErr
			}
		}
		if result, err, done := handleScanErr(scanner.Err()); done {
			return result, err
		}
		return finalizeStream()
	}

	type scanEvent struct {
		line string
		err  error
	}
	// 独立 goroutine 读取上游，避免读取阻塞影响 keepalive/超时处理
	events := make(chan scanEvent, 16)
	done := make(chan struct{})
	sendEvent := func(ev scanEvent) bool {
		select {
		case events <- ev:
			return true
		case <-done:
			return false
		}
	}
	var lastReadAt int64
	atomic.StoreInt64(&lastReadAt, time.Now().UnixNano())
	go func(scanBuf *sseScannerBuf64K) {
		defer putSSEScannerBuf64K(scanBuf)
		defer close(events)
		for scanner.Scan() {
			atomic.StoreInt64(&lastReadAt, time.Now().UnixNano())
			if !sendEvent(scanEvent{line: scanner.Text()}) {
				return
			}
		}
		if err := scanner.Err(); err != nil {
			_ = sendEvent(scanEvent{err: err})
		}
	}(scanBuf)
	defer close(done)

	for {
		select {
		case ev, ok := <-events:
			if !ok {
				return finalizeStream()
			}
			if result, err, done := handleScanErr(ev.err); done {
				return result, err
			}
			processSSELine(ev.line, len(events) == 0)
			if streamFailoverErr != nil {
				return resultWithUsage(), streamFailoverErr
			}

		case <-intervalCh:
			lastRead := time.Unix(0, atomic.LoadInt64(&lastReadAt))
			if time.Since(lastRead) < streamInterval {
				continue
			}
			if clientDisconnected {
				return resultWithUsage(), fmt.Errorf("stream usage incomplete after timeout")
			}
			logger.LegacyPrintf("service.openai_gateway", "Stream data interval timeout: account=%d model=%s interval=%s", account.ID, originalModel, streamInterval)
			// 处理流超时，可能标记账户为临时不可调度或错误状态
			if s.rateLimitService != nil {
				s.rateLimitService.HandleStreamTimeout(ctx, account, originalModel)
			}
			sendErrorEvent("stream_timeout")
			return resultWithUsage(), fmt.Errorf("stream data interval timeout")

		case <-keepaliveCh:
			if clientDisconnected {
				continue
			}
			if time.Since(lastDownstreamWriteAt) < keepaliveInterval {
				continue
			}
			if _, err := bufferedWriter.WriteString(":\n\n"); err != nil {
				clientDisconnected = true
				logger.LegacyPrintf("service.openai_gateway", "Client disconnected during streaming, continuing to drain upstream for billing")
				continue
			}
			if err := flushBuffered(); err != nil {
				clientDisconnected = true
				logger.LegacyPrintf("service.openai_gateway", "Client disconnected during keepalive flush, continuing to drain upstream for billing")
			} else {
				lastDownstreamWriteAt = time.Now()
			}
		}
	}

}

// extractOpenAISSEDataLine 低开销提取 SSE `data:` 行内容。
// 兼容 `data: xxx` 与 `data:xxx` 两种格式。
func extractOpenAISSEDataLine(line string) (string, bool) {
	if !strings.HasPrefix(line, "data:") {
		return "", false
	}
	start := len("data:")
	for start < len(line) {
		if line[start] != ' ' && line[start] != '	' {
			break
		}
		start++
	}
	return line[start:], true
}

func (s *OpenAIGatewayService) replaceModelInSSELine(line, fromModel, toModel string) string {
	data, ok := extractOpenAISSEDataLine(line)
	if !ok {
		return line
	}
	if data == "" || data == "[DONE]" {
		return line
	}

	// 使用 gjson 精确检查 model 字段，避免全量 JSON 反序列化
	if m := gjson.Get(data, "model"); m.Exists() && m.Str == fromModel {
		newData, err := sjson.Set(data, "model", toModel)
		if err != nil {
			return line
		}
		return "data: " + newData
	}

	// 检查嵌套的 response.model 字段
	if m := gjson.Get(data, "response.model"); m.Exists() && m.Str == fromModel {
		newData, err := sjson.Set(data, "response.model", toModel)
		if err != nil {
			return line
		}
		return "data: " + newData
	}

	return line
}

// correctToolCallsInResponseBody 修正响应体中的工具调用
func (s *OpenAIGatewayService) correctToolCallsInResponseBody(body []byte) []byte {
	if len(body) == 0 {
		return body
	}

	corrected, changed := s.toolCorrector.CorrectToolCallsInSSEBytes(body)
	if changed {
		return corrected
	}
	return body
}

func (s *OpenAIGatewayService) parseSSEUsage(data string, usage *OpenAIUsage) {
	s.parseSSEUsageBytes([]byte(data), usage)
}

func (s *OpenAIGatewayService) parseSSEUsageBytes(data []byte, usage *OpenAIUsage) {
	if usage == nil || len(data) == 0 || bytes.Equal(data, []byte("[DONE]")) {
		return
	}
	// 选择性解析：仅在数据中包含终止事件标识时才进入字段提取。
	if len(data) < 72 {
		return
	}
	eventType := gjson.GetBytes(data, "type").String()
	if eventType != "response.completed" && eventType != "response.done" &&
		eventType != "response.incomplete" && eventType != "response.cancelled" && eventType != "response.canceled" {
		return
	}

	usage.InputTokens = int(gjson.GetBytes(data, "response.usage.input_tokens").Int())
	usage.OutputTokens = int(gjson.GetBytes(data, "response.usage.output_tokens").Int())
	usage.CacheReadInputTokens = int(gjson.GetBytes(data, "response.usage.input_tokens_details.cached_tokens").Int())
	usage.ImageOutputTokens = int(gjson.GetBytes(data, "response.usage.output_tokens_details.image_tokens").Int())
}

func extractOpenAIUsageFromJSONBytes(body []byte) (OpenAIUsage, bool) {
	if len(body) == 0 || !gjson.ValidBytes(body) {
		return OpenAIUsage{}, false
	}
	values := gjson.GetManyBytes(
		body,
		"usage.input_tokens",
		"usage.output_tokens",
		"usage.input_tokens_details.cached_tokens",
		"usage.output_tokens_details.image_tokens",
	)
	return OpenAIUsage{
		InputTokens:          int(values[0].Int()),
		OutputTokens:         int(values[1].Int()),
		CacheReadInputTokens: int(values[2].Int()),
		ImageOutputTokens:    int(values[3].Int()),
	}, true
}

func (s *OpenAIGatewayService) handleNonStreamingResponse(ctx context.Context, resp *http.Response, c *gin.Context, account *Account, originalModel, mappedModel string) (*OpenAIUsage, error) {
	body, err := ReadUpstreamResponseBody(resp.Body, s.cfg, c, openAITooLargeError)
	if err != nil {
		return nil, err
	}

	// Detect SSE responses for ALL account types via Content-Type header.
	// Some OpenAI-compatible upstreams (including other sub2api instances)
	// may return SSE even when stream=false was requested.
	if isEventStreamResponse(resp.Header) {
		return s.handleSSEToJSON(resp, c, body, originalModel, mappedModel)
	}
	// For OAuth accounts, also fall back to a body-content heuristic because
	// the upstream may omit the Content-Type header while still sending SSE.
	// This heuristic is NOT applied to API-key accounts to avoid false
	// positives on JSON responses that coincidentally contain "data:" or
	// "event:" in their text content.
	if account.Type == AccountTypeOAuth {
		bodyLooksLikeSSE := bytes.Contains(body, []byte("data:")) || bytes.Contains(body, []byte("event:"))
		if bodyLooksLikeSSE {
			return s.handleSSEToJSON(resp, c, body, originalModel, mappedModel)
		}
	}

	usageValue, usageOK := extractOpenAIUsageFromJSONBytes(body)
	if !usageOK {
		return nil, fmt.Errorf("parse response: invalid json response")
	}
	usage := &usageValue

	// Replace model in response if needed
	if originalModel != mappedModel {
		body = s.replaceModelInResponseBody(body, mappedModel, originalModel)
	}

	responseheaders.WriteFilteredHeaders(c.Writer.Header(), resp.Header, s.responseHeaderFilter)

	contentType := "application/json"
	if s.cfg != nil && !s.cfg.Security.ResponseHeaders.Enabled {
		if upstreamType := resp.Header.Get("Content-Type"); upstreamType != "" {
			contentType = upstreamType
		}
	}

	c.Data(resp.StatusCode, contentType, body)

	return usage, nil
}

func isEventStreamResponse(header http.Header) bool {
	contentType := strings.ToLower(header.Get("Content-Type"))
	return strings.Contains(contentType, "text/event-stream")
}

func (s *OpenAIGatewayService) handleSSEToJSON(resp *http.Response, c *gin.Context, body []byte, originalModel, mappedModel string) (*OpenAIUsage, error) {
	bodyText := string(body)
	finalResponse, ok := extractCodexFinalResponse(bodyText)

	usage := &OpenAIUsage{}
	if ok {
		if parsedUsage, parsed := extractOpenAIUsageFromJSONBytes(finalResponse); parsed {
			*usage = parsedUsage
		}
		// When the terminal event has an empty output array, reconstruct
		// output from accumulated delta events so the client gets full content.
		// gjson Array() returns empty slice for null, missing, or empty arrays.
		if len(gjson.GetBytes(finalResponse, "output").Array()) == 0 {
			if outputJSON, reconstructed := reconstructResponseOutputFromSSE(bodyText); reconstructed {
				if patched, err := sjson.SetRawBytes(finalResponse, "output", outputJSON); err == nil {
					finalResponse = patched
				}
			}
		}
		body = finalResponse
		if originalModel != mappedModel {
			body = s.replaceModelInResponseBody(body, mappedModel, originalModel)
		}
		// Correct tool calls in final response
		body = s.correctToolCallsInResponseBody(body)
	} else {
		terminalType, terminalPayload, terminalOK := extractOpenAISSETerminalEvent(bodyText)
		if terminalOK && terminalType == "response.failed" {
			msg := extractOpenAISSEErrorMessage(terminalPayload)
			if msg == "" {
				msg = "Upstream compact response failed"
			}
			return nil, s.writeOpenAINonStreamingProtocolError(resp, c, msg)
		}
		usage = s.parseSSEUsageFromBody(bodyText)
		if originalModel != mappedModel {
			bodyText = s.replaceModelInSSEBody(bodyText, mappedModel, originalModel)
		}
		body = []byte(bodyText)
	}

	responseheaders.WriteFilteredHeaders(c.Writer.Header(), resp.Header, s.responseHeaderFilter)

	contentType := "application/json; charset=utf-8"
	if !ok {
		contentType = resp.Header.Get("Content-Type")
		if contentType == "" {
			contentType = "text/event-stream"
		}
	}
	c.Data(resp.StatusCode, contentType, body)

	return usage, nil
}

func extractOpenAISSETerminalEvent(body string) (string, []byte, bool) {
	lines := strings.Split(body, "\n")
	for _, line := range lines {
		data, ok := extractOpenAISSEDataLine(line)
		if !ok || data == "" || data == "[DONE]" {
			continue
		}
		eventType := strings.TrimSpace(gjson.Get(data, "type").String())
		switch eventType {
		case "response.completed", "response.done", "response.failed", "response.incomplete", "response.cancelled", "response.canceled":
			return eventType, []byte(data), true
		}
	}
	return "", nil, false
}

func extractOpenAISSEErrorMessage(payload []byte) string {
	if len(payload) == 0 {
		return ""
	}
	for _, path := range []string{"response.error.message", "error.message", "message"} {
		if msg := strings.TrimSpace(gjson.GetBytes(payload, path).String()); msg != "" {
			return sanitizeUpstreamErrorMessage(msg)
		}
	}
	return sanitizeUpstreamErrorMessage(strings.TrimSpace(extractUpstreamErrorMessage(payload)))
}

func (s *OpenAIGatewayService) writeOpenAINonStreamingProtocolError(resp *http.Response, c *gin.Context, message string) error {
	message = sanitizeUpstreamErrorMessage(strings.TrimSpace(message))
	if message == "" {
		message = "Upstream returned an invalid non-streaming response"
	}
	setOpsUpstreamError(c, http.StatusBadGateway, message, "")
	responseheaders.WriteFilteredHeaders(c.Writer.Header(), resp.Header, s.responseHeaderFilter)
	c.Writer.Header().Set("Content-Type", "application/json; charset=utf-8")
	c.JSON(http.StatusBadGateway, gin.H{
		"error": gin.H{
			"type":    "upstream_error",
			"message": message,
		},
	})
	return fmt.Errorf("non-streaming openai protocol error: %s", message)
}

func extractCodexFinalResponse(body string) ([]byte, bool) {
	lines := strings.Split(body, "\n")
	for _, line := range lines {
		data, ok := extractOpenAISSEDataLine(line)
		if !ok {
			continue
		}
		if data == "" || data == "[DONE]" {
			continue
		}
		eventType := gjson.Get(data, "type").String()
		if eventType == "response.done" || eventType == "response.completed" {
			if response := gjson.Get(data, "response"); response.Exists() && response.Type == gjson.JSON && response.Raw != "" {
				return []byte(response.Raw), true
			}
		}
	}
	return nil, false
}

// reconstructResponseOutputFromSSE scans raw SSE body text for delta events and
// returns a JSON-encoded output array reconstructed from accumulated deltas.
// Returns (nil, false) if no content was found in deltas.
func reconstructResponseOutputFromSSE(bodyText string) ([]byte, bool) {
	acc := apicompat.NewBufferedResponseAccumulator()
	imageOutputs := make([]json.RawMessage, 0, 1)
	seenImages := make(map[string]struct{})
	lines := strings.Split(bodyText, "\n")
	for _, line := range lines {
		data, ok := extractOpenAISSEDataLine(line)
		if !ok || data == "" || data == "[DONE]" {
			continue
		}
		if imageOutput, ok := extractImageGenerationOutputFromSSEData([]byte(data), seenImages); ok {
			imageOutputs = append(imageOutputs, imageOutput)
		}
		var event apicompat.ResponsesStreamEvent
		if err := json.Unmarshal([]byte(data), &event); err != nil {
			continue
		}
		acc.ProcessEvent(&event)
	}
	if !acc.HasContent() && len(imageOutputs) == 0 {
		return nil, false
	}

	var output []json.RawMessage
	if acc.HasContent() {
		outputJSON, err := json.Marshal(acc.BuildOutput())
		if err == nil {
			_ = json.Unmarshal(outputJSON, &output)
		}
	}
	output = append(output, imageOutputs...)
	if len(output) == 0 {
		return nil, false
	}

	outputJSON, err := json.Marshal(output)
	if err != nil {
		return nil, false
	}
	return outputJSON, true
}

func extractImageGenerationOutputFromSSEData(data []byte, seen map[string]struct{}) (json.RawMessage, bool) {
	if len(data) == 0 || !gjson.ValidBytes(data) {
		return nil, false
	}
	if gjson.GetBytes(data, "type").String() != "response.output_item.done" {
		return nil, false
	}
	item := gjson.GetBytes(data, "item")
	if !item.Exists() || !item.IsObject() || item.Get("type").String() != "image_generation_call" {
		return nil, false
	}
	if strings.TrimSpace(item.Get("result").String()) == "" {
		return nil, false
	}
	key := strings.TrimSpace(item.Get("id").String())
	if key == "" {
		key = strings.TrimSpace(item.Get("output_format").String()) + "|" + strings.TrimSpace(item.Get("result").String())
	}
	if key != "" && seen != nil {
		if _, exists := seen[key]; exists {
			return nil, false
		}
		seen[key] = struct{}{}
	}
	return json.RawMessage(item.Raw), true
}

func (s *OpenAIGatewayService) parseSSEUsageFromBody(body string) *OpenAIUsage {
	usage := &OpenAIUsage{}
	lines := strings.Split(body, "\n")
	for _, line := range lines {
		data, ok := extractOpenAISSEDataLine(line)
		if !ok {
			continue
		}
		if data == "" || data == "[DONE]" {
			continue
		}
		s.parseSSEUsageBytes([]byte(data), usage)
	}
	return usage
}

func (s *OpenAIGatewayService) replaceModelInSSEBody(body, fromModel, toModel string) string {
	lines := strings.Split(body, "\n")
	for i, line := range lines {
		if _, ok := extractOpenAISSEDataLine(line); !ok {
			continue
		}
		lines[i] = s.replaceModelInSSELine(line, fromModel, toModel)
	}
	return strings.Join(lines, "\n")
}

func (s *OpenAIGatewayService) validateUpstreamBaseURL(raw string) (string, error) {
	if s.cfg != nil && !s.cfg.Security.URLAllowlist.Enabled {
		normalized, err := urlvalidator.ValidateURLFormat(raw, s.cfg.Security.URLAllowlist.AllowInsecureHTTP)
		if err != nil {
			return "", fmt.Errorf("invalid base_url: %w", err)
		}
		return normalized, nil
	}
	normalized, err := urlvalidator.ValidateHTTPSURL(raw, urlvalidator.ValidationOptions{
		AllowedHosts:     s.cfg.Security.URLAllowlist.UpstreamHosts,
		RequireAllowlist: true,
		AllowPrivate:     s.cfg.Security.URLAllowlist.AllowPrivateHosts,
	})
	if err != nil {
		return "", fmt.Errorf("invalid base_url: %w", err)
	}
	return normalized, nil
}

// buildOpenAIResponsesURL 组装 OpenAI Responses 端点。
// - base 以 /v1 结尾：追加 /responses
// - base 已是 /responses：原样返回
// - 其他情况：追加 /v1/responses
func buildOpenAIResponsesURL(base string) string {
	normalized := strings.TrimRight(strings.TrimSpace(base), "/")
	if strings.HasSuffix(normalized, "/responses") {
		return normalized
	}
	if strings.HasSuffix(normalized, "/v1") {
		return normalized + "/responses"
	}
	return normalized + "/v1/responses"
}

func trimOpenAIEncryptedReasoningItems(reqBody map[string]any) bool {
	if len(reqBody) == 0 {
		return false
	}

	inputValue, has := reqBody["input"]
	if !has {
		return false
	}

	switch input := inputValue.(type) {
	case []any:
		filtered := input[:0]
		changed := false
		for _, item := range input {
			nextItem, itemChanged, keep := sanitizeEncryptedReasoningInputItem(item)
			if itemChanged {
				changed = true
			}
			if !keep {
				continue
			}
			filtered = append(filtered, nextItem)
		}
		if !changed {
			return false
		}
		if len(filtered) == 0 {
			delete(reqBody, "input")
			return true
		}
		reqBody["input"] = filtered
		return true
	case []map[string]any:
		filtered := input[:0]
		changed := false
		for _, item := range input {
			nextItem, itemChanged, keep := sanitizeEncryptedReasoningInputItem(item)
			if itemChanged {
				changed = true
			}
			if !keep {
				continue
			}
			nextMap, ok := nextItem.(map[string]any)
			if !ok {
				filtered = append(filtered, item)
				continue
			}
			filtered = append(filtered, nextMap)
		}
		if !changed {
			return false
		}
		if len(filtered) == 0 {
			delete(reqBody, "input")
			return true
		}
		reqBody["input"] = filtered
		return true
	case map[string]any:
		nextItem, changed, keep := sanitizeEncryptedReasoningInputItem(input)
		if !changed {
			return false
		}
		if !keep {
			delete(reqBody, "input")
			return true
		}
		nextMap, ok := nextItem.(map[string]any)
		if !ok {
			return false
		}
		reqBody["input"] = nextMap
		return true
	default:
		return false
	}
}

func sanitizeEncryptedReasoningInputItem(item any) (next any, changed bool, keep bool) {
	inputItem, ok := item.(map[string]any)
	if !ok {
		return item, false, true
	}

	itemType, _ := inputItem["type"].(string)
	if strings.TrimSpace(itemType) != "reasoning" {
		return item, false, true
	}

	_, hasEncryptedContent := inputItem["encrypted_content"]
	if !hasEncryptedContent {
		return item, false, true
	}

	delete(inputItem, "encrypted_content")
	if len(inputItem) == 1 {
		return nil, true, false
	}
	return inputItem, true, true
}

func IsOpenAIResponsesCompactPathForTest(c *gin.Context) bool {
	return isOpenAIResponsesCompactPath(c)
}

func OpenAICompactSessionSeedKeyForTest() string {
	return openAICompactSessionSeedKey
}

func NormalizeOpenAICompactRequestBodyForTest(body []byte) ([]byte, bool, error) {
	return normalizeOpenAICompactRequestBody(body)
}

func isOpenAIResponsesCompactPath(c *gin.Context) bool {
	suffix := strings.TrimSpace(openAIResponsesRequestPathSuffix(c))
	return suffix == "/compact" || strings.HasPrefix(suffix, "/compact/")
}

func normalizeOpenAICompactRequestBody(body []byte) ([]byte, bool, error) {
	if len(body) == 0 {
		return body, false, nil
	}

	normalized := []byte(`{}`)
	for _, field := range []string{"model", "input", "instructions", "previous_response_id"} {
		value := gjson.GetBytes(body, field)
		if !value.Exists() {
			continue
		}
		next, err := sjson.SetRawBytes(normalized, field, []byte(value.Raw))
		if err != nil {
			return body, false, fmt.Errorf("normalize compact body %s: %w", field, err)
		}
		normalized = next
	}

	if bytes.Equal(bytes.TrimSpace(body), bytes.TrimSpace(normalized)) {
		return body, false, nil
	}
	return normalized, true, nil
}

func resolveOpenAICompactSessionID(c *gin.Context) string {
	if c != nil {
		if sessionID := strings.TrimSpace(c.GetHeader("session_id")); sessionID != "" {
			return sessionID
		}
		if conversationID := strings.TrimSpace(c.GetHeader("conversation_id")); conversationID != "" {
			return conversationID
		}
		if seed, ok := c.Get(openAICompactSessionSeedKey); ok {
			if seedStr, ok := seed.(string); ok && strings.TrimSpace(seedStr) != "" {
				return strings.TrimSpace(seedStr)
			}
		}
	}
	return uuid.NewString()
}

func openAIResponsesRequestPathSuffix(c *gin.Context) string {
	if c == nil || c.Request == nil || c.Request.URL == nil {
		return ""
	}
	normalizedPath := strings.TrimRight(strings.TrimSpace(c.Request.URL.Path), "/")
	if normalizedPath == "" {
		return ""
	}
	idx := strings.LastIndex(normalizedPath, "/responses")
	if idx < 0 {
		return ""
	}
	suffix := normalizedPath[idx+len("/responses"):]
	if suffix == "" || suffix == "/" {
		return ""
	}
	if !strings.HasPrefix(suffix, "/") {
		return ""
	}
	return suffix
}

func appendOpenAIResponsesRequestPathSuffix(baseURL, suffix string) string {
	trimmedBase := strings.TrimRight(strings.TrimSpace(baseURL), "/")
	trimmedSuffix := strings.TrimSpace(suffix)
	if trimmedBase == "" || trimmedSuffix == "" {
		return trimmedBase
	}
	return trimmedBase + trimmedSuffix
}

func (s *OpenAIGatewayService) replaceModelInResponseBody(body []byte, fromModel, toModel string) []byte {
	// 使用 gjson/sjson 精确替换 model 字段，避免全量 JSON 反序列化
	if m := gjson.GetBytes(body, "model"); m.Exists() && m.Str == fromModel {
		newBody, err := sjson.SetBytes(body, "model", toModel)
		if err != nil {
			return body
		}
		return newBody
	}
	return body
}

// OpenAIRecordUsageInput input for recording usage
type OpenAIRecordUsageInput struct {
	Result             *OpenAIForwardResult
	APIKey             *APIKey
	User               *User
	Account            *Account
	Subscription       *UserSubscription
	InboundEndpoint    string
	UpstreamEndpoint   string
	UserAgent          string // 请求的 User-Agent
	IPAddress          string // 请求的客户端 IP 地址
	RequestPayloadHash string
	APIKeyService      APIKeyQuotaUpdater
	ChannelUsageFields
}

// RecordUsage records usage and deducts balance
func (s *OpenAIGatewayService) RecordUsage(ctx context.Context, input *OpenAIRecordUsageInput) error {
	result := input.Result
	if s.rateLimitService != nil && input != nil && input.Account != nil && input.Account.Platform == PlatformOpenAI {
		s.rateLimitService.ResetOpenAI403Counter(ctx, input.Account.ID)
	}

	// 跳过所有 token 均为零的用量记录——上游未返回 usage 时不应写入数据库
	if result.Usage.InputTokens == 0 && result.Usage.OutputTokens == 0 &&
		result.Usage.CacheCreationInputTokens == 0 && result.Usage.CacheReadInputTokens == 0 &&
		result.Usage.ImageOutputTokens == 0 && result.ImageCount == 0 {
		return nil
	}

	apiKey := input.APIKey
	user := input.User
	account := input.Account
	subscription := input.Subscription

	// 计算实际的新输入token（减去缓存读取的token）
	// 因为 input_tokens 包含了 cache_read_tokens，而缓存读取的token不应按输入价格计费
	actualInputTokens := result.Usage.InputTokens - result.Usage.CacheReadInputTokens
	if actualInputTokens < 0 {
		actualInputTokens = 0
	}

	// Calculate cost
	tokens := UsageTokens{
		InputTokens:         actualInputTokens,
		OutputTokens:        result.Usage.OutputTokens,
		CacheCreationTokens: result.Usage.CacheCreationInputTokens,
		CacheReadTokens:     result.Usage.CacheReadInputTokens,
		ImageOutputTokens:   result.Usage.ImageOutputTokens,
	}

	// Get rate multiplier
	multiplier := 1.0
	if s.cfg != nil {
		multiplier = s.cfg.Default.RateMultiplier
	}
	if apiKey.GroupID != nil && apiKey.Group != nil {
		resolver := s.userGroupRateResolver
		if resolver == nil {
			resolver = newUserGroupRateResolver(nil, nil, resolveUserGroupRateCacheTTL(s.cfg), nil, "service.openai_gateway")
		}
		multiplier = resolver.Resolve(ctx, user.ID, *apiKey.GroupID, apiKey.Group.RateMultiplier)
	}

	var cost *CostBreakdown
	var err error
	billingModel := forwardResultBillingModel(result.Model, result.UpstreamModel)
	if result.BillingModel != "" {
		billingModel = strings.TrimSpace(result.BillingModel)
	}
	if input.BillingModelSource == BillingModelSourceChannelMapped && input.ChannelMappedModel != "" && input.ChannelMappedModel != input.OriginalModel {
		billingModel = input.ChannelMappedModel
	}
	if input.BillingModelSource == BillingModelSourceRequested && input.OriginalModel != "" {
		billingModel = input.OriginalModel
	}
	serviceTier := ""
	if result.ServiceTier != nil {
		serviceTier = strings.TrimSpace(*result.ServiceTier)
	}
	cost, err = s.calculateOpenAIRecordUsageCost(ctx, result, apiKey, billingModel, multiplier, tokens, serviceTier)
	if err != nil {
		cost = &CostBreakdown{ActualCost: 0}
	}

	// Determine billing type
	isSubscriptionBilling := subscription != nil && apiKey.Group != nil && apiKey.Group.IsSubscriptionType()
	billingType := BillingTypeBalance
	if isSubscriptionBilling {
		billingType = BillingTypeSubscription
	}

	// Create usage log
	durationMs := int(result.Duration.Milliseconds())
	accountRateMultiplier := account.BillingRateMultiplier()
	requestID := resolveUsageBillingRequestID(ctx, result.RequestID)

	// 确定 RequestedModel（渠道映射前的原始模型）
	requestedModel := result.Model
	if input.OriginalModel != "" {
		requestedModel = input.OriginalModel
	}

	usageLog := &UsageLog{
		UserID:              user.ID,
		APIKeyID:            apiKey.ID,
		AccountID:           account.ID,
		RequestID:           requestID,
		Model:               result.Model,
		RequestedModel:      requestedModel,
		UpstreamModel:       optionalNonEqualStringPtr(result.UpstreamModel, result.Model),
		ServiceTier:         result.ServiceTier,
		ReasoningEffort:     result.ReasoningEffort,
		InboundEndpoint:     optionalTrimmedStringPtr(input.InboundEndpoint),
		UpstreamEndpoint:    optionalTrimmedStringPtr(input.UpstreamEndpoint),
		InputTokens:         actualInputTokens,
		OutputTokens:        result.Usage.OutputTokens,
		CacheCreationTokens: result.Usage.CacheCreationInputTokens,
		CacheReadTokens:     result.Usage.CacheReadInputTokens,
		ImageOutputTokens:   result.Usage.ImageOutputTokens,
		ImageCount:          result.ImageCount,
		ImageSize:           optionalTrimmedStringPtr(result.ImageSize),
	}
	if cost != nil {
		usageLog.InputCost = cost.InputCost
		usageLog.OutputCost = cost.OutputCost
		usageLog.ImageOutputCost = cost.ImageOutputCost
		usageLog.CacheCreationCost = cost.CacheCreationCost
		usageLog.CacheReadCost = cost.CacheReadCost
		usageLog.TotalCost = cost.TotalCost
		usageLog.ActualCost = cost.ActualCost
	}
	usageLog.RateMultiplier = multiplier
	usageLog.AccountRateMultiplier = &accountRateMultiplier
	usageLog.BillingType = billingType
	usageLog.Stream = result.Stream
	usageLog.OpenAIWSMode = result.OpenAIWSMode
	usageLog.DurationMs = &durationMs
	usageLog.FirstTokenMs = result.FirstTokenMs
	usageLog.CreatedAt = time.Now()
	// 设置渠道信息
	usageLog.ChannelID = optionalInt64Ptr(input.ChannelID)
	usageLog.ModelMappingChain = optionalTrimmedStringPtr(input.ModelMappingChain)
	// 设置计费模式
	if cost != nil && cost.BillingMode != "" {
		billingMode := cost.BillingMode
		usageLog.BillingMode = &billingMode
	} else if result.ImageCount > 0 {
		billingMode := string(BillingModeImage)
		usageLog.BillingMode = &billingMode
	} else {
		billingMode := string(BillingModeToken)
		usageLog.BillingMode = &billingMode
	}
	// 添加 UserAgent
	if input.UserAgent != "" {
		usageLog.UserAgent = &input.UserAgent
	}

	// 添加 IPAddress
	if input.IPAddress != "" {
		usageLog.IPAddress = &input.IPAddress
	}

	if apiKey.GroupID != nil {
		usageLog.GroupID = apiKey.GroupID
	}
	if subscription != nil {
		usageLog.SubscriptionID = &subscription.ID
	}

	// 计算账号统计定价费用（使用最终上游模型匹配自定义规则）
	if apiKey.GroupID != nil {
		applyAccountStatsCost(ctx, usageLog, s.channelService, s.billingService,
			account.ID, *apiKey.GroupID, result.UpstreamModel, result.Model,
			tokens, cost.TotalCost,
		)
	}

	if s.cfg != nil && s.cfg.RunMode == config.RunModeSimple {
		writeUsageLogBestEffort(ctx, s.usageLogRepo, usageLog, "service.openai_gateway")
		logger.LegacyPrintf("service.openai_gateway", "[SIMPLE MODE] Usage recorded (not billed): user=%d, tokens=%d", usageLog.UserID, usageLog.TotalTokens())
		s.deferredService.ScheduleLastUsedUpdate(account.ID)
		return nil
	}

	billingErr := func() error {
		_, err := applyUsageBilling(ctx, requestID, usageLog, &postUsageBillingParams{
			Cost:                  cost,
			User:                  user,
			APIKey:                apiKey,
			Account:               account,
			Subscription:          subscription,
			RequestPayloadHash:    resolveUsageBillingPayloadFingerprint(ctx, input.RequestPayloadHash),
			IsSubscriptionBill:    isSubscriptionBilling,
			AccountRateMultiplier: accountRateMultiplier,
			APIKeyService:         input.APIKeyService,
		}, s.billingDeps(), s.usageBillingRepo)
		return err
	}()

	if billingErr != nil {
		return billingErr
	}
	writeUsageLogBestEffort(ctx, s.usageLogRepo, usageLog, "service.openai_gateway")

	return nil
}

func (s *OpenAIGatewayService) calculateOpenAIRecordUsageCost(
	ctx context.Context,
	result *OpenAIForwardResult,
	apiKey *APIKey,
	billingModel string,
	multiplier float64,
	tokens UsageTokens,
	serviceTier string,
) (*CostBreakdown, error) {
	if result != nil && result.ImageCount > 0 {
		return s.calculateOpenAIImageCost(ctx, billingModel, apiKey, result, multiplier), nil
	}
	if s.resolver != nil && apiKey.Group != nil {
		gid := apiKey.Group.ID
		return s.billingService.CalculateCostUnified(CostInput{
			Ctx:            ctx,
			Model:          billingModel,
			GroupID:        &gid,
			Tokens:         tokens,
			RequestCount:   1,
			RateMultiplier: multiplier,
			ServiceTier:    serviceTier,
			Resolver:       s.resolver,
		})
	}
	return s.billingService.CalculateCostWithServiceTier(billingModel, tokens, multiplier, serviceTier)
}

func (s *OpenAIGatewayService) calculateOpenAIImageCost(
	ctx context.Context,
	billingModel string,
	apiKey *APIKey,
	result *OpenAIForwardResult,
	multiplier float64,
) *CostBreakdown {
	if resolved := s.resolveOpenAIChannelPricing(ctx, billingModel, apiKey); resolved != nil &&
		(resolved.Mode == BillingModePerRequest || resolved.Mode == BillingModeImage) {
		gid := apiKey.Group.ID
		cost, err := s.billingService.CalculateCostUnified(CostInput{
			Ctx:            ctx,
			Model:          billingModel,
			GroupID:        &gid,
			RequestCount:   1,
			SizeTier:       result.ImageSize,
			RateMultiplier: multiplier,
			Resolver:       s.resolver,
			Resolved:       resolved,
		})
		if err == nil {
			return cost
		}
		logger.LegacyPrintf("service.openai_gateway", "Calculate image channel cost failed: %v", err)
	}

	var groupConfig *ImagePriceConfig
	if apiKey != nil && apiKey.Group != nil {
		groupConfig = &ImagePriceConfig{
			Price1K: apiKey.Group.ImagePrice1K,
			Price2K: apiKey.Group.ImagePrice2K,
			Price4K: apiKey.Group.ImagePrice4K,
		}
	}
	return s.billingService.CalculateImageCost(billingModel, result.ImageSize, result.ImageCount, groupConfig, multiplier)
}

func (s *OpenAIGatewayService) resolveOpenAIChannelPricing(ctx context.Context, billingModel string, apiKey *APIKey) *ResolvedPricing {
	if s.resolver == nil || apiKey == nil || apiKey.Group == nil {
		return nil
	}
	gid := apiKey.Group.ID
	resolved := s.resolver.Resolve(ctx, PricingInput{Model: billingModel, GroupID: &gid})
	if resolved.Source == PricingSourceChannel {
		return resolved
	}
	return nil
}

// ParseCodexRateLimitHeaders extracts Codex usage limits from response headers.
// Exported for use in ratelimit_service when handling OpenAI 429 responses.
func ParseCodexRateLimitHeaders(headers http.Header) *OpenAICodexUsageSnapshot {
	snapshot := &OpenAICodexUsageSnapshot{}
	hasData := false

	// Helper to parse float64 from header
	parseFloat := func(key string) *float64 {
		if v := headers.Get(key); v != "" {
			if f, err := strconv.ParseFloat(v, 64); err == nil {
				return &f
			}
		}
		return nil
	}

	// Helper to parse int from header
	parseInt := func(key string) *int {
		if v := headers.Get(key); v != "" {
			if i, err := strconv.Atoi(v); err == nil {
				return &i
			}
		}
		return nil
	}

	// Primary (weekly) limits
	if v := parseFloat("x-codex-primary-used-percent"); v != nil {
		snapshot.PrimaryUsedPercent = v
		hasData = true
	}
	if v := parseInt("x-codex-primary-reset-after-seconds"); v != nil {
		snapshot.PrimaryResetAfterSeconds = v
		hasData = true
	}
	if v := parseInt("x-codex-primary-window-minutes"); v != nil {
		snapshot.PrimaryWindowMinutes = v
		hasData = true
	}

	// Secondary (5h) limits
	if v := parseFloat("x-codex-secondary-used-percent"); v != nil {
		snapshot.SecondaryUsedPercent = v
		hasData = true
	}
	if v := parseInt("x-codex-secondary-reset-after-seconds"); v != nil {
		snapshot.SecondaryResetAfterSeconds = v
		hasData = true
	}
	if v := parseInt("x-codex-secondary-window-minutes"); v != nil {
		snapshot.SecondaryWindowMinutes = v
		hasData = true
	}

	// Overflow ratio
	if v := parseFloat("x-codex-primary-over-secondary-limit-percent"); v != nil {
		snapshot.PrimaryOverSecondaryPercent = v
		hasData = true
	}

	if !hasData {
		return nil
	}

	snapshot.UpdatedAt = time.Now().Format(time.RFC3339)
	return snapshot
}

func codexSnapshotBaseTime(snapshot *OpenAICodexUsageSnapshot, fallback time.Time) time.Time {
	if snapshot == nil {
		return fallback
	}
	if snapshot.UpdatedAt == "" {
		return fallback
	}
	base, err := time.Parse(time.RFC3339, snapshot.UpdatedAt)
	if err != nil {
		return fallback
	}
	return base
}

func codexResetAtRFC3339(base time.Time, resetAfterSeconds *int) *string {
	if resetAfterSeconds == nil {
		return nil
	}
	sec := *resetAfterSeconds
	if sec < 0 {
		sec = 0
	}
	resetAt := base.Add(time.Duration(sec) * time.Second).Format(time.RFC3339)
	return &resetAt
}

func buildCodexUsageExtraUpdates(snapshot *OpenAICodexUsageSnapshot, fallbackNow time.Time) map[string]any {
	if snapshot == nil {
		return nil
	}

	baseTime := codexSnapshotBaseTime(snapshot, fallbackNow)
	updates := make(map[string]any)

	// 保存原始 primary/secondary 字段，便于排查问题
	if snapshot.PrimaryUsedPercent != nil {
		updates["codex_primary_used_percent"] = *snapshot.PrimaryUsedPercent
	}
	if snapshot.PrimaryResetAfterSeconds != nil {
		updates["codex_primary_reset_after_seconds"] = *snapshot.PrimaryResetAfterSeconds
	}
	if snapshot.PrimaryWindowMinutes != nil {
		updates["codex_primary_window_minutes"] = *snapshot.PrimaryWindowMinutes
	}
	if snapshot.SecondaryUsedPercent != nil {
		updates["codex_secondary_used_percent"] = *snapshot.SecondaryUsedPercent
	}
	if snapshot.SecondaryResetAfterSeconds != nil {
		updates["codex_secondary_reset_after_seconds"] = *snapshot.SecondaryResetAfterSeconds
	}
	if snapshot.SecondaryWindowMinutes != nil {
		updates["codex_secondary_window_minutes"] = *snapshot.SecondaryWindowMinutes
	}
	if snapshot.PrimaryOverSecondaryPercent != nil {
		updates["codex_primary_over_secondary_percent"] = *snapshot.PrimaryOverSecondaryPercent
	}
	updates["codex_usage_updated_at"] = baseTime.Format(time.RFC3339)

	// 归一化到 5h/7d 规范字段
	if normalized := snapshot.Normalize(); normalized != nil {
		if normalized.Used5hPercent != nil {
			updates["codex_5h_used_percent"] = *normalized.Used5hPercent
		}
		if normalized.Reset5hSeconds != nil {
			updates["codex_5h_reset_after_seconds"] = *normalized.Reset5hSeconds
		}
		if normalized.Window5hMinutes != nil {
			updates["codex_5h_window_minutes"] = *normalized.Window5hMinutes
		}
		if normalized.Used7dPercent != nil {
			updates["codex_7d_used_percent"] = *normalized.Used7dPercent
		}
		if normalized.Reset7dSeconds != nil {
			updates["codex_7d_reset_after_seconds"] = *normalized.Reset7dSeconds
		}
		if normalized.Window7dMinutes != nil {
			updates["codex_7d_window_minutes"] = *normalized.Window7dMinutes
		}
		if reset5hAt := codexResetAtRFC3339(baseTime, normalized.Reset5hSeconds); reset5hAt != nil {
			updates["codex_5h_reset_at"] = *reset5hAt
		}
		if reset7dAt := codexResetAtRFC3339(baseTime, normalized.Reset7dSeconds); reset7dAt != nil {
			updates["codex_7d_reset_at"] = *reset7dAt
		}
	}

	return updates
}

// updateCodexUsageSnapshot saves the Codex usage snapshot to account's Extra field
func (s *OpenAIGatewayService) updateCodexUsageSnapshot(ctx context.Context, accountID int64, snapshot *OpenAICodexUsageSnapshot) {
	if snapshot == nil {
		return
	}
	if s == nil || s.accountRepo == nil {
		return
	}

	now := time.Now()
	updates := buildCodexUsageExtraUpdates(snapshot, now)
	if len(updates) == 0 {
		return
	}
	if !s.getCodexSnapshotThrottle().Allow(accountID, now) {
		return
	}

	go func() {
		updateCtx, cancel := context.WithTimeout(context.Background(), 5*time.Second)
		defer cancel()
		_ = s.accountRepo.UpdateExtra(updateCtx, accountID, updates)
	}()
}

func (s *OpenAIGatewayService) UpdateCodexUsageSnapshotFromHeaders(ctx context.Context, accountID int64, headers http.Header) {
	if accountID <= 0 || headers == nil {
		return
	}
	if snapshot := ParseCodexRateLimitHeaders(headers); snapshot != nil {
		s.updateCodexUsageSnapshot(ctx, accountID, snapshot)
	}
}

func getOpenAIReasoningEffortFromReqBody(reqBody map[string]any) (value string, present bool) {
	if reqBody == nil {
		return "", false
	}

	// Primary: reasoning.effort
	if reasoning, ok := reqBody["reasoning"].(map[string]any); ok {
		if effort, ok := reasoning["effort"].(string); ok {
			return normalizeOpenAIReasoningEffort(effort), true
		}
	}

	// Fallback: some clients may use a flat field.
	if effort, ok := reqBody["reasoning_effort"].(string); ok {
		return normalizeOpenAIReasoningEffort(effort), true
	}

	return "", false
}

func deriveOpenAIReasoningEffortFromModel(model string) string {
	if strings.TrimSpace(model) == "" {
		return ""
	}

	modelID := strings.TrimSpace(model)
	if strings.Contains(modelID, "/") {
		parts := strings.Split(modelID, "/")
		modelID = parts[len(parts)-1]
	}

	parts := strings.FieldsFunc(strings.ToLower(modelID), func(r rune) bool {
		switch r {
		case '-', '_', ' ':
			return true
		default:
			return false
		}
	})
	if len(parts) == 0 {
		return ""
	}

	return normalizeOpenAIReasoningEffort(parts[len(parts)-1])
}

func extractOpenAIRequestMetaFromBody(body []byte) (model string, stream bool, promptCacheKey string) {
	if len(body) == 0 {
		return "", false, ""
	}

	model = strings.TrimSpace(gjson.GetBytes(body, "model").String())
	stream = gjson.GetBytes(body, "stream").Bool()
	promptCacheKey = strings.TrimSpace(gjson.GetBytes(body, "prompt_cache_key").String())
	return model, stream, promptCacheKey
}

// normalizeOpenAIPassthroughOAuthBody 将透传 OAuth 请求体收敛为旧链路关键行为：
// 1) store=false 2) 非 compact 保持 stream=true；compact 强制 stream=false
func normalizeOpenAIPassthroughOAuthBody(body []byte, compact bool) ([]byte, bool, error) {
	if len(body) == 0 {
		return body, false, nil
	}

	normalized := body
	changed := false

	if compact {
		if store := gjson.GetBytes(normalized, "store"); store.Exists() {
			next, err := sjson.DeleteBytes(normalized, "store")
			if err != nil {
				return body, false, fmt.Errorf("normalize passthrough body delete store: %w", err)
			}
			normalized = next
			changed = true
		}
		if stream := gjson.GetBytes(normalized, "stream"); stream.Exists() {
			next, err := sjson.DeleteBytes(normalized, "stream")
			if err != nil {
				return body, false, fmt.Errorf("normalize passthrough body delete stream: %w", err)
			}
			normalized = next
			changed = true
		}
	} else {
		if store := gjson.GetBytes(normalized, "store"); !store.Exists() || store.Type != gjson.False {
			next, err := sjson.SetBytes(normalized, "store", false)
			if err != nil {
				return body, false, fmt.Errorf("normalize passthrough body store=false: %w", err)
			}
			normalized = next
			changed = true
		}
		if stream := gjson.GetBytes(normalized, "stream"); !stream.Exists() || stream.Type != gjson.True {
			next, err := sjson.SetBytes(normalized, "stream", true)
			if err != nil {
				return body, false, fmt.Errorf("normalize passthrough body stream=true: %w", err)
			}
			normalized = next
			changed = true
		}
	}

	return normalized, changed, nil
}

func detectOpenAIPassthroughInstructionsRejectReason(reqModel string, body []byte) string {
	model := strings.ToLower(strings.TrimSpace(reqModel))
	if !strings.Contains(model, "codex") {
		return ""
	}

	instructions := gjson.GetBytes(body, "instructions")
	if !instructions.Exists() {
		return "instructions_missing"
	}
	if instructions.Type != gjson.String {
		return "instructions_not_string"
	}
	if strings.TrimSpace(instructions.String()) == "" {
		return "instructions_empty"
	}
	return ""
}

func extractOpenAIReasoningEffortFromBody(body []byte, requestedModel string) *string {
	reasoningEffort := strings.TrimSpace(gjson.GetBytes(body, "reasoning.effort").String())
	if reasoningEffort == "" {
		reasoningEffort = strings.TrimSpace(gjson.GetBytes(body, "reasoning_effort").String())
	}
	if reasoningEffort != "" {
		normalized := normalizeOpenAIReasoningEffort(reasoningEffort)
		if normalized == "" {
			return nil
		}
		return &normalized
	}

	value := deriveOpenAIReasoningEffortFromModel(requestedModel)
	if value == "" {
		return nil
	}
	return &value
}

func extractOpenAIServiceTier(reqBody map[string]any) *string {
	if reqBody == nil {
		return nil
	}
	raw, ok := reqBody["service_tier"].(string)
	if !ok {
		return nil
	}
	return normalizeOpenAIServiceTier(raw)
}

func extractOpenAIServiceTierFromBody(body []byte) *string {
	if len(body) == 0 {
		return nil
	}
	return normalizeOpenAIServiceTier(gjson.GetBytes(body, "service_tier").String())
}

func normalizeOpenAIServiceTier(raw string) *string {
	value := strings.ToLower(strings.TrimSpace(raw))
	if value == "" {
		return nil
	}
	if value == "fast" {
		value = "priority"
	}
	// 放过 OpenAI 官方文档定义的所有合法 tier 值：priority/flex/auto/default/scale。
	// 对 Codex 客户端零影响（Codex 只发 priority 或 flex，见 codex-rs/core/src/client.rs），
	// 但能让直连 OpenAI SDK 的用户透传 auto/default/scale 以便抓包/调试。
	// 真未知值仍返回 nil，由 normalizeResponsesBodyServiceTier 从 body 中删除。
	switch value {
	case "priority", "flex", "auto", "default", "scale":
		return &value
	default:
		return nil
	}
}

// OpenAIFastBlockedError indicates a request was rejected by the OpenAI fast
// policy (action=block). Mirrors BetaBlockedError on the Claude side.
type OpenAIFastBlockedError struct {
	Message string
}

func (e *OpenAIFastBlockedError) Error() string { return e.Message }

// evaluateOpenAIFastPolicy returns the action and error message that should be
// applied for a request with the given account/model/service_tier. When the
// policy service is unavailable or no rule matches, it returns
// (BetaPolicyActionPass, "") so callers can short-circuit safely.
//
// Matching rules:
//   - Scope filters by account type (all / oauth / apikey / bedrock)
//   - ServiceTier must be empty (= any), "all", or equal the normalized tier
//   - ModelWhitelist narrows the rule to specific models; FallbackAction
//     handles the non-matching case (default: pass)
//
// 与 Claude BetaPolicy 的差异（保留首条匹配 short-circuit）：
//   - BetaPolicy 处理的是 anthropic-beta header 中的 token 集合，不同
//     规则可能针对不同 token，filter 需要累加成 set；block 则 first-match。
//   - OpenAI fast policy 操作的是单个字段 service_tier：filter 即删字段，
//     没有可累加的对象。一次请求只携带一个 service_tier，规则的 tier
//     维度天然互斥；同一 (scope, tier) 下若多条规则的 model whitelist
//     发生重叠，admin 可通过规则顺序明确意图。因此采用 first-match 而
//     非 BetaPolicy 那样的"block 覆盖 filter 覆盖 pass"语义。
func (s *OpenAIGatewayService) evaluateOpenAIFastPolicy(ctx context.Context, account *Account, model, serviceTier string) (action, errMsg string) {
	if s == nil || s.settingService == nil {
		return BetaPolicyActionPass, ""
	}
	tier := strings.ToLower(strings.TrimSpace(serviceTier))
	if tier == "" {
		return BetaPolicyActionPass, ""
	}
	settings := openAIFastPolicySettingsFromContext(ctx)
	if settings == nil {
		fetched, err := s.settingService.GetOpenAIFastPolicySettings(ctx)
		if err != nil || fetched == nil {
			return BetaPolicyActionPass, ""
		}
		settings = fetched
	}
	return evaluateOpenAIFastPolicyWithSettings(settings, account, model, tier)
}

// evaluateOpenAIFastPolicyWithSettings is the pure-function core extracted so
// long-lived sessions (e.g. WS) can prefetch settings once and avoid hitting
// the settingService on every frame. See WSSession entry and
// openAIFastPolicySettingsFromContext for the caching glue.
func evaluateOpenAIFastPolicyWithSettings(settings *OpenAIFastPolicySettings, account *Account, model, tier string) (action, errMsg string) {
	if settings == nil {
		return BetaPolicyActionPass, ""
	}
	isOAuth := account != nil && account.IsOAuth()
	isBedrock := account != nil && account.IsBedrock()
	for _, rule := range settings.Rules {
		if !betaPolicyScopeMatches(rule.Scope, isOAuth, isBedrock) {
			continue
		}
		ruleTier := strings.ToLower(strings.TrimSpace(rule.ServiceTier))
		if ruleTier != "" && ruleTier != OpenAIFastTierAny && ruleTier != tier {
			continue
		}
		eff := BetaPolicyRule{
			Action:               rule.Action,
			ErrorMessage:         rule.ErrorMessage,
			ModelWhitelist:       rule.ModelWhitelist,
			FallbackAction:       rule.FallbackAction,
			FallbackErrorMessage: rule.FallbackErrorMessage,
		}
		return resolveRuleAction(eff, model)
	}
	return BetaPolicyActionPass, ""
}

// openAIFastPolicyCtxKey 是 context 中预取的 OpenAIFastPolicySettings 缓存
// 键，仅用于 WebSocket 长会话内多帧复用同一份策略快照，避免每帧 DB 命中。
//
// Trade-off：策略变更不会影响当前 WS session（只影响新 session）。这是
// 有意为之 —— 对长会话来说，"策略一致性"比"立刻生效"更重要，且 Claude
// BetaPolicy 的 gin.Context 缓存也是同样取舍。需要 hot-reload 时管理员
// 可以通过踢断 session 强制刷新。
type openAIFastPolicyCtxKeyType struct{}

var openAIFastPolicyCtxKey = openAIFastPolicyCtxKeyType{}

// withOpenAIFastPolicyContext 将一份 settings 快照绑定到 context，供该 ctx
// 衍生 goroutine 中的 evaluateOpenAIFastPolicy 复用。
func withOpenAIFastPolicyContext(ctx context.Context, settings *OpenAIFastPolicySettings) context.Context {
	if ctx == nil || settings == nil {
		return ctx
	}
	return context.WithValue(ctx, openAIFastPolicyCtxKey, settings)
}

func openAIFastPolicySettingsFromContext(ctx context.Context) *OpenAIFastPolicySettings {
	if ctx == nil {
		return nil
	}
	if v, ok := ctx.Value(openAIFastPolicyCtxKey).(*OpenAIFastPolicySettings); ok {
		return v
	}
	return nil
}

// applyOpenAIFastPolicyToBody applies the OpenAI fast policy to a raw request
// body. When action=filter it removes the service_tier field; when
// action=block it returns (body, *OpenAIFastBlockedError). On pass it
// normalizes the service_tier value (e.g. client alias "fast" → "priority"),
// rewriting the body so the upstream receives a slug it recognizes.
//
// Rationale for normalize-on-pass: chat-completions / messages 入口在调用本
// 函数之前已经通过 normalizeResponsesBodyServiceTier 把 service_tier 归一化
// 到了上游可识别值；passthrough（OpenAI 自动透传） / native /responses 等
// 入口没有这一前置步骤，pass 路径下若不在此处归一化，"fast" 就会被原样
// 透传到 OpenAI 上游导致 400/拒绝。把归一化收敛到本函数，所有入口行为一致。
func (s *OpenAIGatewayService) applyOpenAIFastPolicyToBody(ctx context.Context, account *Account, model string, body []byte) ([]byte, error) {
	if len(body) == 0 {
		return body, nil
	}
	rawTier := gjson.GetBytes(body, "service_tier").String()
	if rawTier == "" {
		return body, nil
	}
	normTier := normalizedOpenAIServiceTierValue(rawTier)
	if normTier == "" {
		return body, nil
	}
	action, errMsg := s.evaluateOpenAIFastPolicy(ctx, account, model, normTier)
	switch action {
	case BetaPolicyActionBlock:
		msg := errMsg
		if msg == "" {
			msg = fmt.Sprintf("openai service_tier=%s is not allowed for model %s", normTier, model)
		}
		return body, &OpenAIFastBlockedError{Message: msg}
	case BetaPolicyActionFilter:
		trimmed, err := sjson.DeleteBytes(body, "service_tier")
		if err != nil {
			return body, fmt.Errorf("strip service_tier from body: %w", err)
		}
		return trimmed, nil
	default:
		// pass：把别名（如 "fast"）写回为规范值（"priority"）。
		if normTier == rawTier {
			return body, nil
		}
		updated, err := sjson.SetBytes(body, "service_tier", normTier)
		if err != nil {
			return body, fmt.Errorf("normalize service_tier on pass: %w", err)
		}
		return updated, nil
	}
}

// writeOpenAIFastPolicyBlockedResponse writes a 403 JSON response for a
// request blocked by the OpenAI fast policy.
func writeOpenAIFastPolicyBlockedResponse(c *gin.Context, err *OpenAIFastBlockedError) {
	if c == nil || err == nil {
		return
	}
	c.JSON(http.StatusForbidden, gin.H{
		"error": gin.H{
			"type":    "permission_error",
			"message": err.Message,
		},
	})
}

// applyOpenAIFastPolicyToWSResponseCreate evaluates the OpenAI fast policy
// against a single client→upstream WebSocket frame whose top-level
// "type"=="response.create". It mirrors the HTTP-side
// applyOpenAIFastPolicyToBody contract but operates on a Realtime/Responses
// WS payload:
//
//   - pass: returns frame unchanged (newBytes == frame, blocked == nil)
//   - filter: returns a copy with top-level service_tier removed
//   - block: returns (frame, *OpenAIFastBlockedError)
//
// Only frames whose "type" field strictly equals "response.create" are
// inspected/mutated. Any other frame type — including the empty string —
// passes through untouched. The OpenAI Realtime client-event spec requires
// "type" to be set, so an empty type is treated as a malformed frame we do
// not police; the upstream is the source of truth for rejecting it.
//
// service_tier lives at the top level of response.create — same as the
// Responses HTTP body shape (see openai_gateway_chat_completions.go:304 +
// extractOpenAIServiceTierFromBody at line 5593, and the test fixture at
// openai_ws_forwarder_ingress_session_test.go:402). We therefore only need
// to inspect / strip the top-level field; there is no nested form in the
// schema today.
//
// The caller is responsible for choosing the upstream model passed in —
// this helper does not re-derive it.
func (s *OpenAIGatewayService) applyOpenAIFastPolicyToWSResponseCreate(
	ctx context.Context,
	account *Account,
	model string,
	frame []byte,
) ([]byte, *OpenAIFastBlockedError, error) {
	if len(frame) == 0 {
		return frame, nil, nil
	}
	if !gjson.ValidBytes(frame) {
		return frame, nil, nil
	}
	frameType := strings.TrimSpace(gjson.GetBytes(frame, "type").String())
	// Strict match: only response.create is policy-checked. Empty / other
	// types pass through untouched so we never accidentally strip fields
	// from response.cancel, conversation.item.create, or any future
	// client-event the spec adds. The Realtime spec requires "type" on
	// every client event, so an empty type is malformed input — let the
	// upstream reject it rather than guessing at our layer.
	if frameType != "response.create" {
		return frame, nil, nil
	}
	rawTier := gjson.GetBytes(frame, "service_tier").String()
	if rawTier == "" {
		return frame, nil, nil
	}
	normTier := normalizedOpenAIServiceTierValue(rawTier)
	if normTier == "" {
		return frame, nil, nil
	}
	action, errMsg := s.evaluateOpenAIFastPolicy(ctx, account, model, normTier)
	switch action {
	case BetaPolicyActionBlock:
		msg := errMsg
		if msg == "" {
			msg = fmt.Sprintf("openai service_tier=%s is not allowed for model %s", normTier, model)
		}
		return frame, &OpenAIFastBlockedError{Message: msg}, nil
	case BetaPolicyActionFilter:
		trimmed, err := sjson.DeleteBytes(frame, "service_tier")
		if err != nil {
			return frame, nil, fmt.Errorf("strip service_tier from ws frame: %w", err)
		}
		return trimmed, nil, nil
	default:
		return frame, nil, nil
	}
}

// newOpenAIFastPolicyWSEventID returns a Realtime-style event_id for a
// server-emitted error event. Matches the loose "evt_<rand>" convention used
// by upstream Realtime servers; the exact value is not load-bearing and is
// only required for client-side log correlation. We reuse the existing
// google/uuid dependency rather than pulling a new one.
func newOpenAIFastPolicyWSEventID() string {
	id, err := uuid.NewRandom()
	if err != nil {
		// Extremely unlikely; fall back to a fixed prefix so the field is
		// still non-empty and the schema stays self-consistent.
		return "evt_openai_fast_policy"
	}
	// Strip dashes so it visually matches "evt_<hex>" rather than UUID v4
	// canonical form, mirroring what real Realtime traces look like.
	return "evt_" + strings.ReplaceAll(id.String(), "-", "")
}

// buildOpenAIFastPolicyBlockedWSEvent renders an OpenAI Realtime/Responses
// style "error" event payload for a request blocked by the OpenAI fast
// policy. The shape mirrors Realtime error events as observed in upstream
// traces and per the spec's server "error" event:
//
//	{
//	  "event_id": "evt_<random>",
//	  "type": "error",
//	  "error": {
//	    "type": "invalid_request_error",
//	    "code": "policy_violation",
//	    "message": "..."
//	  }
//	}
//
// event_id lets clients correlate the rejection in their logs; "code" gives
// programmatic clients a stable identifier (HTTP-side equivalent is the
// 403 permission_error JSON body).
func buildOpenAIFastPolicyBlockedWSEvent(err *OpenAIFastBlockedError) []byte {
	if err == nil {
		return nil
	}
	eventID := newOpenAIFastPolicyWSEventID()
	payload, mErr := json.Marshal(map[string]any{
		"event_id": eventID,
		"type":     "error",
		"error": map[string]any{
			"type":    "invalid_request_error",
			"code":    "policy_violation",
			"message": err.Message,
		},
	})
	if mErr != nil {
		// Fallback to a minimal hand-rolled payload; Marshal of the literal
		// shape above should never fail in practice.
		return []byte(`{"event_id":"` + eventID + `","type":"error","error":{"type":"invalid_request_error","code":"policy_violation","message":"openai fast policy blocked this request"}}`)
	}
	return payload
}

func sanitizeEmptyBase64InputImagesInOpenAIBody(body []byte) ([]byte, bool, error) {
	if len(body) == 0 || !bytes.Contains(body, []byte(`"image_url"`)) || !bytes.Contains(body, []byte(`base64,`)) {
		return body, false, nil
	}

	var reqBody map[string]any
	if err := json.Unmarshal(body, &reqBody); err != nil {
		return body, false, fmt.Errorf("sanitize request body: %w", err)
	}
	if !sanitizeEmptyBase64InputImagesInOpenAIRequestBodyMap(reqBody) {
		return body, false, nil
	}
	normalized, err := json.Marshal(reqBody)
	if err != nil {
		return body, false, fmt.Errorf("serialize sanitized request body: %w", err)
	}
	return normalized, true, nil
}

func sanitizeEmptyBase64InputImagesInOpenAIRequestBodyMap(reqBody map[string]any) bool {
	if reqBody == nil {
		return false
	}
	input, ok := reqBody["input"]
	if !ok {
		return false
	}
	normalizedInput, changed := sanitizeEmptyBase64InputImagesInOpenAIInput(input)
	if !changed {
		return false
	}
	reqBody["input"] = normalizedInput
	return true
}

func sanitizeEmptyBase64InputImagesInOpenAIInput(input any) (any, bool) {
	items, ok := input.([]any)
	if !ok {
		return input, false
	}

	normalizedItems := make([]any, 0, len(items))
	changed := false
	for _, item := range items {
		itemMap, ok := item.(map[string]any)
		if !ok {
			normalizedItems = append(normalizedItems, item)
			continue
		}
		if shouldDropEmptyBase64InputImagePart(itemMap) {
			changed = true
			continue
		}
		content, ok := itemMap["content"]
		if !ok {
			normalizedItems = append(normalizedItems, itemMap)
			continue
		}
		parts, ok := content.([]any)
		if !ok {
			normalizedItems = append(normalizedItems, itemMap)
			continue
		}

		normalizedParts := make([]any, 0, len(parts))
		itemChanged := false
		for _, part := range parts {
			if shouldDropEmptyBase64InputImagePart(part) {
				changed = true
				itemChanged = true
				continue
			}
			normalizedParts = append(normalizedParts, part)
		}
		if itemChanged {
			if len(normalizedParts) == 0 {
				continue
			}
			itemMap["content"] = normalizedParts
		}
		normalizedItems = append(normalizedItems, itemMap)
	}
	if !changed {
		return input, false
	}
	return normalizedItems, true
}

func shouldDropEmptyBase64InputImagePart(part any) bool {
	partMap, ok := part.(map[string]any)
	if !ok {
		return false
	}
	typeValue, _ := partMap["type"].(string)
	if strings.TrimSpace(typeValue) != "input_image" {
		return false
	}
	imageURL, _ := partMap["image_url"].(string)
	return isEmptyBase64DataURI(imageURL)
}

func isEmptyBase64DataURI(raw string) bool {
	if !strings.HasPrefix(raw, "data:") {
		return false
	}
	rest := strings.TrimPrefix(raw, "data:")
	semicolonIdx := strings.Index(rest, ";")
	if semicolonIdx < 0 {
		return false
	}
	rest = rest[semicolonIdx+1:]
	if !strings.HasPrefix(rest, "base64,") {
		return false
	}
	return strings.TrimSpace(strings.TrimPrefix(rest, "base64,")) == ""
}

func getOpenAIRequestBodyMap(c *gin.Context, body []byte) (map[string]any, error) {
	if c != nil {
		if cached, ok := c.Get(OpenAIParsedRequestBodyKey); ok {
			if reqBody, ok := cached.(map[string]any); ok && reqBody != nil {
				return reqBody, nil
			}
		}
	}

	var reqBody map[string]any
	if err := json.Unmarshal(body, &reqBody); err != nil {
		return nil, fmt.Errorf("parse request: %w", err)
	}
	if c != nil {
		c.Set(OpenAIParsedRequestBodyKey, reqBody)
	}
	return reqBody, nil
}

func extractOpenAIReasoningEffort(reqBody map[string]any, requestedModel string) *string {
	if value, present := getOpenAIReasoningEffortFromReqBody(reqBody); present {
		if value == "" {
			return nil
		}
		return &value
	}

	value := deriveOpenAIReasoningEffortFromModel(requestedModel)
	if value == "" {
		return nil
	}
	return &value
}

func normalizeOpenAIReasoningEffort(raw string) string {
	value := strings.ToLower(strings.TrimSpace(raw))
	if value == "" {
		return ""
	}

	// Normalize separators for "x-high"/"x_high" variants.
	value = strings.NewReplacer("-", "", "_", "", " ", "").Replace(value)

	switch value {
	case "none", "minimal":
		return ""
	case "low", "medium", "high":
		return value
	case "xhigh", "extrahigh":
		return "xhigh"
	default:
		// Only store known effort levels for now to keep UI consistent.
		return ""
	}
}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								package service
 								import (
 									"bufio"
 									"bytes"
 									"context"
 									"crypto/sha256"
 									"encoding/hex"
 									"encoding/json"
 									"errors"
 									"fmt"
 									"io"
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+									"log/slog"
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									"math/rand"
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									"net/http"
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									"sort"
-												feat: OpenAI OAuth账号显示Codex使用量

从响应头提取x-codex-*使用量信息并保存到账号Extra字段，
前端账号列表展示5h/7d窗口的使用进度条。

											
										
										
											2025-12-23 16:26:07 +08:00
+									"strconv"
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									"strings"
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									"sync"
-												fix(流式): 以上游读取判定超时并调大事件缓冲

- 以读取时间戳判定流式间隔超时，避免下游阻塞误判
- antigravity 流式读取使用 MaxLineSize 配置
- 事件通道缓冲提升到 16

测试: go test ./...

											
										
										
											2026-01-04 20:19:07 +08:00
+									"sync/atomic"
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									"time"
-												refactor: 重命名 go module

											
										
										
											2025-12-24 21:07:21 +08:00
+									"github.com/Wei-Shaw/sub2api/internal/config"
-												fix: 非流式路径在上游终态事件output为空时从delta事件重建响应内容

上游API近期更新后，response.completed终态SSE事件的output字段可能为空，
实际内容仅通过response.output_text.delta等增量事件下发。流式路径不受影响，
但chat_completions非流式路径和responses OAuth非流式路径只依赖终态事件的
output，导致返回空响应。

新增BufferedResponseAccumulator累积器，在SSE扫描过程中收集delta事件内容
（文本、function_call、reasoning），当终态output为空时补充重建。

同时修复handleChatBufferedStreamingResponse遗漏response.done事件类型的问题。

											
										
										
											2026-04-07 19:30:45 +08:00
+									"github.com/Wei-Shaw/sub2api/internal/pkg/apicompat"
-												chore(logging): 完成后端日志审计与结构化迁移

- 将高密度服务与处理器日志迁移到新日志系统（LegacyPrintf/结构化日志）
- 增加 stdlog bridge 与兼容测试，保留旧日志捕获能力
- 将 OpenAI 断流告警改为结构化 Warn 并改造对应测试为 sink 捕获
- 补齐后端相关文件 logger 引用并通过全量 go test

											
										
										
											2026-02-12 19:01:09 +08:00
+									"github.com/Wei-Shaw/sub2api/internal/pkg/logger"
-												Make Codex CLI passthrough

											
										
										
											2026-01-10 03:12:56 +08:00
+									"github.com/Wei-Shaw/sub2api/internal/pkg/openai"
-												feat(安全): 强化安全策略与配置校验

- 增加 CORS/CSP/安全响应头与代理信任配置

- 引入 URL 白名单与私网开关，校验上游与价格源

- 改善 API Key 处理与网关错误返回

- 管理端设置隐藏敏感字段并优化前端提示

- 增加计费熔断与相关配置示例

测试: go test ./...

											
										
										
											2026-01-02 17:40:57 +08:00
+									"github.com/Wei-Shaw/sub2api/internal/util/responseheaders"
 									"github.com/Wei-Shaw/sub2api/internal/util/urlvalidator"
-												fix(gateway): 防止 OpenAI Codex 跨用户串流

根因：多个用户共享同一 OAuth 账号时，conversation_id/session_id 头
未做用户隔离，导致上游 chatgpt.com 将不同用户的请求关联到同一会话。

HTTP SSE 修复:
- 新增 isolateOpenAISessionID(apiKeyID, raw)，将 API Key ID 混入
  session 标识符（xxhash），确保不同 Key 的用户产生不同上游会话
- buildUpstreamRequest: OAuth 分支先 Del 客户端透传的 session 头，
  再用隔离值覆盖
- buildUpstreamRequestOpenAIPassthrough: 透传路径同样隔离
- ForwardAsAnthropic: Anthropic Messages 兼容路径同步修复
- buildOpenAIWSHeaders: WS 路径的 OAuth session 头同步隔离

											
										
										
											2026-03-16 10:28:11 +08:00
+									"github.com/cespare/xxhash/v2"
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									"github.com/gin-gonic/gin"
-												fix(openai): support remote compact task

											
										
										
											2026-03-06 18:50:28 +08:00
+									"github.com/google/uuid"
-												perf(service): 优化 model 替换函数，用 gjson/sjson 替代全量 JSON 序列化

SSE 热路径中 replaceModelInSSELine 和 replaceModelInResponseBody 原来
使用 json.Unmarshal/Marshal 对每个事件做全量反序列化再序列化，现改为
gjson.Get/sjson.Set 精确字段操作，消除 O(n) 中间 map 分配，保持 JSON
字段顺序不变。涉及 OpenAIGatewayService 和 GatewayService 两个服务。

新增 23 个单元测试覆盖：顶层/嵌套 model 替换、不匹配跳过、空行/[DONE]/
非法 JSON 等边界情况。

Fixes: P1-08

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-07 17:09:55 +08:00
+									"github.com/tidwall/gjson"
 									"github.com/tidwall/sjson"
-												chore(logging): 完成后端日志审计与结构化迁移

- 将高密度服务与处理器日志迁移到新日志系统（LegacyPrintf/结构化日志）
- 增加 stdlog bridge 与兼容测试，保留旧日志捕获能力
- 将 OpenAI 断流告警改为结构化 Warn 并改造对应测试为 sink 捕获
- 补齐后端相关文件 logger 引用并通过全量 go test

											
										
										
											2026-02-12 19:01:09 +08:00
+									"go.uber.org/zap"
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								)
 								const (
 									// ChatGPT internal API for OAuth accounts
 									chatgptCodexURL = "https://chatgpt.com/backend-api/codex/responses"
 									// OpenAI Platform API for API Key accounts (fallback)
 									openaiPlatformAPIURL   = "https://api.openai.com/v1/responses"
 									openaiStickySessionTTL = time.Hour // 粘性会话TTL
-												fix(openai): bump codex CLI version from 0.104.0 to 0.125.0

The hardcoded codex CLI version (0.104.0) causes upstream rejection
when using gpt-5.5 with compact, as the server treats the request
as an outdated client and returns 400/502.

Update codexCLIVersion, codexCLIUserAgent, and openAICodexProbeVersion
to 0.125.0 to match the current Codex CLI release.

Fixes #1933, #1887, #1865
Related: #1609, #1298, #849

											
										
										
											2026-04-25 05:26:33 +00:00
+									codexCLIUserAgent      = "codex_cli_rs/0.125.0"
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+									// codex_cli_only 拒绝时单个请求头日志长度上限（字符）
 									codexCLIOnlyHeaderValueMaxBytes = 256
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+									// OpenAIParsedRequestBodyKey 缓存 handler 侧已解析的请求体，避免重复解析。
 									OpenAIParsedRequestBodyKey = "openai_parsed_request_body"
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									// OpenAI WS Mode 失败后的重连次数上限（不含首次尝试）。
 									// 与 Codex 客户端保持一致：失败后最多重连 5 次。
 									openAIWSReconnectRetryLimit = 5
 									// OpenAI WS Mode 重连退避默认值（可由配置覆盖）。
 									openAIWSRetryBackoffInitialDefault = 120 * time.Millisecond
 									openAIWSRetryBackoffMaxDefault     = 2 * time.Second
 									openAIWSRetryJitterRatioDefault    = 0.2
-												fix(openai): support remote compact task

											
										
										
											2026-03-06 18:50:28 +08:00
+									openAICompactSessionSeedKey        = "openai_compact_session_seed"
-												fix(openai): bump codex CLI version from 0.104.0 to 0.125.0

The hardcoded codex CLI version (0.104.0) causes upstream rejection
when using gpt-5.5 with compact, as the server treats the request
as an outdated client and returns 400/502.

Update codexCLIVersion, codexCLIUserAgent, and openAICodexProbeVersion
to 0.125.0 to match the current Codex CLI release.

Fixes #1933, #1887, #1865
Related: #1609, #1298, #849

											
										
										
											2026-04-25 05:26:33 +00:00
+									codexCLIVersion                    = "0.125.0"
-												Reduce DB write amplification on quota and account extra updates

											
										
										
											2026-03-11 13:53:19 +08:00
+									// Codex 限额快照仅用于后台展示/诊断，不需要每个成功请求都立即落库。
 									openAICodexSnapshotPersistMinInterval = 30 * time.Second
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+								)
-												fix(sse): 修复非标准 SSE 格式解析问题

部分上游 API 返回的 SSE 格式不符合标准规范：
- 标准格式: `data: {...}`（冒号后有空格）
- 非标准格式: `data:{...}`（冒号后无空格）

使用预编译正则 `^data:\s*` 统一处理两种格式。

											
										
										
											2025-12-26 03:49:55 -08:00
-												fix(openai): 收敛自动透传请求头并增强 OAuth 安全兜底

											
										
										
											2026-02-12 20:12:15 +08:00
+								// OpenAI allowed headers whitelist (for non-passthrough).
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								var openaiAllowedHeaders = map[string]bool{
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									"accept-language":       true,
 									"content-type":          true,
 									"conversation_id":       true,
 									"user-agent":            true,
 									"originator":            true,
 									"session_id":            true,
 									"x-codex-turn-state":    true,
 									"x-codex-turn-metadata": true,
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								}
-												fix(openai): 收敛自动透传请求头并增强 OAuth 安全兜底

											
										
										
											2026-02-12 20:12:15 +08:00
+								// OpenAI passthrough allowed headers whitelist.
 								// 透传模式下仅放行这些低风险请求头，避免将非标准/环境噪声头传给上游触发风控。
 								var openaiPassthroughAllowedHeaders = map[string]bool{
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									"accept":                true,
 									"accept-language":       true,
 									"content-type":          true,
 									"conversation_id":       true,
 									"openai-beta":           true,
 									"user-agent":            true,
 									"originator":            true,
 									"session_id":            true,
 									"x-codex-turn-state":    true,
 									"x-codex-turn-metadata": true,
-												fix(openai): 收敛自动透传请求头并增强 OAuth 安全兜底

											
										
										
											2026-02-12 20:12:15 +08:00
+								}
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+								// codex_cli_only 拒绝时记录的请求头白名单（仅用于诊断日志，不参与上游透传）
 								var codexCLIOnlyDebugHeaderWhitelist = []string{
 									"User-Agent",
 									"Content-Type",
 									"Accept",
 									"Accept-Language",
 									"OpenAI-Beta",
 									"Originator",
 									"Session_ID",
 									"Conversation_ID",
 									"X-Request-ID",
 									"X-Client-Request-ID",
 									"X-Forwarded-For",
 									"X-Real-IP",
 								}
-												feat: OpenAI OAuth账号显示Codex使用量

从响应头提取x-codex-*使用量信息并保存到账号Extra字段，
前端账号列表展示5h/7d窗口的使用进度条。

											
										
										
											2025-12-23 16:26:07 +08:00
+								// OpenAICodexUsageSnapshot represents Codex API usage limits from response headers
 								type OpenAICodexUsageSnapshot struct {
 									PrimaryUsedPercent          *float64 `json:"primary_used_percent,omitempty"`
 									PrimaryResetAfterSeconds    *int     `json:"primary_reset_after_seconds,omitempty"`
 									PrimaryWindowMinutes        *int     `json:"primary_window_minutes,omitempty"`
 									SecondaryUsedPercent        *float64 `json:"secondary_used_percent,omitempty"`
 									SecondaryResetAfterSeconds  *int     `json:"secondary_reset_after_seconds,omitempty"`
 									SecondaryWindowMinutes      *int     `json:"secondary_window_minutes,omitempty"`
 									PrimaryOverSecondaryPercent *float64 `json:"primary_over_secondary_percent,omitempty"`
 									UpdatedAt                   string   `json:"updated_at,omitempty"`
 								}
-												fix(ratelimit): 修复 OpenAI 账号限流倒计时计算错误

- 解析 x-codex-* 响应头获取正确的重置时间
- 7d 限制用尽时使用 codex_7d_reset_after_seconds
- 提取 Normalize() 方法统一窗口规范化逻辑

											
										
										
											2026-01-25 13:32:08 +08:00
+								// NormalizedCodexLimits contains normalized 5h/7d rate limit data
 								type NormalizedCodexLimits struct {
 									Used5hPercent   *float64
 									Reset5hSeconds  *int
 									Window5hMinutes *int
 									Used7dPercent   *float64
 									Reset7dSeconds  *int
 									Window7dMinutes *int
 								}
 								// Normalize converts primary/secondary fields to canonical 5h/7d fields.
 								// Strategy: Compare window_minutes to determine which is 5h vs 7d.
 								// Returns nil if snapshot is nil or has no useful data.
 								func (s *OpenAICodexUsageSnapshot) Normalize() *NormalizedCodexLimits {
 									if s == nil {
 										return nil
 									}
 									result := &NormalizedCodexLimits{}
 									primaryMins := 0
 									secondaryMins := 0
 									hasPrimaryWindow := false
 									hasSecondaryWindow := false
 									if s.PrimaryWindowMinutes != nil {
 										primaryMins = *s.PrimaryWindowMinutes
 										hasPrimaryWindow = true
 									}
 									if s.SecondaryWindowMinutes != nil {
 										secondaryMins = *s.SecondaryWindowMinutes
 										hasSecondaryWindow = true
 									}
 									// Determine mapping based on window_minutes
 									use5hFromPrimary := false
 									use7dFromPrimary := false
 									if hasPrimaryWindow && hasSecondaryWindow {
 										// Both known: smaller window is 5h, larger is 7d
 										if primaryMins < secondaryMins {
 											use5hFromPrimary = true
 										} else {
 											use7dFromPrimary = true
 										}
 									} else if hasPrimaryWindow {
 										// Only primary known: classify by threshold (<=360 min = 6h -> 5h window)
 										if primaryMins <= 360 {
 											use5hFromPrimary = true
 										} else {
 											use7dFromPrimary = true
 										}
 									} else if hasSecondaryWindow {
 										// Only secondary known: classify by threshold
 										if secondaryMins <= 360 {
 											// 5h from secondary, so primary (if any data) is 7d
 											use7dFromPrimary = true
 										} else {
 											// 7d from secondary, so primary (if any data) is 5h
 											use5hFromPrimary = true
 										}
 									} else {
 										// No window_minutes: fall back to legacy assumption (primary=7d, secondary=5h)
 										use7dFromPrimary = true
 									}
 									// Assign values
 									if use5hFromPrimary {
 										result.Used5hPercent = s.PrimaryUsedPercent
 										result.Reset5hSeconds = s.PrimaryResetAfterSeconds
 										result.Window5hMinutes = s.PrimaryWindowMinutes
 										result.Used7dPercent = s.SecondaryUsedPercent
 										result.Reset7dSeconds = s.SecondaryResetAfterSeconds
 										result.Window7dMinutes = s.SecondaryWindowMinutes
 									} else if use7dFromPrimary {
 										result.Used7dPercent = s.PrimaryUsedPercent
 										result.Reset7dSeconds = s.PrimaryResetAfterSeconds
 										result.Window7dMinutes = s.PrimaryWindowMinutes
 										result.Used5hPercent = s.SecondaryUsedPercent
 										result.Reset5hSeconds = s.SecondaryResetAfterSeconds
 										result.Window5hMinutes = s.SecondaryWindowMinutes
 									}
 									return result
 								}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								// OpenAIUsage represents OpenAI API response usage
 								type OpenAIUsage struct {
 									InputTokens              int `json:"input_tokens"`
 									OutputTokens             int `json:"output_tokens"`
 									CacheCreationInputTokens int `json:"cache_creation_input_tokens,omitempty"`
 									CacheReadInputTokens     int `json:"cache_read_input_tokens,omitempty"`
-												feat: image output token billing, channel-mapped billing source, credits balance precheck

- Parse candidatesTokensDetails from Gemini API to separate image/text output tokens
- Add image_output_tokens and image_output_cost to usage_log (migration 089)
- Support per-image-token pricing via output_cost_per_image_token from model pricing data
- Channel pricing ImageOutputPrice override works in token billing mode
- Auto-fill image_output_price in channel pricing form from model defaults
- Add "channel_mapped" billing model source as new default (migration 088)
- Bills by model name after channel mapping, before account mapping
- Fix channel cache error TTL sign error (115s → 5s)
- Fix Update channel only invalidating new groups, not removed groups
- Fix frontend model_mapping clearing sending undefined instead of {}
- Credits balance precheck via shared AccountUsageService cache before injection
- Skip credits injection for accounts with insufficient balance
- Don't mark credits exhausted for "exhausted your capacity on this model" 429s

											
										
										
											2026-04-01 15:08:57 +08:00
+									ImageOutputTokens        int `json:"image_output_tokens,omitempty"`
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								}
 								// OpenAIForwardResult represents the result of forwarding
 								type OpenAIForwardResult struct {
-												feat(usage): add reasoning effort column

											
										
										
											2026-02-03 14:36:29 +08:00
+									RequestID string
 									Usage     OpenAIUsage
-												feat: /v1/messages端点适配codex账号池

											
										
										
											2026-03-06 22:39:33 +08:00
+									Model     string // 原始模型（用于响应和日志显示）
 									// BillingModel is the model used for cost calculation.
 									// When non-empty, CalculateCost uses this instead of Model.
 									// This is set by the Anthropic Messages conversion path where
 									// the mapped upstream model differs from the client-facing model.
 									BillingModel string
-												feat(service): record upstream model across all gateway paths

Propagate UpstreamModel through ForwardResult and OpenAIForwardResult in Anthropic direct, API-key passthrough, Bedrock, and OpenAI gateway flows. Extract optionalNonEqualStringPtr and optionalTrimmedStringPtr into usage_log_helpers.go. Store upstream_model only when it differs from the requested model.

Also introduces anthropicPassthroughForwardInput struct to reduce parameter count.

											
										
										
											2026-03-17 19:25:35 +08:00
+									// UpstreamModel is the actual model sent to the upstream provider after mapping.
 									// Empty when no mapping was applied (requested model was used as-is).
 									UpstreamModel string
-												fix(billing): 修复 OpenAI fast 档位计费并补齐展示

- 打通 service_tier 在 OpenAI HTTP、WS、passthrough 与 usage 记录中的传递
- 修正 priority/flex 计费逻辑，并将 fast 归一化为 priority
- 在用户端和管理端补齐服务档位与计费明细展示
- 补齐前后端测试，并修复 WS 限流信号重复持久化导致的全量回归失败

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-08 23:22:28 +08:00
+									// ServiceTier records the OpenAI Responses API service tier, e.g. "priority" / "flex".
 									// Nil means the request did not specify a recognized tier.
 									ServiceTier *string
-												feat(usage): add reasoning effort column

											
										
										
											2026-02-03 14:36:29 +08:00
+									// ReasoningEffort is extracted from request body (reasoning.effort) or derived from model suffix.
 									// Stored for usage records display; nil means not provided / not applicable.
 									ReasoningEffort *string
 									Stream          bool
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									OpenAIWSMode    bool
-												fix(openai): restore ws usage window display

											
										
										
											2026-03-06 20:46:10 +08:00
+									ResponseHeaders http.Header
-												feat(usage): add reasoning effort column

											
										
										
											2026-02-03 14:36:29 +08:00
+									Duration        time.Duration
 									FirstTokenMs    *int
-												feat(openai): 同步生图 API 支持并接入图片计费调度

- 同步 OpenAI 图片生成与编辑接口
- 接入图片请求解析、账号调度、转发与用量记录
- 接入图片计费与图片用量落库
- 限制 OAuth 生图仅支持无显式模型和尺寸的基础请求

											
										
										
											2026-04-22 12:30:08 +08:00
+									ImageCount      int
 									ImageSize       string
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+								type OpenAIWSRetryMetricsSnapshot struct {
 									RetryAttemptsTotal            int64 `json:"retry_attempts_total"`
 									RetryBackoffMsTotal           int64 `json:"retry_backoff_ms_total"`
 									RetryExhaustedTotal           int64 `json:"retry_exhausted_total"`
 									NonRetryableFastFallbackTotal int64 `json:"non_retryable_fast_fallback_total"`
 								}
 								type OpenAICompatibilityFallbackMetricsSnapshot struct {
 									SessionHashLegacyReadFallbackTotal int64   `json:"session_hash_legacy_read_fallback_total"`
 									SessionHashLegacyReadFallbackHit   int64   `json:"session_hash_legacy_read_fallback_hit"`
 									SessionHashLegacyDualWriteTotal    int64   `json:"session_hash_legacy_dual_write_total"`
 									SessionHashLegacyReadHitRate       float64 `json:"session_hash_legacy_read_hit_rate"`
 									MetadataLegacyFallbackIsMaxTokensOneHaikuTotal int64 `json:"metadata_legacy_fallback_is_max_tokens_one_haiku_total"`
 									MetadataLegacyFallbackThinkingEnabledTotal     int64 `json:"metadata_legacy_fallback_thinking_enabled_total"`
 									MetadataLegacyFallbackPrefetchedStickyAccount  int64 `json:"metadata_legacy_fallback_prefetched_sticky_account_total"`
 									MetadataLegacyFallbackPrefetchedStickyGroup    int64 `json:"metadata_legacy_fallback_prefetched_sticky_group_total"`
 									MetadataLegacyFallbackSingleAccountRetryTotal  int64 `json:"metadata_legacy_fallback_single_account_retry_total"`
 									MetadataLegacyFallbackAccountSwitchCountTotal  int64 `json:"metadata_legacy_fallback_account_switch_count_total"`
 									MetadataLegacyFallbackTotal                    int64 `json:"metadata_legacy_fallback_total"`
 								}
 								type openAIWSRetryMetrics struct {
 									retryAttempts            atomic.Int64
 									retryBackoffMs           atomic.Int64
 									retryExhausted           atomic.Int64
 									nonRetryableFastFallback atomic.Int64
 								}
-												Reduce DB write amplification on quota and account extra updates

											
										
										
											2026-03-11 13:53:19 +08:00
+								type accountWriteThrottle struct {
 									minInterval time.Duration
 									mu          sync.Mutex
 									lastByID    map[int64]time.Time
 								}
 								func newAccountWriteThrottle(minInterval time.Duration) *accountWriteThrottle {
 									return &accountWriteThrottle{
 										minInterval: minInterval,
 										lastByID:    make(map[int64]time.Time),
 									}
 								}
 								func (t *accountWriteThrottle) Allow(id int64, now time.Time) bool {
 									if t == nil || id <= 0 || t.minInterval <= 0 {
 										return true
 									}
 									t.mu.Lock()
 									defer t.mu.Unlock()
 									if last, ok := t.lastByID[id]; ok && now.Sub(last) < t.minInterval {
 										return false
 									}
 									t.lastByID[id] = now
 									if len(t.lastByID) > 4096 {
 										cutoff := now.Add(-4 * t.minInterval)
 										for accountID, writtenAt := range t.lastByID {
 											if writtenAt.Before(cutoff) {
 												delete(t.lastByID, accountID)
 											}
 										}
 									}
 									return true
 								}
 								var defaultOpenAICodexSnapshotPersistThrottle = newAccountWriteThrottle(openAICodexSnapshotPersistMinInterval)
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+								// ErrNoAvailableCompactAccounts indicates the request needs /responses/compact
 								// support but no compatible account is available.
 								var ErrNoAvailableCompactAccounts = errors.New("no available OpenAI accounts support /responses/compact")
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								// OpenAIGatewayService handles OpenAI API gateway operations
 								type OpenAIGatewayService struct {
-												fix(openai): 统一专属倍率计费链路并补齐回归测试

抽取共享的用户分组专属倍率解析器，统一缓存、singleflight 与回退逻辑。\n\n让 OpenAI 独立计费链路复用专属倍率解析，修复 usage 记录与实际扣费未命中用户专属倍率的问题。\n\n补齐 OpenAI 计费与解析器单元测试，并修复全量回归中暴露的 lint 阻塞项。\n\nCo-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-06 14:54:52 +08:00
+									accountRepo           AccountRepository
 									usageLogRepo          UsageLogRepository
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+									usageBillingRepo      UsageBillingRepository
-												fix(openai): 统一专属倍率计费链路并补齐回归测试

抽取共享的用户分组专属倍率解析器，统一缓存、singleflight 与回退逻辑。\n\n让 OpenAI 独立计费链路复用专属倍率解析，修复 usage 记录与实际扣费未命中用户专属倍率的问题。\n\n补齐 OpenAI 计费与解析器单元测试，并修复全量回归中暴露的 lint 阻塞项。\n\nCo-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-06 14:54:52 +08:00
+									userRepo              UserRepository
 									userSubRepo           UserSubscriptionRepository
 									cache                 GatewayCache
 									cfg                   *config.Config
 									codexDetector         CodexClientRestrictionDetector
 									schedulerSnapshot     *SchedulerSnapshotService
 									concurrencyService    *ConcurrencyService
 									billingService        *BillingService
 									rateLimitService      *RateLimitService
 									billingCacheService   *BillingCacheService
 									userGroupRateResolver *userGroupRateResolver
 									httpUpstream          HTTPUpstream
 									deferredService       *DeferredService
 									openAITokenProvider   *OpenAITokenProvider
 									toolCorrector         *CodexToolCorrector
 									openaiWSResolver      OpenAIWSProtocolResolver
-												feat(billing): 网关计费迁移到 CalculateCostUnified + 模型限制错误统一

- GatewayService/OpenAIGatewayService 注入 ModelPricingResolver
- RecordUsage 从旧路径迁移到 CalculateCostUnified（支持 per_request/image 模式）
- 无渠道时自动回退旧路径，保持原有行为
- 长上下文双倍计费仅在无渠道定价时生效
- CostBreakdown 新增 BillingMode 字段，使用日志记录实际计费模式
- 模型限制错误改为与"无可用账号"相同的 503 响应

											
										
										
											2026-03-30 22:58:28 +08:00
+									resolver              *ModelPricingResolver
-												feat(channel): 通配符定价匹配 + OpenAI BillingModelSource + 按次价格校验 + 用户端计费模式展示

- 定价查找支持通配符(suffix *)，最长前缀优先匹配
- 模型限制(restrict_models)同样支持通配符匹配
- OpenAI 网关接入渠道映射/BillingModelSource/模型限制
- 按次/图片计费模式创建时强制要求价格或层级(前后端)
- 用户使用记录列表增加计费模式 badge 列

											
										
										
											2026-03-31 00:23:45 +08:00
+									channelService        *ChannelService
-												feat(notify): add balance low & account quota notification system

- User balance low notification: email alert when balance drops below
  configurable threshold (user email + verified extra emails)
- Account quota notification: broadcast email to admin-configured
  recipients when daily/weekly/total quota usage exceeds alert threshold
- Admin settings: global enable/disable, default threshold, quota
  notification email list (Email Settings tab)
- User profile: enable/disable, custom threshold, add/remove extra
  notification emails with verification code flow
- Account quota: per-dimension alert toggle and threshold in quota
  control card
- Trigger logic: first-crossing only (old >= threshold && new < threshold
  for balance; old < threshold && new >= threshold for quota), naturally
  prevents duplicate notifications without Redis dedup

											
										
										
											2026-04-12 02:48:57 +08:00
+									balanceNotifyService  *BalanceNotifyService
-												feat(openai): OpenAI Fast/Flex Policy 完整实现（HTTP + WebSocket + Admin）

对称参照 Claude BetaPolicy 的 fast-mode 过滤实现，新增针对 OpenAI 上游
service_tier 字段（priority / flex，含客户端 "fast" → "priority" 归一化）的
pass / filter / block 三态策略，覆盖全部 OpenAI 入口 + admin 配置入口。

后端核心
- 新增 SettingKeyOpenAIFastPolicySettings、OpenAIFastPolicyRule、
  OpenAIFastPolicySettings 配置模型，含规则的 service_tier × action × scope
  × 模型白名单 × fallback action 维度。
- SettingService.Get/SetOpenAIFastPolicySettings；缺失时返回内置默认策略
  （所有模型的 priority 走 filter，whitelist 为空，fallback=pass）。设计
  依据：service_tier=fast 是用户级开关，与 model 字段正交，默认锁定特定
  model slug 会留下"用 gpt-4 + fast 透传 priority 上游"的绕过路径。JSON
  解析失败不再静默 fallback，slog.Warn 记录脏数据，便于运维定位。
- service_tier 归一化（trim + ToLower + fast→priority + 白名单 priority/flex）
  与策略评估（evaluateOpenAIFastPolicy）作为唯一真实来源，HTTP / WS 共用。
  抽出纯函数 evaluateOpenAIFastPolicyWithSettings，配合 ctx-bound settings
  快照（withOpenAIFastPolicyContext / openAIFastPolicySettingsFromContext），
  WS 长会话入口预取一次后所有帧复用，避免每帧打到 settingService。

HTTP 入口（4 个）
- Chat Completions、Anthropic 兼容（Messages，含 BetaFastMode→priority 二次
  命中）、原生 Responses、Passthrough Responses 全部接入
  applyOpenAIFastPolicyToBody，filter 走 sjson 顶层删除 service_tier，block
  返回 403 forbidden_error JSON。
- 4 入口统一使用 upstream 视角的 model（GetMappedModel +
  normalizeOpenAIModelForUpstream + Codex OAuth normalize 后的 slug），
  避免 chat/messages/native /responses/passthrough 因为 model 维度不同
  造成 whitelist 命中差异。
- 在 pass 路径也把客户端 "fast" 别名归一化为 "priority" 写回 body，
  否则 native /responses 与 passthrough 入口会把 "fast" 原样透传给上游
  导致 400/拒绝（chat-completions 入口的 normalizeResponsesBodyServiceTier
  此前已具备同等行为）。

WebSocket 入口
- 新增 applyOpenAIFastPolicyToWSResponseCreate：严格匹配
  type="response.create"，仅处理顶层 service_tier；filter 用 sjson 删字段，
  block 返回 typed *OpenAIFastBlockedError。
- ingress 路径在 parseClientPayload 内调用，block 命中先 Write Realtime
  风格 error event 再返回 OpenAIWSClientCloseError(StatusPolicyViolation
  =1008)，依赖底层 WebSocket Conn.Write 的同步 flush 保证 error 先于
  close。
- passthrough 路径在 RunEntry 前对 firstClientMessage 应用策略，并通过
  openAIWSPolicyEnforcingFrameConn 包装 ReadFrame 对每个 client→upstream
  帧执行策略；后续帧无 model 字段时回退到 capturedSessionModel。
  filter 闭包内同时侦测 session.update / session.created 帧的 session.model
  字段刷新 capturedSessionModel，封堵"首帧 model=gpt-4o（pass）→
  session.update 改为 gpt-5.5 → 不带 model 的 response.create fallback
  到 gpt-4o"的 mid-session 绕过路径。
- passthrough billing：requestServiceTier 在策略 filter 之后再从
  firstClientMessage 提取，filter 命中时 OpenAIForwardResult.ServiceTier
  上报 nil（default tier），与 HTTP 入口（reqBody 来自 post-filter map）
  / WS ingress（payload 来自 post-filter bytes）的语义一致。
- 错误事件 schema：{event_id: "evt_<32hex>", type: "error",
  error: {type: "forbidden_error", code: "policy_violation", message}}，
  与 OpenAI codex 客户端 error event 解析兼容。

Admin / Frontend
- dto.SystemSettings / UpdateSettingsRequest 新增
  openai_fast_policy_settings 字段（omitempty），bulk GET/PUT 接入。
- Settings 页 Gateway 页签新增 Fast/Flex Policy 表单卡片：
  service_tier × action × scope × 模型白名单 × fallback action 全字段配置。
- 前端守门：openaiFastPolicyLoaded 标志仅在 GET 真带回字段时才允许回写，
  避免 rollout/错误把默认规则覆盖成空；saveSettings 回写循环 skip 该字段，
  由专用刷新逻辑处理；仅 action=block 时发送 error_message，匹配后端
  omitempty 行为。

测试
- HTTP 路径：openai_fast_policy_test.go 覆盖默认配置（whitelist=[]，所有
  模型 priority filter）/ block 自定义错误 / scope 区分 / filter 删字段 /
  block 不改 body / block 短路上游 / Anthropic BetaFastMode 触发 OpenAI
  fast policy 等场景。
- WebSocket 路径：openai_fast_policy_ws_test.go 覆盖
    helper 单元（filter / fast→priority 归一化 / flex 透传 / block typed
    error / 无 service_tier 字节不变 / 非 response.create 帧不动 / 空 type
    帧不动 / event_id+code 字段断言 / 非字符串 service_tier 容错）+
    pass 路径 fast 别名归一化回归 +
    ingress 端到端（filter 后上游不含 service_tier / block 后客户端先收
    error event 再收 close 1008 且上游 0 写）+
    passthrough capturedSessionModel fallback 用例（whitelist 策略下首帧
    建立、缺 model 命中 fallback、缺少 fallback 时的 leak 文档化）+
    passthrough session.update / session.created 旋转 capturedSessionModel
    的 mid-session 绕过回归 +
    passthrough billing post-filter ServiceTier 与 idempotent filter 回归。

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-28 00:34:23 +08:00
+									settingService        *SettingService
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
-												feat(openai-ws): 合并 WS v2 透传模式与前端 ws mode

新增 OpenAI WebSocket v2 passthrough relay 数据面与服务适配层，
支持按账号 ws mode 在 ctx_pool 与 passthrough 间路由。

同步调整前端 OpenAI ws mode 选项为 off/ctx_pool/passthrough，
并补充 i18n 文案与对应单测。

新增 Caddyfile.dmit 与 docker-compose-aicodex.yml 部署配置，
用于宿主机场景下的反向代理与服务编排。

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-05 11:50:58 +08:00
+									openaiWSPoolOnce              sync.Once
 									openaiWSStateStoreOnce        sync.Once
 									openaiSchedulerOnce           sync.Once
 									openaiWSPassthroughDialerOnce sync.Once
 									openaiWSPool                  *openAIWSConnPool
 									openaiWSStateStore            OpenAIWSStateStore
 									openaiScheduler               OpenAIAccountScheduler
 									openaiWSPassthroughDialer     openAIWSClientDialer
 									openaiAccountStats            *openAIAccountRuntimeStats
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
 									openaiWSFallbackUntil sync.Map // key: int64(accountID), value: time.Time
 									openaiWSRetryMetrics  openAIWSRetryMetrics
 									responseHeaderFilter  *responseheaders.CompiledHeaderFilter
-												Reduce DB write amplification on quota and account extra updates

											
										
										
											2026-03-11 13:53:19 +08:00
+									codexSnapshotThrottle *accountWriteThrottle
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								}
 								// NewOpenAIGatewayService creates a new OpenAIGatewayService
 								func NewOpenAIGatewayService(
-												refactor: 删除 ports 目录

											
										
										
											2025-12-25 17:15:01 +08:00
+									accountRepo AccountRepository,
 									usageLogRepo UsageLogRepository,
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+									usageBillingRepo UsageBillingRepository,
-												refactor: 删除 ports 目录

											
										
										
											2025-12-25 17:15:01 +08:00
+									userRepo UserRepository,
 									userSubRepo UserSubscriptionRepository,
-												fix(openai): 统一专属倍率计费链路并补齐回归测试

抽取共享的用户分组专属倍率解析器，统一缓存、singleflight 与回退逻辑。\n\n让 OpenAI 独立计费链路复用专属倍率解析，修复 usage 记录与实际扣费未命中用户专属倍率的问题。\n\n补齐 OpenAI 计费与解析器单元测试，并修复全量回归中暴露的 lint 阻塞项。\n\nCo-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-06 14:54:52 +08:00
+									userGroupRateRepo UserGroupRateRepository,
-												refactor: 删除 ports 目录

											
										
										
											2025-12-25 17:15:01 +08:00
+									cache GatewayCache,
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									cfg *config.Config,
-												feat(scheduler): 引入调度快照缓存与 outbox 回放

- 调度热路径优先读 Redis 快照，保留分组排序语义
- outbox 回放 + 全量重建纠偏，失败重试不推进水位
- 自动 Atlas 基线对齐并同步调度配置示例

											
										
										
											2026-01-12 14:19:06 +08:00
+									schedulerSnapshot *SchedulerSnapshotService,
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									concurrencyService *ConcurrencyService,
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									billingService *BillingService,
 									rateLimitService *RateLimitService,
 									billingCacheService *BillingCacheService,
-												refactor: 删除 ports 目录

											
										
										
											2025-12-25 17:15:01 +08:00
+									httpUpstream HTTPUpstream,
-												feat: Schedule batch update for account last_used_at

Implement deferred batch update mechanism to reduce database load:

- Add DeferredService for batching account last_used_at updates
- Add TimingWheelService for efficient recurring task scheduling
- Integrate with GatewayService and OpenAIGatewayService
- Implement BatchUpdateLastUsed repository method using CASE...WHEN SQL
- Fix golangci-lint error: Replace interface{} with any

Benefits:
- Reduces database writes by batching updates (10-second intervals)
- Improves request throughput by deferring non-critical updates
- Maintains accurate account usage tracking for scheduling

											
										
										
											2025-12-28 08:07:15 +08:00
+									deferredService *DeferredService,
-												feat(网关): 引入 OpenAI/Claude OAuth token 缓存

新增 OpenAI/Claude TokenProvider 与缓存键生成
扩展 OAuth 缓存失效覆盖更多平台
统一 OAuth 缓存前缀与依赖注入

											
										
										
											2026-01-15 18:27:06 +08:00
+									openAITokenProvider *OpenAITokenProvider,
-												feat(billing): 网关计费迁移到 CalculateCostUnified + 模型限制错误统一

- GatewayService/OpenAIGatewayService 注入 ModelPricingResolver
- RecordUsage 从旧路径迁移到 CalculateCostUnified（支持 per_request/image 模式）
- 无渠道时自动回退旧路径，保持原有行为
- 长上下文双倍计费仅在无渠道定价时生效
- CostBreakdown 新增 BillingMode 字段，使用日志记录实际计费模式
- 模型限制错误改为与"无可用账号"相同的 503 响应

											
										
										
											2026-03-30 22:58:28 +08:00
+									resolver *ModelPricingResolver,
-												feat(channel): 通配符定价匹配 + OpenAI BillingModelSource + 按次价格校验 + 用户端计费模式展示

- 定价查找支持通配符(suffix *)，最长前缀优先匹配
- 模型限制(restrict_models)同样支持通配符匹配
- OpenAI 网关接入渠道映射/BillingModelSource/模型限制
- 按次/图片计费模式创建时强制要求价格或层级(前后端)
- 用户使用记录列表增加计费模式 badge 列

											
										
										
											2026-03-31 00:23:45 +08:00
+									channelService *ChannelService,
-												feat(notify): add balance low & account quota notification system

- User balance low notification: email alert when balance drops below
  configurable threshold (user email + verified extra emails)
- Account quota notification: broadcast email to admin-configured
  recipients when daily/weekly/total quota usage exceeds alert threshold
- Admin settings: global enable/disable, default threshold, quota
  notification email list (Email Settings tab)
- User profile: enable/disable, custom threshold, add/remove extra
  notification emails with verification code flow
- Account quota: per-dimension alert toggle and threshold in quota
  control card
- Trigger logic: first-crossing only (old >= threshold && new < threshold
  for balance; old < threshold && new >= threshold for quota), naturally
  prevents duplicate notifications without Redis dedup

											
										
										
											2026-04-12 02:48:57 +08:00
+									balanceNotifyService *BalanceNotifyService,
-												feat(openai): OpenAI Fast/Flex Policy 完整实现（HTTP + WebSocket + Admin）

对称参照 Claude BetaPolicy 的 fast-mode 过滤实现，新增针对 OpenAI 上游
service_tier 字段（priority / flex，含客户端 "fast" → "priority" 归一化）的
pass / filter / block 三态策略，覆盖全部 OpenAI 入口 + admin 配置入口。

后端核心
- 新增 SettingKeyOpenAIFastPolicySettings、OpenAIFastPolicyRule、
  OpenAIFastPolicySettings 配置模型，含规则的 service_tier × action × scope
  × 模型白名单 × fallback action 维度。
- SettingService.Get/SetOpenAIFastPolicySettings；缺失时返回内置默认策略
  （所有模型的 priority 走 filter，whitelist 为空，fallback=pass）。设计
  依据：service_tier=fast 是用户级开关，与 model 字段正交，默认锁定特定
  model slug 会留下"用 gpt-4 + fast 透传 priority 上游"的绕过路径。JSON
  解析失败不再静默 fallback，slog.Warn 记录脏数据，便于运维定位。
- service_tier 归一化（trim + ToLower + fast→priority + 白名单 priority/flex）
  与策略评估（evaluateOpenAIFastPolicy）作为唯一真实来源，HTTP / WS 共用。
  抽出纯函数 evaluateOpenAIFastPolicyWithSettings，配合 ctx-bound settings
  快照（withOpenAIFastPolicyContext / openAIFastPolicySettingsFromContext），
  WS 长会话入口预取一次后所有帧复用，避免每帧打到 settingService。

HTTP 入口（4 个）
- Chat Completions、Anthropic 兼容（Messages，含 BetaFastMode→priority 二次
  命中）、原生 Responses、Passthrough Responses 全部接入
  applyOpenAIFastPolicyToBody，filter 走 sjson 顶层删除 service_tier，block
  返回 403 forbidden_error JSON。
- 4 入口统一使用 upstream 视角的 model（GetMappedModel +
  normalizeOpenAIModelForUpstream + Codex OAuth normalize 后的 slug），
  避免 chat/messages/native /responses/passthrough 因为 model 维度不同
  造成 whitelist 命中差异。
- 在 pass 路径也把客户端 "fast" 别名归一化为 "priority" 写回 body，
  否则 native /responses 与 passthrough 入口会把 "fast" 原样透传给上游
  导致 400/拒绝（chat-completions 入口的 normalizeResponsesBodyServiceTier
  此前已具备同等行为）。

WebSocket 入口
- 新增 applyOpenAIFastPolicyToWSResponseCreate：严格匹配
  type="response.create"，仅处理顶层 service_tier；filter 用 sjson 删字段，
  block 返回 typed *OpenAIFastBlockedError。
- ingress 路径在 parseClientPayload 内调用，block 命中先 Write Realtime
  风格 error event 再返回 OpenAIWSClientCloseError(StatusPolicyViolation
  =1008)，依赖底层 WebSocket Conn.Write 的同步 flush 保证 error 先于
  close。
- passthrough 路径在 RunEntry 前对 firstClientMessage 应用策略，并通过
  openAIWSPolicyEnforcingFrameConn 包装 ReadFrame 对每个 client→upstream
  帧执行策略；后续帧无 model 字段时回退到 capturedSessionModel。
  filter 闭包内同时侦测 session.update / session.created 帧的 session.model
  字段刷新 capturedSessionModel，封堵"首帧 model=gpt-4o（pass）→
  session.update 改为 gpt-5.5 → 不带 model 的 response.create fallback
  到 gpt-4o"的 mid-session 绕过路径。
- passthrough billing：requestServiceTier 在策略 filter 之后再从
  firstClientMessage 提取，filter 命中时 OpenAIForwardResult.ServiceTier
  上报 nil（default tier），与 HTTP 入口（reqBody 来自 post-filter map）
  / WS ingress（payload 来自 post-filter bytes）的语义一致。
- 错误事件 schema：{event_id: "evt_<32hex>", type: "error",
  error: {type: "forbidden_error", code: "policy_violation", message}}，
  与 OpenAI codex 客户端 error event 解析兼容。

Admin / Frontend
- dto.SystemSettings / UpdateSettingsRequest 新增
  openai_fast_policy_settings 字段（omitempty），bulk GET/PUT 接入。
- Settings 页 Gateway 页签新增 Fast/Flex Policy 表单卡片：
  service_tier × action × scope × 模型白名单 × fallback action 全字段配置。
- 前端守门：openaiFastPolicyLoaded 标志仅在 GET 真带回字段时才允许回写，
  避免 rollout/错误把默认规则覆盖成空；saveSettings 回写循环 skip 该字段，
  由专用刷新逻辑处理；仅 action=block 时发送 error_message，匹配后端
  omitempty 行为。

测试
- HTTP 路径：openai_fast_policy_test.go 覆盖默认配置（whitelist=[]，所有
  模型 priority filter）/ block 自定义错误 / scope 区分 / filter 删字段 /
  block 不改 body / block 短路上游 / Anthropic BetaFastMode 触发 OpenAI
  fast policy 等场景。
- WebSocket 路径：openai_fast_policy_ws_test.go 覆盖
    helper 单元（filter / fast→priority 归一化 / flex 透传 / block typed
    error / 无 service_tier 字节不变 / 非 response.create 帧不动 / 空 type
    帧不动 / event_id+code 字段断言 / 非字符串 service_tier 容错）+
    pass 路径 fast 别名归一化回归 +
    ingress 端到端（filter 后上游不含 service_tier / block 后客户端先收
    error event 再收 close 1008 且上游 0 写）+
    passthrough capturedSessionModel fallback 用例（whitelist 策略下首帧
    建立、缺 model 命中 fallback、缺少 fallback 时的 leak 文档化）+
    passthrough session.update / session.created 旋转 capturedSessionModel
    的 mid-session 绕过回归 +
    passthrough billing post-filter ServiceTier 与 idempotent filter 回归。

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-28 00:34:23 +08:00
+									settingService *SettingService,
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								) *OpenAIGatewayService {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									svc := &OpenAIGatewayService{
-												fix(openai): 统一专属倍率计费链路并补齐回归测试

抽取共享的用户分组专属倍率解析器，统一缓存、singleflight 与回退逻辑。\n\n让 OpenAI 独立计费链路复用专属倍率解析，修复 usage 记录与实际扣费未命中用户专属倍率的问题。\n\n补齐 OpenAI 计费与解析器单元测试，并修复全量回归中暴露的 lint 阻塞项。\n\nCo-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-06 14:54:52 +08:00
+										accountRepo:         accountRepo,
 										usageLogRepo:        usageLogRepo,
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+										usageBillingRepo:    usageBillingRepo,
-												fix(openai): 统一专属倍率计费链路并补齐回归测试

抽取共享的用户分组专属倍率解析器，统一缓存、singleflight 与回退逻辑。\n\n让 OpenAI 独立计费链路复用专属倍率解析，修复 usage 记录与实际扣费未命中用户专属倍率的问题。\n\n补齐 OpenAI 计费与解析器单元测试，并修复全量回归中暴露的 lint 阻塞项。\n\nCo-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-06 14:54:52 +08:00
+										userRepo:            userRepo,
 										userSubRepo:         userSubRepo,
 										cache:               cache,
 										cfg:                 cfg,
 										codexDetector:       NewOpenAICodexClientRestrictionDetector(cfg),
 										schedulerSnapshot:   schedulerSnapshot,
 										concurrencyService:  concurrencyService,
 										billingService:      billingService,
 										rateLimitService:    rateLimitService,
 										billingCacheService: billingCacheService,
 										userGroupRateResolver: newUserGroupRateResolver(
 											userGroupRateRepo,
 											nil,
 											resolveUserGroupRateCacheTTL(cfg),
 											nil,
 											"service.openai_gateway",
 										),
-												Reduce DB write amplification on quota and account extra updates

											
										
										
											2026-03-11 13:53:19 +08:00
+										httpUpstream:          httpUpstream,
 										deferredService:       deferredService,
 										openAITokenProvider:   openAITokenProvider,
 										toolCorrector:         NewCodexToolCorrector(),
 										openaiWSResolver:      NewOpenAIWSProtocolResolver(cfg),
-												feat(billing): 网关计费迁移到 CalculateCostUnified + 模型限制错误统一

- GatewayService/OpenAIGatewayService 注入 ModelPricingResolver
- RecordUsage 从旧路径迁移到 CalculateCostUnified（支持 per_request/image 模式）
- 无渠道时自动回退旧路径，保持原有行为
- 长上下文双倍计费仅在无渠道定价时生效
- CostBreakdown 新增 BillingMode 字段，使用日志记录实际计费模式
- 模型限制错误改为与"无可用账号"相同的 503 响应

											
										
										
											2026-03-30 22:58:28 +08:00
+										resolver:              resolver,
-												feat(channel): 通配符定价匹配 + OpenAI BillingModelSource + 按次价格校验 + 用户端计费模式展示

- 定价查找支持通配符(suffix *)，最长前缀优先匹配
- 模型限制(restrict_models)同样支持通配符匹配
- OpenAI 网关接入渠道映射/BillingModelSource/模型限制
- 按次/图片计费模式创建时强制要求价格或层级(前后端)
- 用户使用记录列表增加计费模式 badge 列

											
										
										
											2026-03-31 00:23:45 +08:00
+										channelService:        channelService,
-												feat(notify): add balance low & account quota notification system

- User balance low notification: email alert when balance drops below
  configurable threshold (user email + verified extra emails)
- Account quota notification: broadcast email to admin-configured
  recipients when daily/weekly/total quota usage exceeds alert threshold
- Admin settings: global enable/disable, default threshold, quota
  notification email list (Email Settings tab)
- User profile: enable/disable, custom threshold, add/remove extra
  notification emails with verification code flow
- Account quota: per-dimension alert toggle and threshold in quota
  control card
- Trigger logic: first-crossing only (old >= threshold && new < threshold
  for balance; old < threshold && new >= threshold for quota), naturally
  prevents duplicate notifications without Redis dedup

											
										
										
											2026-04-12 02:48:57 +08:00
+										balanceNotifyService:  balanceNotifyService,
-												feat(openai): OpenAI Fast/Flex Policy 完整实现（HTTP + WebSocket + Admin）

对称参照 Claude BetaPolicy 的 fast-mode 过滤实现，新增针对 OpenAI 上游
service_tier 字段（priority / flex，含客户端 "fast" → "priority" 归一化）的
pass / filter / block 三态策略，覆盖全部 OpenAI 入口 + admin 配置入口。

后端核心
- 新增 SettingKeyOpenAIFastPolicySettings、OpenAIFastPolicyRule、
  OpenAIFastPolicySettings 配置模型，含规则的 service_tier × action × scope
  × 模型白名单 × fallback action 维度。
- SettingService.Get/SetOpenAIFastPolicySettings；缺失时返回内置默认策略
  （所有模型的 priority 走 filter，whitelist 为空，fallback=pass）。设计
  依据：service_tier=fast 是用户级开关，与 model 字段正交，默认锁定特定
  model slug 会留下"用 gpt-4 + fast 透传 priority 上游"的绕过路径。JSON
  解析失败不再静默 fallback，slog.Warn 记录脏数据，便于运维定位。
- service_tier 归一化（trim + ToLower + fast→priority + 白名单 priority/flex）
  与策略评估（evaluateOpenAIFastPolicy）作为唯一真实来源，HTTP / WS 共用。
  抽出纯函数 evaluateOpenAIFastPolicyWithSettings，配合 ctx-bound settings
  快照（withOpenAIFastPolicyContext / openAIFastPolicySettingsFromContext），
  WS 长会话入口预取一次后所有帧复用，避免每帧打到 settingService。

HTTP 入口（4 个）
- Chat Completions、Anthropic 兼容（Messages，含 BetaFastMode→priority 二次
  命中）、原生 Responses、Passthrough Responses 全部接入
  applyOpenAIFastPolicyToBody，filter 走 sjson 顶层删除 service_tier，block
  返回 403 forbidden_error JSON。
- 4 入口统一使用 upstream 视角的 model（GetMappedModel +
  normalizeOpenAIModelForUpstream + Codex OAuth normalize 后的 slug），
  避免 chat/messages/native /responses/passthrough 因为 model 维度不同
  造成 whitelist 命中差异。
- 在 pass 路径也把客户端 "fast" 别名归一化为 "priority" 写回 body，
  否则 native /responses 与 passthrough 入口会把 "fast" 原样透传给上游
  导致 400/拒绝（chat-completions 入口的 normalizeResponsesBodyServiceTier
  此前已具备同等行为）。

WebSocket 入口
- 新增 applyOpenAIFastPolicyToWSResponseCreate：严格匹配
  type="response.create"，仅处理顶层 service_tier；filter 用 sjson 删字段，
  block 返回 typed *OpenAIFastBlockedError。
- ingress 路径在 parseClientPayload 内调用，block 命中先 Write Realtime
  风格 error event 再返回 OpenAIWSClientCloseError(StatusPolicyViolation
  =1008)，依赖底层 WebSocket Conn.Write 的同步 flush 保证 error 先于
  close。
- passthrough 路径在 RunEntry 前对 firstClientMessage 应用策略，并通过
  openAIWSPolicyEnforcingFrameConn 包装 ReadFrame 对每个 client→upstream
  帧执行策略；后续帧无 model 字段时回退到 capturedSessionModel。
  filter 闭包内同时侦测 session.update / session.created 帧的 session.model
  字段刷新 capturedSessionModel，封堵"首帧 model=gpt-4o（pass）→
  session.update 改为 gpt-5.5 → 不带 model 的 response.create fallback
  到 gpt-4o"的 mid-session 绕过路径。
- passthrough billing：requestServiceTier 在策略 filter 之后再从
  firstClientMessage 提取，filter 命中时 OpenAIForwardResult.ServiceTier
  上报 nil（default tier），与 HTTP 入口（reqBody 来自 post-filter map）
  / WS ingress（payload 来自 post-filter bytes）的语义一致。
- 错误事件 schema：{event_id: "evt_<32hex>", type: "error",
  error: {type: "forbidden_error", code: "policy_violation", message}}，
  与 OpenAI codex 客户端 error event 解析兼容。

Admin / Frontend
- dto.SystemSettings / UpdateSettingsRequest 新增
  openai_fast_policy_settings 字段（omitempty），bulk GET/PUT 接入。
- Settings 页 Gateway 页签新增 Fast/Flex Policy 表单卡片：
  service_tier × action × scope × 模型白名单 × fallback action 全字段配置。
- 前端守门：openaiFastPolicyLoaded 标志仅在 GET 真带回字段时才允许回写，
  避免 rollout/错误把默认规则覆盖成空；saveSettings 回写循环 skip 该字段，
  由专用刷新逻辑处理；仅 action=block 时发送 error_message，匹配后端
  omitempty 行为。

测试
- HTTP 路径：openai_fast_policy_test.go 覆盖默认配置（whitelist=[]，所有
  模型 priority filter）/ block 自定义错误 / scope 区分 / filter 删字段 /
  block 不改 body / block 短路上游 / Anthropic BetaFastMode 触发 OpenAI
  fast policy 等场景。
- WebSocket 路径：openai_fast_policy_ws_test.go 覆盖
    helper 单元（filter / fast→priority 归一化 / flex 透传 / block typed
    error / 无 service_tier 字节不变 / 非 response.create 帧不动 / 空 type
    帧不动 / event_id+code 字段断言 / 非字符串 service_tier 容错）+
    pass 路径 fast 别名归一化回归 +
    ingress 端到端（filter 后上游不含 service_tier / block 后客户端先收
    error event 再收 close 1008 且上游 0 写）+
    passthrough capturedSessionModel fallback 用例（whitelist 策略下首帧
    建立、缺 model 命中 fallback、缺少 fallback 时的 leak 文档化）+
    passthrough session.update / session.created 旋转 capturedSessionModel
    的 mid-session 绕过回归 +
    passthrough billing post-filter ServiceTier 与 idempotent filter 回归。

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-28 00:34:23 +08:00
+										settingService:        settingService,
-												Reduce DB write amplification on quota and account extra updates

											
										
										
											2026-03-11 13:53:19 +08:00
+										responseHeaderFilter:  compileResponseHeaderFilter(cfg),
 										codexSnapshotThrottle: newAccountWriteThrottle(openAICodexSnapshotPersistMinInterval),
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									}
 									svc.logOpenAIWSModeBootstrap()
 									return svc
 								}
-												feat(channel): 通配符定价匹配 + OpenAI BillingModelSource + 按次价格校验 + 用户端计费模式展示

- 定价查找支持通配符(suffix *)，最长前缀优先匹配
- 模型限制(restrict_models)同样支持通配符匹配
- OpenAI 网关接入渠道映射/BillingModelSource/模型限制
- 按次/图片计费模式创建时强制要求价格或层级(前后端)
- 用户使用记录列表增加计费模式 badge 列

											
										
										
											2026-03-31 00:23:45 +08:00
+								// ResolveChannelMapping 解析渠道级模型映射（代理到 ChannelService）
 								func (s *OpenAIGatewayService) ResolveChannelMapping(ctx context.Context, groupID int64, model string) ChannelMappingResult {
 									if s.channelService == nil {
 										return ChannelMappingResult{MappedModel: model}
 									}
 									return s.channelService.ResolveChannelMapping(ctx, groupID, model)
 								}
 								// IsModelRestricted 检查模型是否被渠道限制（代理到 ChannelService）
 								func (s *OpenAIGatewayService) IsModelRestricted(ctx context.Context, groupID int64, model string) bool {
 									if s.channelService == nil {
 										return false
 									}
 									return s.channelService.IsModelRestricted(ctx, groupID, model)
 								}
-												fix: address review findings for channel restriction refactoring

- Fix 7 stale comments still mentioning "限制检查" in handlers/services
- Make billingModelForRestriction explicitly list channel_mapped case
- Add slog.Warn for error swallowing in ResolveChannelMapping and
  needsUpstreamChannelRestrictionCheck
- Document sticky session upstream check exemption

											
										
										
											2026-04-02 13:36:58 +08:00
+								// ResolveChannelMappingAndRestrict 解析渠道映射。
 								// 模型限制检查已移至调度阶段，restricted 始终返回 false。
-												refactor(channel): 抽取渠道映射公共函数 + OpenAI映射到body + 空响应修复 + 清理日志

- 抽取 ResolveChannelMappingAndRestrict 统一入口（5处→1个方法）
- 抽取 BuildModelMappingChain 到 ChannelMappingResult 方法（5处→1行调用）
- OpenAI 三入口 Forward 前应用渠道映射到请求体
- OpenAI Responses/Messages 限制检查添加错误响应
- 清理前端 3 处 console.log 调试日志

											
										
										
											2026-03-31 02:11:24 +08:00
+								func (s *OpenAIGatewayService) ResolveChannelMappingAndRestrict(ctx context.Context, groupID *int64, model string) (ChannelMappingResult, bool) {
-												fix(channel): 全平台渠道映射覆盖 + 公共函数抽取 + 死代码清理

- 4个缺失handler入口添加渠道映射+限制检查(ChatCompletions/Responses/Gemini)
- 模型限制错误信息优化，区分"模型不可用"和"无账号"
- OpenAI RecordUsage RequestedModel 改用 OriginalModel
- ResolveChannelMappingAndRestrict/ReplaceModelInBody 抽取到 ChannelService 消除跨service重复
- validateNoDuplicateModels 按 platform:model 去重
- 删除 Channel.ResolveMappedModel 死代码和 CalculateCostWithChannel Deprecated方法
- 移除冗余nil检查，抽取 validatePricingBillingMode 公共校验

											
										
										
											2026-03-31 15:26:20 +08:00
+									if s.channelService == nil {
 										return ChannelMappingResult{MappedModel: model}, false
 									}
 									return s.channelService.ResolveChannelMappingAndRestrict(ctx, groupID, model)
-												refactor(channel): 抽取渠道映射公共函数 + OpenAI映射到body + 空响应修复 + 清理日志

- 抽取 ResolveChannelMappingAndRestrict 统一入口（5处→1个方法）
- 抽取 BuildModelMappingChain 到 ChannelMappingResult 方法（5处→1行调用）
- OpenAI 三入口 Forward 前应用渠道映射到请求体
- OpenAI Responses/Messages 限制检查添加错误响应
- 清理前端 3 处 console.log 调试日志

											
										
										
											2026-03-31 02:11:24 +08:00
+								}
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+								func (s *OpenAIGatewayService) checkChannelPricingRestriction(ctx context.Context, groupID *int64, requestedModel string) bool {
 									if groupID == nil || s.channelService == nil || requestedModel == "" {
 										return false
 									}
 									mapping := s.channelService.ResolveChannelMapping(ctx, *groupID, requestedModel)
 									billingModel := billingModelForRestriction(mapping.BillingModelSource, requestedModel, mapping.MappedModel)
 									if billingModel == "" {
 										return false
 									}
 									return s.channelService.IsModelRestricted(ctx, *groupID, billingModel)
 								}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+								func (s *OpenAIGatewayService) isUpstreamModelRestrictedByChannel(ctx context.Context, groupID int64, account *Account, requestedModel string, requireCompact bool) bool {
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+									if s.channelService == nil {
 										return false
 									}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									upstreamModel := resolveOpenAIAccountUpstreamModelForRequest(account, requestedModel, requireCompact)
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+									if upstreamModel == "" {
 										return false
 									}
 									return s.channelService.IsModelRestricted(ctx, groupID, upstreamModel)
 								}
 								func (s *OpenAIGatewayService) needsUpstreamChannelRestrictionCheck(ctx context.Context, groupID *int64) bool {
 									if groupID == nil || s.channelService == nil {
 										return false
 									}
 									ch, err := s.channelService.GetChannelForGroup(ctx, *groupID)
 									if err != nil {
 										slog.Warn("failed to check openai channel upstream restriction", "group_id", *groupID, "error", err)
 										return false
 									}
 									if ch == nil || !ch.RestrictModels {
 										return false
 									}
 									return ch.BillingModelSource == BillingModelSourceUpstream
 								}
-												refactor(channel): 抽取渠道映射公共函数 + OpenAI映射到body + 空响应修复 + 清理日志

- 抽取 ResolveChannelMappingAndRestrict 统一入口（5处→1个方法）
- 抽取 BuildModelMappingChain 到 ChannelMappingResult 方法（5处→1行调用）
- OpenAI 三入口 Forward 前应用渠道映射到请求体
- OpenAI Responses/Messages 限制检查添加错误响应
- 清理前端 3 处 console.log 调试日志

											
										
										
											2026-03-31 02:11:24 +08:00
+								// ReplaceModelInBody 替换请求体中的 JSON model 字段（通用 gjson/sjson 实现）。
 								func (s *OpenAIGatewayService) ReplaceModelInBody(body []byte, newModel string) []byte {
-												fix(channel): 全平台渠道映射覆盖 + 公共函数抽取 + 死代码清理

- 4个缺失handler入口添加渠道映射+限制检查(ChatCompletions/Responses/Gemini)
- 模型限制错误信息优化，区分"模型不可用"和"无账号"
- OpenAI RecordUsage RequestedModel 改用 OriginalModel
- ResolveChannelMappingAndRestrict/ReplaceModelInBody 抽取到 ChannelService 消除跨service重复
- validateNoDuplicateModels 按 platform:model 去重
- 删除 Channel.ResolveMappedModel 死代码和 CalculateCostWithChannel Deprecated方法
- 移除冗余nil检查，抽取 validatePricingBillingMode 公共校验

											
										
										
											2026-03-31 15:26:20 +08:00
+									return ReplaceModelInBody(body, newModel)
-												refactor(channel): 抽取渠道映射公共函数 + OpenAI映射到body + 空响应修复 + 清理日志

- 抽取 ResolveChannelMappingAndRestrict 统一入口（5处→1个方法）
- 抽取 BuildModelMappingChain 到 ChannelMappingResult 方法（5处→1行调用）
- OpenAI 三入口 Forward 前应用渠道映射到请求体
- OpenAI Responses/Messages 限制检查添加错误响应
- 清理前端 3 处 console.log 调试日志

											
										
										
											2026-03-31 02:11:24 +08:00
+								}
-												Reduce DB write amplification on quota and account extra updates

											
										
										
											2026-03-11 13:53:19 +08:00
+								func (s *OpenAIGatewayService) getCodexSnapshotThrottle() *accountWriteThrottle {
 									if s != nil && s.codexSnapshotThrottle != nil {
 										return s.codexSnapshotThrottle
 									}
 									return defaultOpenAICodexSnapshotPersistThrottle
 								}
-												refactor: unify post-usage billing logic and fix account quota calculation

- Extract postUsageBilling() to consolidate billing logic across
  GatewayService.RecordUsage, RecordUsageWithLongContext, and
  OpenAIGatewayService.RecordUsage, eliminating ~120 lines of
  duplicated code
- Fix account quota to use TotalCost × accountRateMultiplier
  (was using raw TotalCost, inconsistent with account cost stats)
- Fix RecordUsageWithLongContext API Key quota only updating in
  balance mode (now updates regardless of billing type)
- Fix WebSocket client disconnect detection on Windows by adding
  "an established connection was aborted" to known disconnect errors

											
										
										
											2026-03-06 00:37:37 +08:00
+								func (s *OpenAIGatewayService) billingDeps() *billingDeps {
 									return &billingDeps{
-												feat(notify): add balance low & account quota notification system

- User balance low notification: email alert when balance drops below
  configurable threshold (user email + verified extra emails)
- Account quota notification: broadcast email to admin-configured
  recipients when daily/weekly/total quota usage exceeds alert threshold
- Admin settings: global enable/disable, default threshold, quota
  notification email list (Email Settings tab)
- User profile: enable/disable, custom threshold, add/remove extra
  notification emails with verification code flow
- Account quota: per-dimension alert toggle and threshold in quota
  control card
- Trigger logic: first-crossing only (old >= threshold && new < threshold
  for balance; old < threshold && new >= threshold for quota), naturally
  prevents duplicate notifications without Redis dedup

											
										
										
											2026-04-12 02:48:57 +08:00
+										accountRepo:          s.accountRepo,
 										userRepo:             s.userRepo,
 										userSubRepo:          s.userSubRepo,
 										billingCacheService:  s.billingCacheService,
 										deferredService:      s.deferredService,
 										balanceNotifyService: s.balanceNotifyService,
-												refactor: unify post-usage billing logic and fix account quota calculation

- Extract postUsageBilling() to consolidate billing logic across
  GatewayService.RecordUsage, RecordUsageWithLongContext, and
  OpenAIGatewayService.RecordUsage, eliminating ~120 lines of
  duplicated code
- Fix account quota to use TotalCost × accountRateMultiplier
  (was using raw TotalCost, inconsistent with account cost stats)
- Fix RecordUsageWithLongContext API Key quota only updating in
  balance mode (now updates regardless of billing type)
- Fix WebSocket client disconnect detection on Windows by adding
  "an established connection was aborted" to known disconnect errors

											
										
										
											2026-03-06 00:37:37 +08:00
+									}
 								}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+								// CloseOpenAIWSPool 关闭 OpenAI WebSocket 连接池的后台 worker 和空闲连接。
 								// 应在应用优雅关闭时调用。
 								func (s *OpenAIGatewayService) CloseOpenAIWSPool() {
 									if s != nil && s.openaiWSPool != nil {
 										s.openaiWSPool.Close()
 									}
 								}
 								func (s *OpenAIGatewayService) logOpenAIWSModeBootstrap() {
 									if s == nil || s.cfg == nil {
 										return
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									wsCfg := s.cfg.Gateway.OpenAIWS
 									logOpenAIWSModeInfo(
 										"bootstrap enabled=%v oauth_enabled=%v apikey_enabled=%v force_http=%v responses_websockets_v2=%v responses_websockets=%v payload_log_sample_rate=%.3f event_flush_batch_size=%d event_flush_interval_ms=%d prewarm_cooldown_ms=%d retry_backoff_initial_ms=%d retry_backoff_max_ms=%d retry_jitter_ratio=%.3f retry_total_budget_ms=%d ws_read_limit_bytes=%d",
 										wsCfg.Enabled,
 										wsCfg.OAuthEnabled,
 										wsCfg.APIKeyEnabled,
 										wsCfg.ForceHTTP,
 										wsCfg.ResponsesWebsocketsV2,
 										wsCfg.ResponsesWebsockets,
 										wsCfg.PayloadLogSampleRate,
 										wsCfg.EventFlushBatchSize,
 										wsCfg.EventFlushIntervalMS,
 										wsCfg.PrewarmCooldownMS,
 										wsCfg.RetryBackoffInitialMS,
 										wsCfg.RetryBackoffMaxMS,
 										wsCfg.RetryJitterRatio,
 										wsCfg.RetryTotalBudgetMS,
 										openAIWSMessageReadLimitBytes,
 									)
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								}
-												feat(openai): 增加 OAuth 账号 Codex 官方客户端限制开关

新增 codex_cli_only 开关并默认关闭，关闭时完全绕过限制逻辑。
在 OpenAI 网关引入统一检测入口，集中判定账号类型、开关与客户端族。
开启后仅放行 codex_cli_rs、codex_vscode、codex_app 客户端家族。
补充后端判定与网关分支测试，并在前端创建/编辑页增加开关配置与回显。

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-12 22:32:59 +08:00
+								func (s *OpenAIGatewayService) getCodexClientRestrictionDetector() CodexClientRestrictionDetector {
 									if s != nil && s.codexDetector != nil {
 										return s.codexDetector
 									}
 									var cfg *config.Config
 									if s != nil {
 										cfg = s.cfg
 									}
 									return NewOpenAICodexClientRestrictionDetector(cfg)
 								}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+								func (s *OpenAIGatewayService) getOpenAIWSProtocolResolver() OpenAIWSProtocolResolver {
 									if s != nil && s.openaiWSResolver != nil {
 										return s.openaiWSResolver
 									}
 									var cfg *config.Config
 									if s != nil {
 										cfg = s.cfg
 									}
 									return NewOpenAIWSProtocolResolver(cfg)
 								}
 								func classifyOpenAIWSReconnectReason(err error) (string, bool) {
 									if err == nil {
 										return "", false
 									}
 									var fallbackErr *openAIWSFallbackError
 									if !errors.As(err, &fallbackErr) || fallbackErr == nil {
 										return "", false
 									}
 									reason := strings.TrimSpace(fallbackErr.Reason)
 									if reason == "" {
 										return "", false
 									}
 									baseReason := strings.TrimPrefix(reason, "prewarm_")
 									switch baseReason {
 									case "policy_violation",
 										"message_too_big",
 										"upgrade_required",
 										"ws_unsupported",
 										"auth_failed",
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+										"invalid_encrypted_content",
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										"previous_response_not_found":
 										return reason, false
 									}
 									switch baseReason {
 									case "read_event",
 										"write_request",
 										"write",
 										"acquire_timeout",
 										"acquire_conn",
 										"conn_queue_full",
 										"dial_failed",
 										"upstream_5xx",
 										"event_error",
 										"error_event",
 										"upstream_error_event",
 										"ws_connection_limit_reached",
 										"missing_final_response":
 										return reason, true
 									default:
 										return reason, false
 									}
 								}
 								func resolveOpenAIWSFallbackErrorResponse(err error) (statusCode int, errType string, clientMessage string, upstreamMessage string, ok bool) {
 									if err == nil {
 										return 0, "", "", "", false
 									}
 									var fallbackErr *openAIWSFallbackError
 									if !errors.As(err, &fallbackErr) || fallbackErr == nil {
 										return 0, "", "", "", false
 									}
 									reason := strings.TrimSpace(fallbackErr.Reason)
 									reason = strings.TrimPrefix(reason, "prewarm_")
 									if reason == "" {
 										return 0, "", "", "", false
 									}
 									var dialErr *openAIWSDialError
 									if fallbackErr.Err != nil && errors.As(fallbackErr.Err, &dialErr) && dialErr != nil {
 										if dialErr.StatusCode > 0 {
 											statusCode = dialErr.StatusCode
 										}
 										if dialErr.Err != nil {
 											upstreamMessage = sanitizeUpstreamErrorMessage(strings.TrimSpace(dialErr.Err.Error()))
 										}
 									}
 									switch reason {
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+									case "invalid_encrypted_content":
 										if statusCode == 0 {
 											statusCode = http.StatusBadRequest
 										}
 										errType = "invalid_request_error"
 										if upstreamMessage == "" {
 											upstreamMessage = "encrypted content could not be verified"
 										}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									case "previous_response_not_found":
 										if statusCode == 0 {
 											statusCode = http.StatusBadRequest
 										}
 										errType = "invalid_request_error"
 										if upstreamMessage == "" {
 											upstreamMessage = "previous response not found"
 										}
 									case "upgrade_required":
 										if statusCode == 0 {
 											statusCode = http.StatusUpgradeRequired
 										}
 									case "ws_unsupported":
 										if statusCode == 0 {
 											statusCode = http.StatusBadRequest
 										}
 									case "auth_failed":
 										if statusCode == 0 {
 											statusCode = http.StatusUnauthorized
 										}
 									case "upstream_rate_limited":
 										if statusCode == 0 {
 											statusCode = http.StatusTooManyRequests
 										}
 									default:
 										if statusCode == 0 {
 											return 0, "", "", "", false
 										}
 									}
 									if upstreamMessage == "" && fallbackErr.Err != nil {
 										upstreamMessage = sanitizeUpstreamErrorMessage(strings.TrimSpace(fallbackErr.Err.Error()))
 									}
 									if upstreamMessage == "" {
 										switch reason {
 										case "upgrade_required":
 											upstreamMessage = "upstream websocket upgrade required"
 										case "ws_unsupported":
 											upstreamMessage = "upstream websocket not supported"
 										case "auth_failed":
 											upstreamMessage = "upstream authentication failed"
 										case "upstream_rate_limited":
 											upstreamMessage = "upstream rate limit exceeded, please retry later"
 										default:
 											upstreamMessage = "Upstream request failed"
 										}
 									}
 									if errType == "" {
 										if statusCode == http.StatusTooManyRequests {
 											errType = "rate_limit_error"
 										} else {
 											errType = "upstream_error"
 										}
 									}
 									clientMessage = upstreamMessage
 									return statusCode, errType, clientMessage, upstreamMessage, true
 								}
 								func (s *OpenAIGatewayService) writeOpenAIWSFallbackErrorResponse(c *gin.Context, account *Account, wsErr error) bool {
 									if c == nil || c.Writer == nil || c.Writer.Written() {
 										return false
 									}
 									statusCode, errType, clientMessage, upstreamMessage, ok := resolveOpenAIWSFallbackErrorResponse(wsErr)
 									if !ok {
 										return false
 									}
 									if strings.TrimSpace(clientMessage) == "" {
 										clientMessage = "Upstream request failed"
 									}
 									if strings.TrimSpace(upstreamMessage) == "" {
 										upstreamMessage = clientMessage
 									}
 									setOpsUpstreamError(c, statusCode, upstreamMessage, "")
 									if account != nil {
 										appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 											Platform:           account.Platform,
 											AccountID:          account.ID,
 											AccountName:        account.Name,
 											UpstreamStatusCode: statusCode,
 											Kind:               "ws_error",
 											Message:            upstreamMessage,
 										})
 									}
 									c.JSON(statusCode, gin.H{
 										"error": gin.H{
 											"type":    errType,
 											"message": clientMessage,
 										},
 									})
 									return true
 								}
 								func (s *OpenAIGatewayService) openAIWSRetryBackoff(attempt int) time.Duration {
 									if attempt <= 0 {
 										return 0
 									}
 									initial := openAIWSRetryBackoffInitialDefault
 									maxBackoff := openAIWSRetryBackoffMaxDefault
 									jitterRatio := openAIWSRetryJitterRatioDefault
 									if s != nil && s.cfg != nil {
 										wsCfg := s.cfg.Gateway.OpenAIWS
 										if wsCfg.RetryBackoffInitialMS > 0 {
 											initial = time.Duration(wsCfg.RetryBackoffInitialMS) * time.Millisecond
 										}
 										if wsCfg.RetryBackoffMaxMS > 0 {
 											maxBackoff = time.Duration(wsCfg.RetryBackoffMaxMS) * time.Millisecond
 										}
 										if wsCfg.RetryJitterRatio >= 0 {
 											jitterRatio = wsCfg.RetryJitterRatio
 										}
 									}
 									if initial <= 0 {
 										return 0
 									}
 									if maxBackoff <= 0 {
 										maxBackoff = initial
 									}
 									if maxBackoff < initial {
 										maxBackoff = initial
 									}
 									if jitterRatio < 0 {
 										jitterRatio = 0
 									}
 									if jitterRatio > 1 {
 										jitterRatio = 1
 									}
 									shift := attempt - 1
 									if shift < 0 {
 										shift = 0
 									}
 									backoff := initial
 									if shift > 0 {
 										backoff = initial * time.Duration(1<<shift)
 									}
 									if backoff > maxBackoff {
 										backoff = maxBackoff
 									}
 									if jitterRatio <= 0 {
 										return backoff
 									}
 									jitter := time.Duration(float64(backoff) * jitterRatio)
 									if jitter <= 0 {
 										return backoff
 									}
 									delta := time.Duration(rand.Int63n(int64(jitter)*2+1)) - jitter
 									withJitter := backoff + delta
 									if withJitter < 0 {
 										return 0
 									}
 									return withJitter
 								}
 								func (s *OpenAIGatewayService) openAIWSRetryTotalBudget() time.Duration {
 									if s != nil && s.cfg != nil {
 										ms := s.cfg.Gateway.OpenAIWS.RetryTotalBudgetMS
 										if ms <= 0 {
 											return 0
 										}
 										return time.Duration(ms) * time.Millisecond
 									}
 									return 0
 								}
 								func (s *OpenAIGatewayService) recordOpenAIWSRetryAttempt(backoff time.Duration) {
 									if s == nil {
 										return
 									}
 									s.openaiWSRetryMetrics.retryAttempts.Add(1)
 									if backoff > 0 {
 										s.openaiWSRetryMetrics.retryBackoffMs.Add(backoff.Milliseconds())
 									}
 								}
 								func (s *OpenAIGatewayService) recordOpenAIWSRetryExhausted() {
 									if s == nil {
 										return
 									}
 									s.openaiWSRetryMetrics.retryExhausted.Add(1)
 								}
 								func (s *OpenAIGatewayService) recordOpenAIWSNonRetryableFastFallback() {
 									if s == nil {
 										return
 									}
 									s.openaiWSRetryMetrics.nonRetryableFastFallback.Add(1)
 								}
 								func (s *OpenAIGatewayService) SnapshotOpenAIWSRetryMetrics() OpenAIWSRetryMetricsSnapshot {
 									if s == nil {
 										return OpenAIWSRetryMetricsSnapshot{}
 									}
 									return OpenAIWSRetryMetricsSnapshot{
 										RetryAttemptsTotal:            s.openaiWSRetryMetrics.retryAttempts.Load(),
 										RetryBackoffMsTotal:           s.openaiWSRetryMetrics.retryBackoffMs.Load(),
 										RetryExhaustedTotal:           s.openaiWSRetryMetrics.retryExhausted.Load(),
 										NonRetryableFastFallbackTotal: s.openaiWSRetryMetrics.nonRetryableFastFallback.Load(),
 									}
 								}
 								func SnapshotOpenAICompatibilityFallbackMetrics() OpenAICompatibilityFallbackMetricsSnapshot {
 									legacyReadFallbackTotal, legacyReadFallbackHit, legacyDualWriteTotal := openAIStickyCompatStats()
 									isMaxTokensOneHaiku, thinkingEnabled, prefetchedStickyAccount, prefetchedStickyGroup, singleAccountRetry, accountSwitchCount := RequestMetadataFallbackStats()
 									readHitRate := float64(0)
 									if legacyReadFallbackTotal > 0 {
 										readHitRate = float64(legacyReadFallbackHit) / float64(legacyReadFallbackTotal)
 									}
 									metadataFallbackTotal := isMaxTokensOneHaiku + thinkingEnabled + prefetchedStickyAccount + prefetchedStickyGroup + singleAccountRetry + accountSwitchCount
 									return OpenAICompatibilityFallbackMetricsSnapshot{
 										SessionHashLegacyReadFallbackTotal: legacyReadFallbackTotal,
 										SessionHashLegacyReadFallbackHit:   legacyReadFallbackHit,
 										SessionHashLegacyDualWriteTotal:    legacyDualWriteTotal,
 										SessionHashLegacyReadHitRate:       readHitRate,
 										MetadataLegacyFallbackIsMaxTokensOneHaikuTotal: isMaxTokensOneHaiku,
 										MetadataLegacyFallbackThinkingEnabledTotal:     thinkingEnabled,
 										MetadataLegacyFallbackPrefetchedStickyAccount:  prefetchedStickyAccount,
 										MetadataLegacyFallbackPrefetchedStickyGroup:    prefetchedStickyGroup,
 										MetadataLegacyFallbackSingleAccountRetryTotal:  singleAccountRetry,
 										MetadataLegacyFallbackAccountSwitchCountTotal:  accountSwitchCount,
 										MetadataLegacyFallbackTotal:                    metadataFallbackTotal,
 									}
 								}
-												feat(openai): 增加 OAuth 账号 Codex 官方客户端限制开关

新增 codex_cli_only 开关并默认关闭，关闭时完全绕过限制逻辑。
在 OpenAI 网关引入统一检测入口，集中判定账号类型、开关与客户端族。
开启后仅放行 codex_cli_rs、codex_vscode、codex_app 客户端家族。
补充后端判定与网关分支测试，并在前端创建/编辑页增加开关配置与回显。

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-12 22:32:59 +08:00
+								func (s *OpenAIGatewayService) detectCodexClientRestriction(c *gin.Context, account *Account) CodexClientRestrictionDetectionResult {
 									return s.getCodexClientRestrictionDetector().Detect(c, account)
 								}
 								func getAPIKeyIDFromContext(c *gin.Context) int64 {
 									if c == nil {
 										return 0
 									}
 									v, exists := c.Get("api_key")
 									if !exists {
 										return 0
 									}
 									apiKey, ok := v.(*APIKey)
 									if !ok || apiKey == nil {
 										return 0
 									}
 									return apiKey.ID
 								}
-												fix(gateway): 防止 OpenAI Codex 跨用户串流

根因：多个用户共享同一 OAuth 账号时，conversation_id/session_id 头
未做用户隔离，导致上游 chatgpt.com 将不同用户的请求关联到同一会话。

HTTP SSE 修复:
- 新增 isolateOpenAISessionID(apiKeyID, raw)，将 API Key ID 混入
  session 标识符（xxhash），确保不同 Key 的用户产生不同上游会话
- buildUpstreamRequest: OAuth 分支先 Del 客户端透传的 session 头，
  再用隔离值覆盖
- buildUpstreamRequestOpenAIPassthrough: 透传路径同样隔离
- ForwardAsAnthropic: Anthropic Messages 兼容路径同步修复
- buildOpenAIWSHeaders: WS 路径的 OAuth session 头同步隔离

											
										
										
											2026-03-16 10:28:11 +08:00
+								// isolateOpenAISessionID 将 apiKeyID 混入 session 标识符，
 								// 确保不同 API Key 的用户即使使用相同的原始 session_id/conversation_id，
 								// 到达上游的标识符也不同，防止跨用户会话碰撞。
 								func isolateOpenAISessionID(apiKeyID int64, raw string) string {
 									raw = strings.TrimSpace(raw)
 									if raw == "" {
 										return ""
 									}
 									h := xxhash.New()
 									_, _ = fmt.Fprintf(h, "k%d:", apiKeyID)
 									_, _ = h.WriteString(raw)
 									return fmt.Sprintf("%016x", h.Sum64())
 								}
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+								func logCodexCLIOnlyDetection(ctx context.Context, c *gin.Context, account *Account, apiKeyID int64, result CodexClientRestrictionDetectionResult, body []byte) {
-												feat(openai): 增加 OAuth 账号 Codex 官方客户端限制开关

新增 codex_cli_only 开关并默认关闭，关闭时完全绕过限制逻辑。
在 OpenAI 网关引入统一检测入口，集中判定账号类型、开关与客户端族。
开启后仅放行 codex_cli_rs、codex_vscode、codex_app 客户端家族。
补充后端判定与网关分支测试，并在前端创建/编辑页增加开关配置与回显。

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-12 22:32:59 +08:00
+									if !result.Enabled {
 										return
 									}
 									if ctx == nil {
 										ctx = context.Background()
 									}
 									accountID := int64(0)
 									if account != nil {
 										accountID = account.ID
 									}
 									fields := []zap.Field{
 										zap.String("component", "service.openai_gateway"),
 										zap.Int64("account_id", accountID),
 										zap.Bool("codex_cli_only_enabled", result.Enabled),
 										zap.Bool("codex_official_client_match", result.Matched),
 										zap.String("reject_reason", result.Reason),
 									}
 									if apiKeyID > 0 {
 										fields = append(fields, zap.Int64("api_key_id", apiKeyID))
 									}
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+									if !result.Matched {
 										fields = appendCodexCLIOnlyRejectedRequestFields(fields, c, body)
 									}
-												feat(openai): 增加 OAuth 账号 Codex 官方客户端限制开关

新增 codex_cli_only 开关并默认关闭，关闭时完全绕过限制逻辑。
在 OpenAI 网关引入统一检测入口，集中判定账号类型、开关与客户端族。
开启后仅放行 codex_cli_rs、codex_vscode、codex_app 客户端家族。
补充后端判定与网关分支测试，并在前端创建/编辑页增加开关配置与回显。

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-12 22:32:59 +08:00
+									log := logger.FromContext(ctx).With(fields...)
 									if result.Matched {
 										return
 									}
 									log.Warn("OpenAI codex_cli_only 拒绝非官方客户端请求")
 								}
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+								func appendCodexCLIOnlyRejectedRequestFields(fields []zap.Field, c *gin.Context, body []byte) []zap.Field {
 									if c == nil || c.Request == nil {
 										return fields
 									}
 									req := c.Request
 									requestModel, requestStream, promptCacheKey := extractOpenAIRequestMetaFromBody(body)
 									fields = append(fields,
 										zap.String("request_method", strings.TrimSpace(req.Method)),
 										zap.String("request_path", strings.TrimSpace(req.URL.Path)),
 										zap.String("request_query", strings.TrimSpace(req.URL.RawQuery)),
 										zap.String("request_host", strings.TrimSpace(req.Host)),
 										zap.String("request_client_ip", strings.TrimSpace(c.ClientIP())),
 										zap.String("request_remote_addr", strings.TrimSpace(req.RemoteAddr)),
-												fix(openai): 拒绝日志记录原始 User-Agent 便于攻击研判

											
										
										
											2026-02-14 09:59:19 +08:00
+										zap.String("request_user_agent", strings.TrimSpace(req.Header.Get("User-Agent"))),
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+										zap.String("request_content_type", strings.TrimSpace(req.Header.Get("Content-Type"))),
 										zap.Int64("request_content_length", req.ContentLength),
 										zap.Bool("request_stream", requestStream),
 									)
 									if requestModel != "" {
 										fields = append(fields, zap.String("request_model", requestModel))
 									}
 									if promptCacheKey != "" {
 										fields = append(fields, zap.String("request_prompt_cache_key_sha256", hashSensitiveValueForLog(promptCacheKey)))
 									}
 									if headers := snapshotCodexCLIOnlyHeaders(req.Header); len(headers) > 0 {
 										fields = append(fields, zap.Any("request_headers", headers))
 									}
 									fields = append(fields, zap.Int("request_body_size", len(body)))
 									return fields
 								}
 								func snapshotCodexCLIOnlyHeaders(header http.Header) map[string]string {
 									if len(header) == 0 {
 										return nil
 									}
 									result := make(map[string]string, len(codexCLIOnlyDebugHeaderWhitelist))
 									for _, key := range codexCLIOnlyDebugHeaderWhitelist {
 										value := strings.TrimSpace(header.Get(key))
 										if value == "" {
 											continue
 										}
 										result[strings.ToLower(key)] = truncateString(value, codexCLIOnlyHeaderValueMaxBytes)
 									}
 									return result
 								}
 								func hashSensitiveValueForLog(raw string) string {
 									value := strings.TrimSpace(raw)
 									if value == "" {
 										return ""
 									}
 									sum := sha256.Sum256([]byte(value))
 									return hex.EncodeToString(sum[:8])
 								}
 								func logOpenAIInstructionsRequiredDebug(
 									ctx context.Context,
 									c *gin.Context,
 									account *Account,
 									upstreamStatusCode int,
 									upstreamMsg string,
 									requestBody []byte,
 									upstreamBody []byte,
 								) {
 									msg := strings.TrimSpace(upstreamMsg)
 									if !isOpenAIInstructionsRequiredError(upstreamStatusCode, msg, upstreamBody) {
 										return
 									}
 									if ctx == nil {
 										ctx = context.Background()
 									}
 									accountID := int64(0)
 									accountName := ""
 									if account != nil {
 										accountID = account.ID
 										accountName = strings.TrimSpace(account.Name)
 									}
 									userAgent := ""
-												fix(openai): detect official codex client by headers

											
										
										
											2026-03-07 14:12:38 +08:00
+									originator := ""
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+									if c != nil {
 										userAgent = strings.TrimSpace(c.GetHeader("User-Agent"))
-												fix(openai): detect official codex client by headers

											
										
										
											2026-03-07 14:12:38 +08:00
+										originator = strings.TrimSpace(c.GetHeader("originator"))
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+									}
 									fields := []zap.Field{
 										zap.String("component", "service.openai_gateway"),
 										zap.Int64("account_id", accountID),
 										zap.String("account_name", accountName),
 										zap.Int("upstream_status_code", upstreamStatusCode),
 										zap.String("upstream_error_message", msg),
 										zap.String("request_user_agent", userAgent),
-												fix(openai): detect official codex client by headers

											
										
										
											2026-03-07 14:12:38 +08:00
+										zap.Bool("codex_official_client_match", openai.IsCodexOfficialClientByHeaders(userAgent, originator)),
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+									}
 									fields = appendCodexCLIOnlyRejectedRequestFields(fields, c, requestBody)
 									logger.FromContext(ctx).With(fields...).Warn("OpenAI 上游返回 Instructions are required，已记录请求详情用于排查")
 								}
 								func isOpenAIInstructionsRequiredError(upstreamStatusCode int, upstreamMsg string, upstreamBody []byte) bool {
 									if upstreamStatusCode != http.StatusBadRequest {
 										return false
 									}
 									hasInstructionRequired := func(text string) bool {
 										lower := strings.ToLower(strings.TrimSpace(text))
 										if lower == "" {
 											return false
 										}
 										if strings.Contains(lower, "instructions are required") {
 											return true
 										}
 										if strings.Contains(lower, "required parameter: 'instructions'") {
 											return true
 										}
 										if strings.Contains(lower, "required parameter: instructions") {
 											return true
 										}
 										if strings.Contains(lower, "missing required parameter") && strings.Contains(lower, "instructions") {
 											return true
 										}
 										return strings.Contains(lower, "instruction") && strings.Contains(lower, "required")
 									}
 									if hasInstructionRequired(upstreamMsg) {
 										return true
 									}
 									if len(upstreamBody) == 0 {
 										return false
 									}
 									errMsg := gjson.GetBytes(upstreamBody, "error.message").String()
 									errMsgLower := strings.ToLower(strings.TrimSpace(errMsg))
 									errCode := strings.ToLower(strings.TrimSpace(gjson.GetBytes(upstreamBody, "error.code").String()))
 									errParam := strings.ToLower(strings.TrimSpace(gjson.GetBytes(upstreamBody, "error.param").String()))
 									errType := strings.ToLower(strings.TrimSpace(gjson.GetBytes(upstreamBody, "error.type").String()))
 									if errParam == "instructions" {
 										return true
 									}
 									if hasInstructionRequired(errMsg) {
 										return true
 									}
 									if strings.Contains(errCode, "missing_required_parameter") && strings.Contains(errMsgLower, "instructions") {
 										return true
 									}
 									if strings.Contains(errType, "invalid_request") && strings.Contains(errMsgLower, "instructions") && strings.Contains(errMsgLower, "required") {
 										return true
 									}
 									return false
 								}
-												fix: OpenAI临时性400错误支持池模式同账号重试 & HelpTooltip层级修复

1. 识别OpenAI "An error occurred while processing your request" 临时性400错误
   并触发failover，同时在池模式下标记RetryableOnSameAccount，允许同账号重试
2. ForwardAsAnthropic路径同步支持临时性400错误的识别和同账号重试
3. HelpTooltip组件使用Teleport渲染到body，修复在dialog内被裁切的问题

											
										
										
											2026-03-10 03:00:58 +08:00
+								func isOpenAITransientProcessingError(upstreamStatusCode int, upstreamMsg string, upstreamBody []byte) bool {
 									if upstreamStatusCode != http.StatusBadRequest {
 										return false
 									}
 									match := func(text string) bool {
 										lower := strings.ToLower(strings.TrimSpace(text))
 										if lower == "" {
 											return false
 										}
 										if strings.Contains(lower, "an error occurred while processing your request") {
 											return true
 										}
 										return strings.Contains(lower, "you can retry your request") &&
 											strings.Contains(lower, "help.openai.com") &&
 											strings.Contains(lower, "request id")
 									}
 									if match(upstreamMsg) {
 										return true
 									}
 									if len(upstreamBody) == 0 {
 										return false
 									}
 									if match(gjson.GetBytes(upstreamBody, "error.message").String()) {
 										return true
 									}
 									return match(string(upstreamBody))
 								}
-												feat(openai): add /v1/messages endpoint and API compatibility layer

Add Anthropic Messages API support for OpenAI platform groups, enabling
clients using Claude-style /v1/messages format to access OpenAI accounts
through automatic protocol conversion.

- Add apicompat package with type definitions and bidirectional converters
  (Anthropic ↔ Chat, Chat ↔ Responses, Anthropic ↔ Responses)
- Implement /v1/messages endpoint for OpenAI gateway with streaming support
- Add model mapping UI for OpenAI OAuth accounts (whitelist + mapping modes)
- Support prompt caching fields and codex OAuth transforms
- Fix tool call ID conversion for Responses API (fc_ prefix)
- Ensure function_call_output has non-empty output field

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-06 14:29:22 +08:00
+								// ExtractSessionID extracts the raw session ID from headers or body without hashing.
 								// Used by ForwardAsAnthropic to pass as prompt_cache_key for upstream cache.
 								func (s *OpenAIGatewayService) ExtractSessionID(c *gin.Context, body []byte) string {
 									if c == nil {
 										return ""
 									}
 									sessionID := strings.TrimSpace(c.GetHeader("session_id"))
 									if sessionID == "" {
 										sessionID = strings.TrimSpace(c.GetHeader("conversation_id"))
 									}
 									if sessionID == "" && len(body) > 0 {
 										sessionID = strings.TrimSpace(gjson.GetBytes(body, "prompt_cache_key").String())
 									}
 									return sessionID
 								}
-												fix(openai): avoid implicit image sticky sessions

											
										
										
											2026-04-26 17:05:19 +00:00
+								func explicitOpenAISessionID(c *gin.Context, body []byte) string {
 									if c == nil {
 										return ""
 									}
 									sessionID := strings.TrimSpace(c.GetHeader("session_id"))
 									if sessionID == "" {
 										sessionID = strings.TrimSpace(c.GetHeader("conversation_id"))
 									}
 									if sessionID == "" && len(body) > 0 {
 										sessionID = strings.TrimSpace(gjson.GetBytes(body, "prompt_cache_key").String())
 									}
 									return sessionID
 								}
 								// GenerateExplicitSessionHash generates a sticky-session hash only from explicit
 								// client session signals. It intentionally skips content-derived fallback and is
 								// used by stateless endpoints such as /v1/images.
 								func (s *OpenAIGatewayService) GenerateExplicitSessionHash(c *gin.Context, body []byte) string {
 									sessionID := explicitOpenAISessionID(c, body)
 									if sessionID == "" {
 										return ""
 									}
 									currentHash, legacyHash := deriveOpenAISessionHashes(sessionID)
 									attachOpenAILegacySessionHashToGin(c, legacyHash)
 									return currentHash
 								}
-												fix(openai): 使用 prompt_cache_key 兜底粘性会话

opencode 请求不带 session_id/conversation_id，导致粘性会话失效。现在按 header 优先、prompt_cache_key 兜底生成 session hash，并补充单测验证优先级。

											
										
										
											2026-01-17 02:31:16 +08:00
+								// GenerateSessionHash generates a sticky-session hash for OpenAI requests.
 								//
 								// Priority:
 								//  1. Header: session_id
 								//  2. Header: conversation_id
 								//  3. Body:   prompt_cache_key (opencode)
-												fix(gateway): add content-based session hash fallback for non-Codex clients

When no explicit session signals (session_id, conversation_id, prompt_cache_key)
are provided, derive a stable session seed from the request body content
(model + tools + system prompt + first user message) to enable sticky routing
and prompt caching for non-Codex clients using the Chat Completions API.

This mirrors the content-based fallback already present in GatewayService.
GenerateSessionHash, adapted for the OpenAI gateway's request formats (both
Chat Completions messages and Responses API input).

JSON fragments are canonicalized via normalizeCompatSeedJSON to ensure
semantically identical requests produce the same seed regardless of
whitespace or key ordering.

Closes #1421

											
										
										
											2026-04-02 00:11:06 +08:00
+								//  4. Body:   content-based fallback (model + system + tools + first user message)
-												perf(backend): 使用 gjson/sjson 优化热路径 JSON 处理

将 API 网关热路径中的 json.Unmarshal+json.Marshal 替换为 gjson 零拷贝查询和 sjson 精准写入：
- unwrapV1InternalResponse 性能提升 22x（4009ns→182ns），内存分配减少 28.5x
- unwrapGeminiResponse、extractGeminiUsage、estimateGeminiCountTokens、ParseGeminiRateLimitResetTime 改为接收 []byte 使用 gjson 提取
- ParseGatewayRequest 的 model/stream/metadata/thinking/max_tokens 改用 gjson 类型安全提取
- Handler 层（sora/openai）改用 gjson 提取字段、sjson 注入/修改字段，移除 map[string]any 中间变量
- Sora Client 响应解析改用 gjson ForEach 遍历，减少内存分配
- 新增约 100 个单元测试用例，所有改动函数覆盖率 >85%

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-10 08:59:30 +08:00
+								func (s *OpenAIGatewayService) GenerateSessionHash(c *gin.Context, body []byte) string {
-												fix(openai): 使用 prompt_cache_key 兜底粘性会话

opencode 请求不带 session_id/conversation_id，导致粘性会话失效。现在按 header 优先、prompt_cache_key 兜底生成 session hash，并补充单测验证优先级。

											
										
										
											2026-01-17 02:31:16 +08:00
+									if c == nil {
 										return ""
 									}
-												fix(openai): avoid implicit image sticky sessions

											
										
										
											2026-04-26 17:05:19 +00:00
+									sessionID := explicitOpenAISessionID(c, body)
-												fix(gateway): add content-based session hash fallback for non-Codex clients

When no explicit session signals (session_id, conversation_id, prompt_cache_key)
are provided, derive a stable session seed from the request body content
(model + tools + system prompt + first user message) to enable sticky routing
and prompt caching for non-Codex clients using the Chat Completions API.

This mirrors the content-based fallback already present in GatewayService.
GenerateSessionHash, adapted for the OpenAI gateway's request formats (both
Chat Completions messages and Responses API input).

JSON fragments are canonicalized via normalizeCompatSeedJSON to ensure
semantically identical requests produce the same seed regardless of
whitespace or key ordering.

Closes #1421

											
										
										
											2026-04-02 00:11:06 +08:00
+									if sessionID == "" && len(body) > 0 {
 										sessionID = deriveOpenAIContentSessionSeed(body)
 									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									if sessionID == "" {
 										return ""
 									}
-												fix(openai): 使用 prompt_cache_key 兜底粘性会话

opencode 请求不带 session_id/conversation_id，导致粘性会话失效。现在按 header 优先、prompt_cache_key 兜底生成 session hash，并补充单测验证优先级。

											
										
										
											2026-01-17 02:31:16 +08:00
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									currentHash, legacyHash := deriveOpenAISessionHashes(sessionID)
 									attachOpenAILegacySessionHashToGin(c, legacyHash)
 									return currentHash
 								}
 								// GenerateSessionHashWithFallback 先按常规信号生成会话哈希；
 								// 当未携带 session_id/conversation_id/prompt_cache_key 时，使用 fallbackSeed 生成稳定哈希。
 								// 该方法用于 WS ingress，避免会话信号缺失时发生跨账号漂移。
 								func (s *OpenAIGatewayService) GenerateSessionHashWithFallback(c *gin.Context, body []byte, fallbackSeed string) string {
 									sessionHash := s.GenerateSessionHash(c, body)
 									if sessionHash != "" {
 										return sessionHash
 									}
 									seed := strings.TrimSpace(fallbackSeed)
 									if seed == "" {
 										return ""
 									}
 									currentHash, legacyHash := deriveOpenAISessionHashes(seed)
 									attachOpenAILegacySessionHashToGin(c, legacyHash)
 									return currentHash
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								}
-												fix(openai): detect official codex client by headers

											
										
										
											2026-03-07 14:12:38 +08:00
+								func resolveOpenAIUpstreamOriginator(c *gin.Context, isOfficialClient bool) string {
 									if c != nil {
 										if originator := strings.TrimSpace(c.GetHeader("originator")); originator != "" {
 											return originator
 										}
 									}
 									if isOfficialClient {
 										return "codex_cli_rs"
 									}
 									return "opencode"
 								}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+								// BindStickySession sets session -> account binding with standard TTL.
-												feat(groups): add Claude Code client restriction and session isolation

- Add claude_code_only field to restrict groups to Claude Code clients only
- Add fallback_group_id for non-Claude Code requests to use alternate group
- Implement ClaudeCodeValidator for User-Agent detection
- Add group-level session binding isolation (groupID in Redis key)
- Prevent cross-group sticky session pollution
- Update frontend with Claude Code restriction controls

											
										
										
											2026-01-08 23:07:00 +08:00
+								func (s *OpenAIGatewayService) BindStickySession(ctx context.Context, groupID *int64, sessionHash string, accountID int64) error {
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									if sessionHash == "" || accountID <= 0 {
 										return nil
 									}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									ttl := openaiStickySessionTTL
 									if s != nil && s.cfg != nil && s.cfg.Gateway.OpenAIWS.StickySessionTTLSeconds > 0 {
 										ttl = time.Duration(s.cfg.Gateway.OpenAIWS.StickySessionTTLSeconds) * time.Second
 									}
 									return s.setStickySessionAccountID(ctx, groupID, sessionHash, accountID, ttl)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+								}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								// SelectAccount selects an OpenAI account with sticky session support
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+								func (s *OpenAIGatewayService) SelectAccount(ctx context.Context, groupID *int64, sessionHash string) (*Account, error) {
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									return s.SelectAccountForModel(ctx, groupID, sessionHash, "")
 								}
 								// SelectAccountForModel selects an account supporting the requested model
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+								func (s *OpenAIGatewayService) SelectAccountForModel(ctx context.Context, groupID *int64, sessionHash string, requestedModel string) (*Account, error) {
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+									return s.SelectAccountForModelWithExclusions(ctx, groupID, sessionHash, requestedModel, nil)
 								}
 								// SelectAccountForModelWithExclusions selects an account supporting the requested model while excluding specified accounts.
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+								// SelectAccountForModelWithExclusions 选择支持指定模型的账号，同时排除指定的账号。
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+								func (s *OpenAIGatewayService) SelectAccountForModelWithExclusions(ctx context.Context, groupID *int64, sessionHash string, requestedModel string, excludedIDs map[int64]struct{}) (*Account, error) {
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									return s.selectAccountForModelWithExclusions(ctx, groupID, sessionHash, requestedModel, excludedIDs, false, 0)
 								}
 								// noAvailableOpenAISelectionError builds the standard "no account available" error
 								// while preserving the compact-specific error when applicable.
 								func noAvailableOpenAISelectionError(requestedModel string, compactBlocked bool) error {
 									if compactBlocked {
 										return ErrNoAvailableCompactAccounts
 									}
 									if requestedModel != "" {
 										return fmt.Errorf("no available OpenAI accounts supporting model: %s", requestedModel)
 									}
 									return errors.New("no available OpenAI accounts")
 								}
 								// openAICompactSupportTier classifies an OpenAI account by compact capability.
 								// 0 = explicitly unsupported, 1 = unknown / not yet probed, 2 = explicitly supported.
 								func openAICompactSupportTier(account *Account) int {
 									if account == nil || !account.IsOpenAI() {
 										return 0
 									}
 									supported, known := account.OpenAICompactSupportKnown()
 									if !known {
 										return 1
 									}
 									if supported {
 										return 2
 									}
 									return 0
 								}
 								// isOpenAIAccountEligibleForRequest centralises the schedulable / OpenAI / model /
 								// compact-support checks used during account selection.
 								func isOpenAIAccountEligibleForRequest(account *Account, requestedModel string, requireCompact bool) bool {
 									if account == nil || !account.IsSchedulable() || !account.IsOpenAI() {
 										return false
 									}
 									if requestedModel != "" && !account.IsModelSupported(requestedModel) {
 										return false
 									}
 									if requireCompact && openAICompactSupportTier(account) == 0 {
 										return false
 									}
 									return true
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+								}
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+								// prioritizeOpenAICompactAccounts re-orders a slice so that accounts with known
 								// compact support are tried first, followed by unknown, then explicitly unsupported.
 								// The relative order within each tier is preserved.
 								func prioritizeOpenAICompactAccounts(accounts []*Account) []*Account {
 									if len(accounts) == 0 {
 										return nil
 									}
 									supported := make([]*Account, 0, len(accounts))
 									unknown := make([]*Account, 0, len(accounts))
 									unsupported := make([]*Account, 0, len(accounts))
 									for _, account := range accounts {
 										switch openAICompactSupportTier(account) {
 										case 2:
 											supported = append(supported, account)
 										case 1:
 											unknown = append(unknown, account)
 										default:
 											unsupported = append(unsupported, account)
 										}
 									}
 									out := make([]*Account, 0, len(accounts))
 									out = append(out, supported...)
 									out = append(out, unknown...)
 									out = append(out, unsupported...)
 									return out
 								}
 								// resolveOpenAIAccountUpstreamModelForRequest resolves the upstream model that
 								// would be sent for a given request, honouring compact-only mappings when the
 								// caller is on the /responses/compact path.
 								func resolveOpenAIAccountUpstreamModelForRequest(account *Account, requestedModel string, requireCompact bool) string {
 									upstreamModel := resolveOpenAIForwardModel(account, requestedModel, "")
 									if upstreamModel == "" {
 										return ""
 									}
 									if requireCompact {
 										return resolveOpenAICompactForwardModel(account, upstreamModel)
 									}
 									return upstreamModel
 								}
 								func (s *OpenAIGatewayService) selectAccountForModelWithExclusions(ctx context.Context, groupID *int64, sessionHash string, requestedModel string, excludedIDs map[int64]struct{}, requireCompact bool, stickyAccountID int64) (*Account, error) {
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+									if s.checkChannelPricingRestriction(ctx, groupID, requestedModel) {
-												feat(channel): improve cache strategy and add restriction logging

- Change channel cache TTL from 60s to 10min (reduce unnecessary DB queries)
- Actively rebuild cache after CRUD instead of lazy invalidation
- Add slog.Warn logging for channel pricing restriction blocks (4 places)

											
										
										
											2026-04-03 13:54:18 +08:00
+										slog.Warn("channel pricing restriction blocked request",
 											"group_id", derefGroupID(groupID),
 											"model", requestedModel)
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+										return nil, fmt.Errorf("%w supporting model: %s (channel pricing restriction)", ErrNoAvailableAccounts, requestedModel)
 									}
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+									// 1. 尝试粘性会话命中
 									// Try sticky session hit
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									if account := s.tryStickySessionHit(ctx, groupID, sessionHash, requestedModel, excludedIDs, requireCompact, stickyAccountID); account != nil {
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+										return account, nil
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+									// 2. 获取可调度的 OpenAI 账号
 									// Get schedulable OpenAI accounts
-												feat(scheduler): 引入调度快照缓存与 outbox 回放

- 调度热路径优先读 Redis 快照，保留分组排序语义
- outbox 回放 + 全量重建纠偏，失败重试不推进水位
- 自动 Atlas 基线对齐并同步调度配置示例

											
										
										
											2026-01-12 14:19:06 +08:00
+									accounts, err := s.listSchedulableAccounts(ctx, groupID)
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									if err != nil {
 										return nil, fmt.Errorf("query accounts failed: %w", err)
 									}
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+									// 3. 按优先级 + LRU 选择最佳账号
 									// Select by priority + LRU
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									selected, compactBlocked := s.selectBestAccount(ctx, groupID, accounts, requestedModel, excludedIDs, requireCompact)
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
 									if selected == nil {
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										return nil, noAvailableOpenAISelectionError(requestedModel, compactBlocked)
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+									}
 									// 4. 设置粘性会话绑定
 									// Set sticky session binding
 									if sessionHash != "" {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										_ = s.setStickySessionAccountID(ctx, groupID, sessionHash, selected.ID, openaiStickySessionTTL)
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+									}
-												fix: 优化调度快照缓存以避免 Redis 大 MGET

											
										
										
											2026-04-08 10:10:15 -07:00
+									return s.hydrateSelectedAccount(ctx, selected)
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+								}
 								// tryStickySessionHit 尝试从粘性会话获取账号。
 								// 如果命中且账号可用则返回账号；如果账号不可用则清理会话并返回 nil。
 								//
 								// tryStickySessionHit attempts to get account from sticky session.
 								// Returns account if hit and usable; clears session and returns nil if account is unavailable.
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+								func (s *OpenAIGatewayService) tryStickySessionHit(ctx context.Context, groupID *int64, sessionHash, requestedModel string, excludedIDs map[int64]struct{}, requireCompact bool, stickyAccountID int64) *Account {
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+									if sessionHash == "" {
 										return nil
 									}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									accountID := stickyAccountID
 									if accountID <= 0 {
 										var err error
 										accountID, err = s.getStickySessionAccountID(ctx, groupID, sessionHash)
 										if err != nil || accountID <= 0 {
 											return nil
 										}
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+									}
 									if _, excluded := excludedIDs[accountID]; excluded {
 										return nil
 									}
 									account, err := s.getSchedulableAccount(ctx, accountID)
 									if err != nil {
 										return nil
 									}
 									// 检查账号是否需要清理粘性会话
 									// Check if sticky session should be cleared
-												feat(antigravity): comprehensive enhancements - model mapping, rate limiting, scheduling & ops

Key changes:
- Upgrade model mapping: Opus 4.5 → Opus 4.6-thinking with precise matching
- Unified rate limiting: scope-level → model-level with Redis snapshot sync
- Load-balanced scheduling by call count with smart retry mechanism
- Force cache billing support
- Model identity injection in prompts with leak prevention
- Thinking mode auto-handling (max_tokens/budget_tokens fix)
- Frontend: whitelist mode toggle, model mapping validation, status indicators
- Gemini session fallback with Redis Trie O(L) matching
- Ops: enhanced concurrency monitoring, account availability, retry logic
- Migration scripts: 049-051 for model mapping unification

											
										
										
											2026-02-07 12:31:10 +08:00
+									if shouldClearStickySession(account, requestedModel) {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										_ = s.deleteStickySessionAccountID(ctx, groupID, sessionHash)
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+										return nil
 									}
 									// 验证账号是否可用于当前请求
 									// Verify account is usable for current request
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									if !isOpenAIAccountEligibleForRequest(account, requestedModel, false) {
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+										return nil
 									}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									account = s.recheckSelectedOpenAIAccountFromDB(ctx, account, requestedModel, requireCompact)
-												fix(openai): recheck runtime state from db before final account selection

											
										
										
											2026-03-23 03:50:03 +08:00
+									if account == nil {
 										_ = s.deleteStickySessionAccountID(ctx, groupID, sessionHash)
 										return nil
 									}
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+									if groupID != nil && s.needsUpstreamChannelRestrictionCheck(ctx, groupID) &&
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										s.isUpstreamModelRestrictedByChannel(ctx, *groupID, account, requestedModel, requireCompact) {
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+										_ = s.deleteStickySessionAccountID(ctx, groupID, sessionHash)
 										return nil
 									}
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
 									// 刷新会话 TTL 并返回账号
 									// Refresh session TTL and return account
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									_ = s.refreshStickySessionTTL(ctx, groupID, sessionHash, openaiStickySessionTTL)
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+									return account
 								}
 								// selectBestAccount 从候选账号中选择最佳账号（优先级 + LRU）。
 								// 返回 nil 表示无可用账号。
 								//
 								// selectBestAccount selects the best account from candidates (priority + LRU).
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+								// Returns nil if no available account. The second return reports whether at
 								// least one candidate was filtered out solely because it lacks compact support
 								// (only meaningful when requireCompact=true).
 								func (s *OpenAIGatewayService) selectBestAccount(ctx context.Context, groupID *int64, accounts []Account, requestedModel string, excludedIDs map[int64]struct{}, requireCompact bool) (*Account, bool) {
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+									var selected *Account
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									selectedCompactTier := -1
 									compactBlocked := false
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+									needsUpstreamCheck := s.needsUpstreamChannelRestrictionCheck(ctx, groupID)
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									for i := range accounts {
 										acc := &accounts[i]
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
 										// 跳过被排除的账号
 										// Skip excluded accounts
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+										if _, excluded := excludedIDs[acc.ID]; excluded {
 											continue
 										}
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										fresh := s.resolveFreshSchedulableOpenAIAccount(ctx, acc, requestedModel, false)
-												fix: 限流账号自动退出调度并优化提示文案

											
										
										
											2026-03-07 20:59:17 +08:00
+										if fresh == nil {
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+											continue
 										}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										fresh = s.recheckSelectedOpenAIAccountFromDB(ctx, fresh, requestedModel, false)
-												fix(openai): recheck runtime state from db before final account selection

											
										
										
											2026-03-23 03:50:03 +08:00
+										if fresh == nil {
 											continue
 										}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										if needsUpstreamCheck && s.isUpstreamModelRestrictedByChannel(ctx, *groupID, fresh, requestedModel, requireCompact) {
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+											continue
 										}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										compactTier := 0
 										if requireCompact {
 											compactTier = openAICompactSupportTier(fresh)
 											if compactTier == 0 {
 												compactBlocked = true
 												continue
 											}
 										}
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
 										// 选择优先级最高且最久未使用的账号
 										// Select highest priority and least recently used
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										if selected == nil {
-												fix: 限流账号自动退出调度并优化提示文案

											
										
										
											2026-03-07 20:59:17 +08:00
+											selected = fresh
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+											selectedCompactTier = compactTier
 											continue
 										}
 										// compact 模式下高 tier 优先；同 tier 内才比较 priority/LRU。
 										if requireCompact && compactTier != selectedCompactTier {
 											if compactTier > selectedCompactTier {
 												selected = fresh
 												selectedCompactTier = compactTier
 											}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+											continue
 										}
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
-												fix: 限流账号自动退出调度并优化提示文案

											
										
										
											2026-03-07 20:59:17 +08:00
+										if s.isBetterAccount(fresh, selected) {
 											selected = fresh
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+											selectedCompactTier = compactTier
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										}
 									}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									return selected, compactBlocked
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+								}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+								// isBetterAccount 判断 candidate 是否比 current 更优。
 								// 规则：优先级更高（数值更小）优先；同优先级时，未使用过的优先，其次是最久未使用的。
 								//
 								// isBetterAccount checks if candidate is better than current.
 								// Rules: higher priority (lower value) wins; same priority: never used > least recently used.
 								func (s *OpenAIGatewayService) isBetterAccount(candidate, current *Account) bool {
 									// 优先级更高（数值更小）
 									// Higher priority (lower value)
 									if candidate.Priority < current.Priority {
 										return true
 									}
 									if candidate.Priority > current.Priority {
 										return false
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+									// 同优先级，比较最后使用时间
 									// Same priority, compare last used time
 									switch {
 									case candidate.LastUsedAt == nil && current.LastUsedAt != nil:
 										// candidate 从未使用，优先
 										return true
 									case candidate.LastUsedAt != nil && current.LastUsedAt == nil:
 										// current 从未使用，保持
 										return false
 									case candidate.LastUsedAt == nil && current.LastUsedAt == nil:
 										// 都未使用，保持
 										return false
 									default:
 										// 都使用过，选择最久未使用的
 										return candidate.LastUsedAt.Before(*current.LastUsedAt)
 									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+								// SelectAccountWithLoadAwareness selects an account with load-awareness and wait plan.
 								func (s *OpenAIGatewayService) SelectAccountWithLoadAwareness(ctx context.Context, groupID *int64, sessionHash string, requestedModel string, excludedIDs map[int64]struct{}) (*AccountSelectionResult, error) {
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									return s.selectAccountWithLoadAwareness(ctx, groupID, sessionHash, requestedModel, excludedIDs, false)
 								}
 								func (s *OpenAIGatewayService) selectAccountWithLoadAwareness(ctx context.Context, groupID *int64, sessionHash string, requestedModel string, excludedIDs map[int64]struct{}, requireCompact bool) (*AccountSelectionResult, error) {
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+									if s.checkChannelPricingRestriction(ctx, groupID, requestedModel) {
-												feat(channel): improve cache strategy and add restriction logging

- Change channel cache TTL from 60s to 10min (reduce unnecessary DB queries)
- Actively rebuild cache after CRUD instead of lazy invalidation
- Add slog.Warn logging for channel pricing restriction blocks (4 places)

											
										
										
											2026-04-03 13:54:18 +08:00
+										slog.Warn("channel pricing restriction blocked request",
 											"group_id", derefGroupID(groupID),
 											"model", requestedModel)
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+										return nil, fmt.Errorf("%w supporting model: %s (channel pricing restriction)", ErrNoAvailableAccounts, requestedModel)
 									}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									cfg := s.schedulingConfig()
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+									needsUpstreamCheck := s.needsUpstreamChannelRestrictionCheck(ctx, groupID)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									var stickyAccountID int64
 									if sessionHash != "" && s.cache != nil {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										if accountID, err := s.getStickySessionAccountID(ctx, groupID, sessionHash); err == nil {
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+											stickyAccountID = accountID
 										}
 									}
 									if s.concurrencyService == nil || !cfg.LoadBatchEnabled {
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										account, err := s.selectAccountForModelWithExclusions(ctx, groupID, sessionHash, requestedModel, excludedIDs, requireCompact, stickyAccountID)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										if err != nil {
 											return nil, err
 										}
 										result, err := s.tryAcquireAccountSlot(ctx, account.ID, account.Concurrency)
 										if err == nil && result.Acquired {
-												fix: 优化调度快照缓存以避免 Redis 大 MGET

											
										
										
											2026-04-08 10:10:15 -07:00
+											return s.newSelectionResult(ctx, account, true, result.ReleaseFunc, nil)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										}
 										if stickyAccountID > 0 && stickyAccountID == account.ID && s.concurrencyService != nil {
 											waitingCount, _ := s.concurrencyService.GetAccountWaitingCount(ctx, account.ID)
 											if waitingCount < cfg.StickySessionMaxWaiting {
-												fix: 优化调度快照缓存以避免 Redis 大 MGET

											
										
										
											2026-04-08 10:10:15 -07:00
+												return s.newSelectionResult(ctx, account, false, nil, &AccountWaitPlan{
 													AccountID:      account.ID,
 													MaxConcurrency: account.Concurrency,
 													Timeout:        cfg.StickySessionWaitTimeout,
 													MaxWaiting:     cfg.StickySessionMaxWaiting,
 												})
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+											}
 										}
-												fix: 优化调度快照缓存以避免 Redis 大 MGET

											
										
										
											2026-04-08 10:10:15 -07:00
+										return s.newSelectionResult(ctx, account, false, nil, &AccountWaitPlan{
 											AccountID:      account.ID,
 											MaxConcurrency: account.Concurrency,
 											Timeout:        cfg.FallbackWaitTimeout,
 											MaxWaiting:     cfg.FallbackMaxWaiting,
 										})
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									}
 									accounts, err := s.listSchedulableAccounts(ctx, groupID)
 									if err != nil {
 										return nil, err
 									}
 									if len(accounts) == 0 {
-												feat(ops): add ignore insufficient balance errors toggle and extract error constants

- Add 5th error filter switch IgnoreInsufficientBalanceErrors to suppress
  upstream insufficient balance / insufficient_quota errors from ops log
- Extract hardcoded error strings into package-level constants for
  shouldSkipOpsErrorLog, normalizeOpsErrorType, classifyOpsPhase, and
  classifyOpsIsBusinessLimited
- Define ErrNoAvailableAccounts sentinel error and replace all
  errors.New("no available accounts") call sites
- Update tests to use require.ErrorIs with the sentinel error

											
										
										
											2026-03-15 17:25:35 +08:00
+										return nil, ErrNoAvailableAccounts
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									}
 									isExcluded := func(accountID int64) bool {
 										if excludedIDs == nil {
 											return false
 										}
 										_, excluded := excludedIDs[accountID]
 										return excluded
 									}
 									// ============ Layer 1: Sticky session ============
 									if sessionHash != "" {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										accountID := stickyAccountID
 										if accountID > 0 && !isExcluded(accountID) {
-												feat(scheduler): 引入调度快照缓存与 outbox 回放

- 调度热路径优先读 Redis 快照，保留分组排序语义
- outbox 回放 + 全量重建纠偏，失败重试不推进水位
- 自动 Atlas 基线对齐并同步调度配置示例

											
										
										
											2026-01-12 14:19:06 +08:00
+											account, err := s.getSchedulableAccount(ctx, accountID)
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+											if err == nil {
-												feat(antigravity): comprehensive enhancements - model mapping, rate limiting, scheduling & ops

Key changes:
- Upgrade model mapping: Opus 4.5 → Opus 4.6-thinking with precise matching
- Unified rate limiting: scope-level → model-level with Redis snapshot sync
- Load-balanced scheduling by call count with smart retry mechanism
- Force cache billing support
- Model identity injection in prompts with leak prevention
- Thinking mode auto-handling (max_tokens/budget_tokens fix)
- Frontend: whitelist mode toggle, model mapping validation, status indicators
- Gemini session fallback with Redis Trie O(L) matching
- Ops: enhanced concurrency monitoring, account availability, retry logic
- Migration scripts: 049-051 for model mapping unification

											
										
										
											2026-02-07 12:31:10 +08:00
+												clearSticky := shouldClearStickySession(account, requestedModel)
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+												if clearSticky {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+													_ = s.deleteStickySessionAccountID(ctx, groupID, sessionHash)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+												}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+												if !clearSticky && isOpenAIAccountEligibleForRequest(account, requestedModel, false) {
 													account = s.recheckSelectedOpenAIAccountFromDB(ctx, account, requestedModel, requireCompact)
-												fix(openai): recheck runtime state from db before final account selection

											
										
										
											2026-03-23 03:50:03 +08:00
+													if account == nil {
 														_ = s.deleteStickySessionAccountID(ctx, groupID, sessionHash)
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+													} else if needsUpstreamCheck && s.isUpstreamModelRestrictedByChannel(ctx, *groupID, account, requestedModel, requireCompact) {
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+														_ = s.deleteStickySessionAccountID(ctx, groupID, sessionHash)
-												fix(openai): recheck runtime state from db before final account selection

											
										
										
											2026-03-23 03:50:03 +08:00
+													} else {
 														result, err := s.tryAcquireAccountSlot(ctx, accountID, account.Concurrency)
 														if err == nil && result.Acquired {
 															_ = s.refreshStickySessionTTL(ctx, groupID, sessionHash, openaiStickySessionTTL)
-												fix: 优化调度快照缓存以避免 Redis 大 MGET

											
										
										
											2026-04-08 10:10:15 -07:00
+															return s.newSelectionResult(ctx, account, true, result.ReleaseFunc, nil)
-												fix(openai): recheck runtime state from db before final account selection

											
										
										
											2026-03-23 03:50:03 +08:00
+														}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
-												fix(openai): recheck runtime state from db before final account selection

											
										
										
											2026-03-23 03:50:03 +08:00
+														waitingCount, _ := s.concurrencyService.GetAccountWaitingCount(ctx, accountID)
 														if waitingCount < cfg.StickySessionMaxWaiting {
-												fix: 优化调度快照缓存以避免 Redis 大 MGET

											
										
										
											2026-04-08 10:10:15 -07:00
+															return s.newSelectionResult(ctx, account, false, nil, &AccountWaitPlan{
 																AccountID:      accountID,
 																MaxConcurrency: account.Concurrency,
 																Timeout:        cfg.StickySessionWaitTimeout,
 																MaxWaiting:     cfg.StickySessionMaxWaiting,
 															})
-												fix(openai): recheck runtime state from db before final account selection

											
										
										
											2026-03-23 03:50:03 +08:00
+														}
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+													}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+												}
 											}
 										}
 									}
 									// ============ Layer 2: Load-aware selection ============
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									baseCandidateCount := 0
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									candidates := make([]*Account, 0, len(accounts))
 									for i := range accounts {
 										acc := &accounts[i]
 										if isExcluded(acc.ID) {
 											continue
 										}
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+										// Scheduler snapshots can be temporarily stale (bucket rebuild is throttled);
 										// re-check schedulability here so recently rate-limited/overloaded accounts
 										// are not selected again before the bucket is rebuilt.
 										if !acc.IsSchedulable() {
 											continue
 										}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										if requestedModel != "" && !acc.IsModelSupported(requestedModel) {
 											continue
 										}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										if needsUpstreamCheck && s.isUpstreamModelRestrictedByChannel(ctx, *groupID, acc, requestedModel, requireCompact) {
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+											continue
 										}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										baseCandidateCount++
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										candidates = append(candidates, acc)
 									}
 									if len(candidates) == 0 {
-												feat(ops): add ignore insufficient balance errors toggle and extract error constants

- Add 5th error filter switch IgnoreInsufficientBalanceErrors to suppress
  upstream insufficient balance / insufficient_quota errors from ops log
- Extract hardcoded error strings into package-level constants for
  shouldSkipOpsErrorLog, normalizeOpsErrorType, classifyOpsPhase, and
  classifyOpsIsBusinessLimited
- Define ErrNoAvailableAccounts sentinel error and replace all
  errors.New("no available accounts") call sites
- Update tests to use require.ErrorIs with the sentinel error

											
										
										
											2026-03-15 17:25:35 +08:00
+										return nil, ErrNoAvailableAccounts
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									}
 									accountLoads := make([]AccountWithConcurrency, 0, len(candidates))
 									for _, acc := range candidates {
 										accountLoads = append(accountLoads, AccountWithConcurrency{
 											ID:             acc.ID,
-												feat: add independent load_factor field for scheduling load calculation

											
										
										
											2026-03-06 05:07:10 +08:00
+											MaxConcurrency: acc.EffectiveLoadFactor(),
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										})
 									}
 									loadMap, err := s.concurrencyService.GetAccountsLoadBatch(ctx, accountLoads)
 									if err != nil {
 										ordered := append([]*Account(nil), candidates...)
 										sortAccountsByPriorityAndLastUsed(ordered, false)
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										if requireCompact {
 											ordered = prioritizeOpenAICompactAccounts(ordered)
 										}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+										for _, acc := range ordered {
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+											fresh := s.resolveFreshSchedulableOpenAIAccount(ctx, acc, requestedModel, false)
-												fix: 限流账号自动退出调度并优化提示文案

											
										
										
											2026-03-07 20:59:17 +08:00
+											if fresh == nil {
 												continue
 											}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+											fresh = s.recheckSelectedOpenAIAccountFromDB(ctx, fresh, requestedModel, requireCompact)
 											if fresh == nil {
 												continue
 											}
 											if needsUpstreamCheck && s.isUpstreamModelRestrictedByChannel(ctx, *groupID, fresh, requestedModel, requireCompact) {
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+												continue
 											}
-												fix: 限流账号自动退出调度并优化提示文案

											
										
										
											2026-03-07 20:59:17 +08:00
+											result, err := s.tryAcquireAccountSlot(ctx, fresh.ID, fresh.Concurrency)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+											if err == nil && result.Acquired {
 												if sessionHash != "" {
-												fix: 限流账号自动退出调度并优化提示文案

											
										
										
											2026-03-07 20:59:17 +08:00
+													_ = s.setStickySessionAccountID(ctx, groupID, sessionHash, fresh.ID, openaiStickySessionTTL)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+												}
-												fix: 优化调度快照缓存以避免 Redis 大 MGET

											
										
										
											2026-04-08 10:10:15 -07:00
+												return s.newSelectionResult(ctx, fresh, true, result.ReleaseFunc, nil)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+											}
 										}
 									} else {
 										var available []accountWithLoad
 										for _, acc := range candidates {
 											loadInfo := loadMap[acc.ID]
 											if loadInfo == nil {
 												loadInfo = &AccountLoadInfo{AccountID: acc.ID}
 											}
 											if loadInfo.LoadRate < 100 {
 												available = append(available, accountWithLoad{
 													account:  acc,
 													loadInfo: loadInfo,
 												})
 											}
 										}
 										if len(available) > 0 {
 											sort.SliceStable(available, func(i, j int) bool {
 												a, b := available[i], available[j]
 												if a.account.Priority != b.account.Priority {
 													return a.account.Priority < b.account.Priority
 												}
 												if a.loadInfo.LoadRate != b.loadInfo.LoadRate {
 													return a.loadInfo.LoadRate < b.loadInfo.LoadRate
 												}
 												switch {
 												case a.account.LastUsedAt == nil && b.account.LastUsedAt != nil:
 													return true
 												case a.account.LastUsedAt != nil && b.account.LastUsedAt == nil:
 													return false
 												case a.account.LastUsedAt == nil && b.account.LastUsedAt == nil:
 													return false
 												default:
 													return a.account.LastUsedAt.Before(*b.account.LastUsedAt)
 												}
 											})
-												feat: shuffle accounts within same sort group to prevent thundering herd

Add post-sort shuffle for accounts with identical (priority, loadRate,
lastUsedAt) to break deterministic ordering when concurrent requests
read the same scheduler snapshot. Applies to both Antigravity and
OpenAI scheduling paths, plus the sortAccountsByPriorityAndLastUsed
helper.

Keeps upstream CallCount/ModelLoadInfo scheduling intact; shuffle is
additive and only randomises within equivalent-rank groups.

											
										
										
											2026-02-09 07:33:17 +08:00
+											shuffleWithinSortGroups(available)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+											selectionOrder := make([]accountWithLoad, 0, len(available))
 											if requireCompact {
 												appendTier := func(out []accountWithLoad, tier int) []accountWithLoad {
 													for _, item := range available {
 														if openAICompactSupportTier(item.account) == tier {
 															out = append(out, item)
 														}
 													}
 													return out
 												}
 												selectionOrder = appendTier(selectionOrder, 2)
 												selectionOrder = appendTier(selectionOrder, 1)
 												// tier 0 候选作为兜底追加：DB recheck 时若发现 cache tier 0 实际
 												// 已升级为 1/2（探测刚跑完，cache 尚未刷新），仍可正常命中。
 												selectionOrder = appendTier(selectionOrder, 0)
 											} else {
 												selectionOrder = append(selectionOrder, available...)
 											}
 											for _, item := range selectionOrder {
 												fresh := s.resolveFreshSchedulableOpenAIAccount(ctx, item.account, requestedModel, false)
 												if fresh == nil {
 													continue
 												}
 												fresh = s.recheckSelectedOpenAIAccountFromDB(ctx, fresh, requestedModel, requireCompact)
-												fix: 限流账号自动退出调度并优化提示文案

											
										
										
											2026-03-07 20:59:17 +08:00
+												if fresh == nil {
 													continue
 												}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+												if needsUpstreamCheck && s.isUpstreamModelRestrictedByChannel(ctx, *groupID, fresh, requestedModel, requireCompact) {
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+													continue
 												}
-												fix: 限流账号自动退出调度并优化提示文案

											
										
										
											2026-03-07 20:59:17 +08:00
+												result, err := s.tryAcquireAccountSlot(ctx, fresh.ID, fresh.Concurrency)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+												if err == nil && result.Acquired {
 													if sessionHash != "" {
-												fix: 限流账号自动退出调度并优化提示文案

											
										
										
											2026-03-07 20:59:17 +08:00
+														_ = s.setStickySessionAccountID(ctx, groupID, sessionHash, fresh.ID, openaiStickySessionTTL)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+													}
-												fix: 优化调度快照缓存以避免 Redis 大 MGET

											
										
										
											2026-04-08 10:10:15 -07:00
+													return s.newSelectionResult(ctx, fresh, true, result.ReleaseFunc, nil)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+												}
 											}
 										}
 									}
 									// ============ Layer 3: Fallback wait ============
 									sortAccountsByPriorityAndLastUsed(candidates, false)
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									if requireCompact {
 										candidates = prioritizeOpenAICompactAccounts(candidates)
 									}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									for _, acc := range candidates {
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										fresh := s.resolveFreshSchedulableOpenAIAccount(ctx, acc, requestedModel, false)
-												fix: 限流账号自动退出调度并优化提示文案

											
										
										
											2026-03-07 20:59:17 +08:00
+										if fresh == nil {
 											continue
 										}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										fresh = s.recheckSelectedOpenAIAccountFromDB(ctx, fresh, requestedModel, requireCompact)
 										if fresh == nil {
 											continue
 										}
 										if needsUpstreamCheck && s.isUpstreamModelRestrictedByChannel(ctx, *groupID, fresh, requestedModel, requireCompact) {
-												fix: resolve 5 audit findings in channel/credits/scheduling

P0-1: Credits degraded response retry + fail-open
- Add isAntigravityDegradedResponse() to detect transient API failures
- Retry up to 3 times with exponential backoff (500ms/1s/2s)
- Invalidate singleflight cache between retries
- Fail-open after exhausting retries instead of 5h circuit break

P1-1: Fix channel restriction pre-check timing conflict
- Swap checkClaudeCodeRestriction before checkChannelPricingRestriction
- Ensures channel restriction is checked against final fallback groupID

P1-2: Add interval pricing validation (frontend + backend)
- Backend: ValidateIntervals() with boundary, price, overlap checks
- Frontend: validateIntervals() with Chinese error messages
- Rules: MinTokens>=0, MaxTokens>MinTokens, prices>=0, no overlap

P2: Fix cross-platform same-model pricing/mapping override
- Store cache keys using original platform instead of group platform
- Lookup across matching platforms (antigravity→anthropic→gemini)
- Prevents anthropic/gemini same-name models from overwriting each other

											
										
										
											2026-04-02 20:28:04 +08:00
+											continue
 										}
-												fix: 优化调度快照缓存以避免 Redis 大 MGET

											
										
										
											2026-04-08 10:10:15 -07:00
+										return s.newSelectionResult(ctx, fresh, false, nil, &AccountWaitPlan{
 											AccountID:      fresh.ID,
 											MaxConcurrency: fresh.Concurrency,
 											Timeout:        cfg.FallbackWaitTimeout,
 											MaxWaiting:     cfg.FallbackMaxWaiting,
 										})
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									if requireCompact && baseCandidateCount > 0 {
 										return nil, ErrNoAvailableCompactAccounts
 									}
-												feat(ops): add ignore insufficient balance errors toggle and extract error constants

- Add 5th error filter switch IgnoreInsufficientBalanceErrors to suppress
  upstream insufficient balance / insufficient_quota errors from ops log
- Extract hardcoded error strings into package-level constants for
  shouldSkipOpsErrorLog, normalizeOpsErrorType, classifyOpsPhase, and
  classifyOpsIsBusinessLimited
- Define ErrNoAvailableAccounts sentinel error and replace all
  errors.New("no available accounts") call sites
- Update tests to use require.ErrorIs with the sentinel error

											
										
										
											2026-03-15 17:25:35 +08:00
+									return nil, ErrNoAvailableAccounts
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+								}
 								func (s *OpenAIGatewayService) listSchedulableAccounts(ctx context.Context, groupID *int64) ([]Account, error) {
-												feat(scheduler): 引入调度快照缓存与 outbox 回放

- 调度热路径优先读 Redis 快照，保留分组排序语义
- outbox 回放 + 全量重建纠偏，失败重试不推进水位
- 自动 Atlas 基线对齐并同步调度配置示例

											
										
										
											2026-01-12 14:19:06 +08:00
+									if s.schedulerSnapshot != nil {
 										accounts, _, err := s.schedulerSnapshot.ListSchedulableAccounts(ctx, groupID, PlatformOpenAI, false)
 										return accounts, err
 									}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									var accounts []Account
 									var err error
 									if s.cfg != nil && s.cfg.RunMode == config.RunModeSimple {
 										accounts, err = s.accountRepo.ListSchedulableByPlatform(ctx, PlatformOpenAI)
 									} else if groupID != nil {
 										accounts, err = s.accountRepo.ListSchedulableByGroupIDAndPlatform(ctx, *groupID, PlatformOpenAI)
 									} else {
-												fix(gateway): 分组隔离 — 禁止未分组账号被跨组调度

当 API Key 无分组时，调度仅从未分组账号池中选取。
修复 isAccountInGroup 在 groupID==nil 时的逻辑，
同时补全 scheduler_snapshot_service 和 gemini_compat_service
中的 SimpleMode 保护，确保分组隔离在所有调度路径生效。

新增 ListSchedulableUngroupedByPlatform/s 方法，
使用 Ent 的 Not(HasAccountGroups()) 谓词实现未分组账号隔离。
新增 17 个单元和端到端隔离测试，覆盖所有分支和边界条件。

											
										
										
											2026-03-03 13:10:26 +08:00
+										accounts, err = s.accountRepo.ListSchedulableUngroupedByPlatform(ctx, PlatformOpenAI)
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+									}
 									if err != nil {
 										return nil, fmt.Errorf("query accounts failed: %w", err)
 									}
 									return accounts, nil
 								}
 								func (s *OpenAIGatewayService) tryAcquireAccountSlot(ctx context.Context, accountID int64, maxConcurrency int) (*AcquireResult, error) {
 									if s.concurrencyService == nil {
 										return &AcquireResult{Acquired: true, ReleaseFunc: func() {}}, nil
 									}
 									return s.concurrencyService.AcquireAccountSlot(ctx, accountID, maxConcurrency)
 								}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+								func (s *OpenAIGatewayService) resolveFreshSchedulableOpenAIAccount(ctx context.Context, account *Account, requestedModel string, requireCompact bool) *Account {
-												fix: 限流账号自动退出调度并优化提示文案

											
										
										
											2026-03-07 20:59:17 +08:00
+									if account == nil {
 										return nil
 									}
 									fresh := account
 									if s.schedulerSnapshot != nil {
 										current, err := s.getSchedulableAccount(ctx, account.ID)
 										if err != nil || current == nil {
 											return nil
 										}
 										fresh = current
 									}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									if !isOpenAIAccountEligibleForRequest(fresh, requestedModel, requireCompact) {
-												fix: 限流账号自动退出调度并优化提示文案

											
										
										
											2026-03-07 20:59:17 +08:00
+										return nil
 									}
 									return fresh
 								}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+								func (s *OpenAIGatewayService) recheckSelectedOpenAIAccountFromDB(ctx context.Context, account *Account, requestedModel string, requireCompact bool) *Account {
-												fix(openai): recheck runtime state from db before final account selection

											
										
										
											2026-03-23 03:50:03 +08:00
+									if account == nil {
 										return nil
 									}
 									if s.schedulerSnapshot == nil || s.accountRepo == nil {
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										if !isOpenAIAccountEligibleForRequest(account, requestedModel, requireCompact) {
 											return nil
 										}
-												fix(openai): recheck runtime state from db before final account selection

											
										
										
											2026-03-23 03:50:03 +08:00
+										return account
 									}
 									latest, err := s.accountRepo.GetByID(ctx, account.ID)
 									if err != nil || latest == nil {
 										return nil
 									}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									if !isOpenAIAccountEligibleForRequest(latest, requestedModel, requireCompact) {
-												fix(openai): recheck runtime state from db before final account selection

											
										
										
											2026-03-23 03:50:03 +08:00
+										return nil
 									}
 									return latest
 								}
-												feat(scheduler): 引入调度快照缓存与 outbox 回放

- 调度热路径优先读 Redis 快照，保留分组排序语义
- outbox 回放 + 全量重建纠偏，失败重试不推进水位
- 自动 Atlas 基线对齐并同步调度配置示例

											
										
										
											2026-01-12 14:19:06 +08:00
+								func (s *OpenAIGatewayService) getSchedulableAccount(ctx context.Context, accountID int64) (*Account, error) {
-												fix: 补齐旧账号的 OpenAI 限流补偿

											
										
										
											2026-03-08 00:14:15 +08:00
+									var (
 										account *Account
 										err     error
 									)
-												feat(scheduler): 引入调度快照缓存与 outbox 回放

- 调度热路径优先读 Redis 快照，保留分组排序语义
- outbox 回放 + 全量重建纠偏，失败重试不推进水位
- 自动 Atlas 基线对齐并同步调度配置示例

											
										
										
											2026-01-12 14:19:06 +08:00
+									if s.schedulerSnapshot != nil {
-												fix: 补齐旧账号的 OpenAI 限流补偿

											
										
										
											2026-03-08 00:14:15 +08:00
+										account, err = s.schedulerSnapshot.GetAccount(ctx, accountID)
 									} else {
 										account, err = s.accountRepo.GetByID(ctx, accountID)
 									}
 									if err != nil || account == nil {
 										return account, err
-												feat(scheduler): 引入调度快照缓存与 outbox 回放

- 调度热路径优先读 Redis 快照，保留分组排序语义
- outbox 回放 + 全量重建纠偏，失败重试不推进水位
- 自动 Atlas 基线对齐并同步调度配置示例

											
										
										
											2026-01-12 14:19:06 +08:00
+									}
-												fix: 补齐旧账号的 OpenAI 限流补偿

											
										
										
											2026-03-08 00:14:15 +08:00
+									return account, nil
-												feat(scheduler): 引入调度快照缓存与 outbox 回放

- 调度热路径优先读 Redis 快照，保留分组排序语义
- outbox 回放 + 全量重建纠偏，失败重试不推进水位
- 自动 Atlas 基线对齐并同步调度配置示例

											
										
										
											2026-01-12 14:19:06 +08:00
+								}
-												fix: 优化调度快照缓存以避免 Redis 大 MGET

											
										
										
											2026-04-08 10:10:15 -07:00
+								func (s *OpenAIGatewayService) hydrateSelectedAccount(ctx context.Context, account *Account) (*Account, error) {
 									if account == nil || s.schedulerSnapshot == nil {
 										return account, nil
 									}
 									hydrated, err := s.schedulerSnapshot.GetAccount(ctx, account.ID)
 									if err != nil {
 										return nil, err
 									}
 									if hydrated == nil {
 										return nil, fmt.Errorf("selected openai account %d not found during hydration", account.ID)
 									}
 									return hydrated, nil
 								}
 								func (s *OpenAIGatewayService) newSelectionResult(ctx context.Context, account *Account, acquired bool, release func(), waitPlan *AccountWaitPlan) (*AccountSelectionResult, error) {
 									hydrated, err := s.hydrateSelectedAccount(ctx, account)
 									if err != nil {
 										return nil, err
 									}
 									return &AccountSelectionResult{
 										Account:     hydrated,
 										Acquired:    acquired,
 										ReleaseFunc: release,
 										WaitPlan:    waitPlan,
 									}, nil
 								}
-												feat(gateway): 实现负载感知的账号调度优化

- 新增调度配置：粘性会话排队、兜底排队、负载计算、槽位清理
- 实现账号级等待队列和批量负载查询（Redis Lua 脚本）
- 三层选择策略：粘性会话优先 → 负载感知选择 → 兜底排队
- 后台定期清理过期槽位，防止资源泄漏
- 集成到所有网关处理器（Claude/Gemini/OpenAI）

											
										
										
											2026-01-01 04:01:51 +08:00
+								func (s *OpenAIGatewayService) schedulingConfig() config.GatewaySchedulingConfig {
 									if s.cfg != nil {
 										return s.cfg.Gateway.Scheduling
 									}
 									return config.GatewaySchedulingConfig{
 										StickySessionMaxWaiting:  3,
 										StickySessionWaitTimeout: 45 * time.Second,
 										FallbackWaitTimeout:      30 * time.Second,
 										FallbackMaxWaiting:       100,
 										LoadBatchEnabled:         true,
 										SlotCleanupInterval:      30 * time.Second,
 									}
 								}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								// GetAccessToken gets the access token for an OpenAI account
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+								func (s *OpenAIGatewayService) GetAccessToken(ctx context.Context, account *Account) (string, string, error) {
-												fix: 修复golangci-lint检查问题

- 移除OpenAIGatewayHandler中未使用的userService字段
- 将账号类型判断的if-else链改为switch语句

											
										
										
											2025-12-23 10:25:32 +08:00
+									switch account.Type {
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+									case AccountTypeOAuth:
-												feat(网关): 引入 OpenAI/Claude OAuth token 缓存

新增 OpenAI/Claude TokenProvider 与缓存键生成
扩展 OAuth 缓存失效覆盖更多平台
统一 OAuth 缓存前缀与依赖注入

											
										
										
											2026-01-15 18:27:06 +08:00
+										// 使用 TokenProvider 获取缓存的 token
 										if s.openAITokenProvider != nil {
 											accessToken, err := s.openAITokenProvider.GetAccessToken(ctx, account)
 											if err != nil {
 												return "", "", err
 											}
 											return accessToken, "oauth", nil
 										}
 										// 降级：TokenProvider 未配置时直接从账号读取
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										accessToken := account.GetOpenAIAccessToken()
 										if accessToken == "" {
 											return "", "", errors.New("access_token not found in credentials")
 										}
 										return accessToken, "oauth", nil
-												fix(lint): 修复所有 Go 命名规范问题

- 全局替换 ApiKey → APIKey（类型、字段、方法、变量）
- 修复所有 initialism 命名（API, SMTP, HTML, URL 等）
- 添加所有缺失的包注释
- 修复导出符号的注释格式

主要修改：
- ApiKey → APIKey（所有出现的地方）
- ApiKeyID → APIKeyID
- ApiKeyIDs → APIKeyIDs
- TestSmtpConnection → TestSMTPConnection
- HtmlURL → HTMLURL
- 添加 20+ 个包注释
- 修复 10+ 个导出符号注释格式

验证结果：
- ✓ golangci-lint: 0 issues
- ✓ 单元测试: 通过
- ✓ 集成测试: 通过

											
										
										
											2026-01-04 19:27:53 +08:00
+									case AccountTypeAPIKey:
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										apiKey := account.GetOpenAIApiKey()
 										if apiKey == "" {
 											return "", "", errors.New("api_key not found in credentials")
 										}
 										return apiKey, "apikey", nil
-												fix: 修复golangci-lint检查问题

- 移除OpenAIGatewayHandler中未使用的userService字段
- 将账号类型判断的if-else链改为switch语句

											
										
										
											2025-12-23 10:25:32 +08:00
+									default:
 										return "", "", fmt.Errorf("unsupported account type: %s", account.Type)
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
 								}
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+								func (s *OpenAIGatewayService) shouldFailoverUpstreamError(statusCode int) bool {
 									switch statusCode {
-												feat: 修复 OpenAI 402 报错自动切换问题

											
										
										
											2025-12-31 11:46:53 +08:00
+									case 401, 402, 403, 429, 529:
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+										return true
 									default:
 										return statusCode >= 500
 									}
 								}
-												fix: OpenAI临时性400错误支持池模式同账号重试 & HelpTooltip层级修复

1. 识别OpenAI "An error occurred while processing your request" 临时性400错误
   并触发failover，同时在池模式下标记RetryableOnSameAccount，允许同账号重试
2. ForwardAsAnthropic路径同步支持临时性400错误的识别和同账号重试
3. HelpTooltip组件使用Teleport渲染到body，修复在dialog内被裁切的问题

											
										
										
											2026-03-10 03:00:58 +08:00
+								func (s *OpenAIGatewayService) shouldFailoverOpenAIUpstreamResponse(statusCode int, upstreamMsg string, upstreamBody []byte) bool {
 									if s.shouldFailoverUpstreamError(statusCode) {
 										return true
 									}
 									return isOpenAITransientProcessingError(statusCode, upstreamMsg, upstreamBody)
 								}
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+								func (s *OpenAIGatewayService) handleFailoverSideEffects(ctx context.Context, resp *http.Response, account *Account) {
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+									body, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+									s.rateLimitService.HandleUpstreamError(ctx, account, resp.StatusCode, resp.Header, body)
 								}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								// Forward forwards request to OpenAI API
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+								func (s *OpenAIGatewayService) Forward(ctx context.Context, c *gin.Context, account *Account, body []byte) (*OpenAIForwardResult, error) {
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									startTime := time.Now()
-												feat(openai): 增加 OAuth 账号 Codex 官方客户端限制开关

新增 codex_cli_only 开关并默认关闭，关闭时完全绕过限制逻辑。
在 OpenAI 网关引入统一检测入口，集中判定账号类型、开关与客户端族。
开启后仅放行 codex_cli_rs、codex_vscode、codex_app 客户端家族。
补充后端判定与网关分支测试，并在前端创建/编辑页增加开关配置与回显。

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-12 22:32:59 +08:00
+									restrictionResult := s.detectCodexClientRestriction(c, account)
 									apiKeyID := getAPIKeyIDFromContext(c)
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+									logCodexCLIOnlyDetection(ctx, c, account, apiKeyID, restrictionResult, body)
-												feat(openai): 增加 OAuth 账号 Codex 官方客户端限制开关

新增 codex_cli_only 开关并默认关闭，关闭时完全绕过限制逻辑。
在 OpenAI 网关引入统一检测入口，集中判定账号类型、开关与客户端族。
开启后仅放行 codex_cli_rs、codex_vscode、codex_app 客户端家族。
补充后端判定与网关分支测试，并在前端创建/编辑页增加开关配置与回显。

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-12 22:32:59 +08:00
+									if restrictionResult.Enabled && !restrictionResult.Matched {
 										c.JSON(http.StatusForbidden, gin.H{
 											"error": gin.H{
 												"type":    "forbidden_error",
 												"message": "This account only allows Codex official clients",
 											},
 										})
 										return nil, errors.New("codex_cli_only restriction: only codex official clients are allowed")
 									}
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									originalBody := body
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+									reqModel, reqStream, promptCacheKey := extractOpenAIRequestMetaFromBody(body)
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									originalModel := reqModel
-												fix(openai): detect official codex client by headers

											
										
										
											2026-03-07 14:12:38 +08:00
+									isCodexCLI := openai.IsCodexOfficialClientByHeaders(c.GetHeader("User-Agent"), c.GetHeader("originator")) || (s.cfg != nil && s.cfg.Gateway.ForceCodexCLI)
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									wsDecision := s.getOpenAIWSProtocolResolver().Resolve(account)
 									clientTransport := GetOpenAIClientTransport(c)
 									// 仅允许 WS 入站请求走 WS 上游，避免出现 HTTP -> WS 协议混用。
 									wsDecision = resolveOpenAIWSDecisionByClientTransport(wsDecision, clientTransport)
 									if c != nil {
 										c.Set("openai_ws_transport_decision", string(wsDecision.Transport))
 										c.Set("openai_ws_transport_reason", wsDecision.Reason)
 									}
 									if wsDecision.Transport == OpenAIUpstreamTransportResponsesWebsocketV2 {
 										logOpenAIWSModeDebug(
 											"selected account_id=%d account_type=%s transport=%s reason=%s model=%s stream=%v",
 											account.ID,
 											account.Type,
 											normalizeOpenAIWSLogValue(string(wsDecision.Transport)),
 											normalizeOpenAIWSLogValue(wsDecision.Reason),
 											reqModel,
 											reqStream,
 										)
 									}
 									// 当前仅支持 WSv2；WSv1 命中时直接返回错误，避免出现“配置可开但行为不确定”。
 									if wsDecision.Transport == OpenAIUpstreamTransportResponsesWebsocket {
 										if c != nil {
 											c.JSON(http.StatusBadRequest, gin.H{
 												"error": gin.H{
 													"type":    "invalid_request_error",
 													"message": "OpenAI WSv1 is temporarily unsupported. Please enable responses_websockets_v2.",
 												},
 											})
 										}
 										return nil, errors.New("openai ws v1 is temporarily unsupported; use ws v2")
 									}
-												feat(openai): 支持自动透传开关并透传 User-Agent

- OpenAI OAuth/API Key 统一支持自动透传开关，编辑页可开关\n- 透传模式仅替换认证并保留计费/并发/审计，修复 API Key responses 端点拼接\n- Usage 页面显示原始 User-Agent 且不截断，补充回归测试与清单

											
										
										
											2026-02-12 10:56:07 +08:00
+									passthroughEnabled := account.IsOpenAIPassthroughEnabled()
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									if passthroughEnabled {
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+										// 透传分支只需要轻量提取字段，避免热路径全量 Unmarshal。
 										reasoningEffort := extractOpenAIReasoningEffortFromBody(body, reqModel)
-												feat(openai): 支持自动透传开关并透传 User-Agent

- OpenAI OAuth/API Key 统一支持自动透传开关，编辑页可开关\n- 透传模式仅替换认证并保留计费/并发/审计，修复 API Key responses 端点拼接\n- Usage 页面显示原始 User-Agent 且不截断，补充回归测试与清单

											
										
										
											2026-02-12 10:56:07 +08:00
+										return s.forwardOpenAIPassthrough(ctx, c, account, originalBody, reqModel, reasoningEffort, reqStream, startTime)
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									}
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+									reqBody, err := getOpenAIRequestBodyMap(c, body)
 									if err != nil {
 										return nil, err
 									}
 									if v, ok := reqBody["model"].(string); ok {
 										reqModel = v
 										originalModel = reqModel
 									}
 									if v, ok := reqBody["stream"].(bool); ok {
 										reqStream = v
 									}
 									if promptCacheKey == "" {
 										if v, ok := reqBody["prompt_cache_key"].(string); ok {
 											promptCacheKey = strings.TrimSpace(v)
 										}
 									}
 									// Track if body needs re-serialization
 									bodyModified := false
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									// 单字段补丁快速路径：只要整个变更集最终可归约为同一路径的 set/delete，就避免全量 Marshal。
 									patchDisabled := false
 									patchHasOp := false
 									patchDelete := false
 									patchPath := ""
 									var patchValue any
 									markPatchSet := func(path string, value any) {
 										if strings.TrimSpace(path) == "" {
 											patchDisabled = true
 											return
 										}
 										if patchDisabled {
 											return
 										}
 										if !patchHasOp {
 											patchHasOp = true
 											patchDelete = false
 											patchPath = path
 											patchValue = value
 											return
 										}
 										if patchDelete || patchPath != path {
 											patchDisabled = true
 											return
 										}
 										patchValue = value
 									}
 									markPatchDelete := func(path string) {
 										if strings.TrimSpace(path) == "" {
 											patchDisabled = true
 											return
 										}
 										if patchDisabled {
 											return
 										}
 										if !patchHasOp {
 											patchHasOp = true
 											patchDelete = true
 											patchPath = path
 											return
 										}
 										if !patchDelete || patchPath != path {
 											patchDisabled = true
 										}
 									}
 									disablePatch := func() {
 										patchDisabled = true
 									}
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
-												fix: /response端点移除强制注入大量instructions内容

											
										
										
											2026-03-07 13:39:47 +08:00
+									// 非透传模式下，instructions 为空时注入默认指令。
 									if isInstructionsEmpty(reqBody) {
 										reqBody["instructions"] = "You are a helpful coding assistant."
 										bodyModified = true
 										markPatchSet("instructions", "You are a helpful coding assistant.")
-												feat(openai): 支持自动透传开关并透传 User-Agent

- OpenAI OAuth/API Key 统一支持自动透传开关，编辑页可开关\n- 透传模式仅替换认证并保留计费/并发/审计，修复 API Key responses 端点拼接\n- Usage 页面显示原始 User-Agent 且不截断，补充回归测试与清单

											
										
										
											2026-02-12 10:56:07 +08:00
+									}
-												fix: bridge codex image generation over responses

											
										
										
											2026-04-23 15:13:57 +00:00
+									if isCodexCLI && ensureOpenAIResponsesImageGenerationTool(reqBody) {
 										bodyModified = true
 										disablePatch()
 										logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Injected /responses image_generation tool for Codex client")
 									}
-												fix openai image request handling

											
										
										
											2026-04-23 09:53:57 +08:00
+									if normalizeOpenAIResponsesImageGenerationTools(reqBody) {
 										bodyModified = true
 										disablePatch()
 										logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Normalized /responses image_generation tool payload")
 									}
-												fix: bridge codex image generation over responses

											
										
										
											2026-04-23 15:13:57 +00:00
+									if isCodexCLI && applyCodexImageGenerationBridgeInstructions(reqBody) {
 										bodyModified = true
 										disablePatch()
 										logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Added Codex image_generation bridge instructions")
 									}
-												fix openai image request handling

											
										
										
											2026-04-23 09:53:57 +08:00
-												fix(网关): 补齐Codex指令回退与输入过滤

											
										
										
											2026-01-13 17:01:21 +08:00
+									// 对所有请求执行模型映射（包含 Codex CLI）。
-												refactor: improve model resolution and normalization logic for OpenAI integration

											
										
										
											2026-03-24 19:20:15 +08:00
+									billingModel := account.GetMappedModel(reqModel)
 									if billingModel != reqModel {
 										logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Model mapping applied: %s -> %s (account: %s, isCodexCLI: %v)", reqModel, billingModel, account.Name, isCodexCLI)
 										reqBody["model"] = billingModel
-												feat(gateway): 对所有请求（包括 Codex CLI）应用模型映射

- 移除 Codex CLI 的模型映射跳过逻辑
- 添加详细的模型映射日志，包含账号名称和请求类型
- 确保所有 OpenAI 请求都能正确应用账号配置的模型映射

											
										
										
											2026-01-12 13:23:05 -08:00
+										bodyModified = true
-												refactor: improve model resolution and normalization logic for OpenAI integration

											
										
										
											2026-03-24 19:20:15 +08:00
+										markPatchSet("model", billingModel)
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
-												refactor: improve model resolution and normalization logic for OpenAI integration

											
										
										
											2026-03-24 19:20:15 +08:00
+									upstreamModel := billingModel
-												fix: bridge codex image generation over responses

											
										
										
											2026-04-23 15:13:57 +00:00
+									if normalizeOpenAIResponsesImageOnlyModel(reqBody) {
 										bodyModified = true
 										disablePatch()
 										if model, ok := reqBody["model"].(string); ok {
 											upstreamModel = strings.TrimSpace(model)
 										}
 										logger.LegacyPrintf(
 											"service.openai_gateway",
 											"[OpenAI] Normalized /responses image-only model request inbound_model=%s image_model=%s upstream_model=%s",
 											reqModel,
 											billingModel,
 											upstreamModel,
 										)
 									}
-												fix openai image request handling

											
										
										
											2026-04-23 09:53:57 +08:00
+									if err := validateOpenAIResponsesImageModel(reqBody, upstreamModel); err != nil {
 										setOpsUpstreamError(c, http.StatusBadRequest, err.Error(), "")
 										c.JSON(http.StatusBadRequest, gin.H{
 											"error": gin.H{
 												"type":    "invalid_request_error",
 												"message": err.Error(),
 												"param":   "model",
 											},
 										})
 										return nil, err
 									}
 									if hasOpenAIImageGenerationTool(reqBody) {
 										logger.LegacyPrintf(
 											"service.openai_gateway",
 											"[OpenAI] /responses image_generation request inbound_model=%s mapped_model=%s account_type=%s",
 											reqModel,
 											upstreamModel,
 											account.Type,
 										)
 									}
-												fix(openai): handle codex spark model limitations

											
										
										
											2026-04-24 07:42:31 +00:00
+									if err := validateCodexSparkInput(reqBody, upstreamModel); err != nil {
 										setOpsUpstreamError(c, http.StatusBadRequest, err.Error(), "")
 										c.JSON(http.StatusBadRequest, gin.H{
 											"error": gin.H{
 												"type":    "invalid_request_error",
 												"message": err.Error(),
 												"param":   "input",
 											},
 										})
 										return nil, err
 									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									// Compact-only model 映射：仅在 /responses/compact 路径生效，且优先级高于
 									// OAuth 模型规范化（避免 OAuth 规范化覆盖 compact-only 自定义模型）。
 									isCompactRequest := isOpenAIResponsesCompactPath(c)
 									compactMapped := false
 									if isCompactRequest {
 										compactMappedModel := resolveOpenAICompactForwardModel(account, billingModel)
 										if compactMappedModel != "" && compactMappedModel != billingModel {
 											compactMapped = true
 											upstreamModel = compactMappedModel
 											reqBody["model"] = compactMappedModel
 											bodyModified = true
 											markPatchSet("model", compactMappedModel)
 											logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Compact model mapping applied: %s -> %s (account: %s, isCodexCLI: %v)", billingModel, compactMappedModel, account.Name, isCodexCLI)
 										}
 									}
-												fix(openai): do not normalize API token based accounts

											
										
										
											2026-04-07 11:27:57 +03:00
+									// OpenAI OAuth 账号走 ChatGPT internal Codex endpoint，需要将模型名规范化为
 									// 上游可识别的 Codex/GPT 系列。API Key 账号则应保留原始/映射后的模型名，
 									// 以兼容自定义 base_url 的 OpenAI-compatible 上游。
-												fix(openai): 增强 OpenCode 兼容性和模型规范化

## 主要改动

1. **模型规范化扩展到所有账号**
   - 将 Codex 模型规范化（如 gpt-5-nano → gpt-5.1）应用到所有 OpenAI 账号类型
   - 不再仅限于 OAuth 非 CLI 请求
   - 解决 Codex CLI 使用 ChatGPT 账号时的模型兼容性问题

2. **reasoning.effort 参数规范化**
   - 自动将 `minimal` 转换为 `none`
   - 解决 gpt-5.1 模型不支持 `minimal` 值的问题

3. **Session/Conversation ID fallback 机制**
   - 从请求体多个字段提取 session_id/conversation_id
   - 优先级：prompt_cache_key → session_id → conversation_id → previous_response_id
   - 支持 Codex CLI 的会话保持

4. **Tool Call ID fallback**
   - 当 call_id 为空时使用 id 字段作为 fallback
   - 确保 tool call 输出能正确匹配
   - 保留 item_reference 类型的 items

5. **Header 优化**
   - 添加 conversation_id 到允许的 headers
   - 移除删除 session headers 的逻辑

## 相关 Issue
- 参考 OpenCode issue #3118 关于 item_reference 的讨论

											
										
										
											2026-01-12 20:18:53 -08:00
+									if model, ok := reqBody["model"].(string); ok {
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										if !compactMapped {
 											upstreamModel = normalizeOpenAIModelForUpstream(account, model)
 											if upstreamModel != "" && upstreamModel != model {
 												logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Upstream model resolved: %s -> %s (account: %s, type: %s, isCodexCLI: %v)",
 													model, upstreamModel, account.Name, account.Type, isCodexCLI)
 												reqBody["model"] = upstreamModel
 												bodyModified = true
 												markPatchSet("model", upstreamModel)
 											}
-												fix(openai): 增强 OpenCode 兼容性和模型规范化

## 主要改动

1. **模型规范化扩展到所有账号**
   - 将 Codex 模型规范化（如 gpt-5-nano → gpt-5.1）应用到所有 OpenAI 账号类型
   - 不再仅限于 OAuth 非 CLI 请求
   - 解决 Codex CLI 使用 ChatGPT 账号时的模型兼容性问题

2. **reasoning.effort 参数规范化**
   - 自动将 `minimal` 转换为 `none`
   - 解决 gpt-5.1 模型不支持 `minimal` 值的问题

3. **Session/Conversation ID fallback 机制**
   - 从请求体多个字段提取 session_id/conversation_id
   - 优先级：prompt_cache_key → session_id → conversation_id → previous_response_id
   - 支持 Codex CLI 的会话保持

4. **Tool Call ID fallback**
   - 当 call_id 为空时使用 id 字段作为 fallback
   - 确保 tool call 输出能正确匹配
   - 保留 item_reference 类型的 items

5. **Header 优化**
   - 添加 conversation_id 到允许的 headers
   - 移除删除 session headers 的逻辑

## 相关 Issue
- 参考 OpenCode issue #3118 关于 item_reference 的讨论

											
										
										
											2026-01-12 20:18:53 -08:00
+										}
-												fix: 修复gpt-5.2以上模型映射到gpt-5.2以下时verbosity参数引发的报错

											
										
										
											2026-03-11 21:12:07 +08:00
 										// 移除 gpt-5.2-codex 以下的版本 verbosity 参数
 										// 确保高版本模型向低版本模型映射不报错
-												refactor: improve model resolution and normalization logic for OpenAI integration

											
										
										
											2026-03-24 19:20:15 +08:00
+										if !SupportsVerbosity(upstreamModel) {
-												fix: 修复gpt-5.2以上模型映射到gpt-5.2以下时verbosity参数引发的报错

											
										
										
											2026-03-11 21:12:07 +08:00
+											if text, ok := reqBody["text"].(map[string]any); ok {
-												fix: 修复流水线golangci-lint 的 errcheck

											
										
										
											2026-03-11 22:56:20 +08:00
+												delete(text, "verbosity")
-												fix: 修复gpt-5.2以上模型映射到gpt-5.2以下时verbosity参数引发的报错

											
										
										
											2026-03-11 21:12:07 +08:00
+											}
 										}
-												fix(openai): 增强 OpenCode 兼容性和模型规范化

## 主要改动

1. **模型规范化扩展到所有账号**
   - 将 Codex 模型规范化（如 gpt-5-nano → gpt-5.1）应用到所有 OpenAI 账号类型
   - 不再仅限于 OAuth 非 CLI 请求
   - 解决 Codex CLI 使用 ChatGPT 账号时的模型兼容性问题

2. **reasoning.effort 参数规范化**
   - 自动将 `minimal` 转换为 `none`
   - 解决 gpt-5.1 模型不支持 `minimal` 值的问题

3. **Session/Conversation ID fallback 机制**
   - 从请求体多个字段提取 session_id/conversation_id
   - 优先级：prompt_cache_key → session_id → conversation_id → previous_response_id
   - 支持 Codex CLI 的会话保持

4. **Tool Call ID fallback**
   - 当 call_id 为空时使用 id 字段作为 fallback
   - 确保 tool call 输出能正确匹配
   - 保留 item_reference 类型的 items

5. **Header 优化**
   - 添加 conversation_id 到允许的 headers
   - 移除删除 session headers 的逻辑

## 相关 Issue
- 参考 OpenCode issue #3118 关于 item_reference 的讨论

											
										
										
											2026-01-12 20:18:53 -08:00
+									}
-												fix(网关): 补齐Codex指令回退与输入过滤

											
										
										
											2026-01-13 17:01:21 +08:00
+									// 规范化 reasoning.effort 参数（minimal -> none），与上游允许值对齐。
-												fix(openai): 增强 OpenCode 兼容性和模型规范化

## 主要改动

1. **模型规范化扩展到所有账号**
   - 将 Codex 模型规范化（如 gpt-5-nano → gpt-5.1）应用到所有 OpenAI 账号类型
   - 不再仅限于 OAuth 非 CLI 请求
   - 解决 Codex CLI 使用 ChatGPT 账号时的模型兼容性问题

2. **reasoning.effort 参数规范化**
   - 自动将 `minimal` 转换为 `none`
   - 解决 gpt-5.1 模型不支持 `minimal` 值的问题

3. **Session/Conversation ID fallback 机制**
   - 从请求体多个字段提取 session_id/conversation_id
   - 优先级：prompt_cache_key → session_id → conversation_id → previous_response_id
   - 支持 Codex CLI 的会话保持

4. **Tool Call ID fallback**
   - 当 call_id 为空时使用 id 字段作为 fallback
   - 确保 tool call 输出能正确匹配
   - 保留 item_reference 类型的 items

5. **Header 优化**
   - 添加 conversation_id 到允许的 headers
   - 移除删除 session headers 的逻辑

## 相关 Issue
- 参考 OpenCode issue #3118 关于 item_reference 的讨论

											
										
										
											2026-01-12 20:18:53 -08:00
+									if reasoning, ok := reqBody["reasoning"].(map[string]any); ok {
 										if effort, ok := reasoning["effort"].(string); ok && effort == "minimal" {
 											reasoning["effort"] = "none"
 											bodyModified = true
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											markPatchSet("reasoning.effort", "none")
-												chore(logging): 完成后端日志审计与结构化迁移

- 将高密度服务与处理器日志迁移到新日志系统（LegacyPrintf/结构化日志）
- 增加 stdlog bridge 与兼容测试，保留旧日志捕获能力
- 将 OpenAI 断流告警改为结构化 Warn 并改造对应测试为 sink 捕获
- 补齐后端相关文件 logger 引用并通过全量 go test

											
										
										
											2026-02-12 19:01:09 +08:00
+											logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Normalized reasoning.effort: minimal -> none (account: %s)", account.Name)
-												fix(openai): 增强 OpenCode 兼容性和模型规范化

## 主要改动

1. **模型规范化扩展到所有账号**
   - 将 Codex 模型规范化（如 gpt-5-nano → gpt-5.1）应用到所有 OpenAI 账号类型
   - 不再仅限于 OAuth 非 CLI 请求
   - 解决 Codex CLI 使用 ChatGPT 账号时的模型兼容性问题

2. **reasoning.effort 参数规范化**
   - 自动将 `minimal` 转换为 `none`
   - 解决 gpt-5.1 模型不支持 `minimal` 值的问题

3. **Session/Conversation ID fallback 机制**
   - 从请求体多个字段提取 session_id/conversation_id
   - 优先级：prompt_cache_key → session_id → conversation_id → previous_response_id
   - 支持 Codex CLI 的会话保持

4. **Tool Call ID fallback**
   - 当 call_id 为空时使用 id 字段作为 fallback
   - 确保 tool call 输出能正确匹配
   - 保留 item_reference 类型的 items

5. **Header 优化**
   - 添加 conversation_id 到允许的 headers
   - 移除删除 session headers 的逻辑

## 相关 Issue
- 参考 OpenCode issue #3118 关于 item_reference 的讨论

											
										
										
											2026-01-12 20:18:53 -08:00
+										}
 									}
-												fix(openai): 统一 OAuth instructions 处理逻辑，修复 Codex CLI 400 错误

- 修改 applyCodexOAuthTransform 函数签名，增加 isCodexCLI 参数
- 移除 && !isCodexCLI 条件，对所有 OAuth 请求统一处理
- 新增 applyInstructions/applyCodexCLIInstructions/applyOpenCodeInstructions 辅助函数
- 新增 isInstructionsEmpty 函数检查 instructions 字段是否为空
- 添加 Codex CLI 和非 Codex CLI 场景的测试用例

逻辑说明：
- Codex CLI + 有 instructions: 保持不变
- Codex CLI + 无 instructions: 补充 opencode 指令
- 非 Codex CLI: 使用 opencode 指令覆盖

											
										
										
											2026-02-03 21:22:33 +08:00
+									if account.Type == AccountTypeOAuth {
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										codexResult := applyCodexOAuthTransform(reqBody, isCodexCLI, isCompactRequest)
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+										if codexResult.Modified {
-												feat(openai): add AI SDK content format compatibility for OAuth accounts

- Add normalizeInputForCodexAPI function to convert AI SDK multi-part
  content format to simplified format expected by ChatGPT Codex API
- AI SDK sends: {"content": [{"type": "input_text", "text": "..."}]}
- Codex API expects: {"content": "..."}
- Only applies to OAuth accounts (ChatGPT internal API)
- API Key accounts remain unchanged (OpenAI Platform API supports both)

											
										
										
											2026-01-09 00:34:49 +08:00
+											bodyModified = true
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											disablePatch()
-												feat(openai): add AI SDK content format compatibility for OAuth accounts

- Add normalizeInputForCodexAPI function to convert AI SDK multi-part
  content format to simplified format expected by ChatGPT Codex API
- AI SDK sends: {"content": [{"type": "input_text", "text": "..."}]}
- Codex API expects: {"content": "..."}
- Only applies to OAuth accounts (ChatGPT internal API)
- API Key accounts remain unchanged (OpenAI Platform API supports both)

											
										
										
											2026-01-09 00:34:49 +08:00
+										}
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+										if codexResult.NormalizedModel != "" {
-												refactor: improve model resolution and normalization logic for OpenAI integration

											
										
										
											2026-03-24 19:20:15 +08:00
+											upstreamModel = codexResult.NormalizedModel
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+										}
 										if codexResult.PromptCacheKey != "" {
 											promptCacheKey = codexResult.PromptCacheKey
 										}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
-												fix(gateway): 完善 max_output_tokens 参数处理逻辑

根据不同平台和账号类型处理 max_output_tokens 参数：
- OpenAI OAuth (Responses API): 保留 max_output_tokens（支持）
- OpenAI API Key: 删除 max_output_tokens（不支持）
- Anthropic (Claude): 转换 max_output_tokens 为 max_tokens
- Gemini: 删除 max_output_tokens（由 Gemini 专用转换处理）
- 其他平台: 删除（安全起见）

同时处理 max_completion_tokens 参数，仅在 OpenAI OAuth 时保留。

修复客户端（如 OpenCode）发送不支持参数导致上游返回 400 错误的问题。

Related-to: #231

											
										
										
											2026-01-12 11:08:28 -08:00
+									// Handle max_output_tokens based on platform and account type
 									if !isCodexCLI {
 										if maxOutputTokens, hasMaxOutputTokens := reqBody["max_output_tokens"]; hasMaxOutputTokens {
 											switch account.Platform {
 											case PlatformOpenAI:
 												// For OpenAI API Key, remove max_output_tokens (not supported)
 												// For OpenAI OAuth (Responses API), keep it (supported)
 												if account.Type == AccountTypeAPIKey {
 													delete(reqBody, "max_output_tokens")
 													bodyModified = true
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+													markPatchDelete("max_output_tokens")
-												fix(gateway): 完善 max_output_tokens 参数处理逻辑

根据不同平台和账号类型处理 max_output_tokens 参数：
- OpenAI OAuth (Responses API): 保留 max_output_tokens（支持）
- OpenAI API Key: 删除 max_output_tokens（不支持）
- Anthropic (Claude): 转换 max_output_tokens 为 max_tokens
- Gemini: 删除 max_output_tokens（由 Gemini 专用转换处理）
- 其他平台: 删除（安全起见）

同时处理 max_completion_tokens 参数，仅在 OpenAI OAuth 时保留。

修复客户端（如 OpenCode）发送不支持参数导致上游返回 400 错误的问题。

Related-to: #231

											
										
										
											2026-01-12 11:08:28 -08:00
+												}
 											case PlatformAnthropic:
 												// For Anthropic (Claude), convert to max_tokens
 												delete(reqBody, "max_output_tokens")
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+												markPatchDelete("max_output_tokens")
-												fix(gateway): 完善 max_output_tokens 参数处理逻辑

根据不同平台和账号类型处理 max_output_tokens 参数：
- OpenAI OAuth (Responses API): 保留 max_output_tokens（支持）
- OpenAI API Key: 删除 max_output_tokens（不支持）
- Anthropic (Claude): 转换 max_output_tokens 为 max_tokens
- Gemini: 删除 max_output_tokens（由 Gemini 专用转换处理）
- 其他平台: 删除（安全起见）

同时处理 max_completion_tokens 参数，仅在 OpenAI OAuth 时保留。

修复客户端（如 OpenCode）发送不支持参数导致上游返回 400 错误的问题。

Related-to: #231

											
										
										
											2026-01-12 11:08:28 -08:00
+												if _, hasMaxTokens := reqBody["max_tokens"]; !hasMaxTokens {
 													reqBody["max_tokens"] = maxOutputTokens
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+													disablePatch()
-												fix(gateway): 完善 max_output_tokens 参数处理逻辑

根据不同平台和账号类型处理 max_output_tokens 参数：
- OpenAI OAuth (Responses API): 保留 max_output_tokens（支持）
- OpenAI API Key: 删除 max_output_tokens（不支持）
- Anthropic (Claude): 转换 max_output_tokens 为 max_tokens
- Gemini: 删除 max_output_tokens（由 Gemini 专用转换处理）
- 其他平台: 删除（安全起见）

同时处理 max_completion_tokens 参数，仅在 OpenAI OAuth 时保留。

修复客户端（如 OpenCode）发送不支持参数导致上游返回 400 错误的问题。

Related-to: #231

											
										
										
											2026-01-12 11:08:28 -08:00
+												}
 												bodyModified = true
 											case PlatformGemini:
 												// For Gemini, remove (will be handled by Gemini-specific transform)
 												delete(reqBody, "max_output_tokens")
 												bodyModified = true
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+												markPatchDelete("max_output_tokens")
-												fix(gateway): 完善 max_output_tokens 参数处理逻辑

根据不同平台和账号类型处理 max_output_tokens 参数：
- OpenAI OAuth (Responses API): 保留 max_output_tokens（支持）
- OpenAI API Key: 删除 max_output_tokens（不支持）
- Anthropic (Claude): 转换 max_output_tokens 为 max_tokens
- Gemini: 删除 max_output_tokens（由 Gemini 专用转换处理）
- 其他平台: 删除（安全起见）

同时处理 max_completion_tokens 参数，仅在 OpenAI OAuth 时保留。

修复客户端（如 OpenCode）发送不支持参数导致上游返回 400 错误的问题。

Related-to: #231

											
										
										
											2026-01-12 11:08:28 -08:00
+											default:
 												// For unknown platforms, remove to be safe
 												delete(reqBody, "max_output_tokens")
 												bodyModified = true
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+												markPatchDelete("max_output_tokens")
-												fix(gateway): 完善 max_output_tokens 参数处理逻辑

根据不同平台和账号类型处理 max_output_tokens 参数：
- OpenAI OAuth (Responses API): 保留 max_output_tokens（支持）
- OpenAI API Key: 删除 max_output_tokens（不支持）
- Anthropic (Claude): 转换 max_output_tokens 为 max_tokens
- Gemini: 删除 max_output_tokens（由 Gemini 专用转换处理）
- 其他平台: 删除（安全起见）

同时处理 max_completion_tokens 参数，仅在 OpenAI OAuth 时保留。

修复客户端（如 OpenCode）发送不支持参数导致上游返回 400 错误的问题。

Related-to: #231

											
										
										
											2026-01-12 11:08:28 -08:00
+											}
 										}
 										// Also handle max_completion_tokens (similar logic)
 										if _, hasMaxCompletionTokens := reqBody["max_completion_tokens"]; hasMaxCompletionTokens {
 											if account.Type == AccountTypeAPIKey || account.Platform != PlatformOpenAI {
 												delete(reqBody, "max_completion_tokens")
 												bodyModified = true
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+												markPatchDelete("max_completion_tokens")
-												fix(gateway): 完善 max_output_tokens 参数处理逻辑

根据不同平台和账号类型处理 max_output_tokens 参数：
- OpenAI OAuth (Responses API): 保留 max_output_tokens（支持）
- OpenAI API Key: 删除 max_output_tokens（不支持）
- Anthropic (Claude): 转换 max_output_tokens 为 max_tokens
- Gemini: 删除 max_output_tokens（由 Gemini 专用转换处理）
- 其他平台: 删除（安全起见）

同时处理 max_completion_tokens 参数，仅在 OpenAI OAuth 时保留。

修复客户端（如 OpenCode）发送不支持参数导致上游返回 400 错误的问题。

Related-to: #231

											
										
										
											2026-01-12 11:08:28 -08:00
+											}
 										}
-												fix: 添加混合渠道警告确认框和过滤 prompt_cache_retention 参数

- 前端: EditAccountModal 和 CreateAccountModal 添加 409 mixed_channel_warning 处理
- 前端: 弹出确认框让用户确认混合渠道风险
- 后端: 过滤 OpenAI 请求中的 prompt_cache_retention 参数（上游不支持）
- 添加中英文翻译

Co-authored-by: factory-droid[bot] <138933559+factory-droid[bot]@users.noreply.github.com>

											
										
										
											2026-01-17 16:06:44 +08:00
-												fix: remove unsupported safety_identifier and previous_response_id fields from upstream requests

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>

											
										
										
											2026-02-04 15:56:01 +08:00
+										// Remove unsupported fields (not supported by upstream OpenAI API)
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										unsupportedFields := []string{"prompt_cache_retention", "safety_identifier"}
 										for _, unsupportedField := range unsupportedFields {
-												fix: remove unsupported safety_identifier and previous_response_id fields from upstream requests

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>

											
										
										
											2026-02-04 15:56:01 +08:00
+											if _, has := reqBody[unsupportedField]; has {
 												delete(reqBody, unsupportedField)
 												bodyModified = true
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+												markPatchDelete(unsupportedField)
-												fix: remove unsupported safety_identifier and previous_response_id fields from upstream requests

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>

											
										
										
											2026-02-04 15:56:01 +08:00
+											}
-												fix: 添加混合渠道警告确认框和过滤 prompt_cache_retention 参数

- 前端: EditAccountModal 和 CreateAccountModal 添加 409 mixed_channel_warning 处理
- 前端: 弹出确认框让用户确认混合渠道风险
- 后端: 过滤 OpenAI 请求中的 prompt_cache_retention 参数（上游不支持）
- 添加中英文翻译

Co-authored-by: factory-droid[bot] <138933559+factory-droid[bot]@users.noreply.github.com>

											
										
										
											2026-01-17 16:06:44 +08:00
+										}
-												fix(gateway): 完善 max_output_tokens 参数处理逻辑

根据不同平台和账号类型处理 max_output_tokens 参数：
- OpenAI OAuth (Responses API): 保留 max_output_tokens（支持）
- OpenAI API Key: 删除 max_output_tokens（不支持）
- Anthropic (Claude): 转换 max_output_tokens 为 max_tokens
- Gemini: 删除 max_output_tokens（由 Gemini 专用转换处理）
- 其他平台: 删除（安全起见）

同时处理 max_completion_tokens 参数，仅在 OpenAI OAuth 时保留。

修复客户端（如 OpenCode）发送不支持参数导致上游返回 400 错误的问题。

Related-to: #231

											
										
										
											2026-01-12 11:08:28 -08:00
+									}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									// 仅在 WSv2 模式保留 previous_response_id，其他模式（HTTP/WSv1）统一过滤。
 									// 注意：该规则同样适用于 Codex CLI 请求，避免 WSv1 向上游透传不支持字段。
 									if wsDecision.Transport != OpenAIUpstreamTransportResponsesWebsocketV2 {
 										if _, has := reqBody["previous_response_id"]; has {
 											delete(reqBody, "previous_response_id")
 											bodyModified = true
 											markPatchDelete("previous_response_id")
 										}
 									}
-												fix(openai): sanitize empty base64 input images

											
										
										
											2026-04-01 00:46:38 +08:00
+									if sanitizeEmptyBase64InputImagesInOpenAIRequestBodyMap(reqBody) {
 										bodyModified = true
 										disablePatch()
 									}
-												feat(openai): OpenAI Fast/Flex Policy 完整实现（HTTP + WebSocket + Admin）

对称参照 Claude BetaPolicy 的 fast-mode 过滤实现，新增针对 OpenAI 上游
service_tier 字段（priority / flex，含客户端 "fast" → "priority" 归一化）的
pass / filter / block 三态策略，覆盖全部 OpenAI 入口 + admin 配置入口。

后端核心
- 新增 SettingKeyOpenAIFastPolicySettings、OpenAIFastPolicyRule、
  OpenAIFastPolicySettings 配置模型，含规则的 service_tier × action × scope
  × 模型白名单 × fallback action 维度。
- SettingService.Get/SetOpenAIFastPolicySettings；缺失时返回内置默认策略
  （所有模型的 priority 走 filter，whitelist 为空，fallback=pass）。设计
  依据：service_tier=fast 是用户级开关，与 model 字段正交，默认锁定特定
  model slug 会留下"用 gpt-4 + fast 透传 priority 上游"的绕过路径。JSON
  解析失败不再静默 fallback，slog.Warn 记录脏数据，便于运维定位。
- service_tier 归一化（trim + ToLower + fast→priority + 白名单 priority/flex）
  与策略评估（evaluateOpenAIFastPolicy）作为唯一真实来源，HTTP / WS 共用。
  抽出纯函数 evaluateOpenAIFastPolicyWithSettings，配合 ctx-bound settings
  快照（withOpenAIFastPolicyContext / openAIFastPolicySettingsFromContext），
  WS 长会话入口预取一次后所有帧复用，避免每帧打到 settingService。

HTTP 入口（4 个）
- Chat Completions、Anthropic 兼容（Messages，含 BetaFastMode→priority 二次
  命中）、原生 Responses、Passthrough Responses 全部接入
  applyOpenAIFastPolicyToBody，filter 走 sjson 顶层删除 service_tier，block
  返回 403 forbidden_error JSON。
- 4 入口统一使用 upstream 视角的 model（GetMappedModel +
  normalizeOpenAIModelForUpstream + Codex OAuth normalize 后的 slug），
  避免 chat/messages/native /responses/passthrough 因为 model 维度不同
  造成 whitelist 命中差异。
- 在 pass 路径也把客户端 "fast" 别名归一化为 "priority" 写回 body，
  否则 native /responses 与 passthrough 入口会把 "fast" 原样透传给上游
  导致 400/拒绝（chat-completions 入口的 normalizeResponsesBodyServiceTier
  此前已具备同等行为）。

WebSocket 入口
- 新增 applyOpenAIFastPolicyToWSResponseCreate：严格匹配
  type="response.create"，仅处理顶层 service_tier；filter 用 sjson 删字段，
  block 返回 typed *OpenAIFastBlockedError。
- ingress 路径在 parseClientPayload 内调用，block 命中先 Write Realtime
  风格 error event 再返回 OpenAIWSClientCloseError(StatusPolicyViolation
  =1008)，依赖底层 WebSocket Conn.Write 的同步 flush 保证 error 先于
  close。
- passthrough 路径在 RunEntry 前对 firstClientMessage 应用策略，并通过
  openAIWSPolicyEnforcingFrameConn 包装 ReadFrame 对每个 client→upstream
  帧执行策略；后续帧无 model 字段时回退到 capturedSessionModel。
  filter 闭包内同时侦测 session.update / session.created 帧的 session.model
  字段刷新 capturedSessionModel，封堵"首帧 model=gpt-4o（pass）→
  session.update 改为 gpt-5.5 → 不带 model 的 response.create fallback
  到 gpt-4o"的 mid-session 绕过路径。
- passthrough billing：requestServiceTier 在策略 filter 之后再从
  firstClientMessage 提取，filter 命中时 OpenAIForwardResult.ServiceTier
  上报 nil（default tier），与 HTTP 入口（reqBody 来自 post-filter map）
  / WS ingress（payload 来自 post-filter bytes）的语义一致。
- 错误事件 schema：{event_id: "evt_<32hex>", type: "error",
  error: {type: "forbidden_error", code: "policy_violation", message}}，
  与 OpenAI codex 客户端 error event 解析兼容。

Admin / Frontend
- dto.SystemSettings / UpdateSettingsRequest 新增
  openai_fast_policy_settings 字段（omitempty），bulk GET/PUT 接入。
- Settings 页 Gateway 页签新增 Fast/Flex Policy 表单卡片：
  service_tier × action × scope × 模型白名单 × fallback action 全字段配置。
- 前端守门：openaiFastPolicyLoaded 标志仅在 GET 真带回字段时才允许回写，
  避免 rollout/错误把默认规则覆盖成空；saveSettings 回写循环 skip 该字段，
  由专用刷新逻辑处理；仅 action=block 时发送 error_message，匹配后端
  omitempty 行为。

测试
- HTTP 路径：openai_fast_policy_test.go 覆盖默认配置（whitelist=[]，所有
  模型 priority filter）/ block 自定义错误 / scope 区分 / filter 删字段 /
  block 不改 body / block 短路上游 / Anthropic BetaFastMode 触发 OpenAI
  fast policy 等场景。
- WebSocket 路径：openai_fast_policy_ws_test.go 覆盖
    helper 单元（filter / fast→priority 归一化 / flex 透传 / block typed
    error / 无 service_tier 字节不变 / 非 response.create 帧不动 / 空 type
    帧不动 / event_id+code 字段断言 / 非字符串 service_tier 容错）+
    pass 路径 fast 别名归一化回归 +
    ingress 端到端（filter 后上游不含 service_tier / block 后客户端先收
    error event 再收 close 1008 且上游 0 写）+
    passthrough capturedSessionModel fallback 用例（whitelist 策略下首帧
    建立、缺 model 命中 fallback、缺少 fallback 时的 leak 文档化）+
    passthrough session.update / session.created 旋转 capturedSessionModel
    的 mid-session 绕过回归 +
    passthrough billing post-filter ServiceTier 与 idempotent filter 回归。

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-28 00:34:23 +08:00
+									// Apply OpenAI fast policy (参照 Claude BetaPolicy 的 fast-mode 过滤)：
 									// 针对 body 的 service_tier 字段（"priority" 即 fast，"flex"），按策略
 									// 执行 filter（删除字段）或 block（拒绝请求）。对 gpt-5.5 等模型屏蔽
 									// fast 时在此生效。
 									//
 									// 注意：
 									//   1. 此处统一使用 upstreamModel（已经过 GetMappedModel +
 									//      normalizeOpenAIModelForUpstream + Codex OAuth normalize），与
 									//      chat-completions / messages 入口保持一致，避免不同入口因为模型
 									//      维度不同而出现 whitelist 命中差异。
 									//   2. action=pass 时也要把 raw "fast" 归一化为 "priority" 写回 body，
 									//      否则 native /responses 入口透传 "fast" 给上游会被拒。chat-
 									//      completions 入口由 normalizeResponsesBodyServiceTier 完成同一
 									//      行为，这里手工实现等效逻辑。
 									if rawTier, ok := reqBody["service_tier"].(string); ok {
 										if normTier := normalizedOpenAIServiceTierValue(rawTier); normTier != "" {
 											action, errMsg := s.evaluateOpenAIFastPolicy(ctx, account, upstreamModel, normTier)
 											switch action {
 											case BetaPolicyActionBlock:
 												msg := errMsg
 												if msg == "" {
 													msg = fmt.Sprintf("openai service_tier=%s is not allowed for model %s", normTier, upstreamModel)
 												}
 												blocked := &OpenAIFastBlockedError{Message: msg}
 												writeOpenAIFastPolicyBlockedResponse(c, blocked)
 												return nil, blocked
 											case BetaPolicyActionFilter:
 												delete(reqBody, "service_tier")
 												bodyModified = true
 												disablePatch()
 											default:
 												// pass：若客户端传的是别名 "fast"，归一化为 "priority"
 												// 后写回 body，确保上游收到的是其能识别的规范值。
 												if normTier != rawTier {
 													reqBody["service_tier"] = normTier
 													bodyModified = true
 													markPatchSet("service_tier", normTier)
 												}
 											}
 										}
 									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									// Re-serialize body only if modified
 									if bodyModified {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										serializedByPatch := false
 										if !patchDisabled && patchHasOp {
 											var patchErr error
 											if patchDelete {
 												body, patchErr = sjson.DeleteBytes(body, patchPath)
 											} else {
 												body, patchErr = sjson.SetBytes(body, patchPath, patchValue)
 											}
 											if patchErr == nil {
 												serializedByPatch = true
 											}
 										}
 										if !serializedByPatch {
 											var marshalErr error
 											body, marshalErr = json.Marshal(reqBody)
 											if marshalErr != nil {
 												return nil, fmt.Errorf("serialize request body: %w", marshalErr)
 											}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										}
 									}
 									// Get access token
 									token, _, err := s.GetAccessToken(ctx, account)
 									if err != nil {
 										return nil, err
 									}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									// Capture upstream request body for ops retry of this attempt.
 									setOpsUpstreamRequestBody(c, body)
 									// 命中 WS 时仅走 WebSocket Mode；不再自动回退 HTTP。
 									if wsDecision.Transport == OpenAIUpstreamTransportResponsesWebsocketV2 {
 										wsReqBody := reqBody
 										if len(reqBody) > 0 {
 											wsReqBody = make(map[string]any, len(reqBody))
 											for k, v := range reqBody {
 												wsReqBody[k] = v
 											}
 										}
 										_, hasPreviousResponseID := wsReqBody["previous_response_id"]
 										logOpenAIWSModeDebug(
 											"forward_start account_id=%d account_type=%s model=%s stream=%v has_previous_response_id=%v",
 											account.ID,
 											account.Type,
-												refactor: improve model resolution and normalization logic for OpenAI integration

											
										
										
											2026-03-24 19:20:15 +08:00
+											upstreamModel,
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											reqStream,
 											hasPreviousResponseID,
 										)
 										maxAttempts := openAIWSReconnectRetryLimit + 1
 										wsAttempts := 0
 										var wsResult *OpenAIForwardResult
 										var wsErr error
 										wsLastFailureReason := ""
 										wsPrevResponseRecoveryTried := false
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+										wsInvalidEncryptedContentRecoveryTried := false
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										recoverPrevResponseNotFound := func(attempt int) bool {
 											if wsPrevResponseRecoveryTried {
 												return false
 											}
 											previousResponseID := openAIWSPayloadString(wsReqBody, "previous_response_id")
 											if previousResponseID == "" {
 												logOpenAIWSModeInfo(
 													"reconnect_prev_response_recovery_skip account_id=%d attempt=%d reason=missing_previous_response_id previous_response_id_present=false",
 													account.ID,
 													attempt,
 												)
 												return false
 											}
 											if HasFunctionCallOutput(wsReqBody) {
 												logOpenAIWSModeInfo(
 													"reconnect_prev_response_recovery_skip account_id=%d attempt=%d reason=has_function_call_output previous_response_id_present=true",
 													account.ID,
 													attempt,
 												)
 												return false
 											}
 											delete(wsReqBody, "previous_response_id")
 											wsPrevResponseRecoveryTried = true
 											logOpenAIWSModeInfo(
 												"reconnect_prev_response_recovery account_id=%d attempt=%d action=drop_previous_response_id retry=1 previous_response_id=%s previous_response_id_kind=%s",
 												account.ID,
 												attempt,
 												truncateOpenAIWSLogValue(previousResponseID, openAIWSIDValueMaxLen),
 												normalizeOpenAIWSLogValue(ClassifyOpenAIPreviousResponseIDKind(previousResponseID)),
 											)
 											return true
 										}
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+										recoverInvalidEncryptedContent := func(attempt int) bool {
 											if wsInvalidEncryptedContentRecoveryTried {
 												return false
 											}
 											removedReasoningItems := trimOpenAIEncryptedReasoningItems(wsReqBody)
 											if !removedReasoningItems {
 												logOpenAIWSModeInfo(
 													"reconnect_invalid_encrypted_content_recovery_skip account_id=%d attempt=%d reason=missing_encrypted_reasoning_items",
 													account.ID,
 													attempt,
 												)
 												return false
 											}
 											previousResponseID := openAIWSPayloadString(wsReqBody, "previous_response_id")
 											hasFunctionCallOutput := HasFunctionCallOutput(wsReqBody)
 											if previousResponseID != "" && !hasFunctionCallOutput {
 												delete(wsReqBody, "previous_response_id")
 											}
 											wsInvalidEncryptedContentRecoveryTried = true
 											logOpenAIWSModeInfo(
 												"reconnect_invalid_encrypted_content_recovery account_id=%d attempt=%d action=drop_encrypted_reasoning_items retry=1 previous_response_id_present=%v previous_response_id=%s previous_response_id_kind=%s has_function_call_output=%v dropped_previous_response_id=%v",
 												account.ID,
 												attempt,
 												previousResponseID != "",
 												truncateOpenAIWSLogValue(previousResponseID, openAIWSIDValueMaxLen),
 												normalizeOpenAIWSLogValue(ClassifyOpenAIPreviousResponseIDKind(previousResponseID)),
 												hasFunctionCallOutput,
 												previousResponseID != "" && !hasFunctionCallOutput,
 											)
 											return true
 										}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										retryBudget := s.openAIWSRetryTotalBudget()
 										retryStartedAt := time.Now()
 									wsRetryLoop:
 										for attempt := 1; attempt <= maxAttempts; attempt++ {
 											wsAttempts = attempt
 											wsResult, wsErr = s.forwardOpenAIWSV2(
 												ctx,
 												c,
 												account,
 												wsReqBody,
 												token,
 												wsDecision,
 												isCodexCLI,
 												reqStream,
 												originalModel,
-												refactor: improve model resolution and normalization logic for OpenAI integration

											
										
										
											2026-03-24 19:20:15 +08:00
+												upstreamModel,
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+												startTime,
 												attempt,
 												wsLastFailureReason,
 											)
 											if wsErr == nil {
 												break
 											}
 											if c != nil && c.Writer != nil && c.Writer.Written() {
 												break
 											}
 											reason, retryable := classifyOpenAIWSReconnectReason(wsErr)
 											if reason != "" {
 												wsLastFailureReason = reason
 											}
 											// previous_response_not_found 说明续链锚点不可用：
 											// 对非 function_call_output 场景，允许一次“去掉 previous_response_id 后重放”。
 											if reason == "previous_response_not_found" && recoverPrevResponseNotFound(attempt) {
 												continue
 											}
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+											if reason == "invalid_encrypted_content" && recoverInvalidEncryptedContent(attempt) {
 												continue
 											}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											if retryable && attempt < maxAttempts {
 												backoff := s.openAIWSRetryBackoff(attempt)
 												if retryBudget > 0 && time.Since(retryStartedAt)+backoff > retryBudget {
 													s.recordOpenAIWSRetryExhausted()
 													logOpenAIWSModeInfo(
 														"reconnect_budget_exhausted account_id=%d attempts=%d max_retries=%d reason=%s elapsed_ms=%d budget_ms=%d",
 														account.ID,
 														attempt,
 														openAIWSReconnectRetryLimit,
 														normalizeOpenAIWSLogValue(reason),
 														time.Since(retryStartedAt).Milliseconds(),
 														retryBudget.Milliseconds(),
 													)
 													break
 												}
 												s.recordOpenAIWSRetryAttempt(backoff)
 												logOpenAIWSModeInfo(
 													"reconnect_retry account_id=%d retry=%d max_retries=%d reason=%s backoff_ms=%d",
 													account.ID,
 													attempt,
 													openAIWSReconnectRetryLimit,
 													normalizeOpenAIWSLogValue(reason),
 													backoff.Milliseconds(),
 												)
 												if backoff > 0 {
 													timer := time.NewTimer(backoff)
 													select {
 													case <-ctx.Done():
 														if !timer.Stop() {
 															<-timer.C
 														}
 														wsErr = wrapOpenAIWSFallback("retry_backoff_canceled", ctx.Err())
 														break wsRetryLoop
 													case <-timer.C:
 													}
 												}
 												continue
 											}
 											if retryable {
 												s.recordOpenAIWSRetryExhausted()
 												logOpenAIWSModeInfo(
 													"reconnect_exhausted account_id=%d attempts=%d max_retries=%d reason=%s",
 													account.ID,
 													attempt,
 													openAIWSReconnectRetryLimit,
 													normalizeOpenAIWSLogValue(reason),
 												)
 											} else if reason != "" {
 												s.recordOpenAIWSNonRetryableFastFallback()
 												logOpenAIWSModeInfo(
 													"reconnect_stop account_id=%d attempt=%d reason=%s",
 													account.ID,
 													attempt,
 													normalizeOpenAIWSLogValue(reason),
 												)
 											}
 											break
 										}
 										if wsErr == nil {
 											firstTokenMs := int64(0)
 											hasFirstTokenMs := wsResult != nil && wsResult.FirstTokenMs != nil
 											if hasFirstTokenMs {
 												firstTokenMs = int64(*wsResult.FirstTokenMs)
 											}
 											requestID := ""
 											if wsResult != nil {
 												requestID = strings.TrimSpace(wsResult.RequestID)
 											}
 											logOpenAIWSModeDebug(
 												"forward_succeeded account_id=%d request_id=%s stream=%v has_first_token_ms=%v first_token_ms=%d ws_attempts=%d",
 												account.ID,
 												requestID,
 												reqStream,
 												hasFirstTokenMs,
 												firstTokenMs,
 												wsAttempts,
 											)
-												refactor: improve model resolution and normalization logic for OpenAI integration

											
										
										
											2026-03-24 19:20:15 +08:00
+											wsResult.UpstreamModel = upstreamModel
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											return wsResult, nil
 										}
 										s.writeOpenAIWSFallbackErrorResponse(c, account, wsErr)
 										return nil, wsErr
 									}
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+									httpInvalidEncryptedContentRetryTried := false
 									for {
 										// Build upstream request
-												Merge remote-tracking branch 'origin/main' into fix/enc_coot

# Conflicts:
#	backend/internal/service/openai_gateway_service.go

											
										
										
											2026-03-14 13:04:24 +08:00
+										upstreamCtx, releaseUpstreamCtx := detachStreamUpstreamContext(ctx, reqStream)
 										upstreamReq, err := s.buildUpstreamRequest(upstreamCtx, c, account, body, token, reqStream, promptCacheKey, isCodexCLI)
 										releaseUpstreamCtx()
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+										if err != nil {
 											return nil, err
 										}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+										// Get proxy URL
 										proxyURL := ""
 										if account.ProxyID != nil && account.Proxy != nil {
 											proxyURL = account.Proxy.URL()
 										}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+										// Send request
 										upstreamStart := time.Now()
 										resp, err := s.httpUpstream.Do(upstreamReq, proxyURL, account.ID, account.Concurrency)
 										SetOpsLatencyMs(c, OpsUpstreamLatencyMsKey, time.Since(upstreamStart).Milliseconds())
 										if err != nil {
 											// Ensure the client receives an error response (handlers assume Forward writes on non-failover errors).
 											safeErr := sanitizeUpstreamErrorMessage(err.Error())
 											setOpsUpstreamError(c, 0, safeErr, "")
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+											appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 												Platform:           account.Platform,
 												AccountID:          account.ID,
-												feat: merge dev

											
										
										
											2026-01-15 15:14:44 +08:00
+												AccountName:        account.Name,
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+												UpstreamStatusCode: 0,
 												Kind:               "request_error",
 												Message:            safeErr,
 											})
 											c.JSON(http.StatusBadGateway, gin.H{
 												"error": gin.H{
 													"type":    "upstream_error",
 													"message": "Upstream request failed",
 												},
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+											})
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+											return nil, fmt.Errorf("upstream request failed: %s", safeErr)
 										}
 										// Handle error response
 										if resp.StatusCode >= 400 {
 											respBody, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
 											_ = resp.Body.Close()
 											resp.Body = io.NopCloser(bytes.NewReader(respBody))
 											upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(respBody))
 											upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)
 											upstreamCode := extractUpstreamErrorCode(respBody)
 											if !httpInvalidEncryptedContentRetryTried && resp.StatusCode == http.StatusBadRequest && upstreamCode == "invalid_encrypted_content" {
 												if trimOpenAIEncryptedReasoningItems(reqBody) {
 													body, err = json.Marshal(reqBody)
 													if err != nil {
 														return nil, fmt.Errorf("serialize invalid_encrypted_content retry body: %w", err)
 													}
 													setOpsUpstreamRequestBody(c, body)
 													httpInvalidEncryptedContentRetryTried = true
 													logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Retrying non-WSv2 request once after invalid_encrypted_content (account: %s)", account.Name)
 													continue
 												}
 												logger.LegacyPrintf("service.openai_gateway", "[OpenAI] Skip non-WSv2 invalid_encrypted_content retry because encrypted reasoning items are missing (account: %s)", account.Name)
 											}
 											if s.shouldFailoverOpenAIUpstreamResponse(resp.StatusCode, upstreamMsg, respBody) {
 												upstreamDetail := ""
 												if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 													maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
 													if maxBytes <= 0 {
 														maxBytes = 2048
 													}
 													upstreamDetail = truncateString(string(respBody), maxBytes)
 												}
 												appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 													Platform:           account.Platform,
 													AccountID:          account.ID,
 													AccountName:        account.Name,
 													UpstreamStatusCode: resp.StatusCode,
 													UpstreamRequestID:  resp.Header.Get("x-request-id"),
 													Kind:               "failover",
 													Message:            upstreamMsg,
 													Detail:             upstreamDetail,
 												})
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+												s.handleFailoverSideEffects(ctx, resp, account)
 												return nil, &UpstreamFailoverError{
 													StatusCode:             resp.StatusCode,
 													ResponseBody:           respBody,
 													RetryableOnSameAccount: account.IsPoolMode() && (isPoolModeRetryableStatus(resp.StatusCode) || isOpenAITransientProcessingError(resp.StatusCode, upstreamMsg, respBody)),
 												}
-												feat: 支持 API Key 上游池模式同账号重试次数配置与自定义错误策略

											
										
										
											2026-03-08 13:57:23 +08:00
+											}
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+											return s.handleErrorResponse(ctx, resp, c, account, body)
-												feat: cc/codex support account retry

											
										
										
											2025-12-27 11:44:00 +08:00
+										}
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+										defer func() { _ = resp.Body.Close() }()
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+										// Handle normal response
 										var usage *OpenAIUsage
 										var firstTokenMs *int
 										if reqStream {
-												refactor: improve model resolution and normalization logic for OpenAI integration

											
										
										
											2026-03-24 19:20:15 +08:00
+											streamResult, err := s.handleStreamingResponse(ctx, resp, c, account, startTime, originalModel, upstreamModel)
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+											if err != nil {
 												return nil, err
 											}
 											usage = streamResult.usage
 											firstTokenMs = streamResult.firstTokenMs
 										} else {
-												refactor: improve model resolution and normalization logic for OpenAI integration

											
										
										
											2026-03-24 19:20:15 +08:00
+											usage, err = s.handleNonStreamingResponse(ctx, resp, c, account, originalModel, upstreamModel)
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+											if err != nil {
 												return nil, err
 											}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										}
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+										// Extract and save Codex usage snapshot from response headers (for OAuth accounts)
 										if account.Type == AccountTypeOAuth {
 											if snapshot := ParseCodexRateLimitHeaders(resp.Header); snapshot != nil {
 												s.updateCodexUsageSnapshot(ctx, account.ID, snapshot)
 											}
-												feat: OpenAI OAuth账号显示Codex使用量

从响应头提取x-codex-*使用量信息并保存到账号Extra字段，
前端账号列表展示5h/7d窗口的使用进度条。

											
										
										
											2025-12-23 16:26:07 +08:00
+										}
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+										if usage == nil {
 											usage = &OpenAIUsage{}
 										}
-												fix(openai): 修复 usage 为空导致 panic（P0-02）

											
										
										
											2026-02-07 16:15:30 +08:00
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+										reasoningEffort := extractOpenAIReasoningEffort(reqBody, originalModel)
 										serviceTier := extractOpenAIServiceTier(reqBody)
-												feat(usage): add reasoning effort column

											
										
										
											2026-02-03 14:36:29 +08:00
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+										return &OpenAIForwardResult{
 											RequestID:       resp.Header.Get("x-request-id"),
 											Usage:           *usage,
 											Model:           originalModel,
-												refactor: improve model resolution and normalization logic for OpenAI integration

											
										
										
											2026-03-24 19:20:15 +08:00
+											UpstreamModel:   upstreamModel,
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+											ServiceTier:     serviceTier,
 											ReasoningEffort: reasoningEffort,
 											Stream:          reqStream,
 											OpenAIWSMode:    false,
 											Duration:        time.Since(startTime),
 											FirstTokenMs:    firstTokenMs,
 										}, nil
 									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								}
-												feat(openai): 支持自动透传开关并透传 User-Agent

- OpenAI OAuth/API Key 统一支持自动透传开关，编辑页可开关\n- 透传模式仅替换认证并保留计费/并发/审计，修复 API Key responses 端点拼接\n- Usage 页面显示原始 User-Agent 且不截断，补充回归测试与清单

											
										
										
											2026-02-12 10:56:07 +08:00
+								func (s *OpenAIGatewayService) forwardOpenAIPassthrough(
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									ctx context.Context,
 									c *gin.Context,
 									account *Account,
 									body []byte,
 									reqModel string,
 									reasoningEffort *string,
 									reqStream bool,
 									startTime time.Time,
 								) (*OpenAIForwardResult, error) {
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									upstreamPassthroughModel := ""
 									if isOpenAIResponsesCompactPath(c) {
 										compactMappedModel := resolveOpenAICompactForwardModel(account, reqModel)
 										if compactMappedModel != "" && compactMappedModel != reqModel {
 											nextBody, setErr := sjson.SetBytes(body, "model", compactMappedModel)
 											if setErr != nil {
 												return nil, fmt.Errorf("set compact passthrough model: %w", setErr)
 											}
 											body = nextBody
 											upstreamPassthroughModel = compactMappedModel
 										}
 									}
-												fix(openai): 透传OAuth强制store/stream并修复Codex识别

											
										
										
											2026-02-12 21:02:52 +08:00
+									if account != nil && account.Type == AccountTypeOAuth {
-												fix(openai): 自动透传预检 instructions 并本地 403 拦截

											
										
										
											2026-02-14 10:49:01 +08:00
+										if rejectReason := detectOpenAIPassthroughInstructionsRejectReason(reqModel, body); rejectReason != "" {
 											rejectMsg := "OpenAI codex passthrough requires a non-empty instructions field"
 											setOpsUpstreamError(c, http.StatusForbidden, rejectMsg, "")
 											appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 												Platform:           account.Platform,
 												AccountID:          account.ID,
 												AccountName:        account.Name,
 												UpstreamStatusCode: http.StatusForbidden,
 												Passthrough:        true,
 												Kind:               "request_error",
 												Message:            rejectMsg,
 												Detail:             rejectReason,
 											})
 											logOpenAIPassthroughInstructionsRejected(ctx, c, account, reqModel, rejectReason, body)
 											c.JSON(http.StatusForbidden, gin.H{
 												"error": gin.H{
 													"type":    "forbidden_error",
 													"message": rejectMsg,
 												},
 											})
 											return nil, fmt.Errorf("openai passthrough rejected before upstream: %s", rejectReason)
 										}
-												fix(openai): support remote compact task

											
										
										
											2026-03-06 18:50:28 +08:00
+										normalizedBody, normalized, err := normalizeOpenAIPassthroughOAuthBody(body, isOpenAIResponsesCompactPath(c))
-												fix(openai): 透传OAuth强制store/stream并修复Codex识别

											
										
										
											2026-02-12 21:02:52 +08:00
+										if err != nil {
 											return nil, err
 										}
 										if normalized {
 											body = normalizedBody
 										}
-												fix(openai): support remote compact task

											
										
										
											2026-03-06 18:50:28 +08:00
+										reqStream = gjson.GetBytes(body, "stream").Bool()
-												fix(openai): 透传OAuth强制store/stream并修复Codex识别

											
										
										
											2026-02-12 21:02:52 +08:00
+									}
-												fix(openai): sanitize empty base64 input images

											
										
										
											2026-04-01 00:46:38 +08:00
+									sanitizedBody, sanitized, err := sanitizeEmptyBase64InputImagesInOpenAIBody(body)
 									if err != nil {
 										return nil, err
 									}
 									if sanitized {
 										body = sanitizedBody
 									}
-												feat(openai): OpenAI Fast/Flex Policy 完整实现（HTTP + WebSocket + Admin）

对称参照 Claude BetaPolicy 的 fast-mode 过滤实现，新增针对 OpenAI 上游
service_tier 字段（priority / flex，含客户端 "fast" → "priority" 归一化）的
pass / filter / block 三态策略，覆盖全部 OpenAI 入口 + admin 配置入口。

后端核心
- 新增 SettingKeyOpenAIFastPolicySettings、OpenAIFastPolicyRule、
  OpenAIFastPolicySettings 配置模型，含规则的 service_tier × action × scope
  × 模型白名单 × fallback action 维度。
- SettingService.Get/SetOpenAIFastPolicySettings；缺失时返回内置默认策略
  （所有模型的 priority 走 filter，whitelist 为空，fallback=pass）。设计
  依据：service_tier=fast 是用户级开关，与 model 字段正交，默认锁定特定
  model slug 会留下"用 gpt-4 + fast 透传 priority 上游"的绕过路径。JSON
  解析失败不再静默 fallback，slog.Warn 记录脏数据，便于运维定位。
- service_tier 归一化（trim + ToLower + fast→priority + 白名单 priority/flex）
  与策略评估（evaluateOpenAIFastPolicy）作为唯一真实来源，HTTP / WS 共用。
  抽出纯函数 evaluateOpenAIFastPolicyWithSettings，配合 ctx-bound settings
  快照（withOpenAIFastPolicyContext / openAIFastPolicySettingsFromContext），
  WS 长会话入口预取一次后所有帧复用，避免每帧打到 settingService。

HTTP 入口（4 个）
- Chat Completions、Anthropic 兼容（Messages，含 BetaFastMode→priority 二次
  命中）、原生 Responses、Passthrough Responses 全部接入
  applyOpenAIFastPolicyToBody，filter 走 sjson 顶层删除 service_tier，block
  返回 403 forbidden_error JSON。
- 4 入口统一使用 upstream 视角的 model（GetMappedModel +
  normalizeOpenAIModelForUpstream + Codex OAuth normalize 后的 slug），
  避免 chat/messages/native /responses/passthrough 因为 model 维度不同
  造成 whitelist 命中差异。
- 在 pass 路径也把客户端 "fast" 别名归一化为 "priority" 写回 body，
  否则 native /responses 与 passthrough 入口会把 "fast" 原样透传给上游
  导致 400/拒绝（chat-completions 入口的 normalizeResponsesBodyServiceTier
  此前已具备同等行为）。

WebSocket 入口
- 新增 applyOpenAIFastPolicyToWSResponseCreate：严格匹配
  type="response.create"，仅处理顶层 service_tier；filter 用 sjson 删字段，
  block 返回 typed *OpenAIFastBlockedError。
- ingress 路径在 parseClientPayload 内调用，block 命中先 Write Realtime
  风格 error event 再返回 OpenAIWSClientCloseError(StatusPolicyViolation
  =1008)，依赖底层 WebSocket Conn.Write 的同步 flush 保证 error 先于
  close。
- passthrough 路径在 RunEntry 前对 firstClientMessage 应用策略，并通过
  openAIWSPolicyEnforcingFrameConn 包装 ReadFrame 对每个 client→upstream
  帧执行策略；后续帧无 model 字段时回退到 capturedSessionModel。
  filter 闭包内同时侦测 session.update / session.created 帧的 session.model
  字段刷新 capturedSessionModel，封堵"首帧 model=gpt-4o（pass）→
  session.update 改为 gpt-5.5 → 不带 model 的 response.create fallback
  到 gpt-4o"的 mid-session 绕过路径。
- passthrough billing：requestServiceTier 在策略 filter 之后再从
  firstClientMessage 提取，filter 命中时 OpenAIForwardResult.ServiceTier
  上报 nil（default tier），与 HTTP 入口（reqBody 来自 post-filter map）
  / WS ingress（payload 来自 post-filter bytes）的语义一致。
- 错误事件 schema：{event_id: "evt_<32hex>", type: "error",
  error: {type: "forbidden_error", code: "policy_violation", message}}，
  与 OpenAI codex 客户端 error event 解析兼容。

Admin / Frontend
- dto.SystemSettings / UpdateSettingsRequest 新增
  openai_fast_policy_settings 字段（omitempty），bulk GET/PUT 接入。
- Settings 页 Gateway 页签新增 Fast/Flex Policy 表单卡片：
  service_tier × action × scope × 模型白名单 × fallback action 全字段配置。
- 前端守门：openaiFastPolicyLoaded 标志仅在 GET 真带回字段时才允许回写，
  避免 rollout/错误把默认规则覆盖成空；saveSettings 回写循环 skip 该字段，
  由专用刷新逻辑处理；仅 action=block 时发送 error_message，匹配后端
  omitempty 行为。

测试
- HTTP 路径：openai_fast_policy_test.go 覆盖默认配置（whitelist=[]，所有
  模型 priority filter）/ block 自定义错误 / scope 区分 / filter 删字段 /
  block 不改 body / block 短路上游 / Anthropic BetaFastMode 触发 OpenAI
  fast policy 等场景。
- WebSocket 路径：openai_fast_policy_ws_test.go 覆盖
    helper 单元（filter / fast→priority 归一化 / flex 透传 / block typed
    error / 无 service_tier 字节不变 / 非 response.create 帧不动 / 空 type
    帧不动 / event_id+code 字段断言 / 非字符串 service_tier 容错）+
    pass 路径 fast 别名归一化回归 +
    ingress 端到端（filter 后上游不含 service_tier / block 后客户端先收
    error event 再收 close 1008 且上游 0 写）+
    passthrough capturedSessionModel fallback 用例（whitelist 策略下首帧
    建立、缺 model 命中 fallback、缺少 fallback 时的 leak 文档化）+
    passthrough session.update / session.created 旋转 capturedSessionModel
    的 mid-session 绕过回归 +
    passthrough billing post-filter ServiceTier 与 idempotent filter 回归。

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-28 00:34:23 +08:00
+									// Apply OpenAI fast policy to the passthrough body (filter/block by service_tier).
 									// 统一使用 upstream 视角的 model：透传路径下 body 已经过 compact 映射 +
 									// OAuth normalize，body 中的 model 字段即上游真正会看到的 slug。
 									// 这样可以与 chat-completions / messages / native /responses 入口的
 									// upstreamModel 保持一致，避免 whitelist 命中差异。当 body 中没有
 									// model 字段时退回 reqModel。
 									policyModel := strings.TrimSpace(gjson.GetBytes(body, "model").String())
 									if policyModel == "" {
 										policyModel = reqModel
 									}
 									updatedBody, policyErr := s.applyOpenAIFastPolicyToBody(ctx, account, policyModel, body)
 									if policyErr != nil {
 										var blocked *OpenAIFastBlockedError
 										if errors.As(policyErr, &blocked) {
 											writeOpenAIFastPolicyBlockedResponse(c, blocked)
 										}
 										return nil, policyErr
 									}
 									body = updatedBody
-												chore(logging): 完成后端日志审计与结构化迁移

- 将高密度服务与处理器日志迁移到新日志系统（LegacyPrintf/结构化日志）
- 增加 stdlog bridge 与兼容测试，保留旧日志捕获能力
- 将 OpenAI 断流告警改为结构化 Warn 并改造对应测试为 sink 捕获
- 补齐后端相关文件 logger 引用并通过全量 go test

											
										
										
											2026-02-12 19:01:09 +08:00
+									logger.LegacyPrintf("service.openai_gateway",
-												fix(openai): 增强自动透传命中日志

											
										
										
											2026-02-12 11:41:06 +08:00
+										"[OpenAI 自动透传] 命中自动透传分支: account=%d name=%s type=%s model=%s stream=%v",
 										account.ID,
 										account.Name,
 										account.Type,
 										reqModel,
 										reqStream,
 									)
-												fix(gateway): 默认过滤OpenAI透传超时头并补充断流告警

											
										
										
											2026-02-12 14:16:18 +08:00
+									if reqStream && c != nil && c.Request != nil {
 										if timeoutHeaders := collectOpenAIPassthroughTimeoutHeaders(c.Request.Header); len(timeoutHeaders) > 0 {
-												chore(logging): 完成后端日志审计与结构化迁移

- 将高密度服务与处理器日志迁移到新日志系统（LegacyPrintf/结构化日志）
- 增加 stdlog bridge 与兼容测试，保留旧日志捕获能力
- 将 OpenAI 断流告警改为结构化 Warn 并改造对应测试为 sink 捕获
- 补齐后端相关文件 logger 引用并通过全量 go test

											
										
										
											2026-02-12 19:01:09 +08:00
+											streamWarnLogger := logger.FromContext(ctx).With(
 												zap.String("component", "service.openai_gateway"),
 												zap.Int64("account_id", account.ID),
 												zap.Strings("timeout_headers", timeoutHeaders),
 											)
-												fix(gateway): 默认过滤OpenAI透传超时头并补充断流告警

											
										
										
											2026-02-12 14:16:18 +08:00
+											if s.isOpenAIPassthroughTimeoutHeadersAllowed() {
-												chore(logging): 完成后端日志审计与结构化迁移

- 将高密度服务与处理器日志迁移到新日志系统（LegacyPrintf/结构化日志）
- 增加 stdlog bridge 与兼容测试，保留旧日志捕获能力
- 将 OpenAI 断流告警改为结构化 Warn 并改造对应测试为 sink 捕获
- 补齐后端相关文件 logger 引用并通过全量 go test

											
										
										
											2026-02-12 19:01:09 +08:00
+												streamWarnLogger.Warn("OpenAI passthrough 透传请求包含超时相关请求头，且当前配置为放行，可能导致上游提前断流")
-												fix(gateway): 默认过滤OpenAI透传超时头并补充断流告警

											
										
										
											2026-02-12 14:16:18 +08:00
+											} else {
-												chore(logging): 完成后端日志审计与结构化迁移

- 将高密度服务与处理器日志迁移到新日志系统（LegacyPrintf/结构化日志）
- 增加 stdlog bridge 与兼容测试，保留旧日志捕获能力
- 将 OpenAI 断流告警改为结构化 Warn 并改造对应测试为 sink 捕获
- 补齐后端相关文件 logger 引用并通过全量 go test

											
										
										
											2026-02-12 19:01:09 +08:00
+												streamWarnLogger.Warn("OpenAI passthrough 检测到超时相关请求头，将按配置过滤以降低断流风险")
-												fix(gateway): 默认过滤OpenAI透传超时头并补充断流告警

											
										
										
											2026-02-12 14:16:18 +08:00
+											}
 										}
 									}
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
 									// Get access token
 									token, _, err := s.GetAccessToken(ctx, account)
 									if err != nil {
 										return nil, err
 									}
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+									upstreamCtx, releaseUpstreamCtx := detachStreamUpstreamContext(ctx, reqStream)
 									upstreamReq, err := s.buildUpstreamRequestOpenAIPassthrough(upstreamCtx, c, account, body, token)
 									releaseUpstreamCtx()
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									if err != nil {
 										return nil, err
 									}
 									proxyURL := ""
 									if account.ProxyID != nil && account.Proxy != nil {
 										proxyURL = account.Proxy.URL()
 									}
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+									setOpsUpstreamRequestBody(c, body)
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									if c != nil {
 										c.Set("openai_passthrough", true)
 									}
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+									upstreamStart := time.Now()
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									resp, err := s.httpUpstream.Do(upstreamReq, proxyURL, account.ID, account.Concurrency)
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+									SetOpsLatencyMs(c, OpsUpstreamLatencyMsKey, time.Since(upstreamStart).Milliseconds())
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									if err != nil {
 										safeErr := sanitizeUpstreamErrorMessage(err.Error())
 										setOpsUpstreamError(c, 0, safeErr, "")
 										appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 											Platform:           account.Platform,
 											AccountID:          account.ID,
 											AccountName:        account.Name,
 											UpstreamStatusCode: 0,
 											Passthrough:        true,
 											Kind:               "request_error",
 											Message:            safeErr,
 										})
 										c.JSON(http.StatusBadGateway, gin.H{
 											"error": gin.H{
 												"type":    "upstream_error",
 												"message": "Upstream request failed",
 											},
 										})
 										return nil, fmt.Errorf("upstream request failed: %s", safeErr)
 									}
 									defer func() { _ = resp.Body.Close() }()
 									if resp.StatusCode >= 400 {
-												fix(openai): fail over passthrough 429 and 529

											
										
										
											2026-03-30 22:29:26 +08:00
+										// 透传模式默认保持原样代理；但 429/529 属于网关必须兜底的
 										// 上游容量类错误，应先触发多账号 failover 以维持基础 SLA。
 										if shouldFailoverOpenAIPassthroughResponse(resp.StatusCode) {
 											return nil, s.handleFailoverErrorResponsePassthrough(ctx, resp, c, account, body)
 										}
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+										return nil, s.handleErrorResponsePassthrough(ctx, resp, c, account, body)
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									}
 									var usage *OpenAIUsage
 									var firstTokenMs *int
 									if reqStream {
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										result, err := s.handleStreamingResponsePassthrough(ctx, resp, c, account, startTime, reqModel, upstreamPassthroughModel)
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+										if err != nil {
 											return nil, err
 										}
 										usage = result.usage
 										firstTokenMs = result.firstTokenMs
 									} else {
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										usage, err = s.handleNonStreamingResponsePassthrough(ctx, resp, c, reqModel, upstreamPassthroughModel)
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+										if err != nil {
 											return nil, err
 										}
 									}
 									if snapshot := ParseCodexRateLimitHeaders(resp.Header); snapshot != nil {
 										s.updateCodexUsageSnapshot(ctx, account.ID, snapshot)
 									}
 									if usage == nil {
 										usage = &OpenAIUsage{}
 									}
 									return &OpenAIForwardResult{
 										RequestID:       resp.Header.Get("x-request-id"),
 										Usage:           *usage,
 										Model:           reqModel,
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										UpstreamModel:   upstreamPassthroughModel,
-												fix(billing): 修复 OpenAI fast 档位计费并补齐展示

- 打通 service_tier 在 OpenAI HTTP、WS、passthrough 与 usage 记录中的传递
- 修正 priority/flex 计费逻辑，并将 fast 归一化为 priority
- 在用户端和管理端补齐服务档位与计费明细展示
- 补齐前后端测试，并修复 WS 限流信号重复持久化导致的全量回归失败

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-08 23:22:28 +08:00
+										ServiceTier:     extractOpenAIServiceTierFromBody(body),
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+										ReasoningEffort: reasoningEffort,
 										Stream:          reqStream,
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										OpenAIWSMode:    false,
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+										Duration:        time.Since(startTime),
 										FirstTokenMs:    firstTokenMs,
 									}, nil
 								}
-												fix(openai): 自动透传预检 instructions 并本地 403 拦截

											
										
										
											2026-02-14 10:49:01 +08:00
+								func logOpenAIPassthroughInstructionsRejected(
 									ctx context.Context,
 									c *gin.Context,
 									account *Account,
 									reqModel string,
 									rejectReason string,
 									body []byte,
 								) {
 									if ctx == nil {
 										ctx = context.Background()
 									}
 									accountID := int64(0)
 									accountName := ""
 									accountType := ""
 									if account != nil {
 										accountID = account.ID
 										accountName = strings.TrimSpace(account.Name)
 										accountType = strings.TrimSpace(string(account.Type))
 									}
 									fields := []zap.Field{
 										zap.String("component", "service.openai_gateway"),
 										zap.Int64("account_id", accountID),
 										zap.String("account_name", accountName),
 										zap.String("account_type", accountType),
 										zap.String("request_model", strings.TrimSpace(reqModel)),
 										zap.String("reject_reason", strings.TrimSpace(rejectReason)),
 									}
 									fields = appendCodexCLIOnlyRejectedRequestFields(fields, c, body)
 									logger.FromContext(ctx).With(fields...).Warn("OpenAI passthrough 本地拦截：Codex 请求缺少有效 instructions")
 								}
-												feat(openai): 支持自动透传开关并透传 User-Agent

- OpenAI OAuth/API Key 统一支持自动透传开关，编辑页可开关\n- 透传模式仅替换认证并保留计费/并发/审计，修复 API Key responses 端点拼接\n- Usage 页面显示原始 User-Agent 且不截断，补充回归测试与清单

											
										
										
											2026-02-12 10:56:07 +08:00
+								func (s *OpenAIGatewayService) buildUpstreamRequestOpenAIPassthrough(
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									ctx context.Context,
 									c *gin.Context,
 									account *Account,
 									body []byte,
 									token string,
 								) (*http.Request, error) {
-												feat(openai): 支持自动透传开关并透传 User-Agent

- OpenAI OAuth/API Key 统一支持自动透传开关，编辑页可开关\n- 透传模式仅替换认证并保留计费/并发/审计，修复 API Key responses 端点拼接\n- Usage 页面显示原始 User-Agent 且不截断，补充回归测试与清单

											
										
										
											2026-02-12 10:56:07 +08:00
+									targetURL := openaiPlatformAPIURL
 									switch account.Type {
 									case AccountTypeOAuth:
 										targetURL = chatgptCodexURL
 									case AccountTypeAPIKey:
 										baseURL := account.GetOpenAIBaseURL()
 										if baseURL != "" {
 											validatedURL, err := s.validateUpstreamBaseURL(baseURL)
 											if err != nil {
 												return nil, err
 											}
 											targetURL = buildOpenAIResponsesURL(validatedURL)
 										}
 									}
-												fix(openai): support remote compact task

											
										
										
											2026-03-06 18:50:28 +08:00
+									targetURL = appendOpenAIResponsesRequestPathSuffix(targetURL, openAIResponsesRequestPathSuffix(c))
-												feat(openai): 支持自动透传开关并透传 User-Agent

- OpenAI OAuth/API Key 统一支持自动透传开关，编辑页可开关\n- 透传模式仅替换认证并保留计费/并发/审计，修复 API Key responses 端点拼接\n- Usage 页面显示原始 User-Agent 且不截断，补充回归测试与清单

											
										
										
											2026-02-12 10:56:07 +08:00
 									req, err := http.NewRequestWithContext(ctx, http.MethodPost, targetURL, bytes.NewReader(body))
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									if err != nil {
 										return nil, err
 									}
-												fix(openai): 收敛自动透传请求头并增强 OAuth 安全兜底

											
										
										
											2026-02-12 20:12:15 +08:00
+									// 透传客户端请求头（安全白名单）。
-												fix(gateway): 默认过滤OpenAI透传超时头并补充断流告警

											
										
										
											2026-02-12 14:16:18 +08:00
+									allowTimeoutHeaders := s.isOpenAIPassthroughTimeoutHeadersAllowed()
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									if c != nil && c.Request != nil {
 										for key, values := range c.Request.Header {
-												fix(openai): 收敛自动透传请求头并增强 OAuth 安全兜底

											
										
										
											2026-02-12 20:12:15 +08:00
+											lower := strings.ToLower(strings.TrimSpace(key))
 											if !isOpenAIPassthroughAllowedRequestHeader(lower, allowTimeoutHeaders) {
-												fix(gateway): 默认过滤OpenAI透传超时头并补充断流告警

											
										
										
											2026-02-12 14:16:18 +08:00
+												continue
 											}
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+											for _, v := range values {
 												req.Header.Add(key, v)
 											}
 										}
 									}
 									// 覆盖入站鉴权残留，并注入上游认证
 									req.Header.Del("authorization")
 									req.Header.Del("x-api-key")
 									req.Header.Del("x-goog-api-key")
 									req.Header.Set("authorization", "Bearer "+token)
-												feat(openai): 支持自动透传开关并透传 User-Agent

- OpenAI OAuth/API Key 统一支持自动透传开关，编辑页可开关\n- 透传模式仅替换认证并保留计费/并发/审计，修复 API Key responses 端点拼接\n- Usage 页面显示原始 User-Agent 且不截断，补充回归测试与清单

											
										
										
											2026-02-12 10:56:07 +08:00
+									// OAuth 透传到 ChatGPT internal API 时补齐必要头。
 									if account.Type == AccountTypeOAuth {
-												fix(openai): 收敛自动透传请求头并增强 OAuth 安全兜底

											
										
										
											2026-02-12 20:12:15 +08:00
+										promptCacheKey := strings.TrimSpace(gjson.GetBytes(body, "prompt_cache_key").String())
-												feat(openai): 支持自动透传开关并透传 User-Agent

- OpenAI OAuth/API Key 统一支持自动透传开关，编辑页可开关\n- 透传模式仅替换认证并保留计费/并发/审计，修复 API Key responses 端点拼接\n- Usage 页面显示原始 User-Agent 且不截断，补充回归测试与清单

											
										
										
											2026-02-12 10:56:07 +08:00
+										req.Host = "chatgpt.com"
 										if chatgptAccountID := account.GetChatGPTAccountID(); chatgptAccountID != "" {
 											req.Header.Set("chatgpt-account-id", chatgptAccountID)
 										}
-												fix(gateway): 防止 OpenAI Codex 跨用户串流

根因：多个用户共享同一 OAuth 账号时，conversation_id/session_id 头
未做用户隔离，导致上游 chatgpt.com 将不同用户的请求关联到同一会话。

HTTP SSE 修复:
- 新增 isolateOpenAISessionID(apiKeyID, raw)，将 API Key ID 混入
  session 标识符（xxhash），确保不同 Key 的用户产生不同上游会话
- buildUpstreamRequest: OAuth 分支先 Del 客户端透传的 session 头，
  再用隔离值覆盖
- buildUpstreamRequestOpenAIPassthrough: 透传路径同样隔离
- ForwardAsAnthropic: Anthropic Messages 兼容路径同步修复
- buildOpenAIWSHeaders: WS 路径的 OAuth session 头同步隔离

											
										
										
											2026-03-16 10:28:11 +08:00
+										apiKeyID := getAPIKeyIDFromContext(c)
 										// 先保存客户端原始值，再做 compact 补充，避免后续统一隔离时读到已处理的值。
 										clientSessionID := strings.TrimSpace(req.Header.Get("session_id"))
 										clientConversationID := strings.TrimSpace(req.Header.Get("conversation_id"))
-												fix(openai): support remote compact task

											
										
										
											2026-03-06 18:50:28 +08:00
+										if isOpenAIResponsesCompactPath(c) {
 											req.Header.Set("accept", "application/json")
 											if req.Header.Get("version") == "" {
 												req.Header.Set("version", codexCLIVersion)
 											}
-												fix(gateway): 防止 OpenAI Codex 跨用户串流

根因：多个用户共享同一 OAuth 账号时，conversation_id/session_id 头
未做用户隔离，导致上游 chatgpt.com 将不同用户的请求关联到同一会话。

HTTP SSE 修复:
- 新增 isolateOpenAISessionID(apiKeyID, raw)，将 API Key ID 混入
  session 标识符（xxhash），确保不同 Key 的用户产生不同上游会话
- buildUpstreamRequest: OAuth 分支先 Del 客户端透传的 session 头，
  再用隔离值覆盖
- buildUpstreamRequestOpenAIPassthrough: 透传路径同样隔离
- ForwardAsAnthropic: Anthropic Messages 兼容路径同步修复
- buildOpenAIWSHeaders: WS 路径的 OAuth session 头同步隔离

											
										
										
											2026-03-16 10:28:11 +08:00
+											if clientSessionID == "" {
 												clientSessionID = resolveOpenAICompactSessionID(c)
-												fix(openai): support remote compact task

											
										
										
											2026-03-06 18:50:28 +08:00
+											}
 										} else if req.Header.Get("accept") == "" {
-												fix(openai): 收敛自动透传请求头并增强 OAuth 安全兜底

											
										
										
											2026-02-12 20:12:15 +08:00
+											req.Header.Set("accept", "text/event-stream")
 										}
-												feat(openai): 支持自动透传开关并透传 User-Agent

- OpenAI OAuth/API Key 统一支持自动透传开关，编辑页可开关\n- 透传模式仅替换认证并保留计费/并发/审计，修复 API Key responses 端点拼接\n- Usage 页面显示原始 User-Agent 且不截断，补充回归测试与清单

											
										
										
											2026-02-12 10:56:07 +08:00
+										if req.Header.Get("OpenAI-Beta") == "" {
 											req.Header.Set("OpenAI-Beta", "responses=experimental")
 										}
 										if req.Header.Get("originator") == "" {
 											req.Header.Set("originator", "codex_cli_rs")
 										}
-												fix(gateway): 防止 OpenAI Codex 跨用户串流

根因：多个用户共享同一 OAuth 账号时，conversation_id/session_id 头
未做用户隔离，导致上游 chatgpt.com 将不同用户的请求关联到同一会话。

HTTP SSE 修复:
- 新增 isolateOpenAISessionID(apiKeyID, raw)，将 API Key ID 混入
  session 标识符（xxhash），确保不同 Key 的用户产生不同上游会话
- buildUpstreamRequest: OAuth 分支先 Del 客户端透传的 session 头，
  再用隔离值覆盖
- buildUpstreamRequestOpenAIPassthrough: 透传路径同样隔离
- ForwardAsAnthropic: Anthropic Messages 兼容路径同步修复
- buildOpenAIWSHeaders: WS 路径的 OAuth session 头同步隔离

											
										
										
											2026-03-16 10:28:11 +08:00
+										// 用隔离后的 session 标识符覆盖客户端透传值，防止跨用户会话碰撞。
 										if clientSessionID == "" {
 											clientSessionID = promptCacheKey
 										}
 										if clientConversationID == "" {
 											clientConversationID = promptCacheKey
 										}
 										if clientSessionID != "" {
 											req.Header.Set("session_id", isolateOpenAISessionID(apiKeyID, clientSessionID))
 										}
 										if clientConversationID != "" {
 											req.Header.Set("conversation_id", isolateOpenAISessionID(apiKeyID, clientConversationID))
-												fix(openai): 收敛自动透传请求头并增强 OAuth 安全兜底

											
										
										
											2026-02-12 20:12:15 +08:00
+										}
 									}
 									// 透传模式也支持账户自定义 User-Agent 与 ForceCodexCLI 兜底。
 									customUA := account.GetOpenAIUserAgent()
 									if customUA != "" {
 										req.Header.Set("user-agent", customUA)
 									}
 									if s.cfg != nil && s.cfg.Gateway.ForceCodexCLI {
 										req.Header.Set("user-agent", codexCLIUserAgent)
 									}
 									// OAuth 安全透传：对非 Codex UA 统一兜底，降低被上游风控拦截概率。
 									if account.Type == AccountTypeOAuth && !openai.IsCodexCLIRequest(req.Header.Get("user-agent")) {
 										req.Header.Set("user-agent", codexCLIUserAgent)
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									}
 									if req.Header.Get("content-type") == "" {
 										req.Header.Set("content-type", "application/json")
 									}
 									return req, nil
 								}
-												fix(openai): fail over passthrough 429 and 529

											
										
										
											2026-03-30 22:29:26 +08:00
+								func shouldFailoverOpenAIPassthroughResponse(statusCode int) bool {
 									switch statusCode {
 									case http.StatusTooManyRequests, 529:
 										return true
 									default:
 										return false
 									}
 								}
 								func (s *OpenAIGatewayService) handleFailoverErrorResponsePassthrough(
 									ctx context.Context,
 									resp *http.Response,
 									c *gin.Context,
 									account *Account,
 									requestBody []byte,
 								) error {
 									body, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
 									upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(body))
 									upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)
 									upstreamDetail := ""
 									if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 										maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
 										if maxBytes <= 0 {
 											maxBytes = 2048
 										}
 										upstreamDetail = truncateString(string(body), maxBytes)
 									}
 									setOpsUpstreamError(c, resp.StatusCode, upstreamMsg, upstreamDetail)
 									logOpenAIInstructionsRequiredDebug(ctx, c, account, resp.StatusCode, upstreamMsg, requestBody, body)
 									if s.rateLimitService != nil {
 										_ = s.rateLimitService.HandleUpstreamError(ctx, account, resp.StatusCode, resp.Header, body)
 									}
 									appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 										Platform:             account.Platform,
 										AccountID:            account.ID,
 										AccountName:          account.Name,
 										UpstreamStatusCode:   resp.StatusCode,
 										UpstreamRequestID:    resp.Header.Get("x-request-id"),
 										Passthrough:          true,
 										Kind:                 "failover",
 										Message:              upstreamMsg,
 										Detail:               upstreamDetail,
 										UpstreamResponseBody: upstreamDetail,
 									})
 									return &UpstreamFailoverError{
 										StatusCode:      resp.StatusCode,
 										ResponseBody:    body,
 										ResponseHeaders: resp.Header.Clone(),
 									}
 								}
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+								func (s *OpenAIGatewayService) handleErrorResponsePassthrough(
 									ctx context.Context,
 									resp *http.Response,
 									c *gin.Context,
 									account *Account,
 									requestBody []byte,
 								) error {
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									body, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
 									upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(body))
 									upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)
 									upstreamDetail := ""
 									if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 										maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
 										if maxBytes <= 0 {
 											maxBytes = 2048
 										}
 										upstreamDetail = truncateString(string(body), maxBytes)
 									}
 									setOpsUpstreamError(c, resp.StatusCode, upstreamMsg, upstreamDetail)
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+									logOpenAIInstructionsRequiredDebug(ctx, c, account, resp.StatusCode, upstreamMsg, requestBody, body)
-												fix(openai): persist passthrough 429 rate limits

											
										
										
											2026-03-24 01:24:30 +08:00
+									if s.rateLimitService != nil {
 										// Passthrough mode preserves the raw upstream error response, but runtime
 										// account state still needs to be updated so sticky routing can stop
 										// reusing a freshly rate-limited account.
 										_ = s.rateLimitService.HandleUpstreamError(ctx, account, resp.StatusCode, resp.Header, body)
 									}
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 										Platform:             account.Platform,
 										AccountID:            account.ID,
 										AccountName:          account.Name,
 										UpstreamStatusCode:   resp.StatusCode,
 										UpstreamRequestID:    resp.Header.Get("x-request-id"),
 										Passthrough:          true,
 										Kind:                 "http_error",
 										Message:              upstreamMsg,
 										Detail:               upstreamDetail,
 										UpstreamResponseBody: upstreamDetail,
 									})
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									writeOpenAIPassthroughResponseHeaders(c.Writer.Header(), resp.Header, s.responseHeaderFilter)
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									contentType := resp.Header.Get("Content-Type")
 									if contentType == "" {
 										contentType = "application/json"
 									}
 									c.Data(resp.StatusCode, contentType, body)
 									if upstreamMsg == "" {
 										return fmt.Errorf("upstream error: %d", resp.StatusCode)
 									}
 									return fmt.Errorf("upstream error: %d message=%s", resp.StatusCode, upstreamMsg)
 								}
-												fix(openai): 收敛自动透传请求头并增强 OAuth 安全兜底

											
										
										
											2026-02-12 20:12:15 +08:00
+								func isOpenAIPassthroughAllowedRequestHeader(lowerKey string, allowTimeoutHeaders bool) bool {
 									if lowerKey == "" {
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+										return false
 									}
-												fix(openai): 收敛自动透传请求头并增强 OAuth 安全兜底

											
										
										
											2026-02-12 20:12:15 +08:00
+									if isOpenAIPassthroughTimeoutHeader(lowerKey) {
 										return allowTimeoutHeaders
 									}
 									return openaiPassthroughAllowedHeaders[lowerKey]
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+								}
-												fix(gateway): 默认过滤OpenAI透传超时头并补充断流告警

											
										
										
											2026-02-12 14:16:18 +08:00
+								func isOpenAIPassthroughTimeoutHeader(lowerKey string) bool {
 									switch lowerKey {
 									case "x-stainless-timeout", "x-stainless-read-timeout", "x-stainless-connect-timeout", "x-request-timeout", "request-timeout", "grpc-timeout":
 										return true
 									default:
 										return false
 									}
 								}
 								func (s *OpenAIGatewayService) isOpenAIPassthroughTimeoutHeadersAllowed() bool {
 									return s != nil && s.cfg != nil && s.cfg.Gateway.OpenAIPassthroughAllowTimeoutHeaders
 								}
 								func collectOpenAIPassthroughTimeoutHeaders(h http.Header) []string {
 									if h == nil {
 										return nil
 									}
 									var matched []string
 									for key, values := range h {
 										lowerKey := strings.ToLower(strings.TrimSpace(key))
 										if isOpenAIPassthroughTimeoutHeader(lowerKey) {
 											entry := lowerKey
 											if len(values) > 0 {
 												entry = fmt.Sprintf("%s=%s", lowerKey, strings.Join(values, "|"))
 											}
 											matched = append(matched, entry)
 										}
 									}
 									sort.Strings(matched)
 									return matched
 								}
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+								type openaiStreamingResultPassthrough struct {
 									usage        *OpenAIUsage
 									firstTokenMs *int
 								}
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+								func openAIStreamClientOutputStarted(c *gin.Context, localStarted bool) bool {
 									if localStarted {
 										return true
 									}
 									return c != nil && c.Writer != nil && c.Writer.Written()
 								}
 								func openAIStreamEventIsPreamble(eventType string) bool {
 									switch strings.TrimSpace(eventType) {
 									case "response.created", "response.in_progress":
 										return true
 									default:
 										return false
 									}
 								}
 								func openAIStreamDataStartsClientOutput(data, eventType string) bool {
 									trimmed := strings.TrimSpace(data)
 									if trimmed == "" {
 										return false
 									}
 									if strings.TrimSpace(eventType) == "response.failed" {
 										return false
 									}
 									return !openAIStreamEventIsPreamble(eventType)
 								}
 								func openAIStreamFailedEventShouldFailover(payload []byte, message string) bool {
 									code := strings.ToLower(strings.TrimSpace(gjson.GetBytes(payload, "response.error.code").String()))
 									if code == "" {
 										code = strings.ToLower(strings.TrimSpace(gjson.GetBytes(payload, "error.code").String()))
 									}
 									errType := strings.ToLower(strings.TrimSpace(gjson.GetBytes(payload, "response.error.type").String()))
 									if errType == "" {
 										errType = strings.ToLower(strings.TrimSpace(gjson.GetBytes(payload, "error.type").String()))
 									}
 									combined := strings.ToLower(strings.TrimSpace(message + " " + code + " " + errType))
 									if combined == "" {
 										return true
 									}
 									nonRetryableMarkers := []string{
 										"invalid_request",
 										"content_policy",
 										"policy",
 										"safety",
 										"high-risk cyber",
 										"not allowed",
 										"violat",
 									}
 									for _, marker := range nonRetryableMarkers {
 										if strings.Contains(combined, marker) {
 											return false
 										}
 									}
 									return true
 								}
 								func (s *OpenAIGatewayService) newOpenAIStreamFailoverError(
 									c *gin.Context,
 									account *Account,
 									passthrough bool,
 									upstreamRequestID string,
 									payload []byte,
 									message string,
 								) *UpstreamFailoverError {
 									message = sanitizeUpstreamErrorMessage(strings.TrimSpace(message))
 									if message == "" {
 										message = "OpenAI stream disconnected before completion"
 									}
 									detail := ""
 									if len(payload) > 0 && s != nil && s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 										maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
 										if maxBytes <= 0 {
 											maxBytes = 2048
 										}
 										detail = truncateString(string(payload), maxBytes)
 									}
 									if c != nil {
 										setOpsUpstreamError(c, http.StatusBadGateway, message, detail)
 										event := OpsUpstreamErrorEvent{
 											Platform:           PlatformOpenAI,
 											UpstreamStatusCode: http.StatusBadGateway,
 											UpstreamRequestID:  strings.TrimSpace(upstreamRequestID),
 											Passthrough:        passthrough,
 											Kind:               "failover",
 											Message:            message,
 											Detail:             detail,
 										}
 										if account != nil {
 											event.Platform = account.Platform
 											event.AccountID = account.ID
 											event.AccountName = account.Name
 										}
 										appendOpsUpstreamError(c, event)
 									}
 									body, _ := json.Marshal(gin.H{
 										"error": gin.H{
 											"type":    "upstream_error",
 											"message": message,
 										},
 									})
 									return &UpstreamFailoverError{
 										StatusCode:   http.StatusBadGateway,
 										ResponseBody: body,
 									}
 								}
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+								func (s *OpenAIGatewayService) handleStreamingResponsePassthrough(
 									ctx context.Context,
 									resp *http.Response,
 									c *gin.Context,
 									account *Account,
 									startTime time.Time,
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									originalModel string,
 									mappedModel string,
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+								) (*openaiStreamingResultPassthrough, error) {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									writeOpenAIPassthroughResponseHeaders(c.Writer.Header(), resp.Header, s.responseHeaderFilter)
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
 									// SSE headers
 									c.Header("Content-Type", "text/event-stream")
 									c.Header("Cache-Control", "no-cache")
 									c.Header("Connection", "keep-alive")
 									c.Header("X-Accel-Buffering", "no")
 									if v := resp.Header.Get("x-request-id"); v != "" {
 										c.Header("x-request-id", v)
 									}
 									w := c.Writer
 									flusher, ok := w.(http.Flusher)
 									if !ok {
 										return nil, errors.New("streaming not supported")
 									}
 									usage := &OpenAIUsage{}
 									var firstTokenMs *int
-												fix(openai): 修复 OAuth 透传流式断开与压缩头问题

- 透传流式在客户端断开后继续 drain 上游并解析 usage，避免计费信息丢失

- 阻断透传 accept-encoding，避免压缩响应影响 SSE/usage 解析

- 阻断 proxy-authorization，避免透传代理鉴权信息

- 补充回归测试：请求头阻断与断流后 usage 采集

											
										
										
											2026-02-11 22:17:38 +08:00
+									clientDisconnected := false
-												fix(gateway): 默认过滤OpenAI透传超时头并补充断流告警

											
										
										
											2026-02-12 14:16:18 +08:00
+									sawDone := false
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+									sawTerminalEvent := false
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+									sawFailedEvent := false
 									failedMessage := ""
 									clientOutputStarted := false
-												fix(gateway): 默认过滤OpenAI透传超时头并补充断流告警

											
										
										
											2026-02-12 14:16:18 +08:00
+									upstreamRequestID := strings.TrimSpace(resp.Header.Get("x-request-id"))
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+									pendingLines := make([]string, 0, 8)
 									writePendingLines := func() bool {
 										for _, pending := range pendingLines {
 											if _, err := fmt.Fprintln(w, pending); err != nil {
 												clientDisconnected = true
 												logger.LegacyPrintf("service.openai_gateway", "[OpenAI passthrough] Client disconnected during streaming, continue draining upstream for usage: account=%d", account.ID)
 												return false
 											}
 										}
 										pendingLines = pendingLines[:0]
 										return true
 									}
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
 									scanner := bufio.NewScanner(resp.Body)
 									maxLineSize := defaultMaxLineSize
 									if s.cfg != nil && s.cfg.Gateway.MaxLineSize > 0 {
 										maxLineSize = s.cfg.Gateway.MaxLineSize
 									}
 									scanBuf := getSSEScannerBuf64K()
 									scanner.Buffer(scanBuf[:0], maxLineSize)
 									defer putSSEScannerBuf64K(scanBuf)
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									needModelReplace := strings.TrimSpace(originalModel) != "" && strings.TrimSpace(mappedModel) != "" && strings.TrimSpace(originalModel) != strings.TrimSpace(mappedModel)
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									for scanner.Scan() {
 										line := scanner.Text()
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+										lineStartsClientOutput := false
 										forceFlushFailedEvent := false
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+										if data, ok := extractOpenAISSEDataLine(line); ok {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											dataBytes := []byte(data)
-												fix(gateway): 默认过滤OpenAI透传超时头并补充断流告警

											
										
										
											2026-02-12 14:16:18 +08:00
+											trimmedData := strings.TrimSpace(data)
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+											if needModelReplace && strings.Contains(data, mappedModel) {
 												line = s.replaceModelInSSELine(line, mappedModel, originalModel)
 												if replacedData, replaced := extractOpenAISSEDataLine(line); replaced {
 													dataBytes = []byte(replacedData)
 													trimmedData = strings.TrimSpace(replacedData)
 												}
 											}
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+											eventType := strings.TrimSpace(gjson.Get(trimmedData, "type").String())
 											if eventType == "response.failed" {
 												failedMessage = extractOpenAISSEErrorMessage(dataBytes)
 												if !openAIStreamClientOutputStarted(c, clientOutputStarted) && openAIStreamFailedEventShouldFailover(dataBytes, failedMessage) {
 													return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs},
 														s.newOpenAIStreamFailoverError(c, account, true, upstreamRequestID, dataBytes, failedMessage)
 												}
 												forceFlushFailedEvent = true
 												sawFailedEvent = true
 											}
-												fix(gateway): 默认过滤OpenAI透传超时头并补充断流告警

											
										
										
											2026-02-12 14:16:18 +08:00
+											if trimmedData == "[DONE]" {
 												sawDone = true
 											}
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+											if openAIStreamEventIsTerminal(trimmedData) {
 												sawTerminalEvent = true
 											}
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+											lineStartsClientOutput = forceFlushFailedEvent || openAIStreamDataStartsClientOutput(trimmedData, eventType)
 											if firstTokenMs == nil && lineStartsClientOutput && trimmedData != "[DONE]" {
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+												ms := int(time.Since(startTime).Milliseconds())
 												firstTokenMs = &ms
 											}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											s.parseSSEUsageBytes(dataBytes, usage)
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+										}
-												fix(openai): 修复 OAuth 透传流式断开与压缩头问题

- 透传流式在客户端断开后继续 drain 上游并解析 usage，避免计费信息丢失

- 阻断透传 accept-encoding，避免压缩响应影响 SSE/usage 解析

- 阻断 proxy-authorization，避免透传代理鉴权信息

- 补充回归测试：请求头阻断与断流后 usage 采集

											
										
										
											2026-02-11 22:17:38 +08:00
+										if !clientDisconnected {
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+											if !clientOutputStarted && !lineStartsClientOutput {
 												pendingLines = append(pendingLines, line)
 												continue
 											}
 											if !clientOutputStarted && len(pendingLines) > 0 {
 												if !writePendingLines() {
 													continue
 												}
 											}
-												fix(openai): 修复 OAuth 透传流式断开与压缩头问题

- 透传流式在客户端断开后继续 drain 上游并解析 usage，避免计费信息丢失

- 阻断透传 accept-encoding，避免压缩响应影响 SSE/usage 解析

- 阻断 proxy-authorization，避免透传代理鉴权信息

- 补充回归测试：请求头阻断与断流后 usage 采集

											
										
										
											2026-02-11 22:17:38 +08:00
+											if _, err := fmt.Fprintln(w, line); err != nil {
 												clientDisconnected = true
-												chore(logging): 完成后端日志审计与结构化迁移

- 将高密度服务与处理器日志迁移到新日志系统（LegacyPrintf/结构化日志）
- 增加 stdlog bridge 与兼容测试，保留旧日志捕获能力
- 将 OpenAI 断流告警改为结构化 Warn 并改造对应测试为 sink 捕获
- 补齐后端相关文件 logger 引用并通过全量 go test

											
										
										
											2026-02-12 19:01:09 +08:00
+												logger.LegacyPrintf("service.openai_gateway", "[OpenAI passthrough] Client disconnected during streaming, continue draining upstream for usage: account=%d", account.ID)
-												fix(openai): 修复 OAuth 透传流式断开与压缩头问题

- 透传流式在客户端断开后继续 drain 上游并解析 usage，避免计费信息丢失

- 阻断透传 accept-encoding，避免压缩响应影响 SSE/usage 解析

- 阻断 proxy-authorization，避免透传代理鉴权信息

- 补充回归测试：请求头阻断与断流后 usage 采集

											
										
										
											2026-02-11 22:17:38 +08:00
+											} else {
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+												clientOutputStarted = true
-												fix(openai): 修复 OAuth 透传流式断开与压缩头问题

- 透传流式在客户端断开后继续 drain 上游并解析 usage，避免计费信息丢失

- 阻断透传 accept-encoding，避免压缩响应影响 SSE/usage 解析

- 阻断 proxy-authorization，避免透传代理鉴权信息

- 补充回归测试：请求头阻断与断流后 usage 采集

											
										
										
											2026-02-11 22:17:38 +08:00
+												flusher.Flush()
 											}
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+										}
 									}
 									if err := scanner.Err(); err != nil {
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+										if sawTerminalEvent && !sawFailedEvent {
-												fix(openai): 修复 OAuth 透传流式断开与压缩头问题

- 透传流式在客户端断开后继续 drain 上游并解析 usage，避免计费信息丢失

- 阻断透传 accept-encoding，避免压缩响应影响 SSE/usage 解析

- 阻断 proxy-authorization，避免透传代理鉴权信息

- 补充回归测试：请求头阻断与断流后 usage 采集

											
										
										
											2026-02-11 22:17:38 +08:00
+											return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, nil
 										}
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+										if sawFailedEvent {
 											return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, fmt.Errorf("upstream response failed: %s", failedMessage)
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+										}
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+										if errors.Is(err, context.Canceled) || errors.Is(err, context.DeadlineExceeded) {
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+											return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, fmt.Errorf("stream usage incomplete: %w", err)
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+										}
 										if errors.Is(err, bufio.ErrTooLong) {
-												chore(logging): 完成后端日志审计与结构化迁移

- 将高密度服务与处理器日志迁移到新日志系统（LegacyPrintf/结构化日志）
- 增加 stdlog bridge 与兼容测试，保留旧日志捕获能力
- 将 OpenAI 断流告警改为结构化 Warn 并改造对应测试为 sink 捕获
- 补齐后端相关文件 logger 引用并通过全量 go test

											
										
										
											2026-02-12 19:01:09 +08:00
+											logger.LegacyPrintf("service.openai_gateway", "[OpenAI passthrough] SSE line too long: account=%d max_size=%d error=%v", account.ID, maxLineSize, err)
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+											return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, err
 										}
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+										if !openAIStreamClientOutputStarted(c, clientOutputStarted) {
 											msg := "OpenAI stream disconnected before completion"
 											if errText := strings.TrimSpace(err.Error()); errText != "" {
 												msg += ": " + errText
 											}
 											return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs},
 												s.newOpenAIStreamFailoverError(c, account, true, upstreamRequestID, nil, msg)
 										}
 										if clientDisconnected {
 											return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, fmt.Errorf("stream usage incomplete after disconnect: %w", err)
 										}
-												chore(logging): 完成后端日志审计与结构化迁移

- 将高密度服务与处理器日志迁移到新日志系统（LegacyPrintf/结构化日志）
- 增加 stdlog bridge 与兼容测试，保留旧日志捕获能力
- 将 OpenAI 断流告警改为结构化 Warn 并改造对应测试为 sink 捕获
- 补齐后端相关文件 logger 引用并通过全量 go test

											
										
										
											2026-02-12 19:01:09 +08:00
+										logger.LegacyPrintf("service.openai_gateway",
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+											"[OpenAI passthrough] 流读取异常中断: account=%d request_id=%s err=%v",
-												fix(gateway): 默认过滤OpenAI透传超时头并补充断流告警

											
										
										
											2026-02-12 14:16:18 +08:00
+											account.ID,
 											upstreamRequestID,
 											err,
 										)
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+										return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, fmt.Errorf("stream read error: %w", err)
 									}
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+									if sawFailedEvent {
 										return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, fmt.Errorf("upstream response failed: %s", failedMessage)
 									}
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+									if !clientDisconnected && !sawDone && !sawTerminalEvent && ctx.Err() == nil {
-												chore(logging): 完成后端日志审计与结构化迁移

- 将高密度服务与处理器日志迁移到新日志系统（LegacyPrintf/结构化日志）
- 增加 stdlog bridge 与兼容测试，保留旧日志捕获能力
- 将 OpenAI 断流告警改为结构化 Warn 并改造对应测试为 sink 捕获
- 补齐后端相关文件 logger 引用并通过全量 go test

											
										
										
											2026-02-12 19:01:09 +08:00
+										logger.FromContext(ctx).With(
 											zap.String("component", "service.openai_gateway"),
 											zap.Int64("account_id", account.ID),
 											zap.String("upstream_request_id", upstreamRequestID),
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+										).Info("OpenAI passthrough 上游流在未收到 [DONE] 时结束，疑似断流")
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+										if !openAIStreamClientOutputStarted(c, clientOutputStarted) {
 											return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs},
 												s.newOpenAIStreamFailoverError(c, account, true, upstreamRequestID, nil, "OpenAI stream ended before a terminal event")
 										}
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+										return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, errors.New("stream usage incomplete: missing terminal event")
-												fix(gateway): 默认过滤OpenAI透传超时头并补充断流告警

											
										
										
											2026-02-12 14:16:18 +08:00
+									}
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
 									return &openaiStreamingResultPassthrough{usage: usage, firstTokenMs: firstTokenMs}, nil
 								}
 								func (s *OpenAIGatewayService) handleNonStreamingResponsePassthrough(
 									ctx context.Context,
 									resp *http.Response,
 									c *gin.Context,
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									originalModel string,
 									mappedModel string,
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+								) (*OpenAIUsage, error) {
-												refactor: extract ReadUpstreamResponseBody to deduplicate upstream response read + too-large error handling

Consolidates 9 call sites of resolveUpstreamResponseReadLimit + readUpstreamResponseBodyLimited + ErrUpstreamResponseBodyTooLarge error handling into a single ReadUpstreamResponseBody function with TooLargeWriter callback for API-format-specific error responses (Anthropic, OpenAI, countTokens).

											
										
										
											2026-04-16 01:53:22 +08:00
+									body, err := ReadUpstreamResponseBody(resp.Body, s.cfg, c, openAITooLargeError)
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									if err != nil {
 										return nil, err
 									}
-												fix: 非流式响应路径扩展SSE检测至所有账号类型 (#1493)

当上游返回SSE格式响应(如sub2api链路)时，API Key账号的非流式路径
未检测SSE，导致终态事件中空output直接透传给客户端。

- 将Content-Type SSE检测从仅OAuth扩展至所有账号类型
- 重命名handleOAuthSSEToJSON为handleSSEToJSON（无OAuth专属逻辑）
- 为透传路径新增handlePassthroughSSEToJSON，支持SSE转JSON及空output重建

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-07 22:49:14 +08:00
+									// Detect SSE responses from upstream and convert to JSON.
 									// Some upstreams (e.g. other sub2api instances) may return SSE even when
 									// stream=false was requested. Without this conversion the client would
 									// receive raw SSE text or a terminal event with empty output.
 									if isEventStreamResponse(resp.Header) {
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										return s.handlePassthroughSSEToJSON(resp, c, body, originalModel, mappedModel)
-												fix: 非流式响应路径扩展SSE检测至所有账号类型 (#1493)

当上游返回SSE格式响应(如sub2api链路)时，API Key账号的非流式路径
未检测SSE，导致终态事件中空output直接透传给客户端。

- 将Content-Type SSE检测从仅OAuth扩展至所有账号类型
- 重命名handleOAuthSSEToJSON为handleSSEToJSON（无OAuth专属逻辑）
- 为透传路径新增handlePassthroughSSEToJSON，支持SSE转JSON及空output重建

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-07 22:49:14 +08:00
+									}
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									usage := &OpenAIUsage{}
 									usageParsed := false
 									if len(body) > 0 {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										if parsedUsage, ok := extractOpenAIUsageFromJSONBytes(body); ok {
 											*usage = parsedUsage
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+											usageParsed = true
 										}
 									}
 									if !usageParsed {
 										// 兜底：尝试从 SSE 文本中解析 usage
 										usage = s.parseSSEUsageFromBody(string(body))
 									}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									writeOpenAIPassthroughResponseHeaders(c.Writer.Header(), resp.Header, s.responseHeaderFilter)
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
 									contentType := resp.Header.Get("Content-Type")
 									if contentType == "" {
 										contentType = "application/json"
 									}
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+									if originalModel != "" && mappedModel != "" && originalModel != mappedModel {
 										body = s.replaceModelInResponseBody(body, mappedModel, originalModel)
 									}
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									c.Data(resp.StatusCode, contentType, body)
 									return usage, nil
 								}
-												fix: 非流式响应路径扩展SSE检测至所有账号类型 (#1493)

当上游返回SSE格式响应(如sub2api链路)时，API Key账号的非流式路径
未检测SSE，导致终态事件中空output直接透传给客户端。

- 将Content-Type SSE检测从仅OAuth扩展至所有账号类型
- 重命名handleOAuthSSEToJSON为handleSSEToJSON（无OAuth专属逻辑）
- 为透传路径新增handlePassthroughSSEToJSON，支持SSE转JSON及空output重建

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-07 22:49:14 +08:00
+								// handlePassthroughSSEToJSON converts an SSE response body into a JSON
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+								// response for the passthrough path. It mirrors handleSSEToJSON while
 								// preserving passthrough payloads, except compact-only model remapping may
 								// rewrite model fields back to the original requested model.
 								func (s *OpenAIGatewayService) handlePassthroughSSEToJSON(resp *http.Response, c *gin.Context, body []byte, originalModel string, mappedModel string) (*OpenAIUsage, error) {
-												fix: 非流式响应路径扩展SSE检测至所有账号类型 (#1493)

当上游返回SSE格式响应(如sub2api链路)时，API Key账号的非流式路径
未检测SSE，导致终态事件中空output直接透传给客户端。

- 将Content-Type SSE检测从仅OAuth扩展至所有账号类型
- 重命名handleOAuthSSEToJSON为handleSSEToJSON（无OAuth专属逻辑）
- 为透传路径新增handlePassthroughSSEToJSON，支持SSE转JSON及空output重建

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-07 22:49:14 +08:00
+									bodyText := string(body)
 									finalResponse, ok := extractCodexFinalResponse(bodyText)
 									usage := &OpenAIUsage{}
 									if ok {
 										if parsedUsage, parsed := extractOpenAIUsageFromJSONBytes(finalResponse); parsed {
 											*usage = parsedUsage
 										}
 										// When the terminal event has an empty output array, reconstruct
 										// output from accumulated delta events so the client gets full content.
 										if len(gjson.GetBytes(finalResponse, "output").Array()) == 0 {
 											if outputJSON, reconstructed := reconstructResponseOutputFromSSE(bodyText); reconstructed {
 												if patched, err := sjson.SetRawBytes(finalResponse, "output", outputJSON); err == nil {
 													finalResponse = patched
 												}
 											}
 										}
 										body = finalResponse
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										if originalModel != "" && mappedModel != "" && originalModel != mappedModel {
 											body = s.replaceModelInResponseBody(body, mappedModel, originalModel)
 										}
-												fix: 非流式响应路径扩展SSE检测至所有账号类型 (#1493)

当上游返回SSE格式响应(如sub2api链路)时，API Key账号的非流式路径
未检测SSE，导致终态事件中空output直接透传给客户端。

- 将Content-Type SSE检测从仅OAuth扩展至所有账号类型
- 重命名handleOAuthSSEToJSON为handleSSEToJSON（无OAuth专属逻辑）
- 为透传路径新增handlePassthroughSSEToJSON，支持SSE转JSON及空output重建

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-07 22:49:14 +08:00
+										// Correct tool calls in final response
 										body = s.correctToolCallsInResponseBody(body)
 									} else {
 										terminalType, terminalPayload, terminalOK := extractOpenAISSETerminalEvent(bodyText)
 										if terminalOK && terminalType == "response.failed" {
 											msg := extractOpenAISSEErrorMessage(terminalPayload)
 											if msg == "" {
 												msg = "Upstream compact response failed"
 											}
 											return nil, s.writeOpenAINonStreamingProtocolError(resp, c, msg)
 										}
 										usage = s.parseSSEUsageFromBody(bodyText)
-												feat(openai): port /responses/compact account support flow (PR #1555)

将 vansour/sub2api#1555 的 OpenAI compact 能力建模手工移植到当前 main：账号
级 compact 状态/auto-force_on-force_off 模式、compact-only 模型映射、调度器
tier 分层（已支持 > 未知 > 已知不支持）、管理后台 compact 主动探测，以及对应
i18n/状态徽章。普通 /responses 流量行为不变，无数据库迁移。

											
										
										
											2026-04-25 14:40:03 +08:00
+										if originalModel != "" && mappedModel != "" && originalModel != mappedModel {
 											bodyText = s.replaceModelInSSEBody(bodyText, mappedModel, originalModel)
 										}
 										body = []byte(bodyText)
-												fix: 非流式响应路径扩展SSE检测至所有账号类型 (#1493)

当上游返回SSE格式响应(如sub2api链路)时，API Key账号的非流式路径
未检测SSE，导致终态事件中空output直接透传给客户端。

- 将Content-Type SSE检测从仅OAuth扩展至所有账号类型
- 重命名handleOAuthSSEToJSON为handleSSEToJSON（无OAuth专属逻辑）
- 为透传路径新增handlePassthroughSSEToJSON，支持SSE转JSON及空output重建

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-07 22:49:14 +08:00
+									}
 									writeOpenAIPassthroughResponseHeaders(c.Writer.Header(), resp.Header, s.responseHeaderFilter)
 									contentType := "application/json; charset=utf-8"
 									if !ok {
 										contentType = resp.Header.Get("Content-Type")
 										if contentType == "" {
 											contentType = "text/event-stream"
 										}
 									}
 									c.Data(resp.StatusCode, contentType, body)
 									return usage, nil
 								}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+								func writeOpenAIPassthroughResponseHeaders(dst http.Header, src http.Header, filter *responseheaders.CompiledHeaderFilter) {
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									if dst == nil || src == nil {
 										return
 									}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									if filter != nil {
 										responseheaders.WriteFilteredHeaders(dst, src, filter)
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									} else {
 										// 兜底：尽量保留最基础的 content-type
 										if v := strings.TrimSpace(src.Get("Content-Type")); v != "" {
 											dst.Set("Content-Type", v)
 										}
 									}
 									// 透传模式强制放行 x-codex-* 响应头（若上游返回）。
 									// 注意：真实 http.Response.Header 的 key 一般会被 canonicalize；但为了兼容测试/自建响应，
 									// 这里用 EqualFold 做一次大小写不敏感的查找。
 									getCaseInsensitiveValues := func(h http.Header, want string) []string {
 										if h == nil {
 											return nil
 										}
 										for k, vals := range h {
 											if strings.EqualFold(k, want) {
 												return vals
 											}
 										}
 										return nil
 									}
 									for _, rawKey := range []string{
 										"x-codex-primary-used-percent",
 										"x-codex-primary-reset-after-seconds",
 										"x-codex-primary-window-minutes",
 										"x-codex-secondary-used-percent",
 										"x-codex-secondary-reset-after-seconds",
 										"x-codex-secondary-window-minutes",
 										"x-codex-primary-over-secondary-limit-percent",
 									} {
 										vals := getCaseInsensitiveValues(src, rawKey)
 										if len(vals) == 0 {
 											continue
 										}
 										key := http.CanonicalHeaderKey(rawKey)
 										dst.Del(key)
 										for _, v := range vals {
 											dst.Add(key, v)
 										}
 									}
 								}
-												Align OAuth transform with OpenCode instructions

											
										
										
											2026-01-10 20:53:16 +08:00
+								func (s *OpenAIGatewayService) buildUpstreamRequest(ctx context.Context, c *gin.Context, account *Account, body []byte, token string, isStream bool, promptCacheKey string, isCodexCLI bool) (*http.Request, error) {
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									// Determine target URL based on account type
 									var targetURL string
-												fix: 修复golangci-lint检查问题

- 移除OpenAIGatewayHandler中未使用的userService字段
- 将账号类型判断的if-else链改为switch语句

											
										
										
											2025-12-23 10:25:32 +08:00
+									switch account.Type {
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+									case AccountTypeOAuth:
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										// OAuth accounts use ChatGPT internal API
 										targetURL = chatgptCodexURL
-												fix(lint): 修复所有 Go 命名规范问题

- 全局替换 ApiKey → APIKey（类型、字段、方法、变量）
- 修复所有 initialism 命名（API, SMTP, HTML, URL 等）
- 添加所有缺失的包注释
- 修复导出符号的注释格式

主要修改：
- ApiKey → APIKey（所有出现的地方）
- ApiKeyID → APIKeyID
- ApiKeyIDs → APIKeyIDs
- TestSmtpConnection → TestSMTPConnection
- HtmlURL → HTMLURL
- 添加 20+ 个包注释
- 修复 10+ 个导出符号注释格式

验证结果：
- ✓ golangci-lint: 0 issues
- ✓ 单元测试: 通过
- ✓ 集成测试: 通过

											
										
										
											2026-01-04 19:27:53 +08:00
+									case AccountTypeAPIKey:
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										// API Key accounts use Platform API or custom base URL
 										baseURL := account.GetOpenAIBaseURL()
-												feat(安全): 强化安全策略与配置校验

- 增加 CORS/CSP/安全响应头与代理信任配置

- 引入 URL 白名单与私网开关，校验上游与价格源

- 改善 API Key 处理与网关错误返回

- 管理端设置隐藏敏感字段并优化前端提示

- 增加计费熔断与相关配置示例

测试: go test ./...

											
										
										
											2026-01-02 17:40:57 +08:00
+										if baseURL == "" {
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+											targetURL = openaiPlatformAPIURL
-												feat(安全): 强化安全策略与配置校验

- 增加 CORS/CSP/安全响应头与代理信任配置

- 引入 URL 白名单与私网开关，校验上游与价格源

- 改善 API Key 处理与网关错误返回

- 管理端设置隐藏敏感字段并优化前端提示

- 增加计费熔断与相关配置示例

测试: go test ./...

											
										
										
											2026-01-02 17:40:57 +08:00
+										} else {
 											validatedURL, err := s.validateUpstreamBaseURL(baseURL)
 											if err != nil {
 												return nil, err
 											}
-												feat(openai): 支持自动透传开关并透传 User-Agent

- OpenAI OAuth/API Key 统一支持自动透传开关，编辑页可开关\n- 透传模式仅替换认证并保留计费/并发/审计，修复 API Key responses 端点拼接\n- Usage 页面显示原始 User-Agent 且不截断，补充回归测试与清单

											
										
										
											2026-02-12 10:56:07 +08:00
+											targetURL = buildOpenAIResponsesURL(validatedURL)
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										}
-												fix: 修复golangci-lint检查问题

- 移除OpenAIGatewayHandler中未使用的userService字段
- 将账号类型判断的if-else链改为switch语句

											
										
										
											2025-12-23 10:25:32 +08:00
+									default:
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										targetURL = openaiPlatformAPIURL
 									}
-												fix(openai): support remote compact task

											
										
										
											2026-03-06 18:50:28 +08:00
+									targetURL = appendOpenAIResponsesRequestPathSuffix(targetURL, openAIResponsesRequestPathSuffix(c))
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
 									req, err := http.NewRequestWithContext(ctx, "POST", targetURL, bytes.NewReader(body))
 									if err != nil {
 										return nil, err
 									}
 									// Set authentication header
 									req.Header.Set("authorization", "Bearer "+token)
 									// Set headers specific to OAuth accounts (ChatGPT internal API)
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+									if account.Type == AccountTypeOAuth {
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										// Required: set Host for ChatGPT API (must use req.Host, not Header.Set)
 										req.Host = "chatgpt.com"
 										// Required: set chatgpt-account-id header
 										chatgptAccountID := account.GetChatGPTAccountID()
 										if chatgptAccountID != "" {
 											req.Header.Set("chatgpt-account-id", chatgptAccountID)
 										}
 									}
 									// Whitelist passthrough headers
 									for key, values := range c.Request.Header {
 										lowerKey := strings.ToLower(key)
 										if openaiAllowedHeaders[lowerKey] {
 											for _, v := range values {
 												req.Header.Add(key, v)
 											}
 										}
 									}
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+									if account.Type == AccountTypeOAuth {
-												fix(gateway): 防止 OpenAI Codex 跨用户串流

根因：多个用户共享同一 OAuth 账号时，conversation_id/session_id 头
未做用户隔离，导致上游 chatgpt.com 将不同用户的请求关联到同一会话。

HTTP SSE 修复:
- 新增 isolateOpenAISessionID(apiKeyID, raw)，将 API Key ID 混入
  session 标识符（xxhash），确保不同 Key 的用户产生不同上游会话
- buildUpstreamRequest: OAuth 分支先 Del 客户端透传的 session 头，
  再用隔离值覆盖
- buildUpstreamRequestOpenAIPassthrough: 透传路径同样隔离
- ForwardAsAnthropic: Anthropic Messages 兼容路径同步修复
- buildOpenAIWSHeaders: WS 路径的 OAuth session 头同步隔离

											
										
										
											2026-03-16 10:28:11 +08:00
+										// 清除客户端透传的 session 头，后续用隔离后的值重新设置，防止跨用户会话碰撞。
 										req.Header.Del("conversation_id")
 										req.Header.Del("session_id")
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+										req.Header.Set("OpenAI-Beta", "responses=experimental")
-												fix(openai): detect official codex client by headers

											
										
										
											2026-03-07 14:12:38 +08:00
+										req.Header.Set("originator", resolveOpenAIUpstreamOriginator(c, isCodexCLI))
-												fix(gateway): 防止 OpenAI Codex 跨用户串流

根因：多个用户共享同一 OAuth 账号时，conversation_id/session_id 头
未做用户隔离，导致上游 chatgpt.com 将不同用户的请求关联到同一会话。

HTTP SSE 修复:
- 新增 isolateOpenAISessionID(apiKeyID, raw)，将 API Key ID 混入
  session 标识符（xxhash），确保不同 Key 的用户产生不同上游会话
- buildUpstreamRequest: OAuth 分支先 Del 客户端透传的 session 头，
  再用隔离值覆盖
- buildUpstreamRequestOpenAIPassthrough: 透传路径同样隔离
- ForwardAsAnthropic: Anthropic Messages 兼容路径同步修复
- buildOpenAIWSHeaders: WS 路径的 OAuth session 头同步隔离

											
										
										
											2026-03-16 10:28:11 +08:00
+										apiKeyID := getAPIKeyIDFromContext(c)
-												fix(openai): support remote compact task

											
										
										
											2026-03-06 18:50:28 +08:00
+										if isOpenAIResponsesCompactPath(c) {
 											req.Header.Set("accept", "application/json")
 											if req.Header.Get("version") == "" {
 												req.Header.Set("version", codexCLIVersion)
 											}
-												fix(gateway): 防止 OpenAI Codex 跨用户串流

根因：多个用户共享同一 OAuth 账号时，conversation_id/session_id 头
未做用户隔离，导致上游 chatgpt.com 将不同用户的请求关联到同一会话。

HTTP SSE 修复:
- 新增 isolateOpenAISessionID(apiKeyID, raw)，将 API Key ID 混入
  session 标识符（xxhash），确保不同 Key 的用户产生不同上游会话
- buildUpstreamRequest: OAuth 分支先 Del 客户端透传的 session 头，
  再用隔离值覆盖
- buildUpstreamRequestOpenAIPassthrough: 透传路径同样隔离
- ForwardAsAnthropic: Anthropic Messages 兼容路径同步修复
- buildOpenAIWSHeaders: WS 路径的 OAuth session 头同步隔离

											
										
										
											2026-03-16 10:28:11 +08:00
+											compactSession := resolveOpenAICompactSessionID(c)
 											req.Header.Set("session_id", isolateOpenAISessionID(apiKeyID, compactSession))
-												fix(openai): support remote compact task

											
										
										
											2026-03-06 18:50:28 +08:00
+										} else {
 											req.Header.Set("accept", "text/event-stream")
 										}
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+										if promptCacheKey != "" {
-												fix(gateway): 防止 OpenAI Codex 跨用户串流

根因：多个用户共享同一 OAuth 账号时，conversation_id/session_id 头
未做用户隔离，导致上游 chatgpt.com 将不同用户的请求关联到同一会话。

HTTP SSE 修复:
- 新增 isolateOpenAISessionID(apiKeyID, raw)，将 API Key ID 混入
  session 标识符（xxhash），确保不同 Key 的用户产生不同上游会话
- buildUpstreamRequest: OAuth 分支先 Del 客户端透传的 session 头，
  再用隔离值覆盖
- buildUpstreamRequestOpenAIPassthrough: 透传路径同样隔离
- ForwardAsAnthropic: Anthropic Messages 兼容路径同步修复
- buildOpenAIWSHeaders: WS 路径的 OAuth session 头同步隔离

											
										
										
											2026-03-16 10:28:11 +08:00
+											isolated := isolateOpenAISessionID(apiKeyID, promptCacheKey)
 											req.Header.Set("conversation_id", isolated)
 											req.Header.Set("session_id", isolated)
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+										}
 									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
 									// Apply custom User-Agent if configured
 									customUA := account.GetOpenAIUserAgent()
 									if customUA != "" {
 										req.Header.Set("user-agent", customUA)
 									}
-												feat(gateway): 支持强制 Codex CLI 模式并伪装 UA

- Codex CLI 请求仅使用内置 instructions，不再读取 opencode 缓存/回源\n- 新增 gateway.force_codex_cli（环境变量 GATEWAY_FORCE_CODEX_CLI）\n- ForceCodexCLI=true 时转发上游强制 User-Agent=codex_cli_rs/0.0.0\n- 更新 deploy 示例配置

											
										
										
											2026-02-07 09:21:15 +08:00
+									// 若开启 ForceCodexCLI，则强制将上游 User-Agent 伪装为 Codex CLI。
 									// 用于网关未透传/改写 User-Agent 时，仍能命中 Codex 侧识别逻辑。
 									if s.cfg != nil && s.cfg.Gateway.ForceCodexCLI {
-												fix(openai): 收敛自动透传请求头并增强 OAuth 安全兜底

											
										
										
											2026-02-12 20:12:15 +08:00
+										req.Header.Set("user-agent", codexCLIUserAgent)
-												feat(gateway): 支持强制 Codex CLI 模式并伪装 UA

- Codex CLI 请求仅使用内置 instructions，不再读取 opencode 缓存/回源\n- 新增 gateway.force_codex_cli（环境变量 GATEWAY_FORCE_CODEX_CLI）\n- ForceCodexCLI=true 时转发上游强制 User-Agent=codex_cli_rs/0.0.0\n- 更新 deploy 示例配置

											
										
										
											2026-02-07 09:21:15 +08:00
+									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									// Ensure required headers exist
 									if req.Header.Get("content-type") == "" {
 										req.Header.Set("content-type", "application/json")
 									}
 									return req, nil
 								}
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+								func (s *OpenAIGatewayService) handleErrorResponse(
 									ctx context.Context,
 									resp *http.Response,
 									c *gin.Context,
 									account *Account,
 									requestBody []byte,
 								) (*OpenAIForwardResult, error) {
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
+									body, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
 									upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(body))
 									upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)
 									upstreamDetail := ""
 									if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 										maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
 										if maxBytes <= 0 {
 											maxBytes = 2048
 										}
 										upstreamDetail = truncateString(string(body), maxBytes)
 									}
 									setOpsUpstreamError(c, resp.StatusCode, upstreamMsg, upstreamDetail)
-												fix(ops): 修复日志级别过滤并增强OpenAI错误诊断日志

- 移除 warn 级别下 access info 的强制入库补写，确保运行时日志级别真实生效

- 将 OpenAI fallback matched 与 passthrough 断流提示按需求降级为 info

- 为 codex_cli_only 与 instructions required 场景补充请求诊断字段（含 User-Agent）

- 出于安全考虑移除请求体预览，仅保留 request_body_size 与白名单头信息

- 新增/更新回归测试，覆盖 Forward 入口到日志落库链路

											
										
										
											2026-02-13 19:27:07 +08:00
+									logOpenAIInstructionsRequiredDebug(ctx, c, account, resp.StatusCode, upstreamMsg, requestBody, body)
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
 									if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
-												chore(logging): 完成后端日志审计与结构化迁移

- 将高密度服务与处理器日志迁移到新日志系统（LegacyPrintf/结构化日志）
- 增加 stdlog bridge 与兼容测试，保留旧日志捕获能力
- 将 OpenAI 断流告警改为结构化 Warn 并改造对应测试为 sink 捕获
- 补齐后端相关文件 logger 引用并通过全量 go test

											
										
										
											2026-02-12 19:01:09 +08:00
+										logger.LegacyPrintf("service.openai_gateway",
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
+											"OpenAI upstream error %d (account=%d platform=%s type=%s): %s",
 											resp.StatusCode,
 											account.ID,
 											account.Platform,
 											account.Type,
 											truncateForLog(body, s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes),
 										)
 									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
-												fix: restore non-failover error passthrough from 7b156489

											
										
										
											2026-02-07 14:24:55 +08:00
+									if status, errType, errMsg, matched := applyErrorPassthroughRule(
 										c,
 										PlatformOpenAI,
 										resp.StatusCode,
 										body,
 										http.StatusBadGateway,
 										"upstream_error",
 										"Upstream request failed",
 									); matched {
 										c.JSON(status, gin.H{
 											"error": gin.H{
 												"type":    errType,
 												"message": errMsg,
 											},
 										})
 										if upstreamMsg == "" {
 											upstreamMsg = errMsg
 										}
 										if upstreamMsg == "" {
 											return nil, fmt.Errorf("upstream error: %d (passthrough rule matched)", resp.StatusCode)
 										}
 										return nil, fmt.Errorf("upstream error: %d (passthrough rule matched) message=%s", resp.StatusCode, upstreamMsg)
 									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									// Check custom error codes
 									if !account.ShouldHandleErrorCode(resp.StatusCode) {
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+										appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 											Platform:           account.Platform,
 											AccountID:          account.ID,
-												feat: merge dev

											
										
										
											2026-01-15 15:14:44 +08:00
+											AccountName:        account.Name,
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+											UpstreamStatusCode: resp.StatusCode,
 											UpstreamRequestID:  resp.Header.Get("x-request-id"),
 											Kind:               "http_error",
 											Message:            upstreamMsg,
 											Detail:             upstreamDetail,
 										})
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										c.JSON(http.StatusInternalServerError, gin.H{
 											"error": gin.H{
 												"type":    "upstream_error",
 												"message": "Upstream gateway error",
 											},
 										})
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
+										if upstreamMsg == "" {
 											return nil, fmt.Errorf("upstream error: %d (not in custom error codes)", resp.StatusCode)
 										}
 										return nil, fmt.Errorf("upstream error: %d (not in custom error codes) message=%s", resp.StatusCode, upstreamMsg)
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
 									// Handle upstream error (mark account status)
-												chore: 更新依赖、配置和代码生成

主要更新：
- 更新 go.mod/go.sum 依赖
- 重新生成 Ent ORM 代码
- 更新 Wire 依赖注入配置
- 添加 docker-compose.override.yml 到 .gitignore
- 更新 README 文档（Simple Mode 说明和已知问题）
- 清理调试日志
- 其他代码优化和格式修复

											
										
										
											2026-01-03 06:37:08 -08:00
+									shouldDisable := false
 									if s.rateLimitService != nil {
 										shouldDisable = s.rateLimitService.HandleUpstreamError(ctx, account, resp.StatusCode, resp.Header, body)
 									}
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+									kind := "http_error"
 									if shouldDisable {
 										kind = "failover"
 									}
 									appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 										Platform:           account.Platform,
 										AccountID:          account.ID,
-												feat: merge dev

											
										
										
											2026-01-15 15:14:44 +08:00
+										AccountName:        account.Name,
-												feat(ops): 实现上游错误事件记录与查询功能

**新增功能**:
- 新建ops_upstream_error_events表存储上游服务错误详情
- 支持记录上游429/529/5xx错误的详细上下文信息
- 提供按时间范围查询上游错误事件的API

**后端改动**:
1. 模型层（ops_models.go, ops_port.go）:
   - 新增UpstreamErrorEvent结构体
   - 扩展Repository接口支持上游错误事件CRUD

2. 仓储层（ops_repo.go）:
   - 实现InsertUpstreamErrorEvent写入上游错误
   - 实现GetUpstreamErrorEvents按时间范围查询

3. 服务层（ops_service.go, ops_upstream_context.go）:
   - ops_service: 新增GetUpstreamErrorEvents查询方法
   - ops_upstream_context: 封装上游错误上下文构建逻辑

4. Handler层（ops_error_logger.go）:
   - 新增GetUpstreamErrorsHandler处理上游错误查询请求

5. Gateway层集成:
   - antigravity_gateway_service.go: 429/529错误时记录上游事件
   - gateway_service.go: OpenAI 429/5xx错误时记录
   - gemini_messages_compat_service.go: Gemini 429/5xx错误时记录
   - openai_gateway_service.go: OpenAI 429/5xx错误时记录
   - ratelimit_service.go: 429限流错误时记录

**数据记录字段**:
- request_id: 关联ops_logs主记录
- platform/model: 上游服务标识
- status_code/error_message: 错误详情
- request_headers/response_body: 调试信息（可选）
- created_at: 错误发生时间

											
										
										
											2026-01-11 15:30:27 +08:00
+										UpstreamStatusCode: resp.StatusCode,
 										UpstreamRequestID:  resp.Header.Get("x-request-id"),
 										Kind:               kind,
 										Message:            upstreamMsg,
 										Detail:             upstreamDetail,
 									})
-												chore: 更新依赖、配置和代码生成

主要更新：
- 更新 go.mod/go.sum 依赖
- 重新生成 Ent ORM 代码
- 更新 Wire 依赖注入配置
- 添加 docker-compose.override.yml 到 .gitignore
- 更新 README 文档（Simple Mode 说明和已知问题）
- 清理调试日志
- 其他代码优化和格式修复

											
										
										
											2026-01-03 06:37:08 -08:00
+									if shouldDisable {
-												feat: 支持 API Key 上游池模式同账号重试次数配置与自定义错误策略

											
										
										
											2026-03-08 13:57:23 +08:00
+										return nil, &UpstreamFailoverError{
 											StatusCode:             resp.StatusCode,
 											ResponseBody:           body,
 											RetryableOnSameAccount: account.IsPoolMode() && isPoolModeRetryableStatus(resp.StatusCode),
 										}
-												chore: 更新依赖、配置和代码生成

主要更新：
- 更新 go.mod/go.sum 依赖
- 重新生成 Ent ORM 代码
- 更新 Wire 依赖注入配置
- 添加 docker-compose.override.yml 到 .gitignore
- 更新 README 文档（Simple Mode 说明和已知问题）
- 清理调试日志
- 其他代码优化和格式修复

											
										
										
											2026-01-03 06:37:08 -08:00
+									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
 									// Return appropriate error response
 									var errType, errMsg string
 									var statusCode int
 									switch resp.StatusCode {
 									case 401:
 										statusCode = http.StatusBadGateway
 										errType = "upstream_error"
 										errMsg = "Upstream authentication failed, please contact administrator"
-												feat: 修复 OpenAI 402 报错自动切换问题

											
										
										
											2025-12-31 11:46:53 +08:00
+									case 402:
 										statusCode = http.StatusBadGateway
 										errType = "upstream_error"
 										errMsg = "Upstream payment required: insufficient balance or billing issue"
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									case 403:
 										statusCode = http.StatusBadGateway
 										errType = "upstream_error"
 										errMsg = "Upstream access forbidden, please contact administrator"
 									case 429:
 										statusCode = http.StatusTooManyRequests
 										errType = "rate_limit_error"
 										errMsg = "Upstream rate limit exceeded, please retry later"
 									default:
 										statusCode = http.StatusBadGateway
 										errType = "upstream_error"
 										errMsg = "Upstream request failed"
 									}
 									c.JSON(statusCode, gin.H{
 										"error": gin.H{
 											"type":    errType,
 											"message": errMsg,
 										},
 									})
-												feat(ops): 添加QPS脉搏线图并优化指标布局

- 添加实时QPS/TPS历史数据追踪（最近60个数据点）
- 在平均QPS/TPS上方添加SVG脉搏线图（sparkline）
- 将延迟和TTFT卡片的指标布局从2列改为3列
- 恢复Max指标显示（P95/P90/P50/Avg/Max）

											
										
										
											2026-01-11 11:49:34 +08:00
+									if upstreamMsg == "" {
 										return nil, fmt.Errorf("upstream error: %d", resp.StatusCode)
 									}
 									return nil, fmt.Errorf("upstream error: %d message=%s", resp.StatusCode, upstreamMsg)
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								}
-												refactor: 重构 Chat Completions 端点，采用类型安全的 Responses API 转换

将 /v1/chat/completions 端点从 ResponseWriter 劫持模式重构为独立的
类型安全转换路径，与 Anthropic Messages 端点架构对齐：

- 在 apicompat 包新增 Chat Completions 完整类型定义和双向转换器
- 新增 ForwardAsChatCompletions service 方法，走 Responses API 上游
- Handler 改为独立的账号选择/failover 循环，不再劫持 Responses handler
- 提取 handleCompatErrorResponse 为 Chat Completions 和 Messages 共用
- 删除旧的 forwardChatCompletions 直传路径及相关死代码

											
										
										
											2026-03-11 22:10:22 +08:00
+								// compatErrorWriter is the signature for format-specific error writers used by
 								// the compat paths (Chat Completions and Anthropic Messages).
 								type compatErrorWriter func(c *gin.Context, statusCode int, errType, message string)
 								// handleCompatErrorResponse is the shared non-failover error handler for the
 								// Chat Completions and Anthropic Messages compat paths. It mirrors the logic of
 								// handleErrorResponse (passthrough rules, ShouldHandleErrorCode, rate-limit
 								// tracking, secondary failover) but delegates the final error write to the
 								// format-specific writer function.
 								func (s *OpenAIGatewayService) handleCompatErrorResponse(
 									resp *http.Response,
 									c *gin.Context,
 									account *Account,
 									writeError compatErrorWriter,
 								) (*OpenAIForwardResult, error) {
 									body, _ := io.ReadAll(io.LimitReader(resp.Body, 2<<20))
 									upstreamMsg := strings.TrimSpace(extractUpstreamErrorMessage(body))
 									if upstreamMsg == "" {
 										upstreamMsg = fmt.Sprintf("Upstream error: %d", resp.StatusCode)
 									}
 									upstreamMsg = sanitizeUpstreamErrorMessage(upstreamMsg)
 									upstreamDetail := ""
 									if s.cfg != nil && s.cfg.Gateway.LogUpstreamErrorBody {
 										maxBytes := s.cfg.Gateway.LogUpstreamErrorBodyMaxBytes
 										if maxBytes <= 0 {
 											maxBytes = 2048
 										}
 										upstreamDetail = truncateString(string(body), maxBytes)
 									}
 									setOpsUpstreamError(c, resp.StatusCode, upstreamMsg, upstreamDetail)
 									// Apply error passthrough rules
 									if status, errType, errMsg, matched := applyErrorPassthroughRule(
 										c, account.Platform, resp.StatusCode, body,
 										http.StatusBadGateway, "api_error", "Upstream request failed",
 									); matched {
 										writeError(c, status, errType, errMsg)
 										if upstreamMsg == "" {
 											upstreamMsg = errMsg
 										}
 										if upstreamMsg == "" {
 											return nil, fmt.Errorf("upstream error: %d (passthrough rule matched)", resp.StatusCode)
 										}
 										return nil, fmt.Errorf("upstream error: %d (passthrough rule matched) message=%s", resp.StatusCode, upstreamMsg)
 									}
 									// Check custom error codes — if the account does not handle this status,
 									// return a generic error without exposing upstream details.
 									if !account.ShouldHandleErrorCode(resp.StatusCode) {
 										appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 											Platform:           account.Platform,
 											AccountID:          account.ID,
 											AccountName:        account.Name,
 											UpstreamStatusCode: resp.StatusCode,
 											UpstreamRequestID:  resp.Header.Get("x-request-id"),
 											Kind:               "http_error",
 											Message:            upstreamMsg,
 											Detail:             upstreamDetail,
 										})
 										writeError(c, http.StatusInternalServerError, "api_error", "Upstream gateway error")
 										if upstreamMsg == "" {
 											return nil, fmt.Errorf("upstream error: %d (not in custom error codes)", resp.StatusCode)
 										}
 										return nil, fmt.Errorf("upstream error: %d (not in custom error codes) message=%s", resp.StatusCode, upstreamMsg)
 									}
 									// Track rate limits and decide whether to trigger secondary failover.
 									shouldDisable := false
 									if s.rateLimitService != nil {
 										shouldDisable = s.rateLimitService.HandleUpstreamError(
 											c.Request.Context(), account, resp.StatusCode, resp.Header, body,
 										)
 									}
 									kind := "http_error"
 									if shouldDisable {
 										kind = "failover"
 									}
 									appendOpsUpstreamError(c, OpsUpstreamErrorEvent{
 										Platform:           account.Platform,
 										AccountID:          account.ID,
 										AccountName:        account.Name,
 										UpstreamStatusCode: resp.StatusCode,
 										UpstreamRequestID:  resp.Header.Get("x-request-id"),
 										Kind:               kind,
 										Message:            upstreamMsg,
 										Detail:             upstreamDetail,
 									})
 									if shouldDisable {
 										return nil, &UpstreamFailoverError{
 											StatusCode:             resp.StatusCode,
 											ResponseBody:           body,
 											RetryableOnSameAccount: account.IsPoolMode() && isPoolModeRetryableStatus(resp.StatusCode),
 										}
 									}
 									// Map status code to error type and write response
 									errType := "api_error"
 									switch {
 									case resp.StatusCode == 400:
 										errType = "invalid_request_error"
 									case resp.StatusCode == 404:
 										errType = "not_found_error"
 									case resp.StatusCode == 429:
 										errType = "rate_limit_error"
 									case resp.StatusCode >= 500:
 										errType = "api_error"
 									}
 									writeError(c, resp.StatusCode, errType, upstreamMsg)
 									return nil, fmt.Errorf("upstream error: %d %s", resp.StatusCode, upstreamMsg)
 								}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								// openaiStreamingResult streaming response result
 								type openaiStreamingResult struct {
 									usage        *OpenAIUsage
 									firstTokenMs *int
 								}
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+								func (s *OpenAIGatewayService) handleStreamingResponse(ctx context.Context, resp *http.Response, c *gin.Context, account *Account, startTime time.Time, originalModel, mappedModel string) (*openaiStreamingResult, error) {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									if s.responseHeaderFilter != nil {
 										responseheaders.WriteFilteredHeaders(c.Writer.Header(), resp.Header, s.responseHeaderFilter)
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									// Set SSE response headers
 									c.Header("Content-Type", "text/event-stream")
 									c.Header("Cache-Control", "no-cache")
 									c.Header("Connection", "keep-alive")
 									c.Header("X-Accel-Buffering", "no")
 									// Pass through other headers
 									if v := resp.Header.Get("x-request-id"); v != "" {
 										c.Header("x-request-id", v)
 									}
 									w := c.Writer
 									flusher, ok := w.(http.Flusher)
 									if !ok {
 										return nil, errors.New("streaming not supported")
 									}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									bufferedWriter := bufio.NewWriterSize(w, 4*1024)
 									flushBuffered := func() error {
 										if err := bufferedWriter.Flush(); err != nil {
 											return err
 										}
 										flusher.Flush()
 										return nil
 									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
 									usage := &OpenAIUsage{}
 									var firstTokenMs *int
 									scanner := bufio.NewScanner(resp.Body)
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									maxLineSize := defaultMaxLineSize
 									if s.cfg != nil && s.cfg.Gateway.MaxLineSize > 0 {
 										maxLineSize = s.cfg.Gateway.MaxLineSize
 									}
-												perf(service): SSE Scanner buffer 改用 sync.Pool 复用，减少高并发 GC 压力

将流式响应中 bufio.Scanner 的 64KB buffer 从每次 make 分配改为
sync.Pool 复用，统一切片表达式为 [:0]、变量命名为 scanBuf，
并补充对应的单元测试。

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-06 22:55:12 +08:00
+									scanBuf := getSSEScannerBuf64K()
 									scanner.Buffer(scanBuf[:0], maxLineSize)
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
 									streamInterval := time.Duration(0)
 									if s.cfg != nil && s.cfg.Gateway.StreamDataIntervalTimeout > 0 {
 										streamInterval = time.Duration(s.cfg.Gateway.StreamDataIntervalTimeout) * time.Second
 									}
-												fix(流式): 以上游读取判定超时并调大事件缓冲

- 以读取时间戳判定流式间隔超时，避免下游阻塞误判
- antigravity 流式读取使用 MaxLineSize 配置
- 事件通道缓冲提升到 16

测试: go test ./...

											
										
										
											2026-01-04 20:19:07 +08:00
+									// 仅监控上游数据间隔超时，不被下游写入阻塞影响
 									var intervalTicker *time.Ticker
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									if streamInterval > 0 {
-												fix(流式): 以上游读取判定超时并调大事件缓冲

- 以读取时间戳判定流式间隔超时，避免下游阻塞误判
- antigravity 流式读取使用 MaxLineSize 配置
- 事件通道缓冲提升到 16

测试: go test ./...

											
										
										
											2026-01-04 20:19:07 +08:00
+										intervalTicker = time.NewTicker(streamInterval)
 										defer intervalTicker.Stop()
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									}
 									var intervalCh <-chan time.Time
-												fix(流式): 以上游读取判定超时并调大事件缓冲

- 以读取时间戳判定流式间隔超时，避免下游阻塞误判
- antigravity 流式读取使用 MaxLineSize 配置
- 事件通道缓冲提升到 16

测试: go test ./...

											
										
										
											2026-01-04 20:19:07 +08:00
+									if intervalTicker != nil {
 										intervalCh = intervalTicker.C
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									}
 									keepaliveInterval := time.Duration(0)
 									if s.cfg != nil && s.cfg.Gateway.StreamKeepaliveInterval > 0 {
 										keepaliveInterval = time.Duration(s.cfg.Gateway.StreamKeepaliveInterval) * time.Second
 									}
 									// 下游 keepalive 仅用于防止代理空闲断开
 									var keepaliveTicker *time.Ticker
 									if keepaliveInterval > 0 {
 										keepaliveTicker = time.NewTicker(keepaliveInterval)
 										defer keepaliveTicker.Stop()
 									}
 									var keepaliveCh <-chan time.Time
 									if keepaliveTicker != nil {
 										keepaliveCh = keepaliveTicker.C
 									}
-												fix(openai): keep responses stream alive during pre-output failover

											
										
										
											2026-04-25 12:11:27 +00:00
+									// Track downstream writes separately from upstream reads: pre-output failover
 									// can buffer response.created / response.in_progress, so keepalive must be
 									// based on downstream idle time.
 									lastDownstreamWriteAt := time.Now()
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
-												fix(openai): emit OpenAI-compatible SSE error events

											
										
										
											2026-01-19 13:53:39 +08:00
+									// 仅发送一次错误事件，避免多次写入导致协议混乱。
 									// 注意：OpenAI `/v1/responses` streaming 事件必须符合 OpenAI Responses schema；
 									// 否则下游 SDK（例如 OpenCode）会因为类型校验失败而报错。
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									errorEventSent := false
-												fix(gateway): drain upstream after client disconnect

											
										
										
											2026-01-15 21:51:14 +08:00
+									clientDisconnected := false // 客户端断开后继续 drain 上游以收集 usage
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+									sawTerminalEvent := false
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+									sawFailedEvent := false
 									failedMessage := ""
 									clientOutputStarted := false
 									upstreamRequestID := strings.TrimSpace(resp.Header.Get("x-request-id"))
 									var streamFailoverErr error
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									sendErrorEvent := func(reason string) {
-												fix(gateway): drain upstream after client disconnect

											
										
										
											2026-01-15 21:51:14 +08:00
+										if errorEventSent || clientDisconnected {
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+											return
 										}
 										errorEventSent = true
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										payload := `{"type":"error","sequence_number":0,"error":{"type":"upstream_error","message":` + strconv.Quote(reason) + `,"code":` + strconv.Quote(reason) + `}}`
 										if err := flushBuffered(); err != nil {
 											clientDisconnected = true
 											return
 										}
 										if _, err := bufferedWriter.WriteString("data: " + payload + "\n\n"); err != nil {
 											clientDisconnected = true
 											return
-												fix(openai): emit OpenAI-compatible SSE error events

											
										
										
											2026-01-19 13:53:39 +08:00
+										}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										if err := flushBuffered(); err != nil {
 											clientDisconnected = true
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+											return
-												fix(openai): emit OpenAI-compatible SSE error events

											
										
										
											2026-01-19 13:53:39 +08:00
+										}
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+										clientOutputStarted = true
-												fix(openai): keep responses stream alive during pre-output failover

											
										
										
											2026-04-25 12:11:27 +00:00
+										lastDownstreamWriteAt = time.Now()
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
 									needModelReplace := originalModel != mappedModel
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									resultWithUsage := func() *openaiStreamingResult {
 										return &openaiStreamingResult{usage: usage, firstTokenMs: firstTokenMs}
 									}
 									finalizeStream := func() (*openaiStreamingResult, error) {
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+										if !sawTerminalEvent {
 											if !openAIStreamClientOutputStarted(c, clientOutputStarted) {
 												return resultWithUsage(), s.newOpenAIStreamFailoverError(
 													c,
 													account,
 													false,
 													upstreamRequestID,
 													nil,
 													"OpenAI stream ended before a terminal event",
 												)
 											}
 											return resultWithUsage(), fmt.Errorf("stream usage incomplete: missing terminal event")
 										}
 										if sawFailedEvent {
 											return resultWithUsage(), fmt.Errorf("upstream response failed: %s", failedMessage)
 										}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										if !clientDisconnected {
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+											hadBufferedData := bufferedWriter.Buffered() > 0
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											if err := flushBuffered(); err != nil {
 												clientDisconnected = true
 												logger.LegacyPrintf("service.openai_gateway", "Client disconnected during final flush, returning collected usage")
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+											} else if hadBufferedData {
 												clientOutputStarted = true
-												fix(openai): keep responses stream alive during pre-output failover

											
										
										
											2026-04-25 12:11:27 +00:00
+												lastDownstreamWriteAt = time.Now()
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+											}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										}
 										return resultWithUsage(), nil
 									}
 									handleScanErr := func(scanErr error) (*openaiStreamingResult, error, bool) {
 										if scanErr == nil {
 											return nil, nil, false
 										}
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+										if sawTerminalEvent && !sawFailedEvent {
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+											logger.LegacyPrintf("service.openai_gateway", "Upstream scan ended after terminal event: %v", scanErr)
 											return resultWithUsage(), nil, true
 										}
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+										if sawFailedEvent {
 											return resultWithUsage(), fmt.Errorf("upstream response failed: %s", failedMessage), true
 										}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										// 客户端断开/取消请求时，上游读取往往会返回 context canceled。
 										// /v1/responses 的 SSE 事件必须符合 OpenAI 协议；这里不注入自定义 error event，避免下游 SDK 解析失败。
 										if errors.Is(scanErr, context.Canceled) || errors.Is(scanErr, context.DeadlineExceeded) {
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+											return resultWithUsage(), fmt.Errorf("stream usage incomplete: %w", scanErr), true
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										}
 										if errors.Is(scanErr, bufio.ErrTooLong) {
 											logger.LegacyPrintf("service.openai_gateway", "SSE line too long: account=%d max_size=%d error=%v", account.ID, maxLineSize, scanErr)
 											sendErrorEvent("response_too_large")
 											return resultWithUsage(), scanErr, true
 										}
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+										if !openAIStreamClientOutputStarted(c, clientOutputStarted) {
 											msg := "OpenAI stream disconnected before completion"
 											if errText := strings.TrimSpace(scanErr.Error()); errText != "" {
 												msg += ": " + errText
 											}
 											return resultWithUsage(), s.newOpenAIStreamFailoverError(c, account, false, upstreamRequestID, nil, msg), true
 										}
 										// 客户端已断开时，上游出错仅影响体验，不影响计费；返回已收集 usage
 										if clientDisconnected {
 											return resultWithUsage(), fmt.Errorf("stream usage incomplete after disconnect: %w", scanErr), true
 										}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										sendErrorEvent("stream_read_error")
 										return resultWithUsage(), fmt.Errorf("stream read error: %w", scanErr), true
 									}
 									processSSELine := func(line string, queueDrained bool) {
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+										if streamFailoverErr != nil {
 											return
 										}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										// Extract data from SSE line (supports both "data: " and "data:" formats)
 										if data, ok := extractOpenAISSEDataLine(line); ok {
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											// Replace model in response if needed.
 											// Fast path: most events do not contain model field values.
 											if needModelReplace && mappedModel != "" && strings.Contains(data, mappedModel) {
 												line = s.replaceModelInSSELine(line, mappedModel, originalModel)
 											}
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											dataBytes := []byte(data)
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+											if openAIStreamEventIsTerminal(data) {
 												sawTerminalEvent = true
 											}
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+											eventType := strings.TrimSpace(gjson.GetBytes(dataBytes, "type").String())
 											forceFlushFailedEvent := false
 											if eventType == "response.failed" {
 												failedMessage = extractOpenAISSEErrorMessage(dataBytes)
 												if !openAIStreamClientOutputStarted(c, clientOutputStarted) && openAIStreamFailedEventShouldFailover(dataBytes, failedMessage) {
 													sawFailedEvent = true
 													streamFailoverErr = s.newOpenAIStreamFailoverError(c, account, false, upstreamRequestID, dataBytes, failedMessage)
 													return
 												}
 												forceFlushFailedEvent = true
 												sawFailedEvent = true
 											}
-												feat(openai): 添加Codex工具调用自动修正功能

实现了完整的Codex工具调用拦截和自动修正系统，解决OpenCode使用Codex模型时的工具调用兼容性问题。

**核心功能:**

1. **工具名称自动映射**
   - apply_patch/applyPatch → edit
   - update_plan/updatePlan → todowrite
   - read_plan/readPlan → todoread
   - search_files/searchFiles → grep
   - list_files/listFiles → glob
   - read_file/readFile → read
   - write_file/writeFile → write
   - execute_bash/executeBash/exec_bash/execBash → bash

2. **工具参数自动修正**
   - bash: 自动移除不支持的 workdir/work_dir 参数
   - edit: 自动将 path 参数重命名为 file_path
   - 支持 JSON 字符串和对象两种参数格式

3. **流式响应集成**
   - 在 SSE 数据流中实时修正工具调用
   - 支持多种 JSON 结构（tool_calls, function_call, delta, choices等）
   - 不影响响应性能和用户体验

4. **统计和监控**
   - 记录每次工具修正的详细信息
   - 提供修正统计数据查询
   - 便于问题排查和性能优化

**实现文件:**
- `openai_tool_corrector.go`: 工具修正核心逻辑（250行）
- `openai_tool_corrector_test.go`: 完整的单元测试（380+行）
- `openai_gateway_service.go`: 流式响应集成
- `openai_gateway_service_tool_correction_test.go`: 集成测试

**测试覆盖:**
- 工具名称映射测试（18个映射规则）
- 参数修正测试（bash workdir、edit path等）
- SSE数据修正测试（多种JSON结构）
- 统计功能测试
- 所有测试通过 ✅

**解决的问题:**
修复了 OpenCode 使用 sub2api 中转 Codex 时，因工具名称和参数不兼容导致的工具调用失败问题。
Codex 模型有时会忽略指令文件中的工具映射说明，导致调用不存在的工具（如 apply_patch）。
现在通过流式响应拦截，自动将错误的工具调用修正为 OpenCode 兼容的格式。

**参考文档:**
- OpenCode 工具规范: https://opencode.ai/docs/
- Codex Bridge 指令: backend/internal/service/prompts/codex_opencode_bridge.txt

											
										
										
											2026-01-15 23:52:50 +08:00
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											// Correct Codex tool calls if needed (apply_patch -> edit, etc.)
 											if correctedData, corrected := s.toolCorrector.CorrectToolCallsInSSEBytes(dataBytes); corrected {
 												dataBytes = correctedData
 												data = string(correctedData)
 												line = "data: " + data
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+												eventType = strings.TrimSpace(gjson.GetBytes(dataBytes, "type").String())
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											}
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+											startsClientOutput := forceFlushFailedEvent || openAIStreamDataStartsClientOutput(data, eventType)
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											// 写入客户端（客户端断开后继续 drain 上游）
 											if !clientDisconnected {
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+												shouldFlush := queueDrained && (clientOutputStarted || startsClientOutput)
 												if firstTokenMs == nil && startsClientOutput {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+													// 保证首个 token 事件尽快出站，避免影响 TTFT。
 													shouldFlush = true
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+												}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+												if _, err := bufferedWriter.WriteString(line); err != nil {
 													clientDisconnected = true
 													logger.LegacyPrintf("service.openai_gateway", "Client disconnected during streaming, continuing to drain upstream for billing")
 												} else if _, err := bufferedWriter.WriteString("\n"); err != nil {
 													clientDisconnected = true
 													logger.LegacyPrintf("service.openai_gateway", "Client disconnected during streaming, continuing to drain upstream for billing")
 												} else if shouldFlush {
 													if err := flushBuffered(); err != nil {
-												fix(gateway): drain upstream after client disconnect

											
										
										
											2026-01-15 21:51:14 +08:00
+														clientDisconnected = true
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+														logger.LegacyPrintf("service.openai_gateway", "Client disconnected during streaming flush, continuing to drain upstream for billing")
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+													} else {
 														clientOutputStarted = true
-												fix(openai): keep responses stream alive during pre-output failover

											
										
										
											2026-04-25 12:11:27 +00:00
+														lastDownstreamWriteAt = time.Now()
-												fix(gateway): drain upstream after client disconnect

											
										
										
											2026-01-15 21:51:14 +08:00
+													}
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+												}
-												fix(sse): 修复非标准 SSE 格式解析问题

部分上游 API 返回的 SSE 格式不符合标准规范：
- 标准格式: `data: {...}`（冒号后有空格）
- 非标准格式: `data:{...}`（冒号后无空格）

使用预编译正则 `^data:\s*` 统一处理两种格式。

											
										
										
											2025-12-26 03:49:55 -08:00
+											}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											// Record first token time
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+											if firstTokenMs == nil && startsClientOutput {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+												ms := int(time.Since(startTime).Milliseconds())
 												firstTokenMs = &ms
 											}
 											s.parseSSEUsageBytes(dataBytes, usage)
 											return
 										}
 										// Forward non-data lines as-is
 										if !clientDisconnected {
 											if _, err := bufferedWriter.WriteString(line); err != nil {
 												clientDisconnected = true
 												logger.LegacyPrintf("service.openai_gateway", "Client disconnected during streaming, continuing to drain upstream for billing")
 											} else if _, err := bufferedWriter.WriteString("\n"); err != nil {
 												clientDisconnected = true
 												logger.LegacyPrintf("service.openai_gateway", "Client disconnected during streaming, continuing to drain upstream for billing")
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+											} else if queueDrained && clientOutputStarted {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+												if err := flushBuffered(); err != nil {
 													clientDisconnected = true
 													logger.LegacyPrintf("service.openai_gateway", "Client disconnected during streaming flush, continuing to drain upstream for billing")
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+												} else {
 													clientOutputStarted = true
-												fix(openai): keep responses stream alive during pre-output failover

											
										
										
											2026-04-25 12:11:27 +00:00
+													lastDownstreamWriteAt = time.Now()
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+												}
 											}
 										}
 									}
 									// 无超时/无 keepalive 的常见路径走同步扫描，减少 goroutine 与 channel 开销。
 									if streamInterval <= 0 && keepaliveInterval <= 0 {
 										defer putSSEScannerBuf64K(scanBuf)
 										for scanner.Scan() {
 											processSSELine(scanner.Text(), true)
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+											if streamFailoverErr != nil {
 												return resultWithUsage(), streamFailoverErr
 											}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										}
 										if result, err, done := handleScanErr(scanner.Err()); done {
 											return result, err
 										}
 										return finalizeStream()
 									}
 									type scanEvent struct {
 										line string
 										err  error
 									}
 									// 独立 goroutine 读取上游，避免读取阻塞影响 keepalive/超时处理
 									events := make(chan scanEvent, 16)
 									done := make(chan struct{})
 									sendEvent := func(ev scanEvent) bool {
 										select {
 										case events <- ev:
 											return true
 										case <-done:
 											return false
 										}
 									}
 									var lastReadAt int64
 									atomic.StoreInt64(&lastReadAt, time.Now().UnixNano())
 									go func(scanBuf *sseScannerBuf64K) {
 										defer putSSEScannerBuf64K(scanBuf)
 										defer close(events)
 										for scanner.Scan() {
 											atomic.StoreInt64(&lastReadAt, time.Now().UnixNano())
 											if !sendEvent(scanEvent{line: scanner.Text()}) {
 												return
 											}
 										}
 										if err := scanner.Err(); err != nil {
 											_ = sendEvent(scanEvent{err: err})
 										}
 									}(scanBuf)
 									defer close(done)
 									for {
 										select {
 										case ev, ok := <-events:
 											if !ok {
 												return finalizeStream()
 											}
 											if result, err, done := handleScanErr(ev.err); done {
 												return result, err
 											}
 											processSSELine(ev.line, len(events) == 0)
-												fix(openai): fail over before responses stream output

											
										
										
											2026-04-25 15:09:40 +08:00
+											if streamFailoverErr != nil {
 												return resultWithUsage(), streamFailoverErr
 											}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+										case <-intervalCh:
-												fix(流式): 以上游读取判定超时并调大事件缓冲

- 以读取时间戳判定流式间隔超时，避免下游阻塞误判
- antigravity 流式读取使用 MaxLineSize 配置
- 事件通道缓冲提升到 16

测试: go test ./...

											
										
										
											2026-01-04 20:19:07 +08:00
+											lastRead := time.Unix(0, atomic.LoadInt64(&lastReadAt))
 											if time.Since(lastRead) < streamInterval {
 												continue
 											}
-												fix(gateway): drain upstream after client disconnect

											
										
										
											2026-01-15 21:51:14 +08:00
+											if clientDisconnected {
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+												return resultWithUsage(), fmt.Errorf("stream usage incomplete after timeout")
-												fix(gateway): drain upstream after client disconnect

											
										
										
											2026-01-15 21:51:14 +08:00
+											}
-												chore(logging): 完成后端日志审计与结构化迁移

- 将高密度服务与处理器日志迁移到新日志系统（LegacyPrintf/结构化日志）
- 增加 stdlog bridge 与兼容测试，保留旧日志捕获能力
- 将 OpenAI 断流告警改为结构化 Warn 并改造对应测试为 sink 捕获
- 补齐后端相关文件 logger 引用并通过全量 go test

											
										
										
											2026-02-12 19:01:09 +08:00
+											logger.LegacyPrintf("service.openai_gateway", "Stream data interval timeout: account=%d model=%s interval=%s", account.ID, originalModel, streamInterval)
-												feat(gateway): 添加流超时处理机制

- 添加 StreamTimeoutSettings 配置结构体和系统设置
- 实现 TimeoutCounterCache Redis 计数器用于累计超时次数
- 在 RateLimitService 添加 HandleStreamTimeout 方法
- 在 gateway_service、openai_gateway_service、antigravity_gateway_service 中调用超时处理
- 添加后端 API 端点 GET/PUT /admin/settings/stream-timeout
- 添加前端配置界面到系统设置页面
- 支持配置：启用开关、超时阈值、处理方式、暂停时长、触发阈值、阈值窗口

默认配置：
- 启用：true
- 超时阈值：60秒
- 处理方式：临时不可调度
- 暂停时长：5分钟
- 触发阈值：3次
- 阈值窗口：10分钟

											
										
										
											2026-01-11 21:54:52 -08:00
+											// 处理流超时，可能标记账户为临时不可调度或错误状态
 											if s.rateLimitService != nil {
 												s.rateLimitService.HandleStreamTimeout(ctx, account, originalModel)
 											}
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+											sendErrorEvent("stream_timeout")
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											return resultWithUsage(), fmt.Errorf("stream data interval timeout")
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
 										case <-keepaliveCh:
-												fix(gateway): drain upstream after client disconnect

											
										
										
											2026-01-15 21:51:14 +08:00
+											if clientDisconnected {
 												continue
 											}
-												fix(openai): keep responses stream alive during pre-output failover

											
										
										
											2026-04-25 12:11:27 +00:00
+											if time.Since(lastDownstreamWriteAt) < keepaliveInterval {
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+												continue
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+											}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											if _, err := bufferedWriter.WriteString(":\n\n"); err != nil {
-												fix(gateway): drain upstream after client disconnect

											
										
										
											2026-01-15 21:51:14 +08:00
+												clientDisconnected = true
-												chore(logging): 完成后端日志审计与结构化迁移

- 将高密度服务与处理器日志迁移到新日志系统（LegacyPrintf/结构化日志）
- 增加 stdlog bridge 与兼容测试，保留旧日志捕获能力
- 将 OpenAI 断流告警改为结构化 Warn 并改造对应测试为 sink 捕获
- 补齐后端相关文件 logger 引用并通过全量 go test

											
										
										
											2026-02-12 19:01:09 +08:00
+												logger.LegacyPrintf("service.openai_gateway", "Client disconnected during streaming, continuing to drain upstream for billing")
-												fix(gateway): drain upstream after client disconnect

											
										
										
											2026-01-15 21:51:14 +08:00
+												continue
-												fix(sse): 修复非标准 SSE 格式解析问题

部分上游 API 返回的 SSE 格式不符合标准规范：
- 标准格式: `data: {...}`（冒号后有空格）
- 非标准格式: `data:{...}`（冒号后无空格）

使用预编译正则 `^data:\s*` 统一处理两种格式。

											
										
										
											2025-12-26 03:49:55 -08:00
+											}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											if err := flushBuffered(); err != nil {
 												clientDisconnected = true
 												logger.LegacyPrintf("service.openai_gateway", "Client disconnected during keepalive flush, continuing to drain upstream for billing")
-												fix(openai): keep responses stream alive during pre-output failover

											
										
										
											2026-04-25 12:11:27 +00:00
+											} else {
 												lastDownstreamWriteAt = time.Now()
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+											}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										}
 									}
 								}
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+								// extractOpenAISSEDataLine 低开销提取 SSE `data:` 行内容。
 								// 兼容 `data: xxx` 与 `data:xxx` 两种格式。
 								func extractOpenAISSEDataLine(line string) (string, bool) {
 									if !strings.HasPrefix(line, "data:") {
 										return "", false
 									}
 									start := len("data:")
 									for start < len(line) {
 										if line[start] != ' ' && line[start] != '	' {
 											break
 										}
 										start++
 									}
 									return line[start:], true
 								}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								func (s *OpenAIGatewayService) replaceModelInSSELine(line, fromModel, toModel string) string {
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+									data, ok := extractOpenAISSEDataLine(line)
 									if !ok {
-												fix(sse): 修复非标准 SSE 格式解析问题

部分上游 API 返回的 SSE 格式不符合标准规范：
- 标准格式: `data: {...}`（冒号后有空格）
- 非标准格式: `data:{...}`（冒号后无空格）

使用预编译正则 `^data:\s*` 统一处理两种格式。

											
										
										
											2025-12-26 03:49:55 -08:00
+										return line
 									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									if data == "" || data == "[DONE]" {
 										return line
 									}
-												perf(service): 优化 model 替换函数，用 gjson/sjson 替代全量 JSON 序列化

SSE 热路径中 replaceModelInSSELine 和 replaceModelInResponseBody 原来
使用 json.Unmarshal/Marshal 对每个事件做全量反序列化再序列化，现改为
gjson.Get/sjson.Set 精确字段操作，消除 O(n) 中间 map 分配，保持 JSON
字段顺序不变。涉及 OpenAIGatewayService 和 GatewayService 两个服务。

新增 23 个单元测试覆盖：顶层/嵌套 model 替换、不匹配跳过、空行/[DONE]/
非法 JSON 等边界情况。

Fixes: P1-08

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-07 17:09:55 +08:00
+									// 使用 gjson 精确检查 model 字段，避免全量 JSON 反序列化
 									if m := gjson.Get(data, "model"); m.Exists() && m.Str == fromModel {
 										newData, err := sjson.Set(data, "model", toModel)
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										if err != nil {
 											return line
 										}
-												perf(service): 优化 model 替换函数，用 gjson/sjson 替代全量 JSON 序列化

SSE 热路径中 replaceModelInSSELine 和 replaceModelInResponseBody 原来
使用 json.Unmarshal/Marshal 对每个事件做全量反序列化再序列化，现改为
gjson.Get/sjson.Set 精确字段操作，消除 O(n) 中间 map 分配，保持 JSON
字段顺序不变。涉及 OpenAIGatewayService 和 GatewayService 两个服务。

新增 23 个单元测试覆盖：顶层/嵌套 model 替换、不匹配跳过、空行/[DONE]/
非法 JSON 等边界情况。

Fixes: P1-08

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-07 17:09:55 +08:00
+										return "data: " + newData
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
-												perf(service): 优化 model 替换函数，用 gjson/sjson 替代全量 JSON 序列化

SSE 热路径中 replaceModelInSSELine 和 replaceModelInResponseBody 原来
使用 json.Unmarshal/Marshal 对每个事件做全量反序列化再序列化，现改为
gjson.Get/sjson.Set 精确字段操作，消除 O(n) 中间 map 分配，保持 JSON
字段顺序不变。涉及 OpenAIGatewayService 和 GatewayService 两个服务。

新增 23 个单元测试覆盖：顶层/嵌套 model 替换、不匹配跳过、空行/[DONE]/
非法 JSON 等边界情况。

Fixes: P1-08

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-07 17:09:55 +08:00
+									// 检查嵌套的 response.model 字段
 									if m := gjson.Get(data, "response.model"); m.Exists() && m.Str == fromModel {
 										newData, err := sjson.Set(data, "response.model", toModel)
 										if err != nil {
 											return line
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										}
-												perf(service): 优化 model 替换函数，用 gjson/sjson 替代全量 JSON 序列化

SSE 热路径中 replaceModelInSSELine 和 replaceModelInResponseBody 原来
使用 json.Unmarshal/Marshal 对每个事件做全量反序列化再序列化，现改为
gjson.Get/sjson.Set 精确字段操作，消除 O(n) 中间 map 分配，保持 JSON
字段顺序不变。涉及 OpenAIGatewayService 和 GatewayService 两个服务。

新增 23 个单元测试覆盖：顶层/嵌套 model 替换、不匹配跳过、空行/[DONE]/
非法 JSON 等边界情况。

Fixes: P1-08

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-07 17:09:55 +08:00
+										return "data: " + newData
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
 									return line
 								}
-												feat(openai): 添加Codex工具调用自动修正功能

实现了完整的Codex工具调用拦截和自动修正系统，解决OpenCode使用Codex模型时的工具调用兼容性问题。

**核心功能:**

1. **工具名称自动映射**
   - apply_patch/applyPatch → edit
   - update_plan/updatePlan → todowrite
   - read_plan/readPlan → todoread
   - search_files/searchFiles → grep
   - list_files/listFiles → glob
   - read_file/readFile → read
   - write_file/writeFile → write
   - execute_bash/executeBash/exec_bash/execBash → bash

2. **工具参数自动修正**
   - bash: 自动移除不支持的 workdir/work_dir 参数
   - edit: 自动将 path 参数重命名为 file_path
   - 支持 JSON 字符串和对象两种参数格式

3. **流式响应集成**
   - 在 SSE 数据流中实时修正工具调用
   - 支持多种 JSON 结构（tool_calls, function_call, delta, choices等）
   - 不影响响应性能和用户体验

4. **统计和监控**
   - 记录每次工具修正的详细信息
   - 提供修正统计数据查询
   - 便于问题排查和性能优化

**实现文件:**
- `openai_tool_corrector.go`: 工具修正核心逻辑（250行）
- `openai_tool_corrector_test.go`: 完整的单元测试（380+行）
- `openai_gateway_service.go`: 流式响应集成
- `openai_gateway_service_tool_correction_test.go`: 集成测试

**测试覆盖:**
- 工具名称映射测试（18个映射规则）
- 参数修正测试（bash workdir、edit path等）
- SSE数据修正测试（多种JSON结构）
- 统计功能测试
- 所有测试通过 ✅

**解决的问题:**
修复了 OpenCode 使用 sub2api 中转 Codex 时，因工具名称和参数不兼容导致的工具调用失败问题。
Codex 模型有时会忽略指令文件中的工具映射说明，导致调用不存在的工具（如 apply_patch）。
现在通过流式响应拦截，自动将错误的工具调用修正为 OpenCode 兼容的格式。

**参考文档:**
- OpenCode 工具规范: https://opencode.ai/docs/
- Codex Bridge 指令: backend/internal/service/prompts/codex_opencode_bridge.txt

											
										
										
											2026-01-15 23:52:50 +08:00
+								// correctToolCallsInResponseBody 修正响应体中的工具调用
 								func (s *OpenAIGatewayService) correctToolCallsInResponseBody(body []byte) []byte {
 									if len(body) == 0 {
 										return body
 									}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									corrected, changed := s.toolCorrector.CorrectToolCallsInSSEBytes(body)
-												feat(openai): 添加Codex工具调用自动修正功能

实现了完整的Codex工具调用拦截和自动修正系统，解决OpenCode使用Codex模型时的工具调用兼容性问题。

**核心功能:**

1. **工具名称自动映射**
   - apply_patch/applyPatch → edit
   - update_plan/updatePlan → todowrite
   - read_plan/readPlan → todoread
   - search_files/searchFiles → grep
   - list_files/listFiles → glob
   - read_file/readFile → read
   - write_file/writeFile → write
   - execute_bash/executeBash/exec_bash/execBash → bash

2. **工具参数自动修正**
   - bash: 自动移除不支持的 workdir/work_dir 参数
   - edit: 自动将 path 参数重命名为 file_path
   - 支持 JSON 字符串和对象两种参数格式

3. **流式响应集成**
   - 在 SSE 数据流中实时修正工具调用
   - 支持多种 JSON 结构（tool_calls, function_call, delta, choices等）
   - 不影响响应性能和用户体验

4. **统计和监控**
   - 记录每次工具修正的详细信息
   - 提供修正统计数据查询
   - 便于问题排查和性能优化

**实现文件:**
- `openai_tool_corrector.go`: 工具修正核心逻辑（250行）
- `openai_tool_corrector_test.go`: 完整的单元测试（380+行）
- `openai_gateway_service.go`: 流式响应集成
- `openai_gateway_service_tool_correction_test.go`: 集成测试

**测试覆盖:**
- 工具名称映射测试（18个映射规则）
- 参数修正测试（bash workdir、edit path等）
- SSE数据修正测试（多种JSON结构）
- 统计功能测试
- 所有测试通过 ✅

**解决的问题:**
修复了 OpenCode 使用 sub2api 中转 Codex 时，因工具名称和参数不兼容导致的工具调用失败问题。
Codex 模型有时会忽略指令文件中的工具映射说明，导致调用不存在的工具（如 apply_patch）。
现在通过流式响应拦截，自动将错误的工具调用修正为 OpenCode 兼容的格式。

**参考文档:**
- OpenCode 工具规范: https://opencode.ai/docs/
- Codex Bridge 指令: backend/internal/service/prompts/codex_opencode_bridge.txt

											
										
										
											2026-01-15 23:52:50 +08:00
+									if changed {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										return corrected
-												feat(openai): 添加Codex工具调用自动修正功能

实现了完整的Codex工具调用拦截和自动修正系统，解决OpenCode使用Codex模型时的工具调用兼容性问题。

**核心功能:**

1. **工具名称自动映射**
   - apply_patch/applyPatch → edit
   - update_plan/updatePlan → todowrite
   - read_plan/readPlan → todoread
   - search_files/searchFiles → grep
   - list_files/listFiles → glob
   - read_file/readFile → read
   - write_file/writeFile → write
   - execute_bash/executeBash/exec_bash/execBash → bash

2. **工具参数自动修正**
   - bash: 自动移除不支持的 workdir/work_dir 参数
   - edit: 自动将 path 参数重命名为 file_path
   - 支持 JSON 字符串和对象两种参数格式

3. **流式响应集成**
   - 在 SSE 数据流中实时修正工具调用
   - 支持多种 JSON 结构（tool_calls, function_call, delta, choices等）
   - 不影响响应性能和用户体验

4. **统计和监控**
   - 记录每次工具修正的详细信息
   - 提供修正统计数据查询
   - 便于问题排查和性能优化

**实现文件:**
- `openai_tool_corrector.go`: 工具修正核心逻辑（250行）
- `openai_tool_corrector_test.go`: 完整的单元测试（380+行）
- `openai_gateway_service.go`: 流式响应集成
- `openai_gateway_service_tool_correction_test.go`: 集成测试

**测试覆盖:**
- 工具名称映射测试（18个映射规则）
- 参数修正测试（bash workdir、edit path等）
- SSE数据修正测试（多种JSON结构）
- 统计功能测试
- 所有测试通过 ✅

**解决的问题:**
修复了 OpenCode 使用 sub2api 中转 Codex 时，因工具名称和参数不兼容导致的工具调用失败问题。
Codex 模型有时会忽略指令文件中的工具映射说明，导致调用不存在的工具（如 apply_patch）。
现在通过流式响应拦截，自动将错误的工具调用修正为 OpenCode 兼容的格式。

**参考文档:**
- OpenCode 工具规范: https://opencode.ai/docs/
- Codex Bridge 指令: backend/internal/service/prompts/codex_opencode_bridge.txt

											
										
										
											2026-01-15 23:52:50 +08:00
+									}
 									return body
 								}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								func (s *OpenAIGatewayService) parseSSEUsage(data string, usage *OpenAIUsage) {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									s.parseSSEUsageBytes([]byte(data), usage)
 								}
 								func (s *OpenAIGatewayService) parseSSEUsageBytes(data []byte, usage *OpenAIUsage) {
 									if usage == nil || len(data) == 0 || bytes.Equal(data, []byte("[DONE]")) {
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+										return
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+									// 选择性解析：仅在数据中包含终止事件标识时才进入字段提取。
 									if len(data) < 72 {
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+										return
 									}
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+									eventType := gjson.GetBytes(data, "type").String()
-												fix(openai): tighten responses stream account tests

											
										
										
											2026-04-25 16:56:50 +08:00
+									if eventType != "response.completed" && eventType != "response.done" &&
 										eventType != "response.incomplete" && eventType != "response.cancelled" && eventType != "response.canceled" {
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+										return
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									usage.InputTokens = int(gjson.GetBytes(data, "response.usage.input_tokens").Int())
 									usage.OutputTokens = int(gjson.GetBytes(data, "response.usage.output_tokens").Int())
 									usage.CacheReadInputTokens = int(gjson.GetBytes(data, "response.usage.input_tokens_details.cached_tokens").Int())
-												feat(openai): 同步生图 API 支持并接入图片计费调度

- 同步 OpenAI 图片生成与编辑接口
- 接入图片请求解析、账号调度、转发与用量记录
- 接入图片计费与图片用量落库
- 限制 OAuth 生图仅支持无显式模型和尺寸的基础请求

											
										
										
											2026-04-22 12:30:08 +08:00
+									usage.ImageOutputTokens = int(gjson.GetBytes(data, "response.usage.output_tokens_details.image_tokens").Int())
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+								}
 								func extractOpenAIUsageFromJSONBytes(body []byte) (OpenAIUsage, bool) {
 									if len(body) == 0 || !gjson.ValidBytes(body) {
 										return OpenAIUsage{}, false
 									}
 									values := gjson.GetManyBytes(
 										body,
 										"usage.input_tokens",
 										"usage.output_tokens",
 										"usage.input_tokens_details.cached_tokens",
-												feat(openai): 同步生图 API 支持并接入图片计费调度

- 同步 OpenAI 图片生成与编辑接口
- 接入图片请求解析、账号调度、转发与用量记录
- 接入图片计费与图片用量落库
- 限制 OAuth 生图仅支持无显式模型和尺寸的基础请求

											
										
										
											2026-04-22 12:30:08 +08:00
+										"usage.output_tokens_details.image_tokens",
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									)
 									return OpenAIUsage{
 										InputTokens:          int(values[0].Int()),
 										OutputTokens:         int(values[1].Int()),
 										CacheReadInputTokens: int(values[2].Int()),
-												feat(openai): 同步生图 API 支持并接入图片计费调度

- 同步 OpenAI 图片生成与编辑接口
- 接入图片请求解析、账号调度、转发与用量记录
- 接入图片计费与图片用量落库
- 限制 OAuth 生图仅支持无显式模型和尺寸的基础请求

											
										
										
											2026-04-22 12:30:08 +08:00
+										ImageOutputTokens:    int(values[3].Int()),
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									}, true
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								}
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+								func (s *OpenAIGatewayService) handleNonStreamingResponse(ctx context.Context, resp *http.Response, c *gin.Context, account *Account, originalModel, mappedModel string) (*OpenAIUsage, error) {
-												refactor: extract ReadUpstreamResponseBody to deduplicate upstream response read + too-large error handling

Consolidates 9 call sites of resolveUpstreamResponseReadLimit + readUpstreamResponseBodyLimited + ErrUpstreamResponseBodyTooLarge error handling into a single ReadUpstreamResponseBody function with TooLargeWriter callback for API-format-specific error responses (Anthropic, OpenAI, countTokens).

											
										
										
											2026-04-16 01:53:22 +08:00
+									body, err := ReadUpstreamResponseBody(resp.Body, s.cfg, c, openAITooLargeError)
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									if err != nil {
 										return nil, err
 									}
-												fix: 非流式响应路径扩展SSE检测至所有账号类型 (#1493)

当上游返回SSE格式响应(如sub2api链路)时，API Key账号的非流式路径
未检测SSE，导致终态事件中空output直接透传给客户端。

- 将Content-Type SSE检测从仅OAuth扩展至所有账号类型
- 重命名handleOAuthSSEToJSON为handleSSEToJSON（无OAuth专属逻辑）
- 为透传路径新增handlePassthroughSSEToJSON，支持SSE转JSON及空output重建

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-07 22:49:14 +08:00
+									// Detect SSE responses for ALL account types via Content-Type header.
 									// Some OpenAI-compatible upstreams (including other sub2api instances)
 									// may return SSE even when stream=false was requested.
 									if isEventStreamResponse(resp.Header) {
 										return s.handleSSEToJSON(resp, c, body, originalModel, mappedModel)
 									}
 									// For OAuth accounts, also fall back to a body-content heuristic because
 									// the upstream may omit the Content-Type header while still sending SSE.
 									// This heuristic is NOT applied to API-key accounts to avoid false
 									// positives on JSON responses that coincidentally contain "data:" or
 									// "event:" in their text content.
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+									if account.Type == AccountTypeOAuth {
 										bodyLooksLikeSSE := bytes.Contains(body, []byte("data:")) || bytes.Contains(body, []byte("event:"))
-												fix: 非流式响应路径扩展SSE检测至所有账号类型 (#1493)

当上游返回SSE格式响应(如sub2api链路)时，API Key账号的非流式路径
未检测SSE，导致终态事件中空output直接透传给客户端。

- 将Content-Type SSE检测从仅OAuth扩展至所有账号类型
- 重命名handleOAuthSSEToJSON为handleSSEToJSON（无OAuth专属逻辑）
- 为透传路径新增handlePassthroughSSEToJSON，支持SSE转JSON及空output重建

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-07 22:49:14 +08:00
+										if bodyLooksLikeSSE {
 											return s.handleSSEToJSON(resp, c, body, originalModel, mappedModel)
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+										}
 									}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									usageValue, usageOK := extractOpenAIUsageFromJSONBytes(body)
 									if !usageOK {
 										return nil, fmt.Errorf("parse response: invalid json response")
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									usage := &usageValue
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
 									// Replace model in response if needed
 									if originalModel != mappedModel {
 										body = s.replaceModelInResponseBody(body, mappedModel, originalModel)
 									}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									responseheaders.WriteFilteredHeaders(c.Writer.Header(), resp.Header, s.responseHeaderFilter)
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+									contentType := "application/json"
 									if s.cfg != nil && !s.cfg.Security.ResponseHeaders.Enabled {
 										if upstreamType := resp.Header.Get("Content-Type"); upstreamType != "" {
 											contentType = upstreamType
 										}
 									}
 									c.Data(resp.StatusCode, contentType, body)
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
 									return usage, nil
 								}
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+								func isEventStreamResponse(header http.Header) bool {
 									contentType := strings.ToLower(header.Get("Content-Type"))
 									return strings.Contains(contentType, "text/event-stream")
 								}
-												fix: 非流式响应路径扩展SSE检测至所有账号类型 (#1493)

当上游返回SSE格式响应(如sub2api链路)时，API Key账号的非流式路径
未检测SSE，导致终态事件中空output直接透传给客户端。

- 将Content-Type SSE检测从仅OAuth扩展至所有账号类型
- 重命名handleOAuthSSEToJSON为handleSSEToJSON（无OAuth专属逻辑）
- 为透传路径新增handlePassthroughSSEToJSON，支持SSE转JSON及空output重建

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-07 22:49:14 +08:00
+								func (s *OpenAIGatewayService) handleSSEToJSON(resp *http.Response, c *gin.Context, body []byte, originalModel, mappedModel string) (*OpenAIUsage, error) {
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+									bodyText := string(body)
 									finalResponse, ok := extractCodexFinalResponse(bodyText)
 									usage := &OpenAIUsage{}
 									if ok {
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										if parsedUsage, parsed := extractOpenAIUsageFromJSONBytes(finalResponse); parsed {
 											*usage = parsedUsage
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+										}
-												fix: 非流式路径在上游终态事件output为空时从delta事件重建响应内容

上游API近期更新后，response.completed终态SSE事件的output字段可能为空，
实际内容仅通过response.output_text.delta等增量事件下发。流式路径不受影响，
但chat_completions非流式路径和responses OAuth非流式路径只依赖终态事件的
output，导致返回空响应。

新增BufferedResponseAccumulator累积器，在SSE扫描过程中收集delta事件内容
（文本、function_call、reasoning），当终态output为空时补充重建。

同时修复handleChatBufferedStreamingResponse遗漏response.done事件类型的问题。

											
										
										
											2026-04-07 19:30:45 +08:00
+										// When the terminal event has an empty output array, reconstruct
 										// output from accumulated delta events so the client gets full content.
 										// gjson Array() returns empty slice for null, missing, or empty arrays.
 										if len(gjson.GetBytes(finalResponse, "output").Array()) == 0 {
 											if outputJSON, reconstructed := reconstructResponseOutputFromSSE(bodyText); reconstructed {
 												if patched, err := sjson.SetRawBytes(finalResponse, "output", outputJSON); err == nil {
 													finalResponse = patched
 												}
 											}
 										}
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+										body = finalResponse
 										if originalModel != mappedModel {
 											body = s.replaceModelInResponseBody(body, mappedModel, originalModel)
 										}
-												feat(openai): 添加Codex工具调用自动修正功能

实现了完整的Codex工具调用拦截和自动修正系统，解决OpenCode使用Codex模型时的工具调用兼容性问题。

**核心功能:**

1. **工具名称自动映射**
   - apply_patch/applyPatch → edit
   - update_plan/updatePlan → todowrite
   - read_plan/readPlan → todoread
   - search_files/searchFiles → grep
   - list_files/listFiles → glob
   - read_file/readFile → read
   - write_file/writeFile → write
   - execute_bash/executeBash/exec_bash/execBash → bash

2. **工具参数自动修正**
   - bash: 自动移除不支持的 workdir/work_dir 参数
   - edit: 自动将 path 参数重命名为 file_path
   - 支持 JSON 字符串和对象两种参数格式

3. **流式响应集成**
   - 在 SSE 数据流中实时修正工具调用
   - 支持多种 JSON 结构（tool_calls, function_call, delta, choices等）
   - 不影响响应性能和用户体验

4. **统计和监控**
   - 记录每次工具修正的详细信息
   - 提供修正统计数据查询
   - 便于问题排查和性能优化

**实现文件:**
- `openai_tool_corrector.go`: 工具修正核心逻辑（250行）
- `openai_tool_corrector_test.go`: 完整的单元测试（380+行）
- `openai_gateway_service.go`: 流式响应集成
- `openai_gateway_service_tool_correction_test.go`: 集成测试

**测试覆盖:**
- 工具名称映射测试（18个映射规则）
- 参数修正测试（bash workdir、edit path等）
- SSE数据修正测试（多种JSON结构）
- 统计功能测试
- 所有测试通过 ✅

**解决的问题:**
修复了 OpenCode 使用 sub2api 中转 Codex 时，因工具名称和参数不兼容导致的工具调用失败问题。
Codex 模型有时会忽略指令文件中的工具映射说明，导致调用不存在的工具（如 apply_patch）。
现在通过流式响应拦截，自动将错误的工具调用修正为 OpenCode 兼容的格式。

**参考文档:**
- OpenCode 工具规范: https://opencode.ai/docs/
- Codex Bridge 指令: backend/internal/service/prompts/codex_opencode_bridge.txt

											
										
										
											2026-01-15 23:52:50 +08:00
+										// Correct tool calls in final response
 										body = s.correctToolCallsInResponseBody(body)
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+									} else {
-												fix(openai): 统一专属倍率计费链路并补齐回归测试

抽取共享的用户分组专属倍率解析器，统一缓存、singleflight 与回退逻辑。\n\n让 OpenAI 独立计费链路复用专属倍率解析，修复 usage 记录与实际扣费未命中用户专属倍率的问题。\n\n补齐 OpenAI 计费与解析器单元测试，并修复全量回归中暴露的 lint 阻塞项。\n\nCo-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-06 14:54:52 +08:00
+										terminalType, terminalPayload, terminalOK := extractOpenAISSETerminalEvent(bodyText)
 										if terminalOK && terminalType == "response.failed" {
 											msg := extractOpenAISSEErrorMessage(terminalPayload)
 											if msg == "" {
 												msg = "Upstream compact response failed"
 											}
 											return nil, s.writeOpenAINonStreamingProtocolError(resp, c, msg)
 										}
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+										usage = s.parseSSEUsageFromBody(bodyText)
 										if originalModel != mappedModel {
 											bodyText = s.replaceModelInSSEBody(bodyText, mappedModel, originalModel)
 										}
 										body = []byte(bodyText)
 									}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									responseheaders.WriteFilteredHeaders(c.Writer.Header(), resp.Header, s.responseHeaderFilter)
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
 									contentType := "application/json; charset=utf-8"
 									if !ok {
 										contentType = resp.Header.Get("Content-Type")
 										if contentType == "" {
 											contentType = "text/event-stream"
 										}
 									}
 									c.Data(resp.StatusCode, contentType, body)
 									return usage, nil
 								}
-												fix(openai): 统一专属倍率计费链路并补齐回归测试

抽取共享的用户分组专属倍率解析器，统一缓存、singleflight 与回退逻辑。\n\n让 OpenAI 独立计费链路复用专属倍率解析，修复 usage 记录与实际扣费未命中用户专属倍率的问题。\n\n补齐 OpenAI 计费与解析器单元测试，并修复全量回归中暴露的 lint 阻塞项。\n\nCo-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-06 14:54:52 +08:00
+								func extractOpenAISSETerminalEvent(body string) (string, []byte, bool) {
 									lines := strings.Split(body, "\n")
 									for _, line := range lines {
 										data, ok := extractOpenAISSEDataLine(line)
 										if !ok || data == "" || data == "[DONE]" {
 											continue
 										}
 										eventType := strings.TrimSpace(gjson.Get(data, "type").String())
 										switch eventType {
-												fix(openai): tighten responses stream account tests

											
										
										
											2026-04-25 16:56:50 +08:00
+										case "response.completed", "response.done", "response.failed", "response.incomplete", "response.cancelled", "response.canceled":
-												fix(openai): 统一专属倍率计费链路并补齐回归测试

抽取共享的用户分组专属倍率解析器，统一缓存、singleflight 与回退逻辑。\n\n让 OpenAI 独立计费链路复用专属倍率解析，修复 usage 记录与实际扣费未命中用户专属倍率的问题。\n\n补齐 OpenAI 计费与解析器单元测试，并修复全量回归中暴露的 lint 阻塞项。\n\nCo-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-06 14:54:52 +08:00
+											return eventType, []byte(data), true
 										}
 									}
 									return "", nil, false
 								}
 								func extractOpenAISSEErrorMessage(payload []byte) string {
 									if len(payload) == 0 {
 										return ""
 									}
 									for _, path := range []string{"response.error.message", "error.message", "message"} {
 										if msg := strings.TrimSpace(gjson.GetBytes(payload, path).String()); msg != "" {
 											return sanitizeUpstreamErrorMessage(msg)
 										}
 									}
 									return sanitizeUpstreamErrorMessage(strings.TrimSpace(extractUpstreamErrorMessage(payload)))
 								}
 								func (s *OpenAIGatewayService) writeOpenAINonStreamingProtocolError(resp *http.Response, c *gin.Context, message string) error {
 									message = sanitizeUpstreamErrorMessage(strings.TrimSpace(message))
 									if message == "" {
 										message = "Upstream returned an invalid non-streaming response"
 									}
 									setOpsUpstreamError(c, http.StatusBadGateway, message, "")
 									responseheaders.WriteFilteredHeaders(c.Writer.Header(), resp.Header, s.responseHeaderFilter)
 									c.Writer.Header().Set("Content-Type", "application/json; charset=utf-8")
 									c.JSON(http.StatusBadGateway, gin.H{
 										"error": gin.H{
 											"type":    "upstream_error",
 											"message": message,
 										},
 									})
 									return fmt.Errorf("non-streaming openai protocol error: %s", message)
 								}
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+								func extractCodexFinalResponse(body string) ([]byte, bool) {
 									lines := strings.Split(body, "\n")
 									for _, line := range lines {
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+										data, ok := extractOpenAISSEDataLine(line)
 										if !ok {
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+											continue
 										}
 										if data == "" || data == "[DONE]" {
 											continue
 										}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										eventType := gjson.Get(data, "type").String()
 										if eventType == "response.done" || eventType == "response.completed" {
 											if response := gjson.Get(data, "response"); response.Exists() && response.Type == gjson.JSON && response.Raw != "" {
 												return []byte(response.Raw), true
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+											}
 										}
 									}
 									return nil, false
 								}
-												fix: 非流式路径在上游终态事件output为空时从delta事件重建响应内容

上游API近期更新后，response.completed终态SSE事件的output字段可能为空，
实际内容仅通过response.output_text.delta等增量事件下发。流式路径不受影响，
但chat_completions非流式路径和responses OAuth非流式路径只依赖终态事件的
output，导致返回空响应。

新增BufferedResponseAccumulator累积器，在SSE扫描过程中收集delta事件内容
（文本、function_call、reasoning），当终态output为空时补充重建。

同时修复handleChatBufferedStreamingResponse遗漏response.done事件类型的问题。

											
										
										
											2026-04-07 19:30:45 +08:00
+								// reconstructResponseOutputFromSSE scans raw SSE body text for delta events and
 								// returns a JSON-encoded output array reconstructed from accumulated deltas.
 								// Returns (nil, false) if no content was found in deltas.
 								func reconstructResponseOutputFromSSE(bodyText string) ([]byte, bool) {
 									acc := apicompat.NewBufferedResponseAccumulator()
-												fix: bridge codex image generation over responses

											
										
										
											2026-04-23 15:13:57 +00:00
+									imageOutputs := make([]json.RawMessage, 0, 1)
 									seenImages := make(map[string]struct{})
-												fix: 非流式路径在上游终态事件output为空时从delta事件重建响应内容

上游API近期更新后，response.completed终态SSE事件的output字段可能为空，
实际内容仅通过response.output_text.delta等增量事件下发。流式路径不受影响，
但chat_completions非流式路径和responses OAuth非流式路径只依赖终态事件的
output，导致返回空响应。

新增BufferedResponseAccumulator累积器，在SSE扫描过程中收集delta事件内容
（文本、function_call、reasoning），当终态output为空时补充重建。

同时修复handleChatBufferedStreamingResponse遗漏response.done事件类型的问题。

											
										
										
											2026-04-07 19:30:45 +08:00
+									lines := strings.Split(bodyText, "\n")
 									for _, line := range lines {
 										data, ok := extractOpenAISSEDataLine(line)
 										if !ok || data == "" || data == "[DONE]" {
 											continue
 										}
-												fix: bridge codex image generation over responses

											
										
										
											2026-04-23 15:13:57 +00:00
+										if imageOutput, ok := extractImageGenerationOutputFromSSEData([]byte(data), seenImages); ok {
 											imageOutputs = append(imageOutputs, imageOutput)
 										}
-												fix: 非流式路径在上游终态事件output为空时从delta事件重建响应内容

上游API近期更新后，response.completed终态SSE事件的output字段可能为空，
实际内容仅通过response.output_text.delta等增量事件下发。流式路径不受影响，
但chat_completions非流式路径和responses OAuth非流式路径只依赖终态事件的
output，导致返回空响应。

新增BufferedResponseAccumulator累积器，在SSE扫描过程中收集delta事件内容
（文本、function_call、reasoning），当终态output为空时补充重建。

同时修复handleChatBufferedStreamingResponse遗漏response.done事件类型的问题。

											
										
										
											2026-04-07 19:30:45 +08:00
+										var event apicompat.ResponsesStreamEvent
 										if err := json.Unmarshal([]byte(data), &event); err != nil {
 											continue
 										}
 										acc.ProcessEvent(&event)
 									}
-												fix: bridge codex image generation over responses

											
										
										
											2026-04-23 15:13:57 +00:00
+									if !acc.HasContent() && len(imageOutputs) == 0 {
-												fix: 非流式路径在上游终态事件output为空时从delta事件重建响应内容

上游API近期更新后，response.completed终态SSE事件的output字段可能为空，
实际内容仅通过response.output_text.delta等增量事件下发。流式路径不受影响，
但chat_completions非流式路径和responses OAuth非流式路径只依赖终态事件的
output，导致返回空响应。

新增BufferedResponseAccumulator累积器，在SSE扫描过程中收集delta事件内容
（文本、function_call、reasoning），当终态output为空时补充重建。

同时修复handleChatBufferedStreamingResponse遗漏response.done事件类型的问题。

											
										
										
											2026-04-07 19:30:45 +08:00
+										return nil, false
 									}
-												fix: bridge codex image generation over responses

											
										
										
											2026-04-23 15:13:57 +00:00
 									var output []json.RawMessage
 									if acc.HasContent() {
 										outputJSON, err := json.Marshal(acc.BuildOutput())
-												fix(openai): preserve image outputs when text content serialization fails

In reconstructResponseOutputFromSSE, text content Marshal/Unmarshal
failure previously caused an early return that silently discarded
already-extracted image_generation_call outputs. Now serialization
errors are tolerated so image results still reach the client.

											
										
										
											2026-04-24 08:58:51 +08:00
+										if err == nil {
 											_ = json.Unmarshal(outputJSON, &output)
-												fix: bridge codex image generation over responses

											
										
										
											2026-04-23 15:13:57 +00:00
+										}
 									}
 									output = append(output, imageOutputs...)
-												fix(openai): preserve image outputs when text content serialization fails

In reconstructResponseOutputFromSSE, text content Marshal/Unmarshal
failure previously caused an early return that silently discarded
already-extracted image_generation_call outputs. Now serialization
errors are tolerated so image results still reach the client.

											
										
										
											2026-04-24 08:58:51 +08:00
+									if len(output) == 0 {
 										return nil, false
 									}
-												fix: bridge codex image generation over responses

											
										
										
											2026-04-23 15:13:57 +00:00
-												fix: 非流式路径在上游终态事件output为空时从delta事件重建响应内容

上游API近期更新后，response.completed终态SSE事件的output字段可能为空，
实际内容仅通过response.output_text.delta等增量事件下发。流式路径不受影响，
但chat_completions非流式路径和responses OAuth非流式路径只依赖终态事件的
output，导致返回空响应。

新增BufferedResponseAccumulator累积器，在SSE扫描过程中收集delta事件内容
（文本、function_call、reasoning），当终态output为空时补充重建。

同时修复handleChatBufferedStreamingResponse遗漏response.done事件类型的问题。

											
										
										
											2026-04-07 19:30:45 +08:00
+									outputJSON, err := json.Marshal(output)
 									if err != nil {
 										return nil, false
 									}
 									return outputJSON, true
 								}
-												fix: bridge codex image generation over responses

											
										
										
											2026-04-23 15:13:57 +00:00
+								func extractImageGenerationOutputFromSSEData(data []byte, seen map[string]struct{}) (json.RawMessage, bool) {
 									if len(data) == 0 || !gjson.ValidBytes(data) {
 										return nil, false
 									}
 									if gjson.GetBytes(data, "type").String() != "response.output_item.done" {
 										return nil, false
 									}
 									item := gjson.GetBytes(data, "item")
 									if !item.Exists() || !item.IsObject() || item.Get("type").String() != "image_generation_call" {
 										return nil, false
 									}
 									if strings.TrimSpace(item.Get("result").String()) == "" {
 										return nil, false
 									}
 									key := strings.TrimSpace(item.Get("id").String())
 									if key == "" {
 										key = strings.TrimSpace(item.Get("output_format").String()) + "|" + strings.TrimSpace(item.Get("result").String())
 									}
 									if key != "" && seen != nil {
 										if _, exists := seen[key]; exists {
 											return nil, false
 										}
 										seen[key] = struct{}{}
 									}
 									return json.RawMessage(item.Raw), true
 								}
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+								func (s *OpenAIGatewayService) parseSSEUsageFromBody(body string) *OpenAIUsage {
 									usage := &OpenAIUsage{}
 									lines := strings.Split(body, "\n")
 									for _, line := range lines {
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+										data, ok := extractOpenAISSEDataLine(line)
 										if !ok {
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+											continue
 										}
 										if data == "" || data == "[DONE]" {
 											continue
 										}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+										s.parseSSEUsageBytes([]byte(data), usage)
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+									}
 									return usage
 								}
 								func (s *OpenAIGatewayService) replaceModelInSSEBody(body, fromModel, toModel string) string {
 									lines := strings.Split(body, "\n")
 									for i, line := range lines {
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+										if _, ok := extractOpenAISSEDataLine(line); !ok {
-												Fix Codex OAuth tool mapping

											
										
										
											2026-01-09 18:35:58 +08:00
+											continue
 										}
 										lines[i] = s.replaceModelInSSELine(line, fromModel, toModel)
 									}
 									return strings.Join(lines, "\n")
 								}
-												feat(安全): 强化安全策略与配置校验

- 增加 CORS/CSP/安全响应头与代理信任配置

- 引入 URL 白名单与私网开关，校验上游与价格源

- 改善 API Key 处理与网关错误返回

- 管理端设置隐藏敏感字段并优化前端提示

- 增加计费熔断与相关配置示例

测试: go test ./...

											
										
										
											2026-01-02 17:40:57 +08:00
+								func (s *OpenAIGatewayService) validateUpstreamBaseURL(raw string) (string, error) {
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+									if s.cfg != nil && !s.cfg.Security.URLAllowlist.Enabled {
-												fix(安全): 关闭白名单时保留最小校验与默认白名单

实现 allow_insecure_http 并在关闭校验时执行最小格式验证
- 关闭 allowlist 时要求 URL 可解析且 scheme 合规
- 响应头过滤关闭时使用默认白名单策略
- 更新相关文档、示例与测试覆盖

											
										
										
											2026-01-05 14:41:08 +08:00
+										normalized, err := urlvalidator.ValidateURLFormat(raw, s.cfg.Security.URLAllowlist.AllowInsecureHTTP)
 										if err != nil {
 											return "", fmt.Errorf("invalid base_url: %w", err)
 										}
 										return normalized, nil
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+									}
-												feat(安全): 强化安全策略与配置校验

- 增加 CORS/CSP/安全响应头与代理信任配置

- 引入 URL 白名单与私网开关，校验上游与价格源

- 改善 API Key 处理与网关错误返回

- 管理端设置隐藏敏感字段并优化前端提示

- 增加计费熔断与相关配置示例

测试: go test ./...

											
										
										
											2026-01-02 17:40:57 +08:00
+									normalized, err := urlvalidator.ValidateHTTPSURL(raw, urlvalidator.ValidationOptions{
 										AllowedHosts:     s.cfg.Security.URLAllowlist.UpstreamHosts,
 										RequireAllowlist: true,
 										AllowPrivate:     s.cfg.Security.URLAllowlist.AllowPrivateHosts,
 									})
 									if err != nil {
 										return "", fmt.Errorf("invalid base_url: %w", err)
 									}
 									return normalized, nil
 								}
-												feat(openai): 支持自动透传开关并透传 User-Agent

- OpenAI OAuth/API Key 统一支持自动透传开关，编辑页可开关\n- 透传模式仅替换认证并保留计费/并发/审计，修复 API Key responses 端点拼接\n- Usage 页面显示原始 User-Agent 且不截断，补充回归测试与清单

											
										
										
											2026-02-12 10:56:07 +08:00
+								// buildOpenAIResponsesURL 组装 OpenAI Responses 端点。
 								// - base 以 /v1 结尾：追加 /responses
 								// - base 已是 /responses：原样返回
 								// - 其他情况：追加 /v1/responses
 								func buildOpenAIResponsesURL(base string) string {
 									normalized := strings.TrimRight(strings.TrimSpace(base), "/")
 									if strings.HasSuffix(normalized, "/responses") {
 										return normalized
 									}
 									if strings.HasSuffix(normalized, "/v1") {
 										return normalized + "/responses"
 									}
 									return normalized + "/v1/responses"
 								}
-												fix: handle invalid encrypted content error and retry logic.

											
										
										
											2026-03-14 11:42:42 +08:00
+								func trimOpenAIEncryptedReasoningItems(reqBody map[string]any) bool {
 									if len(reqBody) == 0 {
 										return false
 									}
 									inputValue, has := reqBody["input"]
 									if !has {
 										return false
 									}
 									switch input := inputValue.(type) {
 									case []any:
 										filtered := input[:0]
 										changed := false
 										for _, item := range input {
 											nextItem, itemChanged, keep := sanitizeEncryptedReasoningInputItem(item)
 											if itemChanged {
 												changed = true
 											}
 											if !keep {
 												continue
 											}
 											filtered = append(filtered, nextItem)
 										}
 										if !changed {
 											return false
 										}
 										if len(filtered) == 0 {
 											delete(reqBody, "input")
 											return true
 										}
 										reqBody["input"] = filtered
 										return true
 									case []map[string]any:
 										filtered := input[:0]
 										changed := false
 										for _, item := range input {
 											nextItem, itemChanged, keep := sanitizeEncryptedReasoningInputItem(item)
 											if itemChanged {
 												changed = true
 											}
 											if !keep {
 												continue
 											}
 											nextMap, ok := nextItem.(map[string]any)
 											if !ok {
 												filtered = append(filtered, item)
 												continue
 											}
 											filtered = append(filtered, nextMap)
 										}
 										if !changed {
 											return false
 										}
 										if len(filtered) == 0 {
 											delete(reqBody, "input")
 											return true
 										}
 										reqBody["input"] = filtered
 										return true
 									case map[string]any:
 										nextItem, changed, keep := sanitizeEncryptedReasoningInputItem(input)
 										if !changed {
 											return false
 										}
 										if !keep {
 											delete(reqBody, "input")
 											return true
 										}
 										nextMap, ok := nextItem.(map[string]any)
 										if !ok {
 											return false
 										}
 										reqBody["input"] = nextMap
 										return true
 									default:
 										return false
 									}
 								}
 								func sanitizeEncryptedReasoningInputItem(item any) (next any, changed bool, keep bool) {
 									inputItem, ok := item.(map[string]any)
 									if !ok {
 										return item, false, true
 									}
 									itemType, _ := inputItem["type"].(string)
 									if strings.TrimSpace(itemType) != "reasoning" {
 										return item, false, true
 									}
 									_, hasEncryptedContent := inputItem["encrypted_content"]
 									if !hasEncryptedContent {
 										return item, false, true
 									}
 									delete(inputItem, "encrypted_content")
 									if len(inputItem) == 1 {
 										return nil, true, false
 									}
 									return inputItem, true, true
 								}
-												fix(openai): support remote compact task

											
										
										
											2026-03-06 18:50:28 +08:00
+								func IsOpenAIResponsesCompactPathForTest(c *gin.Context) bool {
 									return isOpenAIResponsesCompactPath(c)
 								}
 								func OpenAICompactSessionSeedKeyForTest() string {
 									return openAICompactSessionSeedKey
 								}
 								func NormalizeOpenAICompactRequestBodyForTest(body []byte) ([]byte, bool, error) {
 									return normalizeOpenAICompactRequestBody(body)
 								}
 								func isOpenAIResponsesCompactPath(c *gin.Context) bool {
 									suffix := strings.TrimSpace(openAIResponsesRequestPathSuffix(c))
 									return suffix == "/compact" || strings.HasPrefix(suffix, "/compact/")
 								}
 								func normalizeOpenAICompactRequestBody(body []byte) ([]byte, bool, error) {
 									if len(body) == 0 {
 										return body, false, nil
 									}
 									normalized := []byte(`{}`)
 									for _, field := range []string{"model", "input", "instructions", "previous_response_id"} {
 										value := gjson.GetBytes(body, field)
 										if !value.Exists() {
 											continue
 										}
 										next, err := sjson.SetRawBytes(normalized, field, []byte(value.Raw))
 										if err != nil {
 											return body, false, fmt.Errorf("normalize compact body %s: %w", field, err)
 										}
 										normalized = next
 									}
 									if bytes.Equal(bytes.TrimSpace(body), bytes.TrimSpace(normalized)) {
 										return body, false, nil
 									}
 									return normalized, true, nil
 								}
 								func resolveOpenAICompactSessionID(c *gin.Context) string {
 									if c != nil {
 										if sessionID := strings.TrimSpace(c.GetHeader("session_id")); sessionID != "" {
 											return sessionID
 										}
 										if conversationID := strings.TrimSpace(c.GetHeader("conversation_id")); conversationID != "" {
 											return conversationID
 										}
 										if seed, ok := c.Get(openAICompactSessionSeedKey); ok {
 											if seedStr, ok := seed.(string); ok && strings.TrimSpace(seedStr) != "" {
 												return strings.TrimSpace(seedStr)
 											}
 										}
 									}
 									return uuid.NewString()
 								}
 								func openAIResponsesRequestPathSuffix(c *gin.Context) string {
 									if c == nil || c.Request == nil || c.Request.URL == nil {
 										return ""
 									}
 									normalizedPath := strings.TrimRight(strings.TrimSpace(c.Request.URL.Path), "/")
 									if normalizedPath == "" {
 										return ""
 									}
 									idx := strings.LastIndex(normalizedPath, "/responses")
 									if idx < 0 {
 										return ""
 									}
 									suffix := normalizedPath[idx+len("/responses"):]
 									if suffix == "" || suffix == "/" {
 										return ""
 									}
 									if !strings.HasPrefix(suffix, "/") {
 										return ""
 									}
 									return suffix
 								}
 								func appendOpenAIResponsesRequestPathSuffix(baseURL, suffix string) string {
 									trimmedBase := strings.TrimRight(strings.TrimSpace(baseURL), "/")
 									trimmedSuffix := strings.TrimSpace(suffix)
 									if trimmedBase == "" || trimmedSuffix == "" {
 										return trimmedBase
 									}
 									return trimmedBase + trimmedSuffix
 								}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								func (s *OpenAIGatewayService) replaceModelInResponseBody(body []byte, fromModel, toModel string) []byte {
-												perf(service): 优化 model 替换函数，用 gjson/sjson 替代全量 JSON 序列化

SSE 热路径中 replaceModelInSSELine 和 replaceModelInResponseBody 原来
使用 json.Unmarshal/Marshal 对每个事件做全量反序列化再序列化，现改为
gjson.Get/sjson.Set 精确字段操作，消除 O(n) 中间 map 分配，保持 JSON
字段顺序不变。涉及 OpenAIGatewayService 和 GatewayService 两个服务。

新增 23 个单元测试覆盖：顶层/嵌套 model 替换、不匹配跳过、空行/[DONE]/
非法 JSON 等边界情况。

Fixes: P1-08

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-07 17:09:55 +08:00
+									// 使用 gjson/sjson 精确替换 model 字段，避免全量 JSON 反序列化
 									if m := gjson.GetBytes(body, "model"); m.Exists() && m.Str == fromModel {
 										newBody, err := sjson.SetBytes(body, "model", toModel)
 										if err != nil {
 											return body
 										}
 										return newBody
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
-												perf(service): 优化 model 替换函数，用 gjson/sjson 替代全量 JSON 序列化

SSE 热路径中 replaceModelInSSELine 和 replaceModelInResponseBody 原来
使用 json.Unmarshal/Marshal 对每个事件做全量反序列化再序列化，现改为
gjson.Get/sjson.Set 精确字段操作，消除 O(n) 中间 map 分配，保持 JSON
字段顺序不变。涉及 OpenAIGatewayService 和 GatewayService 两个服务。

新增 23 个单元测试覆盖：顶层/嵌套 model 替换、不匹配跳过、空行/[DONE]/
非法 JSON 等边界情况。

Fixes: P1-08

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-07 17:09:55 +08:00
+									return body
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								}
 								// OpenAIRecordUsageInput input for recording usage
 								type OpenAIRecordUsageInput struct {
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+									Result             *OpenAIForwardResult
 									APIKey             *APIKey
 									User               *User
 									Account            *Account
 									Subscription       *UserSubscription
-												feat: 完善使用记录端点可观测性与分布统计

将入站、上游与路径三类端点分布统一到使用记录页的一致化卡片交互中，并补齐端点元数据与统计链路，提升排障与流量分析效率。

											
										
										
											2026-03-15 11:26:42 +08:00
+									InboundEndpoint    string
 									UpstreamEndpoint   string
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+									UserAgent          string // 请求的 User-Agent
 									IPAddress          string // 请求的客户端 IP 地址
 									RequestPayloadHash string
 									APIKeyService      APIKeyQuotaUpdater
-												feat(channel): 渠道管理全链路集成 — 模型映射、定价、限制、用量统计

- 渠道模型映射：支持精确匹配和通配符映射，按平台隔离
- 渠道模型定价：支持 token/按次/图片三种计费模式，区间分层定价
- 模型限制：渠道可限制仅允许定价列表中的模型
- 计费模型来源：支持 requested/upstream 两种计费模型选择
- 用量统计：usage_logs 新增 channel_id/model_mapping_chain/billing_tier/billing_mode 字段
- Dashboard 支持 model_source 维度（requested/upstream/mapping）查看模型统计
- 全部 gateway handler 统一接入 ResolveChannelMappingAndRestrict
- 修复测试：同步 SoraGenerationRepository 接口、SQL INSERT 参数、scan 字段

											
										
										
											2026-04-01 01:51:19 +08:00
+									ChannelUsageFields
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+								}
 								// RecordUsage records usage and deducts balance
 								func (s *OpenAIGatewayService) RecordUsage(ctx context.Context, input *OpenAIRecordUsageInput) error {
 									result := input.Result
-												修改403逻辑:  先临时冷却，再根据连续次数决定是否判坏号

											
										
										
											2026-04-23 12:58:13 +08:00
+									if s.rateLimitService != nil && input != nil && input.Account != nil && input.Account.Platform == PlatformOpenAI {
 										s.rateLimitService.ResetOpenAI403Counter(ctx, input.Account.ID)
 									}
-												fix: 修复gpt->claude转换无法命中codex缓存问题

											
										
										
											2026-03-09 15:08:37 +08:00
 									// 跳过所有 token 均为零的用量记录——上游未返回 usage 时不应写入数据库
 									if result.Usage.InputTokens == 0 && result.Usage.OutputTokens == 0 &&
-												feat(openai): 同步生图 API 支持并接入图片计费调度

- 同步 OpenAI 图片生成与编辑接口
- 接入图片请求解析、账号调度、转发与用量记录
- 接入图片计费与图片用量落库
- 限制 OAuth 生图仅支持无显式模型和尺寸的基础请求

											
										
										
											2026-04-22 12:30:08 +08:00
+										result.Usage.CacheCreationInputTokens == 0 && result.Usage.CacheReadInputTokens == 0 &&
 										result.Usage.ImageOutputTokens == 0 && result.ImageCount == 0 {
-												fix: 修复gpt->claude转换无法命中codex缓存问题

											
										
										
											2026-03-09 15:08:37 +08:00
+										return nil
 									}
-												fix(lint): 修复所有 Go 命名规范问题

- 全局替换 ApiKey → APIKey（类型、字段、方法、变量）
- 修复所有 initialism 命名（API, SMTP, HTML, URL 等）
- 添加所有缺失的包注释
- 修复导出符号的注释格式

主要修改：
- ApiKey → APIKey（所有出现的地方）
- ApiKeyID → APIKeyID
- ApiKeyIDs → APIKeyIDs
- TestSmtpConnection → TestSMTPConnection
- HtmlURL → HTMLURL
- 添加 20+ 个包注释
- 修复 10+ 个导出符号注释格式

验证结果：
- ✓ golangci-lint: 0 issues
- ✓ 单元测试: 通过
- ✓ 集成测试: 通过

											
										
										
											2026-01-04 19:27:53 +08:00
+									apiKey := input.APIKey
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									user := input.User
 									account := input.Account
 									subscription := input.Subscription
-												feat: 平台图标与计费修复

- fix(billing): 修复 OpenAI 兼容 API 缓存 token 重复计费问题
- fix(auth): 隐藏数据库错误详情，返回通用服务不可用错误
- feat(ui): 新增 PlatformIcon 组件，GroupBadge 支持平台颜色区分
- feat(ui): 账号管理新增重置状态按钮，重授权后自动清除错误
- feat(ui): 分组管理新增计费类型列，显示订阅限额信息
- ui: 首页 GPT 状态改为已支持

											
										
										
											2025-12-23 10:01:58 +08:00
+									// 计算实际的新输入token（减去缓存读取的token）
 									// 因为 input_tokens 包含了 cache_read_tokens，而缓存读取的token不应按输入价格计费
 									actualInputTokens := result.Usage.InputTokens - result.Usage.CacheReadInputTokens
 									if actualInputTokens < 0 {
 										actualInputTokens = 0
 									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									// Calculate cost
 									tokens := UsageTokens{
-												feat: 平台图标与计费修复

- fix(billing): 修复 OpenAI 兼容 API 缓存 token 重复计费问题
- fix(auth): 隐藏数据库错误详情，返回通用服务不可用错误
- feat(ui): 新增 PlatformIcon 组件，GroupBadge 支持平台颜色区分
- feat(ui): 账号管理新增重置状态按钮，重授权后自动清除错误
- feat(ui): 分组管理新增计费类型列，显示订阅限额信息
- ui: 首页 GPT 状态改为已支持

											
										
										
											2025-12-23 10:01:58 +08:00
+										InputTokens:         actualInputTokens,
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+										OutputTokens:        result.Usage.OutputTokens,
 										CacheCreationTokens: result.Usage.CacheCreationInputTokens,
 										CacheReadTokens:     result.Usage.CacheReadInputTokens,
-												feat: image output token billing, channel-mapped billing source, credits balance precheck

- Parse candidatesTokensDetails from Gemini API to separate image/text output tokens
- Add image_output_tokens and image_output_cost to usage_log (migration 089)
- Support per-image-token pricing via output_cost_per_image_token from model pricing data
- Channel pricing ImageOutputPrice override works in token billing mode
- Auto-fill image_output_price in channel pricing form from model defaults
- Add "channel_mapped" billing model source as new default (migration 088)
- Bills by model name after channel mapping, before account mapping
- Fix channel cache error TTL sign error (115s → 5s)
- Fix Update channel only invalidating new groups, not removed groups
- Fix frontend model_mapping clearing sending undefined instead of {}
- Credits balance precheck via shared AccountUsageService cache before injection
- Skip credits injection for accounts with insufficient balance
- Don't mark credits exhausted for "exhausted your capacity on this model" 429s

											
										
										
											2026-04-01 15:08:57 +08:00
+										ImageOutputTokens:   result.Usage.ImageOutputTokens,
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
 									// Get rate multiplier
-												fix: address audit findings - cache sync, validation, consistency

- clearCreditsExhausted: sync Redis scheduler cache after DB update
- Image billing mode UI: write to per_request_price instead of image_output_price
- OpenAI RecordUsage: use BillingModelSourceRequested constant, add s.cfg nil guard
- Fix i18n key path: admin.channels.perRequestPriceRequired → admin.channels.form.perRequestPriceRequired

											
										
										
											2026-04-01 23:13:58 +08:00
+									multiplier := 1.0
 									if s.cfg != nil {
 										multiplier = s.cfg.Default.RateMultiplier
 									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									if apiKey.GroupID != nil && apiKey.Group != nil {
-												fix(openai): 统一专属倍率计费链路并补齐回归测试

抽取共享的用户分组专属倍率解析器，统一缓存、singleflight 与回退逻辑。\n\n让 OpenAI 独立计费链路复用专属倍率解析，修复 usage 记录与实际扣费未命中用户专属倍率的问题。\n\n补齐 OpenAI 计费与解析器单元测试，并修复全量回归中暴露的 lint 阻塞项。\n\nCo-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-06 14:54:52 +08:00
+										resolver := s.userGroupRateResolver
 										if resolver == nil {
 											resolver = newUserGroupRateResolver(nil, nil, resolveUserGroupRateCacheTTL(s.cfg), nil, "service.openai_gateway")
 										}
 										multiplier = resolver.Resolve(ctx, user.ID, *apiKey.GroupID, apiKey.Group.RateMultiplier)
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
-												feat(billing): 网关计费迁移到 CalculateCostUnified + 模型限制错误统一

- GatewayService/OpenAIGatewayService 注入 ModelPricingResolver
- RecordUsage 从旧路径迁移到 CalculateCostUnified（支持 per_request/image 模式）
- 无渠道时自动回退旧路径，保持原有行为
- 长上下文双倍计费仅在无渠道定价时生效
- CostBreakdown 新增 BillingMode 字段，使用日志记录实际计费模式
- 模型限制错误改为与"无可用账号"相同的 503 响应

											
										
										
											2026-03-30 22:58:28 +08:00
+									var cost *CostBreakdown
 									var err error
-												fix(usage): preserve requested model in gateway billing paths

Ultraworked with [Sisyphus](https://github.com/code-yeongyu/oh-my-openagent)

Co-authored-by: Sisyphus <clio-agent@sisyphuslabs.ai>

											
										
										
											2026-03-21 01:23:54 +08:00
+									billingModel := forwardResultBillingModel(result.Model, result.UpstreamModel)
-												feat(channel): 通配符定价匹配 + OpenAI BillingModelSource + 按次价格校验 + 用户端计费模式展示

- 定价查找支持通配符(suffix *)，最长前缀优先匹配
- 模型限制(restrict_models)同样支持通配符匹配
- OpenAI 网关接入渠道映射/BillingModelSource/模型限制
- 按次/图片计费模式创建时强制要求价格或层级(前后端)
- 用户使用记录列表增加计费模式 badge 列

											
										
										
											2026-03-31 00:23:45 +08:00
+									if result.BillingModel != "" {
 										billingModel = strings.TrimSpace(result.BillingModel)
 									}
-												fix(billing): prevent channel_mapped override from reverting BillingModel when channel did not map

When a channel has no model mapping for the requested model, ChannelMappedModel
equals OriginalModel (the user's arbitrary input). Combined with the default
BillingModelSource="channel_mapped", this incorrectly overrides the BillingModel
set by the OpenAI format conversion layer (e.g., gpt-5.4 from DefaultMappedModel)
back to the unmapped original model (e.g., glm) which has no pricing — resulting
in zero-cost billing.

Add guard condition so the channel_mapped override only fires when the channel
actually changed the model (ChannelMappedModel != OriginalModel).

											
										
										
											2026-04-05 17:22:59 +08:00
+									if input.BillingModelSource == BillingModelSourceChannelMapped && input.ChannelMappedModel != "" && input.ChannelMappedModel != input.OriginalModel {
-												feat: image output token billing, channel-mapped billing source, credits balance precheck

- Parse candidatesTokensDetails from Gemini API to separate image/text output tokens
- Add image_output_tokens and image_output_cost to usage_log (migration 089)
- Support per-image-token pricing via output_cost_per_image_token from model pricing data
- Channel pricing ImageOutputPrice override works in token billing mode
- Auto-fill image_output_price in channel pricing form from model defaults
- Add "channel_mapped" billing model source as new default (migration 088)
- Bills by model name after channel mapping, before account mapping
- Fix channel cache error TTL sign error (115s → 5s)
- Fix Update channel only invalidating new groups, not removed groups
- Fix frontend model_mapping clearing sending undefined instead of {}
- Credits balance precheck via shared AccountUsageService cache before injection
- Skip credits injection for accounts with insufficient balance
- Don't mark credits exhausted for "exhausted your capacity on this model" 429s

											
										
										
											2026-04-01 15:08:57 +08:00
+										billingModel = input.ChannelMappedModel
 									}
-												fix: address audit findings - cache sync, validation, consistency

- clearCreditsExhausted: sync Redis scheduler cache after DB update
- Image billing mode UI: write to per_request_price instead of image_output_price
- OpenAI RecordUsage: use BillingModelSourceRequested constant, add s.cfg nil guard
- Fix i18n key path: admin.channels.perRequestPriceRequired → admin.channels.form.perRequestPriceRequired

											
										
										
											2026-04-01 23:13:58 +08:00
+									if input.BillingModelSource == BillingModelSourceRequested && input.OriginalModel != "" {
-												feat(channel): 通配符定价匹配 + OpenAI BillingModelSource + 按次价格校验 + 用户端计费模式展示

- 定价查找支持通配符(suffix *)，最长前缀优先匹配
- 模型限制(restrict_models)同样支持通配符匹配
- OpenAI 网关接入渠道映射/BillingModelSource/模型限制
- 按次/图片计费模式创建时强制要求价格或层级(前后端)
- 用户使用记录列表增加计费模式 badge 列

											
										
										
											2026-03-31 00:23:45 +08:00
+										billingModel = input.OriginalModel
 									}
-												fix(billing): 修复 OpenAI fast 档位计费并补齐展示

- 打通 service_tier 在 OpenAI HTTP、WS、passthrough 与 usage 记录中的传递
- 修正 priority/flex 计费逻辑，并将 fast 归一化为 priority
- 在用户端和管理端补齐服务档位与计费明细展示
- 补齐前后端测试，并修复 WS 限流信号重复持久化导致的全量回归失败

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-08 23:22:28 +08:00
+									serviceTier := ""
 									if result.ServiceTier != nil {
 										serviceTier = strings.TrimSpace(*result.ServiceTier)
 									}
-												feat(openai): 同步生图 API 支持并接入图片计费调度

- 同步 OpenAI 图片生成与编辑接口
- 接入图片请求解析、账号调度、转发与用量记录
- 接入图片计费与图片用量落库
- 限制 OAuth 生图仅支持无显式模型和尺寸的基础请求

											
										
										
											2026-04-22 12:30:08 +08:00
+									cost, err = s.calculateOpenAIRecordUsageCost(ctx, result, apiKey, billingModel, multiplier, tokens, serviceTier)
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									if err != nil {
 										cost = &CostBreakdown{ActualCost: 0}
 									}
 									// Determine billing type
 									isSubscriptionBilling := subscription != nil && apiKey.Group != nil && apiKey.Group.IsSubscriptionType()
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+									billingType := BillingTypeBalance
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									if isSubscriptionBilling {
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+										billingType = BillingTypeSubscription
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
 									// Create usage log
 									durationMs := int(result.Duration.Milliseconds())
-												feat: merge dev

											
										
										
											2026-01-15 15:14:44 +08:00
+									accountRateMultiplier := account.BillingRateMultiplier()
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+									requestID := resolveUsageBillingRequestID(ctx, result.RequestID)
-												fix(channel): 全平台渠道映射覆盖 + 公共函数抽取 + 死代码清理

- 4个缺失handler入口添加渠道映射+限制检查(ChatCompletions/Responses/Gemini)
- 模型限制错误信息优化，区分"模型不可用"和"无账号"
- OpenAI RecordUsage RequestedModel 改用 OriginalModel
- ResolveChannelMappingAndRestrict/ReplaceModelInBody 抽取到 ChannelService 消除跨service重复
- validateNoDuplicateModels 按 platform:model 去重
- 删除 Channel.ResolveMappedModel 死代码和 CalculateCostWithChannel Deprecated方法
- 移除冗余nil检查，抽取 validatePricingBillingMode 公共校验

											
										
										
											2026-03-31 15:26:20 +08:00
 									// 确定 RequestedModel（渠道映射前的原始模型）
 									requestedModel := result.Model
 									if input.OriginalModel != "" {
 										requestedModel = input.OriginalModel
 									}
-												refactor: 调整项目结构为单向依赖

											
										
										
											2025-12-26 15:40:24 +08:00
+									usageLog := &UsageLog{
-												fix: golangci-lint test assertion and gofmt

											
										
										
											2026-04-01 16:39:38 +08:00
+										UserID:              user.ID,
 										APIKeyID:            apiKey.ID,
 										AccountID:           account.ID,
 										RequestID:           requestID,
 										Model:               result.Model,
 										RequestedModel:      requestedModel,
 										UpstreamModel:       optionalNonEqualStringPtr(result.UpstreamModel, result.Model),
 										ServiceTier:         result.ServiceTier,
 										ReasoningEffort:     result.ReasoningEffort,
 										InboundEndpoint:     optionalTrimmedStringPtr(input.InboundEndpoint),
 										UpstreamEndpoint:    optionalTrimmedStringPtr(input.UpstreamEndpoint),
 										InputTokens:         actualInputTokens,
 										OutputTokens:        result.Usage.OutputTokens,
 										CacheCreationTokens: result.Usage.CacheCreationInputTokens,
 										CacheReadTokens:     result.Usage.CacheReadInputTokens,
 										ImageOutputTokens:   result.Usage.ImageOutputTokens,
-												feat(openai): 同步生图 API 支持并接入图片计费调度

- 同步 OpenAI 图片生成与编辑接口
- 接入图片请求解析、账号调度、转发与用量记录
- 接入图片计费与图片用量落库
- 限制 OAuth 生图仅支持无显式模型和尺寸的基础请求

											
										
										
											2026-04-22 12:30:08 +08:00
+										ImageCount:          result.ImageCount,
 										ImageSize:           optionalTrimmedStringPtr(result.ImageSize),
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									}
-												fix: resolve golangci-lint issues

- Fix errcheck: defer rows.Close() with nolint
- Fix errcheck: type assertion with ok check in channel cache
- Fix staticcheck ST1005: lowercase error string
- Fix staticcheck SA5011: nil check cost before use in openai gateway
- Fix gofmt: format chatcompletions_to_responses.go

											
										
										
											2026-04-01 16:30:47 +08:00
+									if cost != nil {
 										usageLog.InputCost = cost.InputCost
 										usageLog.OutputCost = cost.OutputCost
 										usageLog.ImageOutputCost = cost.ImageOutputCost
 										usageLog.CacheCreationCost = cost.CacheCreationCost
 										usageLog.CacheReadCost = cost.CacheReadCost
 										usageLog.TotalCost = cost.TotalCost
 										usageLog.ActualCost = cost.ActualCost
 									}
 									usageLog.RateMultiplier = multiplier
 									usageLog.AccountRateMultiplier = &accountRateMultiplier
 									usageLog.BillingType = billingType
 									usageLog.Stream = result.Stream
 									usageLog.OpenAIWSMode = result.OpenAIWSMode
 									usageLog.DurationMs = &durationMs
 									usageLog.FirstTokenMs = result.FirstTokenMs
 									usageLog.CreatedAt = time.Now()
-												feat(channel): 通配符定价匹配 + OpenAI BillingModelSource + 按次价格校验 + 用户端计费模式展示

- 定价查找支持通配符(suffix *)，最长前缀优先匹配
- 模型限制(restrict_models)同样支持通配符匹配
- OpenAI 网关接入渠道映射/BillingModelSource/模型限制
- 按次/图片计费模式创建时强制要求价格或层级(前后端)
- 用户使用记录列表增加计费模式 badge 列

											
										
										
											2026-03-31 00:23:45 +08:00
+									// 设置渠道信息
 									usageLog.ChannelID = optionalInt64Ptr(input.ChannelID)
 									usageLog.ModelMappingChain = optionalTrimmedStringPtr(input.ModelMappingChain)
-												feat(billing): 网关计费迁移到 CalculateCostUnified + 模型限制错误统一

- GatewayService/OpenAIGatewayService 注入 ModelPricingResolver
- RecordUsage 从旧路径迁移到 CalculateCostUnified（支持 per_request/image 模式）
- 无渠道时自动回退旧路径，保持原有行为
- 长上下文双倍计费仅在无渠道定价时生效
- CostBreakdown 新增 BillingMode 字段，使用日志记录实际计费模式
- 模型限制错误改为与"无可用账号"相同的 503 响应

											
										
										
											2026-03-30 22:58:28 +08:00
+									// 设置计费模式
 									if cost != nil && cost.BillingMode != "" {
 										billingMode := cost.BillingMode
 										usageLog.BillingMode = &billingMode
-												feat(openai): 同步生图 API 支持并接入图片计费调度

- 同步 OpenAI 图片生成与编辑接口
- 接入图片请求解析、账号调度、转发与用量记录
- 接入图片计费与图片用量落库
- 限制 OAuth 生图仅支持无显式模型和尺寸的基础请求

											
										
										
											2026-04-22 12:30:08 +08:00
+									} else if result.ImageCount > 0 {
 										billingMode := string(BillingModeImage)
 										usageLog.BillingMode = &billingMode
-												feat(billing): 网关计费迁移到 CalculateCostUnified + 模型限制错误统一

- GatewayService/OpenAIGatewayService 注入 ModelPricingResolver
- RecordUsage 从旧路径迁移到 CalculateCostUnified（支持 per_request/image 模式）
- 无渠道时自动回退旧路径，保持原有行为
- 长上下文双倍计费仅在无渠道定价时生效
- CostBreakdown 新增 BillingMode 字段，使用日志记录实际计费模式
- 模型限制错误改为与"无可用账号"相同的 503 响应

											
										
										
											2026-03-30 22:58:28 +08:00
+									} else {
-												refactor: replace magic strings with named constants

- PricingSourceChannel/LiteLLM/Fallback for resolver source
- MediaTypeImage/Video/Prompt for result.MediaType
- Reuse BillingModeToken/BillingModeImage for billing mode
- Reuse BillingModelSourceChannelMapped/PlatformAnthropic in handler

											
										
										
											2026-04-02 02:22:15 +08:00
+										billingMode := string(BillingModeToken)
-												feat(usage): 使用记录增加计费模式字段 — 记录/展示/筛选 token/按次/图片

- DB: usage_logs 表新增 billing_mode VARCHAR(20) 列
- 后端: RecordUsage 写入时根据 image_count 判定计费模式
- 前端: 使用记录表格新增计费模式 badge 列 + 筛选下拉

											
										
										
											2026-03-30 22:13:16 +08:00
+										usageLog.BillingMode = &billingMode
 									}
-												feat(usage-log): 增加请求 User-Agent 记录

在使用记录中添加 user_agent 字段，用于记录 API 请求的 User-Agent 头信息，
便于分析客户端类型和调试。

变更内容：
- 新增数据库迁移 028_add_usage_logs_user_agent.sql
- 更新 UsageLog 模型和 Ent Schema 添加 user_agent 字段
- 更新 Repository 层的 Create 和 scanUsageLog 方法
- 更新 RecordUsageInput 结构体支持传入 UserAgent
- 更新 Claude/OpenAI/Gemini 三个网关 Handler 传递 UserAgent

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>

											
										
										
											2026-01-06 16:23:56 +08:00
+									// 添加 UserAgent
 									if input.UserAgent != "" {
 										usageLog.UserAgent = &input.UserAgent
 									}
-												feat(api-key): 添加 IP 白名单/黑名单限制功能 (#221)

* feat(api-key): add IP whitelist/blacklist restriction and usage log IP tracking

- Add IP restriction feature for API keys (whitelist/blacklist with CIDR support)
- Add IP address logging to usage logs (admin-only visibility)
- Remove billing_type column from usage logs UI (redundant)
- Use generic "Access denied" error message for security

Backend:
- New ip package with IP/CIDR validation and matching utilities
- Database migrations for ip_whitelist, ip_blacklist (api_keys) and ip_address (usage_logs)
- Middleware IP restriction check after API key validation
- Input validation for IP/CIDR patterns on create/update

Frontend:
- API key form with enable toggle for IP restriction
- Shield icon indicator in table for keys with IP restriction
- Removed billing_type filter and column from usage views

* fix: update API contract tests for ip_whitelist/ip_blacklist fields

Add ip_whitelist and ip_blacklist fields to expected JSON responses
in API contract tests to match the new API key schema.
											
										
										
											2026-01-09 21:59:32 +08:00
+									// 添加 IPAddress
 									if input.IPAddress != "" {
 										usageLog.IPAddress = &input.IPAddress
 									}
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									if apiKey.GroupID != nil {
 										usageLog.GroupID = apiKey.GroupID
 									}
 									if subscription != nil {
 										usageLog.SubscriptionID = &subscription.ID
 									}
-												fix(channel): use upstream model for account stats pricing and remove channel pricing fallback

- resolveAccountStatsCost now uses the final upstream model (after
  account-level mapping) to match custom pricing rules, fixing the
  issue where requested model (e.g. claude-sonnet-4-5) didn't match
  rules configured for upstream model (e.g. claude-opus-4-6)
- Remove tryChannelPricing fallback — only custom rules are applied,
  unmatched requests use default formula (total_cost × rate)
- Remove unused billingService and serviceTier parameters
- Update description: "启用后将支持自定义账号统计的模型价格"

											
										
										
											2026-04-13 02:28:31 +08:00
+									// 计算账号统计定价费用（使用最终上游模型匹配自定义规则）
-												feat(channels): add custom account stats pricing rules

Allow channels to configure independent model pricing for account
statistics cost calculation, decoupled from user billing.

Backend:
- Migration 101: channels.apply_pricing_to_account_stats toggle,
  channel_account_stats_pricing_rules/model_pricing tables,
  usage_logs.account_stats_cost column
- resolveAccountStatsCost: match rules by group/account, then channel
  pricing, fallback to original formula when unconfigured
- Integrate into both GatewayService.recordUsageCore and
  OpenAIGatewayService.RecordUsage
- Update 8 account stats SQL queries to use
  COALESCE(account_stats_cost, total_cost) * account_rate_multiplier
- 23 unit tests for matching, pricing lookup, and cost calculation

Frontend:
- Channel edit dialog: toggle + custom rules UI with group/account
  multi-select and pricing entry cards
- API types and i18n (zh/en)

											
										
										
											2026-04-11 23:39:49 +08:00
+									if apiKey.GroupID != nil {
-												fix: merge general improvements from release branch

Backend:
- gateway_handler: pass subject.UserID instead of int64(0) for user-level routing
- setting_handler: add missing BalanceLowNotifyRechargeURL to UpdateSettings response
- openai_gateway_service: use applyAccountStatsCost for account stats pricing integration
- embed_on: add local file override (data/public/) for embedded frontend assets

Frontend:
- useTableSelection: add batchUpdate method for batch operations
- AccountsView: virtual scrolling params, Set-based isSelected, swipe virtualization
- ProxiesView: add batchUpdate to selection and swipe-select
- BulkEditAccountModal: fix submit handler to prevent event object as argument
- SettingsView: move payload construction outside try block
- i18n: add general translation keys (saved, deleted, view, validation, allowUserRefund)
- api/client: reorder error fields for consistency
- stores/payment: clarify pollOrderStatus JSDoc

											
										
										
											2026-04-14 19:29:37 +08:00
+										applyAccountStatsCost(ctx, usageLog, s.channelService, s.billingService,
 											account.ID, *apiKey.GroupID, result.UpstreamModel, result.Model,
 											tokens, cost.TotalCost,
-												feat(channels): add custom account stats pricing rules

Allow channels to configure independent model pricing for account
statistics cost calculation, decoupled from user billing.

Backend:
- Migration 101: channels.apply_pricing_to_account_stats toggle,
  channel_account_stats_pricing_rules/model_pricing tables,
  usage_logs.account_stats_cost column
- resolveAccountStatsCost: match rules by group/account, then channel
  pricing, fallback to original formula when unconfigured
- Integrate into both GatewayService.recordUsageCore and
  OpenAIGatewayService.RecordUsage
- Update 8 account stats SQL queries to use
  COALESCE(account_stats_cost, total_cost) * account_rate_multiplier
- 23 unit tests for matching, pricing lookup, and cost calculation

Frontend:
- Channel edit dialog: toggle + custom rules UI with group/account
  multi-select and pricing entry cards
- API types and i18n (zh/en)

											
										
										
											2026-04-11 23:39:49 +08:00
+										)
 									}
-												feat(全栈): 实现简易模式核心功能

**功能概述**：
实现简易模式(Simple Mode)，为个人用户和小团队提供简化的使用体验，隐藏复杂的分组、订阅、配额等概念。

**后端改动**：
1. 配置系统
   - 新增 run_mode 配置项（standard/simple）
   - 支持环境变量 RUN_MODE
   - 默认值为 standard

2. 数据库初始化
   - 自动创建3个默认分组：anthropic-default、openai-default、gemini-default
   - 默认分组配置：无并发限制、active状态、非独占
   - 幂等性保证：重复启动不会重复创建

3. 账号管理
   - 创建账号时自动绑定对应平台的默认分组
   - 如果未指定分组，自动查找并绑定默认分组

**前端改动**：
1. 状态管理
   - authStore 新增 isSimpleMode 计算属性
   - 从后端API获取并同步运行模式

2. UI隐藏
   - 侧边栏：隐藏分组管理、订阅管理、兑换码菜单
   - 账号管理页面：隐藏分组列
   - 创建/编辑账号对话框：隐藏分组选择器

3. 路由守卫
   - 限制访问分组、订阅、兑换码相关页面
   - 访问受限页面时自动重定向到仪表板

**配置示例**：
```yaml
run_mode: simple

run_mode: standard
```

**影响范围**：
- 后端：配置、数据库迁移、账号服务
- 前端：认证状态、路由、UI组件
- 部署：配置文件示例

**兼容性**：
- 简易模式和标准模式可无缝切换
- 不需要数据迁移
- 现有数据不受影响

											
										
										
											2025-12-29 03:17:25 +08:00
+									if s.cfg != nil && s.cfg.RunMode == config.RunModeSimple {
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+										writeUsageLogBestEffort(ctx, s.usageLogRepo, usageLog, "service.openai_gateway")
-												chore(logging): 完成后端日志审计与结构化迁移

- 将高密度服务与处理器日志迁移到新日志系统（LegacyPrintf/结构化日志）
- 增加 stdlog bridge 与兼容测试，保留旧日志捕获能力
- 将 OpenAI 断流告警改为结构化 Warn 并改造对应测试为 sink 捕获
- 补齐后端相关文件 logger 引用并通过全量 go test

											
										
										
											2026-02-12 19:01:09 +08:00
+										logger.LegacyPrintf("service.openai_gateway", "[SIMPLE MODE] Usage recorded (not billed): user=%d, tokens=%d", usageLog.UserID, usageLog.TotalTokens())
-												feat(全栈): 实现简易模式核心功能

**功能概述**：
实现简易模式(Simple Mode)，为个人用户和小团队提供简化的使用体验，隐藏复杂的分组、订阅、配额等概念。

**后端改动**：
1. 配置系统
   - 新增 run_mode 配置项（standard/simple）
   - 支持环境变量 RUN_MODE
   - 默认值为 standard

2. 数据库初始化
   - 自动创建3个默认分组：anthropic-default、openai-default、gemini-default
   - 默认分组配置：无并发限制、active状态、非独占
   - 幂等性保证：重复启动不会重复创建

3. 账号管理
   - 创建账号时自动绑定对应平台的默认分组
   - 如果未指定分组，自动查找并绑定默认分组

**前端改动**：
1. 状态管理
   - authStore 新增 isSimpleMode 计算属性
   - 从后端API获取并同步运行模式

2. UI隐藏
   - 侧边栏：隐藏分组管理、订阅管理、兑换码菜单
   - 账号管理页面：隐藏分组列
   - 创建/编辑账号对话框：隐藏分组选择器

3. 路由守卫
   - 限制访问分组、订阅、兑换码相关页面
   - 访问受限页面时自动重定向到仪表板

**配置示例**：
```yaml
run_mode: simple

run_mode: standard
```

**影响范围**：
- 后端：配置、数据库迁移、账号服务
- 前端：认证状态、路由、UI组件
- 部署：配置文件示例

**兼容性**：
- 简易模式和标准模式可无缝切换
- 不需要数据迁移
- 现有数据不受影响

											
										
										
											2025-12-29 03:17:25 +08:00
+										s.deferredService.ScheduleLastUsedUpdate(account.ID)
 										return nil
 									}
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+									billingErr := func() error {
 										_, err := applyUsageBilling(ctx, requestID, usageLog, &postUsageBillingParams{
-												refactor: unify post-usage billing logic and fix account quota calculation

- Extract postUsageBilling() to consolidate billing logic across
  GatewayService.RecordUsage, RecordUsageWithLongContext, and
  OpenAIGatewayService.RecordUsage, eliminating ~120 lines of
  duplicated code
- Fix account quota to use TotalCost × accountRateMultiplier
  (was using raw TotalCost, inconsistent with account cost stats)
- Fix RecordUsageWithLongContext API Key quota only updating in
  balance mode (now updates regardless of billing type)
- Fix WebSocket client disconnect detection on Windows by adding
  "an established connection was aborted" to known disconnect errors

											
										
										
											2026-03-06 00:37:37 +08:00
+											Cost:                  cost,
 											User:                  user,
 											APIKey:                apiKey,
 											Account:               account,
 											Subscription:          subscription,
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+											RequestPayloadHash:    resolveUsageBillingPayloadFingerprint(ctx, input.RequestPayloadHash),
-												refactor: unify post-usage billing logic and fix account quota calculation

- Extract postUsageBilling() to consolidate billing logic across
  GatewayService.RecordUsage, RecordUsageWithLongContext, and
  OpenAIGatewayService.RecordUsage, eliminating ~120 lines of
  duplicated code
- Fix account quota to use TotalCost × accountRateMultiplier
  (was using raw TotalCost, inconsistent with account cost stats)
- Fix RecordUsageWithLongContext API Key quota only updating in
  balance mode (now updates regardless of billing type)
- Fix WebSocket client disconnect detection on Windows by adding
  "an established connection was aborted" to known disconnect errors

											
										
										
											2026-03-06 00:37:37 +08:00
+											IsSubscriptionBill:    isSubscriptionBilling,
 											AccountRateMultiplier: accountRateMultiplier,
 											APIKeyService:         input.APIKeyService,
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+										}, s.billingDeps(), s.usageBillingRepo)
 										return err
 									}()
 									if billingErr != nil {
 										return billingErr
-												feat: add quota limit for API key accounts

- Add configurable spending limit (quota_limit) for apikey-type accounts
- Atomic quota accumulation via PostgreSQL JSONB operations on TotalCost
- Scheduler filters out over-quota accounts with outbox-triggered snapshot refresh
- Display quota usage ($used / $limit) in account capacity column
- Add "Reset Quota" action in account menu to reset usage to zero
- Editing account settings preserves quota_used (no accidental reset)
- Covers all 3 billing paths: Anthropic, Gemini, OpenAI RecordUsage

chore: bump version to 0.1.90.4

											
										
										
											2026-03-05 20:54:37 +08:00
+									}
-												feat: decouple billing correctness from usage log batching

											
										
										
											2026-03-12 16:53:18 +08:00
+									writeUsageLogBestEffort(ctx, s.usageLogRepo, usageLog, "service.openai_gateway")
-												feat: add quota limit for API key accounts

- Add configurable spending limit (quota_limit) for apikey-type accounts
- Atomic quota accumulation via PostgreSQL JSONB operations on TotalCost
- Scheduler filters out over-quota accounts with outbox-triggered snapshot refresh
- Display quota usage ($used / $limit) in account capacity column
- Add "Reset Quota" action in account menu to reset usage to zero
- Editing account settings preserves quota_used (no accidental reset)
- Covers all 3 billing paths: Anthropic, Gemini, OpenAI RecordUsage

chore: bump version to 0.1.90.4

											
										
										
											2026-03-05 20:54:37 +08:00
-												feat: 新增支持codex转发

											
										
										
											2025-12-22 22:58:31 +08:00
+									return nil
 								}
-												feat: OpenAI OAuth账号显示Codex使用量

从响应头提取x-codex-*使用量信息并保存到账号Extra字段，
前端账号列表展示5h/7d窗口的使用进度条。

											
										
										
											2025-12-23 16:26:07 +08:00
-												feat(openai): 同步生图 API 支持并接入图片计费调度

- 同步 OpenAI 图片生成与编辑接口
- 接入图片请求解析、账号调度、转发与用量记录
- 接入图片计费与图片用量落库
- 限制 OAuth 生图仅支持无显式模型和尺寸的基础请求

											
										
										
											2026-04-22 12:30:08 +08:00
+								func (s *OpenAIGatewayService) calculateOpenAIRecordUsageCost(
 									ctx context.Context,
 									result *OpenAIForwardResult,
 									apiKey *APIKey,
 									billingModel string,
 									multiplier float64,
 									tokens UsageTokens,
 									serviceTier string,
 								) (*CostBreakdown, error) {
 									if result != nil && result.ImageCount > 0 {
 										return s.calculateOpenAIImageCost(ctx, billingModel, apiKey, result, multiplier), nil
 									}
 									if s.resolver != nil && apiKey.Group != nil {
 										gid := apiKey.Group.ID
 										return s.billingService.CalculateCostUnified(CostInput{
 											Ctx:            ctx,
 											Model:          billingModel,
 											GroupID:        &gid,
 											Tokens:         tokens,
 											RequestCount:   1,
 											RateMultiplier: multiplier,
 											ServiceTier:    serviceTier,
 											Resolver:       s.resolver,
 										})
 									}
 									return s.billingService.CalculateCostWithServiceTier(billingModel, tokens, multiplier, serviceTier)
 								}
 								func (s *OpenAIGatewayService) calculateOpenAIImageCost(
 									ctx context.Context,
 									billingModel string,
 									apiKey *APIKey,
 									result *OpenAIForwardResult,
 									multiplier float64,
 								) *CostBreakdown {
-												修复计费问题以及模型回显

											
										
										
											2026-04-23 15:09:47 +08:00
+									if resolved := s.resolveOpenAIChannelPricing(ctx, billingModel, apiKey); resolved != nil &&
 										(resolved.Mode == BillingModePerRequest || resolved.Mode == BillingModeImage) {
-												feat(openai): 同步生图 API 支持并接入图片计费调度

- 同步 OpenAI 图片生成与编辑接口
- 接入图片请求解析、账号调度、转发与用量记录
- 接入图片计费与图片用量落库
- 限制 OAuth 生图仅支持无显式模型和尺寸的基础请求

											
										
										
											2026-04-22 12:30:08 +08:00
+										gid := apiKey.Group.ID
 										cost, err := s.billingService.CalculateCostUnified(CostInput{
 											Ctx:            ctx,
 											Model:          billingModel,
 											GroupID:        &gid,
 											RequestCount:   1,
 											SizeTier:       result.ImageSize,
 											RateMultiplier: multiplier,
 											Resolver:       s.resolver,
 											Resolved:       resolved,
 										})
 										if err == nil {
 											return cost
 										}
 										logger.LegacyPrintf("service.openai_gateway", "Calculate image channel cost failed: %v", err)
 									}
 									var groupConfig *ImagePriceConfig
 									if apiKey != nil && apiKey.Group != nil {
 										groupConfig = &ImagePriceConfig{
 											Price1K: apiKey.Group.ImagePrice1K,
 											Price2K: apiKey.Group.ImagePrice2K,
 											Price4K: apiKey.Group.ImagePrice4K,
 										}
 									}
 									return s.billingService.CalculateImageCost(billingModel, result.ImageSize, result.ImageCount, groupConfig, multiplier)
 								}
 								func (s *OpenAIGatewayService) resolveOpenAIChannelPricing(ctx context.Context, billingModel string, apiKey *APIKey) *ResolvedPricing {
 									if s.resolver == nil || apiKey == nil || apiKey.Group == nil {
 										return nil
 									}
 									gid := apiKey.Group.ID
 									resolved := s.resolver.Resolve(ctx, PricingInput{Model: billingModel, GroupID: &gid})
 									if resolved.Source == PricingSourceChannel {
 										return resolved
 									}
 									return nil
 								}
-												fix(ratelimit): 修复 OpenAI 账号限流倒计时计算错误

- 解析 x-codex-* 响应头获取正确的重置时间
- 7d 限制用尽时使用 codex_7d_reset_after_seconds
- 提取 Normalize() 方法统一窗口规范化逻辑

											
										
										
											2026-01-25 13:32:08 +08:00
+								// ParseCodexRateLimitHeaders extracts Codex usage limits from response headers.
 								// Exported for use in ratelimit_service when handling OpenAI 429 responses.
 								func ParseCodexRateLimitHeaders(headers http.Header) *OpenAICodexUsageSnapshot {
-												feat: OpenAI OAuth账号显示Codex使用量

从响应头提取x-codex-*使用量信息并保存到账号Extra字段，
前端账号列表展示5h/7d窗口的使用进度条。

											
										
										
											2025-12-23 16:26:07 +08:00
+									snapshot := &OpenAICodexUsageSnapshot{}
 									hasData := false
 									// Helper to parse float64 from header
 									parseFloat := func(key string) *float64 {
 										if v := headers.Get(key); v != "" {
 											if f, err := strconv.ParseFloat(v, 64); err == nil {
 												return &f
 											}
 										}
 										return nil
 									}
 									// Helper to parse int from header
 									parseInt := func(key string) *int {
 										if v := headers.Get(key); v != "" {
 											if i, err := strconv.Atoi(v); err == nil {
 												return &i
 											}
 										}
 										return nil
 									}
 									// Primary (weekly) limits
 									if v := parseFloat("x-codex-primary-used-percent"); v != nil {
 										snapshot.PrimaryUsedPercent = v
 										hasData = true
 									}
 									if v := parseInt("x-codex-primary-reset-after-seconds"); v != nil {
 										snapshot.PrimaryResetAfterSeconds = v
 										hasData = true
 									}
 									if v := parseInt("x-codex-primary-window-minutes"); v != nil {
 										snapshot.PrimaryWindowMinutes = v
 										hasData = true
 									}
 									// Secondary (5h) limits
 									if v := parseFloat("x-codex-secondary-used-percent"); v != nil {
 										snapshot.SecondaryUsedPercent = v
 										hasData = true
 									}
 									if v := parseInt("x-codex-secondary-reset-after-seconds"); v != nil {
 										snapshot.SecondaryResetAfterSeconds = v
 										hasData = true
 									}
 									if v := parseInt("x-codex-secondary-window-minutes"); v != nil {
 										snapshot.SecondaryWindowMinutes = v
 										hasData = true
 									}
 									// Overflow ratio
 									if v := parseFloat("x-codex-primary-over-secondary-limit-percent"); v != nil {
 										snapshot.PrimaryOverSecondaryPercent = v
 										hasData = true
 									}
 									if !hasData {
 										return nil
 									}
 									snapshot.UpdatedAt = time.Now().Format(time.RFC3339)
 									return snapshot
 								}
-												fix(codex): 修复额度窗口过期展示并补齐高覆盖测试

- 后端新增绝对重置时间字段计算（codex_5h_reset_at/codex_7d_reset_at）

- 前端统一窗口解析逻辑：绝对时间优先，updated_at+seconds 回退，过期自动归零

- 新增后端与前端单元测试，覆盖关键边界与异常场景

											
										
										
											2026-02-22 21:04:52 +08:00
+								func codexSnapshotBaseTime(snapshot *OpenAICodexUsageSnapshot, fallback time.Time) time.Time {
-												feat: OpenAI OAuth账号显示Codex使用量

从响应头提取x-codex-*使用量信息并保存到账号Extra字段，
前端账号列表展示5h/7d窗口的使用进度条。

											
										
										
											2025-12-23 16:26:07 +08:00
+									if snapshot == nil {
-												fix(codex): 修复额度窗口过期展示并补齐高覆盖测试

- 后端新增绝对重置时间字段计算（codex_5h_reset_at/codex_7d_reset_at）

- 前端统一窗口解析逻辑：绝对时间优先，updated_at+seconds 回退，过期自动归零

- 新增后端与前端单元测试，覆盖关键边界与异常场景

											
										
										
											2026-02-22 21:04:52 +08:00
+										return fallback
-												feat: OpenAI OAuth账号显示Codex使用量

从响应头提取x-codex-*使用量信息并保存到账号Extra字段，
前端账号列表展示5h/7d窗口的使用进度条。

											
										
										
											2025-12-23 16:26:07 +08:00
+									}
-												fix(codex): 修复额度窗口过期展示并补齐高覆盖测试

- 后端新增绝对重置时间字段计算（codex_5h_reset_at/codex_7d_reset_at）

- 前端统一窗口解析逻辑：绝对时间优先，updated_at+seconds 回退，过期自动归零

- 新增后端与前端单元测试，覆盖关键边界与异常场景

											
										
										
											2026-02-22 21:04:52 +08:00
+									if snapshot.UpdatedAt == "" {
 										return fallback
 									}
 									base, err := time.Parse(time.RFC3339, snapshot.UpdatedAt)
 									if err != nil {
 										return fallback
 									}
 									return base
 								}
 								func codexResetAtRFC3339(base time.Time, resetAfterSeconds *int) *string {
 									if resetAfterSeconds == nil {
 										return nil
 									}
 									sec := *resetAfterSeconds
 									if sec < 0 {
 										sec = 0
 									}
 									resetAt := base.Add(time.Duration(sec) * time.Second).Format(time.RFC3339)
 									return &resetAt
 								}
 								func buildCodexUsageExtraUpdates(snapshot *OpenAICodexUsageSnapshot, fallbackNow time.Time) map[string]any {
 									if snapshot == nil {
 										return nil
-												feat(openai): 增加 OAuth 透传开关

- 仅对 Codex CLI 且账号开启时走原样透传（只替换认证）

- 透传模式禁用工具修正/模型替换，并旁路解析 usage 用于计费

- 管理后台增加开关与文案，ops upstream error 记录 passthrough 标记

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-11 00:59:39 +08:00
+									}
-												feat: OpenAI OAuth账号显示Codex使用量

从响应头提取x-codex-*使用量信息并保存到账号Extra字段，
前端账号列表展示5h/7d窗口的使用进度条。

											
										
										
											2025-12-23 16:26:07 +08:00
-												fix(codex): 修复额度窗口过期展示并补齐高覆盖测试

- 后端新增绝对重置时间字段计算（codex_5h_reset_at/codex_7d_reset_at）

- 前端统一窗口解析逻辑：绝对时间优先，updated_at+seconds 回退，过期自动归零

- 新增后端与前端单元测试，覆盖关键边界与异常场景

											
										
										
											2026-02-22 21:04:52 +08:00
+									baseTime := codexSnapshotBaseTime(snapshot, fallbackNow)
-												feat: OpenAI OAuth账号显示Codex使用量

从响应头提取x-codex-*使用量信息并保存到账号Extra字段，
前端账号列表展示5h/7d窗口的使用进度条。

											
										
										
											2025-12-23 16:26:07 +08:00
+									updates := make(map[string]any)
-												fix(ratelimit): 修复 OpenAI 账号限流倒计时计算错误

- 解析 x-codex-* 响应头获取正确的重置时间
- 7d 限制用尽时使用 codex_7d_reset_after_seconds
- 提取 Normalize() 方法统一窗口规范化逻辑

											
										
										
											2026-01-25 13:32:08 +08:00
-												fix(codex): 修复额度窗口过期展示并补齐高覆盖测试

- 后端新增绝对重置时间字段计算（codex_5h_reset_at/codex_7d_reset_at）

- 前端统一窗口解析逻辑：绝对时间优先，updated_at+seconds 回退，过期自动归零

- 新增后端与前端单元测试，覆盖关键边界与异常场景

											
										
										
											2026-02-22 21:04:52 +08:00
+									// 保存原始 primary/secondary 字段，便于排查问题
-												feat: OpenAI OAuth账号显示Codex使用量

从响应头提取x-codex-*使用量信息并保存到账号Extra字段，
前端账号列表展示5h/7d窗口的使用进度条。

											
										
										
											2025-12-23 16:26:07 +08:00
+									if snapshot.PrimaryUsedPercent != nil {
 										updates["codex_primary_used_percent"] = *snapshot.PrimaryUsedPercent
 									}
 									if snapshot.PrimaryResetAfterSeconds != nil {
 										updates["codex_primary_reset_after_seconds"] = *snapshot.PrimaryResetAfterSeconds
 									}
 									if snapshot.PrimaryWindowMinutes != nil {
 										updates["codex_primary_window_minutes"] = *snapshot.PrimaryWindowMinutes
 									}
 									if snapshot.SecondaryUsedPercent != nil {
 										updates["codex_secondary_used_percent"] = *snapshot.SecondaryUsedPercent
 									}
 									if snapshot.SecondaryResetAfterSeconds != nil {
 										updates["codex_secondary_reset_after_seconds"] = *snapshot.SecondaryResetAfterSeconds
 									}
 									if snapshot.SecondaryWindowMinutes != nil {
 										updates["codex_secondary_window_minutes"] = *snapshot.SecondaryWindowMinutes
 									}
 									if snapshot.PrimaryOverSecondaryPercent != nil {
 										updates["codex_primary_over_secondary_percent"] = *snapshot.PrimaryOverSecondaryPercent
 									}
-												fix(codex): 修复额度窗口过期展示并补齐高覆盖测试

- 后端新增绝对重置时间字段计算（codex_5h_reset_at/codex_7d_reset_at）

- 前端统一窗口解析逻辑：绝对时间优先，updated_at+seconds 回退，过期自动归零

- 新增后端与前端单元测试，覆盖关键边界与异常场景

											
										
										
											2026-02-22 21:04:52 +08:00
+									updates["codex_usage_updated_at"] = baseTime.Format(time.RFC3339)
-												feat: OpenAI OAuth账号显示Codex使用量

从响应头提取x-codex-*使用量信息并保存到账号Extra字段，
前端账号列表展示5h/7d窗口的使用进度条。

											
										
										
											2025-12-23 16:26:07 +08:00
-												fix(codex): 修复额度窗口过期展示并补齐高覆盖测试

- 后端新增绝对重置时间字段计算（codex_5h_reset_at/codex_7d_reset_at）

- 前端统一窗口解析逻辑：绝对时间优先，updated_at+seconds 回退，过期自动归零

- 新增后端与前端单元测试，覆盖关键边界与异常场景

											
										
										
											2026-02-22 21:04:52 +08:00
+									// 归一化到 5h/7d 规范字段
-												fix(ratelimit): 修复 OpenAI 账号限流倒计时计算错误

- 解析 x-codex-* 响应头获取正确的重置时间
- 7d 限制用尽时使用 codex_7d_reset_after_seconds
- 提取 Normalize() 方法统一窗口规范化逻辑

											
										
										
											2026-01-25 13:32:08 +08:00
+									if normalized := snapshot.Normalize(); normalized != nil {
 										if normalized.Used5hPercent != nil {
 											updates["codex_5h_used_percent"] = *normalized.Used5hPercent
-												fix: 修复 OpenAI 账号 5h/7d 使用限制显示错误的问题 (#30)

* fix: 修复 OpenAI 账号 5h/7d 使用限制显示错误的问题

问题描述:
- 账号管理页面中,OpenAI OAuth 账号的 5h 列显示 7 天的剩余时间
- 7d 列却显示几小时的剩余时间
- 根本原因: OpenAI 响应头中 primary/secondary 的实际含义与代码假设相反

修复方案:
1. 后端归一化 (openai_gateway_service.go):
   - 根据 window_minutes 动态判断哪个是 5h/7d 限制
   - 新增规范字段 codex_5h_* 和 codex_7d_*
   - 保留旧字段以兼容性

2. 前端适配 (AccountUsageCell.vue):
   - 优先使用新的规范字段
   - Fallback 到旧字段时基于 window_minutes 动态判断
   - 更新 computed 属性命名

3. 类型定义更新 (types/index.ts):
   - 添加新的规范字段定义
   - 更新注释说明实际语义由 window_minutes 决定

🤖 Generated with Claude Code and Codex collaboration

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
Co-Authored-By: OpenAI Codex <noreply@openai.com>

* fix: 改进窗口判断逻辑，修复两个窗口都小于阈值时的bug

问题：
当两个窗口都小于360分钟时（如 primary=180分钟，secondary=300分钟），
之前的逻辑会导致：
- primary5h = true, secondary5h = true
- 5h 字段会使用 primary（错误）
- 7d 字段没有数据（bug）

修复方案：
改用比较策略：
1. 当两个窗口都存在时：较小的分配给5h，较大的分配给7d
2. 当只有一个窗口时：根据大小（<=360分钟）判断是5h还是7d
3. 确保数据不会丢失，逻辑更健壮

示例：
- Primary: 180分钟, Secondary: 300分钟
  → 5h 使用 Primary(180分钟), 7d 使用 Secondary(300分钟) ✓

🤖 Generated with Claude Code

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

* fix: 修正窗口大小判断逻辑 - 不能用剩余时间判断窗口类型

**严重bug修复：**
之前的 fallback 逻辑错误地使用 reset_after_seconds 来判断窗口大小。

问题示例：
- 周限制（7d）剩余 2h → reset_after_seconds = 7200秒
- 5h限制 剩余 4h → reset_after_seconds = 14400秒
- 错误逻辑：7200/60 < 14400/60，把周限制当成5h ❌

根本问题：
- window_minutes = 窗口的总大小（300 or 10080）
- reset_after_seconds = 距离重置的剩余时间（变化的）
- 不能用剩余时间来判断窗口类型！

修复方案：
1. **只使用 window_minutes** 来判断窗口大小
2. 移除错误的 reset_after_seconds fallback
3. 如果 window_minutes 都不存在，使用传统假设
4. 添加详细注释说明这个陷阱

🤖 Generated with Claude Code

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

* fix: 修复 lint 问题 - 改进 fallback 逻辑的变量赋值

问题：
第882-883行的简单布尔赋值可能触发 ineffassign 或 staticcheck 警告：
  use5hFromSecondary = snapshot.SecondaryUsedPercent != nil
  use7dFromPrimary = snapshot.PrimaryUsedPercent != nil

修复：
改用明确的 if 语句检查任意字段是否存在，更符合代码意图：
- 如果 secondary 的任意字段存在，将其视为 5h
- 如果 primary 的任意字段存在，将其视为 7d

这样逻辑更清晰，也避免了 lint 警告。

---------

Co-authored-by: Claude Sonnet 4.5 <noreply@anthropic.com>
Co-authored-by: OpenAI Codex <noreply@openai.com>
											
										
										
											2025-12-25 17:00:02 +08:00
+										}
-												fix(ratelimit): 修复 OpenAI 账号限流倒计时计算错误

- 解析 x-codex-* 响应头获取正确的重置时间
- 7d 限制用尽时使用 codex_7d_reset_after_seconds
- 提取 Normalize() 方法统一窗口规范化逻辑

											
										
										
											2026-01-25 13:32:08 +08:00
+										if normalized.Reset5hSeconds != nil {
 											updates["codex_5h_reset_after_seconds"] = *normalized.Reset5hSeconds
-												fix: 修复 OpenAI 账号 5h/7d 使用限制显示错误的问题 (#30)

* fix: 修复 OpenAI 账号 5h/7d 使用限制显示错误的问题

问题描述:
- 账号管理页面中,OpenAI OAuth 账号的 5h 列显示 7 天的剩余时间
- 7d 列却显示几小时的剩余时间
- 根本原因: OpenAI 响应头中 primary/secondary 的实际含义与代码假设相反

修复方案:
1. 后端归一化 (openai_gateway_service.go):
   - 根据 window_minutes 动态判断哪个是 5h/7d 限制
   - 新增规范字段 codex_5h_* 和 codex_7d_*
   - 保留旧字段以兼容性

2. 前端适配 (AccountUsageCell.vue):
   - 优先使用新的规范字段
   - Fallback 到旧字段时基于 window_minutes 动态判断
   - 更新 computed 属性命名

3. 类型定义更新 (types/index.ts):
   - 添加新的规范字段定义
   - 更新注释说明实际语义由 window_minutes 决定

🤖 Generated with Claude Code and Codex collaboration

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
Co-Authored-By: OpenAI Codex <noreply@openai.com>

* fix: 改进窗口判断逻辑，修复两个窗口都小于阈值时的bug

问题：
当两个窗口都小于360分钟时（如 primary=180分钟，secondary=300分钟），
之前的逻辑会导致：
- primary5h = true, secondary5h = true
- 5h 字段会使用 primary（错误）
- 7d 字段没有数据（bug）

修复方案：
改用比较策略：
1. 当两个窗口都存在时：较小的分配给5h，较大的分配给7d
2. 当只有一个窗口时：根据大小（<=360分钟）判断是5h还是7d
3. 确保数据不会丢失，逻辑更健壮

示例：
- Primary: 180分钟, Secondary: 300分钟
  → 5h 使用 Primary(180分钟), 7d 使用 Secondary(300分钟) ✓

🤖 Generated with Claude Code

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

* fix: 修正窗口大小判断逻辑 - 不能用剩余时间判断窗口类型

**严重bug修复：**
之前的 fallback 逻辑错误地使用 reset_after_seconds 来判断窗口大小。

问题示例：
- 周限制（7d）剩余 2h → reset_after_seconds = 7200秒
- 5h限制 剩余 4h → reset_after_seconds = 14400秒
- 错误逻辑：7200/60 < 14400/60，把周限制当成5h ❌

根本问题：
- window_minutes = 窗口的总大小（300 or 10080）
- reset_after_seconds = 距离重置的剩余时间（变化的）
- 不能用剩余时间来判断窗口类型！

修复方案：
1. **只使用 window_minutes** 来判断窗口大小
2. 移除错误的 reset_after_seconds fallback
3. 如果 window_minutes 都不存在，使用传统假设
4. 添加详细注释说明这个陷阱

🤖 Generated with Claude Code

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

* fix: 修复 lint 问题 - 改进 fallback 逻辑的变量赋值

问题：
第882-883行的简单布尔赋值可能触发 ineffassign 或 staticcheck 警告：
  use5hFromSecondary = snapshot.SecondaryUsedPercent != nil
  use7dFromPrimary = snapshot.PrimaryUsedPercent != nil

修复：
改用明确的 if 语句检查任意字段是否存在，更符合代码意图：
- 如果 secondary 的任意字段存在，将其视为 5h
- 如果 primary 的任意字段存在，将其视为 7d

这样逻辑更清晰，也避免了 lint 警告。

---------

Co-authored-by: Claude Sonnet 4.5 <noreply@anthropic.com>
Co-authored-by: OpenAI Codex <noreply@openai.com>
											
										
										
											2025-12-25 17:00:02 +08:00
+										}
-												fix(ratelimit): 修复 OpenAI 账号限流倒计时计算错误

- 解析 x-codex-* 响应头获取正确的重置时间
- 7d 限制用尽时使用 codex_7d_reset_after_seconds
- 提取 Normalize() 方法统一窗口规范化逻辑

											
										
										
											2026-01-25 13:32:08 +08:00
+										if normalized.Window5hMinutes != nil {
 											updates["codex_5h_window_minutes"] = *normalized.Window5hMinutes
-												fix: 修复 OpenAI 账号 5h/7d 使用限制显示错误的问题 (#30)

* fix: 修复 OpenAI 账号 5h/7d 使用限制显示错误的问题

问题描述:
- 账号管理页面中,OpenAI OAuth 账号的 5h 列显示 7 天的剩余时间
- 7d 列却显示几小时的剩余时间
- 根本原因: OpenAI 响应头中 primary/secondary 的实际含义与代码假设相反

修复方案:
1. 后端归一化 (openai_gateway_service.go):
   - 根据 window_minutes 动态判断哪个是 5h/7d 限制
   - 新增规范字段 codex_5h_* 和 codex_7d_*
   - 保留旧字段以兼容性

2. 前端适配 (AccountUsageCell.vue):
   - 优先使用新的规范字段
   - Fallback 到旧字段时基于 window_minutes 动态判断
   - 更新 computed 属性命名

3. 类型定义更新 (types/index.ts):
   - 添加新的规范字段定义
   - 更新注释说明实际语义由 window_minutes 决定

🤖 Generated with Claude Code and Codex collaboration

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
Co-Authored-By: OpenAI Codex <noreply@openai.com>

* fix: 改进窗口判断逻辑，修复两个窗口都小于阈值时的bug

问题：
当两个窗口都小于360分钟时（如 primary=180分钟，secondary=300分钟），
之前的逻辑会导致：
- primary5h = true, secondary5h = true
- 5h 字段会使用 primary（错误）
- 7d 字段没有数据（bug）

修复方案：
改用比较策略：
1. 当两个窗口都存在时：较小的分配给5h，较大的分配给7d
2. 当只有一个窗口时：根据大小（<=360分钟）判断是5h还是7d
3. 确保数据不会丢失，逻辑更健壮

示例：
- Primary: 180分钟, Secondary: 300分钟
  → 5h 使用 Primary(180分钟), 7d 使用 Secondary(300分钟) ✓

🤖 Generated with Claude Code

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

* fix: 修正窗口大小判断逻辑 - 不能用剩余时间判断窗口类型

**严重bug修复：**
之前的 fallback 逻辑错误地使用 reset_after_seconds 来判断窗口大小。

问题示例：
- 周限制（7d）剩余 2h → reset_after_seconds = 7200秒
- 5h限制 剩余 4h → reset_after_seconds = 14400秒
- 错误逻辑：7200/60 < 14400/60，把周限制当成5h ❌

根本问题：
- window_minutes = 窗口的总大小（300 or 10080）
- reset_after_seconds = 距离重置的剩余时间（变化的）
- 不能用剩余时间来判断窗口类型！

修复方案：
1. **只使用 window_minutes** 来判断窗口大小
2. 移除错误的 reset_after_seconds fallback
3. 如果 window_minutes 都不存在，使用传统假设
4. 添加详细注释说明这个陷阱

🤖 Generated with Claude Code

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

* fix: 修复 lint 问题 - 改进 fallback 逻辑的变量赋值

问题：
第882-883行的简单布尔赋值可能触发 ineffassign 或 staticcheck 警告：
  use5hFromSecondary = snapshot.SecondaryUsedPercent != nil
  use7dFromPrimary = snapshot.PrimaryUsedPercent != nil

修复：
改用明确的 if 语句检查任意字段是否存在，更符合代码意图：
- 如果 secondary 的任意字段存在，将其视为 5h
- 如果 primary 的任意字段存在，将其视为 7d

这样逻辑更清晰，也避免了 lint 警告。

---------

Co-authored-by: Claude Sonnet 4.5 <noreply@anthropic.com>
Co-authored-by: OpenAI Codex <noreply@openai.com>
											
										
										
											2025-12-25 17:00:02 +08:00
+										}
-												fix(ratelimit): 修复 OpenAI 账号限流倒计时计算错误

- 解析 x-codex-* 响应头获取正确的重置时间
- 7d 限制用尽时使用 codex_7d_reset_after_seconds
- 提取 Normalize() 方法统一窗口规范化逻辑

											
										
										
											2026-01-25 13:32:08 +08:00
+										if normalized.Used7dPercent != nil {
 											updates["codex_7d_used_percent"] = *normalized.Used7dPercent
-												fix: 修复 OpenAI 账号 5h/7d 使用限制显示错误的问题 (#30)

* fix: 修复 OpenAI 账号 5h/7d 使用限制显示错误的问题

问题描述:
- 账号管理页面中,OpenAI OAuth 账号的 5h 列显示 7 天的剩余时间
- 7d 列却显示几小时的剩余时间
- 根本原因: OpenAI 响应头中 primary/secondary 的实际含义与代码假设相反

修复方案:
1. 后端归一化 (openai_gateway_service.go):
   - 根据 window_minutes 动态判断哪个是 5h/7d 限制
   - 新增规范字段 codex_5h_* 和 codex_7d_*
   - 保留旧字段以兼容性

2. 前端适配 (AccountUsageCell.vue):
   - 优先使用新的规范字段
   - Fallback 到旧字段时基于 window_minutes 动态判断
   - 更新 computed 属性命名

3. 类型定义更新 (types/index.ts):
   - 添加新的规范字段定义
   - 更新注释说明实际语义由 window_minutes 决定

🤖 Generated with Claude Code and Codex collaboration

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
Co-Authored-By: OpenAI Codex <noreply@openai.com>

* fix: 改进窗口判断逻辑，修复两个窗口都小于阈值时的bug

问题：
当两个窗口都小于360分钟时（如 primary=180分钟，secondary=300分钟），
之前的逻辑会导致：
- primary5h = true, secondary5h = true
- 5h 字段会使用 primary（错误）
- 7d 字段没有数据（bug）

修复方案：
改用比较策略：
1. 当两个窗口都存在时：较小的分配给5h，较大的分配给7d
2. 当只有一个窗口时：根据大小（<=360分钟）判断是5h还是7d
3. 确保数据不会丢失，逻辑更健壮

示例：
- Primary: 180分钟, Secondary: 300分钟
  → 5h 使用 Primary(180分钟), 7d 使用 Secondary(300分钟) ✓

🤖 Generated with Claude Code

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

* fix: 修正窗口大小判断逻辑 - 不能用剩余时间判断窗口类型

**严重bug修复：**
之前的 fallback 逻辑错误地使用 reset_after_seconds 来判断窗口大小。

问题示例：
- 周限制（7d）剩余 2h → reset_after_seconds = 7200秒
- 5h限制 剩余 4h → reset_after_seconds = 14400秒
- 错误逻辑：7200/60 < 14400/60，把周限制当成5h ❌

根本问题：
- window_minutes = 窗口的总大小（300 or 10080）
- reset_after_seconds = 距离重置的剩余时间（变化的）
- 不能用剩余时间来判断窗口类型！

修复方案：
1. **只使用 window_minutes** 来判断窗口大小
2. 移除错误的 reset_after_seconds fallback
3. 如果 window_minutes 都不存在，使用传统假设
4. 添加详细注释说明这个陷阱

🤖 Generated with Claude Code

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

* fix: 修复 lint 问题 - 改进 fallback 逻辑的变量赋值

问题：
第882-883行的简单布尔赋值可能触发 ineffassign 或 staticcheck 警告：
  use5hFromSecondary = snapshot.SecondaryUsedPercent != nil
  use7dFromPrimary = snapshot.PrimaryUsedPercent != nil

修复：
改用明确的 if 语句检查任意字段是否存在，更符合代码意图：
- 如果 secondary 的任意字段存在，将其视为 5h
- 如果 primary 的任意字段存在，将其视为 7d

这样逻辑更清晰，也避免了 lint 警告。

---------

Co-authored-by: Claude Sonnet 4.5 <noreply@anthropic.com>
Co-authored-by: OpenAI Codex <noreply@openai.com>
											
										
										
											2025-12-25 17:00:02 +08:00
+										}
-												fix(ratelimit): 修复 OpenAI 账号限流倒计时计算错误

- 解析 x-codex-* 响应头获取正确的重置时间
- 7d 限制用尽时使用 codex_7d_reset_after_seconds
- 提取 Normalize() 方法统一窗口规范化逻辑

											
										
										
											2026-01-25 13:32:08 +08:00
+										if normalized.Reset7dSeconds != nil {
 											updates["codex_7d_reset_after_seconds"] = *normalized.Reset7dSeconds
-												fix: 修复 OpenAI 账号 5h/7d 使用限制显示错误的问题 (#30)

* fix: 修复 OpenAI 账号 5h/7d 使用限制显示错误的问题

问题描述:
- 账号管理页面中,OpenAI OAuth 账号的 5h 列显示 7 天的剩余时间
- 7d 列却显示几小时的剩余时间
- 根本原因: OpenAI 响应头中 primary/secondary 的实际含义与代码假设相反

修复方案:
1. 后端归一化 (openai_gateway_service.go):
   - 根据 window_minutes 动态判断哪个是 5h/7d 限制
   - 新增规范字段 codex_5h_* 和 codex_7d_*
   - 保留旧字段以兼容性

2. 前端适配 (AccountUsageCell.vue):
   - 优先使用新的规范字段
   - Fallback 到旧字段时基于 window_minutes 动态判断
   - 更新 computed 属性命名

3. 类型定义更新 (types/index.ts):
   - 添加新的规范字段定义
   - 更新注释说明实际语义由 window_minutes 决定

🤖 Generated with Claude Code and Codex collaboration

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
Co-Authored-By: OpenAI Codex <noreply@openai.com>

* fix: 改进窗口判断逻辑，修复两个窗口都小于阈值时的bug

问题：
当两个窗口都小于360分钟时（如 primary=180分钟，secondary=300分钟），
之前的逻辑会导致：
- primary5h = true, secondary5h = true
- 5h 字段会使用 primary（错误）
- 7d 字段没有数据（bug）

修复方案：
改用比较策略：
1. 当两个窗口都存在时：较小的分配给5h，较大的分配给7d
2. 当只有一个窗口时：根据大小（<=360分钟）判断是5h还是7d
3. 确保数据不会丢失，逻辑更健壮

示例：
- Primary: 180分钟, Secondary: 300分钟
  → 5h 使用 Primary(180分钟), 7d 使用 Secondary(300分钟) ✓

🤖 Generated with Claude Code

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

* fix: 修正窗口大小判断逻辑 - 不能用剩余时间判断窗口类型

**严重bug修复：**
之前的 fallback 逻辑错误地使用 reset_after_seconds 来判断窗口大小。

问题示例：
- 周限制（7d）剩余 2h → reset_after_seconds = 7200秒
- 5h限制 剩余 4h → reset_after_seconds = 14400秒
- 错误逻辑：7200/60 < 14400/60，把周限制当成5h ❌

根本问题：
- window_minutes = 窗口的总大小（300 or 10080）
- reset_after_seconds = 距离重置的剩余时间（变化的）
- 不能用剩余时间来判断窗口类型！

修复方案：
1. **只使用 window_minutes** 来判断窗口大小
2. 移除错误的 reset_after_seconds fallback
3. 如果 window_minutes 都不存在，使用传统假设
4. 添加详细注释说明这个陷阱

🤖 Generated with Claude Code

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

* fix: 修复 lint 问题 - 改进 fallback 逻辑的变量赋值

问题：
第882-883行的简单布尔赋值可能触发 ineffassign 或 staticcheck 警告：
  use5hFromSecondary = snapshot.SecondaryUsedPercent != nil
  use7dFromPrimary = snapshot.PrimaryUsedPercent != nil

修复：
改用明确的 if 语句检查任意字段是否存在，更符合代码意图：
- 如果 secondary 的任意字段存在，将其视为 5h
- 如果 primary 的任意字段存在，将其视为 7d

这样逻辑更清晰，也避免了 lint 警告。

---------

Co-authored-by: Claude Sonnet 4.5 <noreply@anthropic.com>
Co-authored-by: OpenAI Codex <noreply@openai.com>
											
										
										
											2025-12-25 17:00:02 +08:00
+										}
-												fix(ratelimit): 修复 OpenAI 账号限流倒计时计算错误

- 解析 x-codex-* 响应头获取正确的重置时间
- 7d 限制用尽时使用 codex_7d_reset_after_seconds
- 提取 Normalize() 方法统一窗口规范化逻辑

											
										
										
											2026-01-25 13:32:08 +08:00
+										if normalized.Window7dMinutes != nil {
 											updates["codex_7d_window_minutes"] = *normalized.Window7dMinutes
-												fix: 修复 OpenAI 账号 5h/7d 使用限制显示错误的问题 (#30)

* fix: 修复 OpenAI 账号 5h/7d 使用限制显示错误的问题

问题描述:
- 账号管理页面中,OpenAI OAuth 账号的 5h 列显示 7 天的剩余时间
- 7d 列却显示几小时的剩余时间
- 根本原因: OpenAI 响应头中 primary/secondary 的实际含义与代码假设相反

修复方案:
1. 后端归一化 (openai_gateway_service.go):
   - 根据 window_minutes 动态判断哪个是 5h/7d 限制
   - 新增规范字段 codex_5h_* 和 codex_7d_*
   - 保留旧字段以兼容性

2. 前端适配 (AccountUsageCell.vue):
   - 优先使用新的规范字段
   - Fallback 到旧字段时基于 window_minutes 动态判断
   - 更新 computed 属性命名

3. 类型定义更新 (types/index.ts):
   - 添加新的规范字段定义
   - 更新注释说明实际语义由 window_minutes 决定

🤖 Generated with Claude Code and Codex collaboration

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
Co-Authored-By: OpenAI Codex <noreply@openai.com>

* fix: 改进窗口判断逻辑，修复两个窗口都小于阈值时的bug

问题：
当两个窗口都小于360分钟时（如 primary=180分钟，secondary=300分钟），
之前的逻辑会导致：
- primary5h = true, secondary5h = true
- 5h 字段会使用 primary（错误）
- 7d 字段没有数据（bug）

修复方案：
改用比较策略：
1. 当两个窗口都存在时：较小的分配给5h，较大的分配给7d
2. 当只有一个窗口时：根据大小（<=360分钟）判断是5h还是7d
3. 确保数据不会丢失，逻辑更健壮

示例：
- Primary: 180分钟, Secondary: 300分钟
  → 5h 使用 Primary(180分钟), 7d 使用 Secondary(300分钟) ✓

🤖 Generated with Claude Code

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

* fix: 修正窗口大小判断逻辑 - 不能用剩余时间判断窗口类型

**严重bug修复：**
之前的 fallback 逻辑错误地使用 reset_after_seconds 来判断窗口大小。

问题示例：
- 周限制（7d）剩余 2h → reset_after_seconds = 7200秒
- 5h限制 剩余 4h → reset_after_seconds = 14400秒
- 错误逻辑：7200/60 < 14400/60，把周限制当成5h ❌

根本问题：
- window_minutes = 窗口的总大小（300 or 10080）
- reset_after_seconds = 距离重置的剩余时间（变化的）
- 不能用剩余时间来判断窗口类型！

修复方案：
1. **只使用 window_minutes** 来判断窗口大小
2. 移除错误的 reset_after_seconds fallback
3. 如果 window_minutes 都不存在，使用传统假设
4. 添加详细注释说明这个陷阱

🤖 Generated with Claude Code

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

* fix: 修复 lint 问题 - 改进 fallback 逻辑的变量赋值

问题：
第882-883行的简单布尔赋值可能触发 ineffassign 或 staticcheck 警告：
  use5hFromSecondary = snapshot.SecondaryUsedPercent != nil
  use7dFromPrimary = snapshot.PrimaryUsedPercent != nil

修复：
改用明确的 if 语句检查任意字段是否存在，更符合代码意图：
- 如果 secondary 的任意字段存在，将其视为 5h
- 如果 primary 的任意字段存在，将其视为 7d

这样逻辑更清晰，也避免了 lint 警告。

---------

Co-authored-by: Claude Sonnet 4.5 <noreply@anthropic.com>
Co-authored-by: OpenAI Codex <noreply@openai.com>
											
										
										
											2025-12-25 17:00:02 +08:00
+										}
-												fix(codex): 修复额度窗口过期展示并补齐高覆盖测试

- 后端新增绝对重置时间字段计算（codex_5h_reset_at/codex_7d_reset_at）

- 前端统一窗口解析逻辑：绝对时间优先，updated_at+seconds 回退，过期自动归零

- 新增后端与前端单元测试，覆盖关键边界与异常场景

											
										
										
											2026-02-22 21:04:52 +08:00
+										if reset5hAt := codexResetAtRFC3339(baseTime, normalized.Reset5hSeconds); reset5hAt != nil {
 											updates["codex_5h_reset_at"] = *reset5hAt
 										}
 										if reset7dAt := codexResetAtRFC3339(baseTime, normalized.Reset7dSeconds); reset7dAt != nil {
 											updates["codex_7d_reset_at"] = *reset7dAt
 										}
 									}
 									return updates
 								}
 								// updateCodexUsageSnapshot saves the Codex usage snapshot to account's Extra field
 								func (s *OpenAIGatewayService) updateCodexUsageSnapshot(ctx context.Context, accountID int64, snapshot *OpenAICodexUsageSnapshot) {
 									if snapshot == nil {
 										return
 									}
 									if s == nil || s.accountRepo == nil {
 										return
 									}
-												fix: 修复 OpenAI WS 限流状态与调度同步

											
										
										
											2026-03-07 23:59:39 +08:00
+									now := time.Now()
 									updates := buildCodexUsageExtraUpdates(snapshot, now)
-												修复 OpenAI 账号限流回流误判：7d 窗口可用时不因 5h 窗口为 0 回写 429

											
										
										
											2026-04-15 15:29:52 +08:00
+									if len(updates) == 0 {
-												fix(codex): 修复额度窗口过期展示并补齐高覆盖测试

- 后端新增绝对重置时间字段计算（codex_5h_reset_at/codex_7d_reset_at）

- 前端统一窗口解析逻辑：绝对时间优先，updated_at+seconds 回退，过期自动归零

- 新增后端与前端单元测试，覆盖关键边界与异常场景

											
										
										
											2026-02-22 21:04:52 +08:00
+										return
-												fix: 修复 OpenAI 账号 5h/7d 使用限制显示错误的问题 (#30)

* fix: 修复 OpenAI 账号 5h/7d 使用限制显示错误的问题

问题描述:
- 账号管理页面中,OpenAI OAuth 账号的 5h 列显示 7 天的剩余时间
- 7d 列却显示几小时的剩余时间
- 根本原因: OpenAI 响应头中 primary/secondary 的实际含义与代码假设相反

修复方案:
1. 后端归一化 (openai_gateway_service.go):
   - 根据 window_minutes 动态判断哪个是 5h/7d 限制
   - 新增规范字段 codex_5h_* 和 codex_7d_*
   - 保留旧字段以兼容性

2. 前端适配 (AccountUsageCell.vue):
   - 优先使用新的规范字段
   - Fallback 到旧字段时基于 window_minutes 动态判断
   - 更新 computed 属性命名

3. 类型定义更新 (types/index.ts):
   - 添加新的规范字段定义
   - 更新注释说明实际语义由 window_minutes 决定

🤖 Generated with Claude Code and Codex collaboration

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
Co-Authored-By: OpenAI Codex <noreply@openai.com>

* fix: 改进窗口判断逻辑，修复两个窗口都小于阈值时的bug

问题：
当两个窗口都小于360分钟时（如 primary=180分钟，secondary=300分钟），
之前的逻辑会导致：
- primary5h = true, secondary5h = true
- 5h 字段会使用 primary（错误）
- 7d 字段没有数据（bug）

修复方案：
改用比较策略：
1. 当两个窗口都存在时：较小的分配给5h，较大的分配给7d
2. 当只有一个窗口时：根据大小（<=360分钟）判断是5h还是7d
3. 确保数据不会丢失，逻辑更健壮

示例：
- Primary: 180分钟, Secondary: 300分钟
  → 5h 使用 Primary(180分钟), 7d 使用 Secondary(300分钟) ✓

🤖 Generated with Claude Code

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

* fix: 修正窗口大小判断逻辑 - 不能用剩余时间判断窗口类型

**严重bug修复：**
之前的 fallback 逻辑错误地使用 reset_after_seconds 来判断窗口大小。

问题示例：
- 周限制（7d）剩余 2h → reset_after_seconds = 7200秒
- 5h限制 剩余 4h → reset_after_seconds = 14400秒
- 错误逻辑：7200/60 < 14400/60，把周限制当成5h ❌

根本问题：
- window_minutes = 窗口的总大小（300 or 10080）
- reset_after_seconds = 距离重置的剩余时间（变化的）
- 不能用剩余时间来判断窗口类型！

修复方案：
1. **只使用 window_minutes** 来判断窗口大小
2. 移除错误的 reset_after_seconds fallback
3. 如果 window_minutes 都不存在，使用传统假设
4. 添加详细注释说明这个陷阱

🤖 Generated with Claude Code

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

* fix: 修复 lint 问题 - 改进 fallback 逻辑的变量赋值

问题：
第882-883行的简单布尔赋值可能触发 ineffassign 或 staticcheck 警告：
  use5hFromSecondary = snapshot.SecondaryUsedPercent != nil
  use7dFromPrimary = snapshot.PrimaryUsedPercent != nil

修复：
改用明确的 if 语句检查任意字段是否存在，更符合代码意图：
- 如果 secondary 的任意字段存在，将其视为 5h
- 如果 primary 的任意字段存在，将其视为 7d

这样逻辑更清晰，也避免了 lint 警告。

---------

Co-authored-by: Claude Sonnet 4.5 <noreply@anthropic.com>
Co-authored-by: OpenAI Codex <noreply@openai.com>
											
										
										
											2025-12-25 17:00:02 +08:00
+									}
-												修复 OpenAI 账号限流回流误判：7d 窗口可用时不因 5h 窗口为 0 回写 429

											
										
										
											2026-04-15 15:29:52 +08:00
+									if !s.getCodexSnapshotThrottle().Allow(accountID, now) {
-												Fix Codex exhausted snapshot propagation

											
										
										
											2026-03-11 15:47:39 +08:00
+										return
 									}
-												fix: 修复 OpenAI 账号 5h/7d 使用限制显示错误的问题 (#30)

* fix: 修复 OpenAI 账号 5h/7d 使用限制显示错误的问题

问题描述:
- 账号管理页面中,OpenAI OAuth 账号的 5h 列显示 7 天的剩余时间
- 7d 列却显示几小时的剩余时间
- 根本原因: OpenAI 响应头中 primary/secondary 的实际含义与代码假设相反

修复方案:
1. 后端归一化 (openai_gateway_service.go):
   - 根据 window_minutes 动态判断哪个是 5h/7d 限制
   - 新增规范字段 codex_5h_* 和 codex_7d_*
   - 保留旧字段以兼容性

2. 前端适配 (AccountUsageCell.vue):
   - 优先使用新的规范字段
   - Fallback 到旧字段时基于 window_minutes 动态判断
   - 更新 computed 属性命名

3. 类型定义更新 (types/index.ts):
   - 添加新的规范字段定义
   - 更新注释说明实际语义由 window_minutes 决定

🤖 Generated with Claude Code and Codex collaboration

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
Co-Authored-By: OpenAI Codex <noreply@openai.com>

* fix: 改进窗口判断逻辑，修复两个窗口都小于阈值时的bug

问题：
当两个窗口都小于360分钟时（如 primary=180分钟，secondary=300分钟），
之前的逻辑会导致：
- primary5h = true, secondary5h = true
- 5h 字段会使用 primary（错误）
- 7d 字段没有数据（bug）

修复方案：
改用比较策略：
1. 当两个窗口都存在时：较小的分配给5h，较大的分配给7d
2. 当只有一个窗口时：根据大小（<=360分钟）判断是5h还是7d
3. 确保数据不会丢失，逻辑更健壮

示例：
- Primary: 180分钟, Secondary: 300分钟
  → 5h 使用 Primary(180分钟), 7d 使用 Secondary(300分钟) ✓

🤖 Generated with Claude Code

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

* fix: 修正窗口大小判断逻辑 - 不能用剩余时间判断窗口类型

**严重bug修复：**
之前的 fallback 逻辑错误地使用 reset_after_seconds 来判断窗口大小。

问题示例：
- 周限制（7d）剩余 2h → reset_after_seconds = 7200秒
- 5h限制 剩余 4h → reset_after_seconds = 14400秒
- 错误逻辑：7200/60 < 14400/60，把周限制当成5h ❌

根本问题：
- window_minutes = 窗口的总大小（300 or 10080）
- reset_after_seconds = 距离重置的剩余时间（变化的）
- 不能用剩余时间来判断窗口类型！

修复方案：
1. **只使用 window_minutes** 来判断窗口大小
2. 移除错误的 reset_after_seconds fallback
3. 如果 window_minutes 都不存在，使用传统假设
4. 添加详细注释说明这个陷阱

🤖 Generated with Claude Code

Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>

* fix: 修复 lint 问题 - 改进 fallback 逻辑的变量赋值

问题：
第882-883行的简单布尔赋值可能触发 ineffassign 或 staticcheck 警告：
  use5hFromSecondary = snapshot.SecondaryUsedPercent != nil
  use7dFromPrimary = snapshot.PrimaryUsedPercent != nil

修复：
改用明确的 if 语句检查任意字段是否存在，更符合代码意图：
- 如果 secondary 的任意字段存在，将其视为 5h
- 如果 primary 的任意字段存在，将其视为 7d

这样逻辑更清晰，也避免了 lint 警告。

---------

Co-authored-by: Claude Sonnet 4.5 <noreply@anthropic.com>
Co-authored-by: OpenAI Codex <noreply@openai.com>
											
										
										
											2025-12-25 17:00:02 +08:00
-												feat: OpenAI OAuth账号显示Codex使用量

从响应头提取x-codex-*使用量信息并保存到账号Extra字段，
前端账号列表展示5h/7d窗口的使用进度条。

											
										
										
											2025-12-23 16:26:07 +08:00
+									go func() {
 										updateCtx, cancel := context.WithTimeout(context.Background(), 5*time.Second)
 										defer cancel()
-												修复 OpenAI 账号限流回流误判：7d 窗口可用时不因 5h 窗口为 0 回写 429

											
										
										
											2026-04-15 15:29:52 +08:00
+										_ = s.accountRepo.UpdateExtra(updateCtx, accountID, updates)
-												feat: OpenAI OAuth账号显示Codex使用量

从响应头提取x-codex-*使用量信息并保存到账号Extra字段，
前端账号列表展示5h/7d窗口的使用进度条。

											
										
										
											2025-12-23 16:26:07 +08:00
+									}()
 								}
-												feat(usage): add reasoning effort column

											
										
										
											2026-02-03 14:36:29 +08:00
-												fix(openai): restore ws usage window display

											
										
										
											2026-03-06 20:46:10 +08:00
+								func (s *OpenAIGatewayService) UpdateCodexUsageSnapshotFromHeaders(ctx context.Context, accountID int64, headers http.Header) {
 									if accountID <= 0 || headers == nil {
 										return
 									}
 									if snapshot := ParseCodexRateLimitHeaders(headers); snapshot != nil {
 										s.updateCodexUsageSnapshot(ctx, accountID, snapshot)
 									}
 								}
-												feat(usage): add reasoning effort column

											
										
										
											2026-02-03 14:36:29 +08:00
+								func getOpenAIReasoningEffortFromReqBody(reqBody map[string]any) (value string, present bool) {
 									if reqBody == nil {
 										return "", false
 									}
 									// Primary: reasoning.effort
 									if reasoning, ok := reqBody["reasoning"].(map[string]any); ok {
 										if effort, ok := reasoning["effort"].(string); ok {
 											return normalizeOpenAIReasoningEffort(effort), true
 										}
 									}
 									// Fallback: some clients may use a flat field.
 									if effort, ok := reqBody["reasoning_effort"].(string); ok {
 										return normalizeOpenAIReasoningEffort(effort), true
 									}
 									return "", false
 								}
 								func deriveOpenAIReasoningEffortFromModel(model string) string {
 									if strings.TrimSpace(model) == "" {
 										return ""
 									}
 									modelID := strings.TrimSpace(model)
 									if strings.Contains(modelID, "/") {
 										parts := strings.Split(modelID, "/")
 										modelID = parts[len(parts)-1]
 									}
 									parts := strings.FieldsFunc(strings.ToLower(modelID), func(r rune) bool {
 										switch r {
 										case '-', '_', ' ':
 											return true
 										default:
 											return false
 										}
 									})
 									if len(parts) == 0 {
 										return ""
 									}
 									return normalizeOpenAIReasoningEffort(parts[len(parts)-1])
 								}
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+								func extractOpenAIRequestMetaFromBody(body []byte) (model string, stream bool, promptCacheKey string) {
 									if len(body) == 0 {
 										return "", false, ""
 									}
 									model = strings.TrimSpace(gjson.GetBytes(body, "model").String())
 									stream = gjson.GetBytes(body, "stream").Bool()
 									promptCacheKey = strings.TrimSpace(gjson.GetBytes(body, "prompt_cache_key").String())
 									return model, stream, promptCacheKey
 								}
-												fix(openai): 透传OAuth强制store/stream并修复Codex识别

											
										
										
											2026-02-12 21:02:52 +08:00
+								// normalizeOpenAIPassthroughOAuthBody 将透传 OAuth 请求体收敛为旧链路关键行为：
-												fix(openai): support remote compact task

											
										
										
											2026-03-06 18:50:28 +08:00
+								// 1) store=false 2) 非 compact 保持 stream=true；compact 强制 stream=false
 								func normalizeOpenAIPassthroughOAuthBody(body []byte, compact bool) ([]byte, bool, error) {
-												fix(openai): 透传OAuth强制store/stream并修复Codex识别

											
										
										
											2026-02-12 21:02:52 +08:00
+									if len(body) == 0 {
 										return body, false, nil
 									}
 									normalized := body
 									changed := false
-												fix(openai): support remote compact task

											
										
										
											2026-03-06 18:50:28 +08:00
+									if compact {
 										if store := gjson.GetBytes(normalized, "store"); store.Exists() {
 											next, err := sjson.DeleteBytes(normalized, "store")
 											if err != nil {
 												return body, false, fmt.Errorf("normalize passthrough body delete store: %w", err)
 											}
 											normalized = next
 											changed = true
-												fix(openai): 透传OAuth强制store/stream并修复Codex识别

											
										
										
											2026-02-12 21:02:52 +08:00
+										}
-												fix(openai): support remote compact task

											
										
										
											2026-03-06 18:50:28 +08:00
+										if stream := gjson.GetBytes(normalized, "stream"); stream.Exists() {
 											next, err := sjson.DeleteBytes(normalized, "stream")
 											if err != nil {
 												return body, false, fmt.Errorf("normalize passthrough body delete stream: %w", err)
 											}
 											normalized = next
 											changed = true
 										}
 									} else {
 										if store := gjson.GetBytes(normalized, "store"); !store.Exists() || store.Type != gjson.False {
 											next, err := sjson.SetBytes(normalized, "store", false)
 											if err != nil {
 												return body, false, fmt.Errorf("normalize passthrough body store=false: %w", err)
 											}
 											normalized = next
 											changed = true
 										}
 										if stream := gjson.GetBytes(normalized, "stream"); !stream.Exists() || stream.Type != gjson.True {
 											next, err := sjson.SetBytes(normalized, "stream", true)
 											if err != nil {
 												return body, false, fmt.Errorf("normalize passthrough body stream=true: %w", err)
 											}
 											normalized = next
 											changed = true
-												fix(openai): 透传OAuth强制store/stream并修复Codex识别

											
										
										
											2026-02-12 21:02:52 +08:00
+										}
 									}
 									return normalized, changed, nil
 								}
-												feat(backend): 提交后端审计修复与配套测试改动

											
										
										
											2026-02-14 11:23:10 +08:00
+								func detectOpenAIPassthroughInstructionsRejectReason(reqModel string, body []byte) string {
 									model := strings.ToLower(strings.TrimSpace(reqModel))
 									if !strings.Contains(model, "codex") {
 										return ""
 									}
 									instructions := gjson.GetBytes(body, "instructions")
 									if !instructions.Exists() {
 										return "instructions_missing"
 									}
 									if instructions.Type != gjson.String {
 										return "instructions_not_string"
 									}
 									if strings.TrimSpace(instructions.String()) == "" {
 										return "instructions_empty"
 									}
 									return ""
 								}
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+								func extractOpenAIReasoningEffortFromBody(body []byte, requestedModel string) *string {
 									reasoningEffort := strings.TrimSpace(gjson.GetBytes(body, "reasoning.effort").String())
 									if reasoningEffort == "" {
 										reasoningEffort = strings.TrimSpace(gjson.GetBytes(body, "reasoning_effort").String())
 									}
 									if reasoningEffort != "" {
 										normalized := normalizeOpenAIReasoningEffort(reasoningEffort)
 										if normalized == "" {
 											return nil
 										}
 										return &normalized
 									}
 									value := deriveOpenAIReasoningEffortFromModel(requestedModel)
 									if value == "" {
 										return nil
 									}
 									return &value
 								}
-												fix(billing): 修复 OpenAI fast 档位计费并补齐展示

- 打通 service_tier 在 OpenAI HTTP、WS、passthrough 与 usage 记录中的传递
- 修正 priority/flex 计费逻辑，并将 fast 归一化为 priority
- 在用户端和管理端补齐服务档位与计费明细展示
- 补齐前后端测试，并修复 WS 限流信号重复持久化导致的全量回归失败

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-08 23:22:28 +08:00
+								func extractOpenAIServiceTier(reqBody map[string]any) *string {
 									if reqBody == nil {
 										return nil
 									}
 									raw, ok := reqBody["service_tier"].(string)
 									if !ok {
 										return nil
 									}
 									return normalizeOpenAIServiceTier(raw)
 								}
 								func extractOpenAIServiceTierFromBody(body []byte) *string {
 									if len(body) == 0 {
 										return nil
 									}
 									return normalizeOpenAIServiceTier(gjson.GetBytes(body, "service_tier").String())
 								}
 								func normalizeOpenAIServiceTier(raw string) *string {
 									value := strings.ToLower(strings.TrimSpace(raw))
 									if value == "" {
 										return nil
 									}
 									if value == "fast" {
 										value = "priority"
 									}
-												feat(openai): OpenAI Fast/Flex Policy 完整实现（HTTP + WebSocket + Admin）

对称参照 Claude BetaPolicy 的 fast-mode 过滤实现，新增针对 OpenAI 上游
service_tier 字段（priority / flex，含客户端 "fast" → "priority" 归一化）的
pass / filter / block 三态策略，覆盖全部 OpenAI 入口 + admin 配置入口。

后端核心
- 新增 SettingKeyOpenAIFastPolicySettings、OpenAIFastPolicyRule、
  OpenAIFastPolicySettings 配置模型，含规则的 service_tier × action × scope
  × 模型白名单 × fallback action 维度。
- SettingService.Get/SetOpenAIFastPolicySettings；缺失时返回内置默认策略
  （所有模型的 priority 走 filter，whitelist 为空，fallback=pass）。设计
  依据：service_tier=fast 是用户级开关，与 model 字段正交，默认锁定特定
  model slug 会留下"用 gpt-4 + fast 透传 priority 上游"的绕过路径。JSON
  解析失败不再静默 fallback，slog.Warn 记录脏数据，便于运维定位。
- service_tier 归一化（trim + ToLower + fast→priority + 白名单 priority/flex）
  与策略评估（evaluateOpenAIFastPolicy）作为唯一真实来源，HTTP / WS 共用。
  抽出纯函数 evaluateOpenAIFastPolicyWithSettings，配合 ctx-bound settings
  快照（withOpenAIFastPolicyContext / openAIFastPolicySettingsFromContext），
  WS 长会话入口预取一次后所有帧复用，避免每帧打到 settingService。

HTTP 入口（4 个）
- Chat Completions、Anthropic 兼容（Messages，含 BetaFastMode→priority 二次
  命中）、原生 Responses、Passthrough Responses 全部接入
  applyOpenAIFastPolicyToBody，filter 走 sjson 顶层删除 service_tier，block
  返回 403 forbidden_error JSON。
- 4 入口统一使用 upstream 视角的 model（GetMappedModel +
  normalizeOpenAIModelForUpstream + Codex OAuth normalize 后的 slug），
  避免 chat/messages/native /responses/passthrough 因为 model 维度不同
  造成 whitelist 命中差异。
- 在 pass 路径也把客户端 "fast" 别名归一化为 "priority" 写回 body，
  否则 native /responses 与 passthrough 入口会把 "fast" 原样透传给上游
  导致 400/拒绝（chat-completions 入口的 normalizeResponsesBodyServiceTier
  此前已具备同等行为）。

WebSocket 入口
- 新增 applyOpenAIFastPolicyToWSResponseCreate：严格匹配
  type="response.create"，仅处理顶层 service_tier；filter 用 sjson 删字段，
  block 返回 typed *OpenAIFastBlockedError。
- ingress 路径在 parseClientPayload 内调用，block 命中先 Write Realtime
  风格 error event 再返回 OpenAIWSClientCloseError(StatusPolicyViolation
  =1008)，依赖底层 WebSocket Conn.Write 的同步 flush 保证 error 先于
  close。
- passthrough 路径在 RunEntry 前对 firstClientMessage 应用策略，并通过
  openAIWSPolicyEnforcingFrameConn 包装 ReadFrame 对每个 client→upstream
  帧执行策略；后续帧无 model 字段时回退到 capturedSessionModel。
  filter 闭包内同时侦测 session.update / session.created 帧的 session.model
  字段刷新 capturedSessionModel，封堵"首帧 model=gpt-4o（pass）→
  session.update 改为 gpt-5.5 → 不带 model 的 response.create fallback
  到 gpt-4o"的 mid-session 绕过路径。
- passthrough billing：requestServiceTier 在策略 filter 之后再从
  firstClientMessage 提取，filter 命中时 OpenAIForwardResult.ServiceTier
  上报 nil（default tier），与 HTTP 入口（reqBody 来自 post-filter map）
  / WS ingress（payload 来自 post-filter bytes）的语义一致。
- 错误事件 schema：{event_id: "evt_<32hex>", type: "error",
  error: {type: "forbidden_error", code: "policy_violation", message}}，
  与 OpenAI codex 客户端 error event 解析兼容。

Admin / Frontend
- dto.SystemSettings / UpdateSettingsRequest 新增
  openai_fast_policy_settings 字段（omitempty），bulk GET/PUT 接入。
- Settings 页 Gateway 页签新增 Fast/Flex Policy 表单卡片：
  service_tier × action × scope × 模型白名单 × fallback action 全字段配置。
- 前端守门：openaiFastPolicyLoaded 标志仅在 GET 真带回字段时才允许回写，
  避免 rollout/错误把默认规则覆盖成空；saveSettings 回写循环 skip 该字段，
  由专用刷新逻辑处理；仅 action=block 时发送 error_message，匹配后端
  omitempty 行为。

测试
- HTTP 路径：openai_fast_policy_test.go 覆盖默认配置（whitelist=[]，所有
  模型 priority filter）/ block 自定义错误 / scope 区分 / filter 删字段 /
  block 不改 body / block 短路上游 / Anthropic BetaFastMode 触发 OpenAI
  fast policy 等场景。
- WebSocket 路径：openai_fast_policy_ws_test.go 覆盖
    helper 单元（filter / fast→priority 归一化 / flex 透传 / block typed
    error / 无 service_tier 字节不变 / 非 response.create 帧不动 / 空 type
    帧不动 / event_id+code 字段断言 / 非字符串 service_tier 容错）+
    pass 路径 fast 别名归一化回归 +
    ingress 端到端（filter 后上游不含 service_tier / block 后客户端先收
    error event 再收 close 1008 且上游 0 写）+
    passthrough capturedSessionModel fallback 用例（whitelist 策略下首帧
    建立、缺 model 命中 fallback、缺少 fallback 时的 leak 文档化）+
    passthrough session.update / session.created 旋转 capturedSessionModel
    的 mid-session 绕过回归 +
    passthrough billing post-filter ServiceTier 与 idempotent filter 回归。

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-28 00:34:23 +08:00
+									// 放过 OpenAI 官方文档定义的所有合法 tier 值：priority/flex/auto/default/scale。
 									// 对 Codex 客户端零影响（Codex 只发 priority 或 flex，见 codex-rs/core/src/client.rs），
 									// 但能让直连 OpenAI SDK 的用户透传 auto/default/scale 以便抓包/调试。
 									// 真未知值仍返回 nil，由 normalizeResponsesBodyServiceTier 从 body 中删除。
-												fix(billing): 修复 OpenAI fast 档位计费并补齐展示

- 打通 service_tier 在 OpenAI HTTP、WS、passthrough 与 usage 记录中的传递
- 修正 priority/flex 计费逻辑，并将 fast 归一化为 priority
- 在用户端和管理端补齐服务档位与计费明细展示
- 补齐前后端测试，并修复 WS 限流信号重复持久化导致的全量回归失败

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-08 23:22:28 +08:00
+									switch value {
-												feat(openai): OpenAI Fast/Flex Policy 完整实现（HTTP + WebSocket + Admin）

对称参照 Claude BetaPolicy 的 fast-mode 过滤实现，新增针对 OpenAI 上游
service_tier 字段（priority / flex，含客户端 "fast" → "priority" 归一化）的
pass / filter / block 三态策略，覆盖全部 OpenAI 入口 + admin 配置入口。

后端核心
- 新增 SettingKeyOpenAIFastPolicySettings、OpenAIFastPolicyRule、
  OpenAIFastPolicySettings 配置模型，含规则的 service_tier × action × scope
  × 模型白名单 × fallback action 维度。
- SettingService.Get/SetOpenAIFastPolicySettings；缺失时返回内置默认策略
  （所有模型的 priority 走 filter，whitelist 为空，fallback=pass）。设计
  依据：service_tier=fast 是用户级开关，与 model 字段正交，默认锁定特定
  model slug 会留下"用 gpt-4 + fast 透传 priority 上游"的绕过路径。JSON
  解析失败不再静默 fallback，slog.Warn 记录脏数据，便于运维定位。
- service_tier 归一化（trim + ToLower + fast→priority + 白名单 priority/flex）
  与策略评估（evaluateOpenAIFastPolicy）作为唯一真实来源，HTTP / WS 共用。
  抽出纯函数 evaluateOpenAIFastPolicyWithSettings，配合 ctx-bound settings
  快照（withOpenAIFastPolicyContext / openAIFastPolicySettingsFromContext），
  WS 长会话入口预取一次后所有帧复用，避免每帧打到 settingService。

HTTP 入口（4 个）
- Chat Completions、Anthropic 兼容（Messages，含 BetaFastMode→priority 二次
  命中）、原生 Responses、Passthrough Responses 全部接入
  applyOpenAIFastPolicyToBody，filter 走 sjson 顶层删除 service_tier，block
  返回 403 forbidden_error JSON。
- 4 入口统一使用 upstream 视角的 model（GetMappedModel +
  normalizeOpenAIModelForUpstream + Codex OAuth normalize 后的 slug），
  避免 chat/messages/native /responses/passthrough 因为 model 维度不同
  造成 whitelist 命中差异。
- 在 pass 路径也把客户端 "fast" 别名归一化为 "priority" 写回 body，
  否则 native /responses 与 passthrough 入口会把 "fast" 原样透传给上游
  导致 400/拒绝（chat-completions 入口的 normalizeResponsesBodyServiceTier
  此前已具备同等行为）。

WebSocket 入口
- 新增 applyOpenAIFastPolicyToWSResponseCreate：严格匹配
  type="response.create"，仅处理顶层 service_tier；filter 用 sjson 删字段，
  block 返回 typed *OpenAIFastBlockedError。
- ingress 路径在 parseClientPayload 内调用，block 命中先 Write Realtime
  风格 error event 再返回 OpenAIWSClientCloseError(StatusPolicyViolation
  =1008)，依赖底层 WebSocket Conn.Write 的同步 flush 保证 error 先于
  close。
- passthrough 路径在 RunEntry 前对 firstClientMessage 应用策略，并通过
  openAIWSPolicyEnforcingFrameConn 包装 ReadFrame 对每个 client→upstream
  帧执行策略；后续帧无 model 字段时回退到 capturedSessionModel。
  filter 闭包内同时侦测 session.update / session.created 帧的 session.model
  字段刷新 capturedSessionModel，封堵"首帧 model=gpt-4o（pass）→
  session.update 改为 gpt-5.5 → 不带 model 的 response.create fallback
  到 gpt-4o"的 mid-session 绕过路径。
- passthrough billing：requestServiceTier 在策略 filter 之后再从
  firstClientMessage 提取，filter 命中时 OpenAIForwardResult.ServiceTier
  上报 nil（default tier），与 HTTP 入口（reqBody 来自 post-filter map）
  / WS ingress（payload 来自 post-filter bytes）的语义一致。
- 错误事件 schema：{event_id: "evt_<32hex>", type: "error",
  error: {type: "forbidden_error", code: "policy_violation", message}}，
  与 OpenAI codex 客户端 error event 解析兼容。

Admin / Frontend
- dto.SystemSettings / UpdateSettingsRequest 新增
  openai_fast_policy_settings 字段（omitempty），bulk GET/PUT 接入。
- Settings 页 Gateway 页签新增 Fast/Flex Policy 表单卡片：
  service_tier × action × scope × 模型白名单 × fallback action 全字段配置。
- 前端守门：openaiFastPolicyLoaded 标志仅在 GET 真带回字段时才允许回写，
  避免 rollout/错误把默认规则覆盖成空；saveSettings 回写循环 skip 该字段，
  由专用刷新逻辑处理；仅 action=block 时发送 error_message，匹配后端
  omitempty 行为。

测试
- HTTP 路径：openai_fast_policy_test.go 覆盖默认配置（whitelist=[]，所有
  模型 priority filter）/ block 自定义错误 / scope 区分 / filter 删字段 /
  block 不改 body / block 短路上游 / Anthropic BetaFastMode 触发 OpenAI
  fast policy 等场景。
- WebSocket 路径：openai_fast_policy_ws_test.go 覆盖
    helper 单元（filter / fast→priority 归一化 / flex 透传 / block typed
    error / 无 service_tier 字节不变 / 非 response.create 帧不动 / 空 type
    帧不动 / event_id+code 字段断言 / 非字符串 service_tier 容错）+
    pass 路径 fast 别名归一化回归 +
    ingress 端到端（filter 后上游不含 service_tier / block 后客户端先收
    error event 再收 close 1008 且上游 0 写）+
    passthrough capturedSessionModel fallback 用例（whitelist 策略下首帧
    建立、缺 model 命中 fallback、缺少 fallback 时的 leak 文档化）+
    passthrough session.update / session.created 旋转 capturedSessionModel
    的 mid-session 绕过回归 +
    passthrough billing post-filter ServiceTier 与 idempotent filter 回归。

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-28 00:34:23 +08:00
+									case "priority", "flex", "auto", "default", "scale":
-												fix(billing): 修复 OpenAI fast 档位计费并补齐展示

- 打通 service_tier 在 OpenAI HTTP、WS、passthrough 与 usage 记录中的传递
- 修正 priority/flex 计费逻辑，并将 fast 归一化为 priority
- 在用户端和管理端补齐服务档位与计费明细展示
- 补齐前后端测试，并修复 WS 限流信号重复持久化导致的全量回归失败

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-08 23:22:28 +08:00
+										return &value
 									default:
 										return nil
 									}
 								}
-												feat(openai): OpenAI Fast/Flex Policy 完整实现（HTTP + WebSocket + Admin）

对称参照 Claude BetaPolicy 的 fast-mode 过滤实现，新增针对 OpenAI 上游
service_tier 字段（priority / flex，含客户端 "fast" → "priority" 归一化）的
pass / filter / block 三态策略，覆盖全部 OpenAI 入口 + admin 配置入口。

后端核心
- 新增 SettingKeyOpenAIFastPolicySettings、OpenAIFastPolicyRule、
  OpenAIFastPolicySettings 配置模型，含规则的 service_tier × action × scope
  × 模型白名单 × fallback action 维度。
- SettingService.Get/SetOpenAIFastPolicySettings；缺失时返回内置默认策略
  （所有模型的 priority 走 filter，whitelist 为空，fallback=pass）。设计
  依据：service_tier=fast 是用户级开关，与 model 字段正交，默认锁定特定
  model slug 会留下"用 gpt-4 + fast 透传 priority 上游"的绕过路径。JSON
  解析失败不再静默 fallback，slog.Warn 记录脏数据，便于运维定位。
- service_tier 归一化（trim + ToLower + fast→priority + 白名单 priority/flex）
  与策略评估（evaluateOpenAIFastPolicy）作为唯一真实来源，HTTP / WS 共用。
  抽出纯函数 evaluateOpenAIFastPolicyWithSettings，配合 ctx-bound settings
  快照（withOpenAIFastPolicyContext / openAIFastPolicySettingsFromContext），
  WS 长会话入口预取一次后所有帧复用，避免每帧打到 settingService。

HTTP 入口（4 个）
- Chat Completions、Anthropic 兼容（Messages，含 BetaFastMode→priority 二次
  命中）、原生 Responses、Passthrough Responses 全部接入
  applyOpenAIFastPolicyToBody，filter 走 sjson 顶层删除 service_tier，block
  返回 403 forbidden_error JSON。
- 4 入口统一使用 upstream 视角的 model（GetMappedModel +
  normalizeOpenAIModelForUpstream + Codex OAuth normalize 后的 slug），
  避免 chat/messages/native /responses/passthrough 因为 model 维度不同
  造成 whitelist 命中差异。
- 在 pass 路径也把客户端 "fast" 别名归一化为 "priority" 写回 body，
  否则 native /responses 与 passthrough 入口会把 "fast" 原样透传给上游
  导致 400/拒绝（chat-completions 入口的 normalizeResponsesBodyServiceTier
  此前已具备同等行为）。

WebSocket 入口
- 新增 applyOpenAIFastPolicyToWSResponseCreate：严格匹配
  type="response.create"，仅处理顶层 service_tier；filter 用 sjson 删字段，
  block 返回 typed *OpenAIFastBlockedError。
- ingress 路径在 parseClientPayload 内调用，block 命中先 Write Realtime
  风格 error event 再返回 OpenAIWSClientCloseError(StatusPolicyViolation
  =1008)，依赖底层 WebSocket Conn.Write 的同步 flush 保证 error 先于
  close。
- passthrough 路径在 RunEntry 前对 firstClientMessage 应用策略，并通过
  openAIWSPolicyEnforcingFrameConn 包装 ReadFrame 对每个 client→upstream
  帧执行策略；后续帧无 model 字段时回退到 capturedSessionModel。
  filter 闭包内同时侦测 session.update / session.created 帧的 session.model
  字段刷新 capturedSessionModel，封堵"首帧 model=gpt-4o（pass）→
  session.update 改为 gpt-5.5 → 不带 model 的 response.create fallback
  到 gpt-4o"的 mid-session 绕过路径。
- passthrough billing：requestServiceTier 在策略 filter 之后再从
  firstClientMessage 提取，filter 命中时 OpenAIForwardResult.ServiceTier
  上报 nil（default tier），与 HTTP 入口（reqBody 来自 post-filter map）
  / WS ingress（payload 来自 post-filter bytes）的语义一致。
- 错误事件 schema：{event_id: "evt_<32hex>", type: "error",
  error: {type: "forbidden_error", code: "policy_violation", message}}，
  与 OpenAI codex 客户端 error event 解析兼容。

Admin / Frontend
- dto.SystemSettings / UpdateSettingsRequest 新增
  openai_fast_policy_settings 字段（omitempty），bulk GET/PUT 接入。
- Settings 页 Gateway 页签新增 Fast/Flex Policy 表单卡片：
  service_tier × action × scope × 模型白名单 × fallback action 全字段配置。
- 前端守门：openaiFastPolicyLoaded 标志仅在 GET 真带回字段时才允许回写，
  避免 rollout/错误把默认规则覆盖成空；saveSettings 回写循环 skip 该字段，
  由专用刷新逻辑处理；仅 action=block 时发送 error_message，匹配后端
  omitempty 行为。

测试
- HTTP 路径：openai_fast_policy_test.go 覆盖默认配置（whitelist=[]，所有
  模型 priority filter）/ block 自定义错误 / scope 区分 / filter 删字段 /
  block 不改 body / block 短路上游 / Anthropic BetaFastMode 触发 OpenAI
  fast policy 等场景。
- WebSocket 路径：openai_fast_policy_ws_test.go 覆盖
    helper 单元（filter / fast→priority 归一化 / flex 透传 / block typed
    error / 无 service_tier 字节不变 / 非 response.create 帧不动 / 空 type
    帧不动 / event_id+code 字段断言 / 非字符串 service_tier 容错）+
    pass 路径 fast 别名归一化回归 +
    ingress 端到端（filter 后上游不含 service_tier / block 后客户端先收
    error event 再收 close 1008 且上游 0 写）+
    passthrough capturedSessionModel fallback 用例（whitelist 策略下首帧
    建立、缺 model 命中 fallback、缺少 fallback 时的 leak 文档化）+
    passthrough session.update / session.created 旋转 capturedSessionModel
    的 mid-session 绕过回归 +
    passthrough billing post-filter ServiceTier 与 idempotent filter 回归。

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>

											
										
										
											2026-04-28 00:34:23 +08:00
+								// OpenAIFastBlockedError indicates a request was rejected by the OpenAI fast
 								// policy (action=block). Mirrors BetaBlockedError on the Claude side.
 								type OpenAIFastBlockedError struct {
 									Message string
 								}
 								func (e *OpenAIFastBlockedError) Error() string { return e.Message }
 								// evaluateOpenAIFastPolicy returns the action and error message that should be
 								// applied for a request with the given account/model/service_tier. When the
 								// policy service is unavailable or no rule matches, it returns
 								// (BetaPolicyActionPass, "") so callers can short-circuit safely.
 								//
 								// Matching rules:
 								//   - Scope filters by account type (all / oauth / apikey / bedrock)
 								//   - ServiceTier must be empty (= any), "all", or equal the normalized tier
 								//   - ModelWhitelist narrows the rule to specific models; FallbackAction
 								//     handles the non-matching case (default: pass)
 								//
 								// 与 Claude BetaPolicy 的差异（保留首条匹配 short-circuit）：
 								//   - BetaPolicy 处理的是 anthropic-beta header 中的 token 集合，不同
 								//     规则可能针对不同 token，filter 需要累加成 set；block 则 first-match。
 								//   - OpenAI fast policy 操作的是单个字段 service_tier：filter 即删字段，
 								//     没有可累加的对象。一次请求只携带一个 service_tier，规则的 tier
 								//     维度天然互斥；同一 (scope, tier) 下若多条规则的 model whitelist
 								//     发生重叠，admin 可通过规则顺序明确意图。因此采用 first-match 而
 								//     非 BetaPolicy 那样的"block 覆盖 filter 覆盖 pass"语义。
 								func (s *OpenAIGatewayService) evaluateOpenAIFastPolicy(ctx context.Context, account *Account, model, serviceTier string) (action, errMsg string) {
 									if s == nil || s.settingService == nil {
 										return BetaPolicyActionPass, ""
 									}
 									tier := strings.ToLower(strings.TrimSpace(serviceTier))
 									if tier == "" {
 										return BetaPolicyActionPass, ""
 									}
 									settings := openAIFastPolicySettingsFromContext(ctx)
 									if settings == nil {
 										fetched, err := s.settingService.GetOpenAIFastPolicySettings(ctx)
 										if err != nil || fetched == nil {
 											return BetaPolicyActionPass, ""
 										}
 										settings = fetched
 									}
 									return evaluateOpenAIFastPolicyWithSettings(settings, account, model, tier)
 								}
 								// evaluateOpenAIFastPolicyWithSettings is the pure-function core extracted so
 								// long-lived sessions (e.g. WS) can prefetch settings once and avoid hitting
 								// the settingService on every frame. See WSSession entry and
 								// openAIFastPolicySettingsFromContext for the caching glue.
 								func evaluateOpenAIFastPolicyWithSettings(settings *OpenAIFastPolicySettings, account *Account, model, tier string) (action, errMsg string) {
 									if settings == nil {
 										return BetaPolicyActionPass, ""
 									}
 									isOAuth := account != nil && account.IsOAuth()
 									isBedrock := account != nil && account.IsBedrock()
 									for _, rule := range settings.Rules {
 										if !betaPolicyScopeMatches(rule.Scope, isOAuth, isBedrock) {
 											continue
 										}
 										ruleTier := strings.ToLower(strings.TrimSpace(rule.ServiceTier))
 										if ruleTier != "" && ruleTier != OpenAIFastTierAny && ruleTier != tier {
 											continue
 										}
 										eff := BetaPolicyRule{
 											Action:               rule.Action,
 											ErrorMessage:         rule.ErrorMessage,
 											ModelWhitelist:       rule.ModelWhitelist,
 											FallbackAction:       rule.FallbackAction,
 											FallbackErrorMessage: rule.FallbackErrorMessage,
 										}
 										return resolveRuleAction(eff, model)
 									}
 									return BetaPolicyActionPass, ""
 								}
 								// openAIFastPolicyCtxKey 是 context 中预取的 OpenAIFastPolicySettings 缓存
 								// 键，仅用于 WebSocket 长会话内多帧复用同一份策略快照，避免每帧 DB 命中。
 								//
 								// Trade-off：策略变更不会影响当前 WS session（只影响新 session）。这是
 								// 有意为之 —— 对长会话来说，"策略一致性"比"立刻生效"更重要，且 Claude
 								// BetaPolicy 的 gin.Context 缓存也是同样取舍。需要 hot-reload 时管理员
 								// 可以通过踢断 session 强制刷新。
 								type openAIFastPolicyCtxKeyType struct{}
 								var openAIFastPolicyCtxKey = openAIFastPolicyCtxKeyType{}
 								// withOpenAIFastPolicyContext 将一份 settings 快照绑定到 context，供该 ctx
 								// 衍生 goroutine 中的 evaluateOpenAIFastPolicy 复用。
 								func withOpenAIFastPolicyContext(ctx context.Context, settings *OpenAIFastPolicySettings) context.Context {
 									if ctx == nil || settings == nil {
 										return ctx
 									}
 									return context.WithValue(ctx, openAIFastPolicyCtxKey, settings)
 								}
 								func openAIFastPolicySettingsFromContext(ctx context.Context) *OpenAIFastPolicySettings {
 									if ctx == nil {
 										return nil
 									}
 									if v, ok := ctx.Value(openAIFastPolicyCtxKey).(*OpenAIFastPolicySettings); ok {
 										return v
 									}
 									return nil
 								}
 								// applyOpenAIFastPolicyToBody applies the OpenAI fast policy to a raw request
 								// body. When action=filter it removes the service_tier field; when
 								// action=block it returns (body, *OpenAIFastBlockedError). On pass it
 								// normalizes the service_tier value (e.g. client alias "fast" → "priority"),
 								// rewriting the body so the upstream receives a slug it recognizes.
 								//
 								// Rationale for normalize-on-pass: chat-completions / messages 入口在调用本
 								// 函数之前已经通过 normalizeResponsesBodyServiceTier 把 service_tier 归一化
 								// 到了上游可识别值；passthrough（OpenAI 自动透传） / native /responses 等
 								// 入口没有这一前置步骤，pass 路径下若不在此处归一化，"fast" 就会被原样
 								// 透传到 OpenAI 上游导致 400/拒绝。把归一化收敛到本函数，所有入口行为一致。
 								func (s *OpenAIGatewayService) applyOpenAIFastPolicyToBody(ctx context.Context, account *Account, model string, body []byte) ([]byte, error) {
 									if len(body) == 0 {
 										return body, nil
 									}
 									rawTier := gjson.GetBytes(body, "service_tier").String()
 									if rawTier == "" {
 										return body, nil
 									}
 									normTier := normalizedOpenAIServiceTierValue(rawTier)
 									if normTier == "" {
 										return body, nil
 									}
 									action, errMsg := s.evaluateOpenAIFastPolicy(ctx, account, model, normTier)
 									switch action {
 									case BetaPolicyActionBlock:
 										msg := errMsg
 										if msg == "" {
 											msg = fmt.Sprintf("openai service_tier=%s is not allowed for model %s", normTier, model)
 										}
 										return body, &OpenAIFastBlockedError{Message: msg}
 									case BetaPolicyActionFilter:
 										trimmed, err := sjson.DeleteBytes(body, "service_tier")
 										if err != nil {
 											return body, fmt.Errorf("strip service_tier from body: %w", err)
 										}
 										return trimmed, nil
 									default:
 										// pass：把别名（如 "fast"）写回为规范值（"priority"）。
 										if normTier == rawTier {
 											return body, nil
 										}
 										updated, err := sjson.SetBytes(body, "service_tier", normTier)
 										if err != nil {
 											return body, fmt.Errorf("normalize service_tier on pass: %w", err)
 										}
 										return updated, nil
 									}
 								}
 								// writeOpenAIFastPolicyBlockedResponse writes a 403 JSON response for a
 								// request blocked by the OpenAI fast policy.
 								func writeOpenAIFastPolicyBlockedResponse(c *gin.Context, err *OpenAIFastBlockedError) {
 									if c == nil || err == nil {
 										return
 									}
 									c.JSON(http.StatusForbidden, gin.H{
 										"error": gin.H{
 											"type":    "permission_error",
 											"message": err.Message,
 										},
 									})
 								}
 								// applyOpenAIFastPolicyToWSResponseCreate evaluates the OpenAI fast policy
 								// against a single client→upstream WebSocket frame whose top-level
 								// "type"=="response.create". It mirrors the HTTP-side
 								// applyOpenAIFastPolicyToBody contract but operates on a Realtime/Responses
 								// WS payload:
 								//
 								//   - pass: returns frame unchanged (newBytes == frame, blocked == nil)
 								//   - filter: returns a copy with top-level service_tier removed
 								//   - block: returns (frame, *OpenAIFastBlockedError)
 								//
 								// Only frames whose "type" field strictly equals "response.create" are
 								// inspected/mutated. Any other frame type — including the empty string —
 								// passes through untouched. The OpenAI Realtime client-event spec requires
 								// "type" to be set, so an empty type is treated as a malformed frame we do
 								// not police; the upstream is the source of truth for rejecting it.
 								//
 								// service_tier lives at the top level of response.create — same as the
 								// Responses HTTP body shape (see openai_gateway_chat_completions.go:304 +
 								// extractOpenAIServiceTierFromBody at line 5593, and the test fixture at
 								// openai_ws_forwarder_ingress_session_test.go:402). We therefore only need
 								// to inspect / strip the top-level field; there is no nested form in the
 								// schema today.
 								//
 								// The caller is responsible for choosing the upstream model passed in —
 								// this helper does not re-derive it.
 								func (s *OpenAIGatewayService) applyOpenAIFastPolicyToWSResponseCreate(
 									ctx context.Context,
 									account *Account,
 									model string,
 									frame []byte,
 								) ([]byte, *OpenAIFastBlockedError, error) {
 									if len(frame) == 0 {
 										return frame, nil, nil
 									}
 									if !gjson.ValidBytes(frame) {
 										return frame, nil, nil
 									}
 									frameType := strings.TrimSpace(gjson.GetBytes(frame, "type").String())
 									// Strict match: only response.create is policy-checked. Empty / other
 									// types pass through untouched so we never accidentally strip fields
 									// from response.cancel, conversation.item.create, or any future
 									// client-event the spec adds. The Realtime spec requires "type" on
 									// every client event, so an empty type is malformed input — let the
 									// upstream reject it rather than guessing at our layer.
 									if frameType != "response.create" {
 										return frame, nil, nil
 									}
 									rawTier := gjson.GetBytes(frame, "service_tier").String()
 									if rawTier == "" {
 										return frame, nil, nil
 									}
 									normTier := normalizedOpenAIServiceTierValue(rawTier)
 									if normTier == "" {
 										return frame, nil, nil
 									}
 									action, errMsg := s.evaluateOpenAIFastPolicy(ctx, account, model, normTier)
 									switch action {
 									case BetaPolicyActionBlock:
 										msg := errMsg
 										if msg == "" {
 											msg = fmt.Sprintf("openai service_tier=%s is not allowed for model %s", normTier, model)
 										}
 										return frame, &OpenAIFastBlockedError{Message: msg}, nil
 									case BetaPolicyActionFilter:
 										trimmed, err := sjson.DeleteBytes(frame, "service_tier")
 										if err != nil {
 											return frame, nil, fmt.Errorf("strip service_tier from ws frame: %w", err)
 										}
 										return trimmed, nil, nil
 									default:
 										return frame, nil, nil
 									}
 								}
 								// newOpenAIFastPolicyWSEventID returns a Realtime-style event_id for a
 								// server-emitted error event. Matches the loose "evt_<rand>" convention used
 								// by upstream Realtime servers; the exact value is not load-bearing and is
 								// only required for client-side log correlation. We reuse the existing
 								// google/uuid dependency rather than pulling a new one.
 								func newOpenAIFastPolicyWSEventID() string {
 									id, err := uuid.NewRandom()
 									if err != nil {
 										// Extremely unlikely; fall back to a fixed prefix so the field is
 										// still non-empty and the schema stays self-consistent.
 										return "evt_openai_fast_policy"
 									}
 									// Strip dashes so it visually matches "evt_<hex>" rather than UUID v4
 									// canonical form, mirroring what real Realtime traces look like.
 									return "evt_" + strings.ReplaceAll(id.String(), "-", "")
 								}
 								// buildOpenAIFastPolicyBlockedWSEvent renders an OpenAI Realtime/Responses
 								// style "error" event payload for a request blocked by the OpenAI fast
 								// policy. The shape mirrors Realtime error events as observed in upstream
 								// traces and per the spec's server "error" event:
 								//
 								//	{
 								//	  "event_id": "evt_<random>",
 								//	  "type": "error",
 								//	  "error": {
 								//	    "type": "invalid_request_error",
 								//	    "code": "policy_violation",
 								//	    "message": "..."
 								//	  }
 								//	}
 								//
 								// event_id lets clients correlate the rejection in their logs; "code" gives
 								// programmatic clients a stable identifier (HTTP-side equivalent is the
 								// 403 permission_error JSON body).
 								func buildOpenAIFastPolicyBlockedWSEvent(err *OpenAIFastBlockedError) []byte {
 									if err == nil {
 										return nil
 									}
 									eventID := newOpenAIFastPolicyWSEventID()
 									payload, mErr := json.Marshal(map[string]any{
 										"event_id": eventID,
 										"type":     "error",
 										"error": map[string]any{
 											"type":    "invalid_request_error",
 											"code":    "policy_violation",
 											"message": err.Message,
 										},
 									})
 									if mErr != nil {
 										// Fallback to a minimal hand-rolled payload; Marshal of the literal
 										// shape above should never fail in practice.
 										return []byte(`{"event_id":"` + eventID + `","type":"error","error":{"type":"invalid_request_error","code":"policy_violation","message":"openai fast policy blocked this request"}}`)
 									}
 									return payload
 								}
-												fix(openai): sanitize empty base64 input images

											
										
										
											2026-04-01 00:46:38 +08:00
+								func sanitizeEmptyBase64InputImagesInOpenAIBody(body []byte) ([]byte, bool, error) {
 									if len(body) == 0 || !bytes.Contains(body, []byte(`"image_url"`)) || !bytes.Contains(body, []byte(`base64,`)) {
 										return body, false, nil
 									}
 									var reqBody map[string]any
 									if err := json.Unmarshal(body, &reqBody); err != nil {
 										return body, false, fmt.Errorf("sanitize request body: %w", err)
 									}
 									if !sanitizeEmptyBase64InputImagesInOpenAIRequestBodyMap(reqBody) {
 										return body, false, nil
 									}
 									normalized, err := json.Marshal(reqBody)
 									if err != nil {
 										return body, false, fmt.Errorf("serialize sanitized request body: %w", err)
 									}
 									return normalized, true, nil
 								}
 								func sanitizeEmptyBase64InputImagesInOpenAIRequestBodyMap(reqBody map[string]any) bool {
 									if reqBody == nil {
 										return false
 									}
 									input, ok := reqBody["input"]
 									if !ok {
 										return false
 									}
 									normalizedInput, changed := sanitizeEmptyBase64InputImagesInOpenAIInput(input)
 									if !changed {
 										return false
 									}
 									reqBody["input"] = normalizedInput
 									return true
 								}
 								func sanitizeEmptyBase64InputImagesInOpenAIInput(input any) (any, bool) {
 									items, ok := input.([]any)
 									if !ok {
 										return input, false
 									}
 									normalizedItems := make([]any, 0, len(items))
 									changed := false
 									for _, item := range items {
 										itemMap, ok := item.(map[string]any)
 										if !ok {
 											normalizedItems = append(normalizedItems, item)
 											continue
 										}
 										if shouldDropEmptyBase64InputImagePart(itemMap) {
 											changed = true
 											continue
 										}
 										content, ok := itemMap["content"]
 										if !ok {
 											normalizedItems = append(normalizedItems, itemMap)
 											continue
 										}
 										parts, ok := content.([]any)
 										if !ok {
 											normalizedItems = append(normalizedItems, itemMap)
 											continue
 										}
 										normalizedParts := make([]any, 0, len(parts))
 										itemChanged := false
 										for _, part := range parts {
 											if shouldDropEmptyBase64InputImagePart(part) {
 												changed = true
 												itemChanged = true
 												continue
 											}
 											normalizedParts = append(normalizedParts, part)
 										}
 										if itemChanged {
 											if len(normalizedParts) == 0 {
 												continue
 											}
 											itemMap["content"] = normalizedParts
 										}
 										normalizedItems = append(normalizedItems, itemMap)
 									}
 									if !changed {
 										return input, false
 									}
 									return normalizedItems, true
 								}
 								func shouldDropEmptyBase64InputImagePart(part any) bool {
 									partMap, ok := part.(map[string]any)
 									if !ok {
 										return false
 									}
 									typeValue, _ := partMap["type"].(string)
 									if strings.TrimSpace(typeValue) != "input_image" {
 										return false
 									}
 									imageURL, _ := partMap["image_url"].(string)
 									return isEmptyBase64DataURI(imageURL)
 								}
 								func isEmptyBase64DataURI(raw string) bool {
 									if !strings.HasPrefix(raw, "data:") {
 										return false
 									}
 									rest := strings.TrimPrefix(raw, "data:")
 									semicolonIdx := strings.Index(rest, ";")
 									if semicolonIdx < 0 {
 										return false
 									}
 									rest = rest[semicolonIdx+1:]
 									if !strings.HasPrefix(rest, "base64,") {
 										return false
 									}
 									return strings.TrimSpace(strings.TrimPrefix(rest, "base64,")) == ""
 								}
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+								func getOpenAIRequestBodyMap(c *gin.Context, body []byte) (map[string]any, error) {
 									if c != nil {
 										if cached, ok := c.Get(OpenAIParsedRequestBodyKey); ok {
 											if reqBody, ok := cached.(map[string]any); ok && reqBody != nil {
 												return reqBody, nil
 											}
 										}
 									}
 									var reqBody map[string]any
 									if err := json.Unmarshal(body, &reqBody); err != nil {
 										return nil, fmt.Errorf("parse request: %w", err)
 									}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									if c != nil {
 										c.Set(OpenAIParsedRequestBodyKey, reqBody)
 									}
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
+									return reqBody, nil
 								}
-												feat(usage): add reasoning effort column

											
										
										
											2026-02-03 14:36:29 +08:00
+								func extractOpenAIReasoningEffort(reqBody map[string]any, requestedModel string) *string {
 									if value, present := getOpenAIReasoningEffortFromReqBody(reqBody); present {
 										if value == "" {
 											return nil
 										}
 										return &value
 									}
 									value := deriveOpenAIReasoningEffortFromModel(requestedModel)
 									if value == "" {
 										return nil
 									}
 									return &value
 								}
 								func normalizeOpenAIReasoningEffort(raw string) string {
 									value := strings.ToLower(strings.TrimSpace(raw))
 									if value == "" {
 										return ""
 									}
 									// Normalize separators for "x-high"/"x_high" variants.
 									value = strings.NewReplacer("-", "", "_", "", " ", "").Replace(value)
 									switch value {
 									case "none", "minimal":
 										return ""
 									case "low", "medium", "high":
 										return value
 									case "xhigh", "extrahigh":
 										return "xhigh"
 									default:
 										// Only store known effort levels for now to keep UI consistent.
 										return ""
 									}
 								}