backend/internal/service/openai_gateway_service_test.go

package service

import (
	"bufio"
	"bytes"
	"context"
	"errors"
	"fmt"
	"io"
	"net/http"
	"net/http/httptest"
	"strings"
	"testing"
	"time"

	"github.com/Wei-Shaw/sub2api/internal/config"
	"github.com/Wei-Shaw/sub2api/internal/pkg/openai"
	"github.com/cespare/xxhash/v2"
	"github.com/gin-gonic/gin"
	"github.com/stretchr/testify/require"
)

// 编译期接口断言
var _ AccountRepository = (*stubOpenAIAccountRepo)(nil)
var _ GatewayCache = (*stubGatewayCache)(nil)

type stubOpenAIAccountRepo struct {
	AccountRepository
	accounts []Account
}

type snapshotUpdateAccountRepo struct {
	stubOpenAIAccountRepo
	updateExtraCalls chan map[string]any
}

func (r *snapshotUpdateAccountRepo) UpdateExtra(ctx context.Context, id int64, updates map[string]any) error {
	if r.updateExtraCalls != nil {
		copied := make(map[string]any, len(updates))
		for k, v := range updates {
			copied[k] = v
		}
		r.updateExtraCalls <- copied
	}
	return nil
}

func (r stubOpenAIAccountRepo) GetByID(ctx context.Context, id int64) (*Account, error) {
	for i := range r.accounts {
		if r.accounts[i].ID == id {
			return &r.accounts[i], nil
		}
	}
	return nil, errors.New("account not found")
}

func (r stubOpenAIAccountRepo) ListSchedulableByGroupIDAndPlatform(ctx context.Context, groupID int64, platform string) ([]Account, error) {
	var result []Account
	for _, acc := range r.accounts {
		if acc.Platform == platform {
			result = append(result, acc)
		}
	}
	return result, nil
}

func (r stubOpenAIAccountRepo) ListSchedulableByPlatform(ctx context.Context, platform string) ([]Account, error) {
	var result []Account
	for _, acc := range r.accounts {
		if acc.Platform == platform {
			result = append(result, acc)
		}
	}
	return result, nil
}

func (r stubOpenAIAccountRepo) ListSchedulableUngroupedByPlatform(ctx context.Context, platform string) ([]Account, error) {
	return r.ListSchedulableByPlatform(ctx, platform)
}

type stubConcurrencyCache struct {
	ConcurrencyCache
	loadBatchErr    error
	loadMap         map[int64]*AccountLoadInfo
	acquireResults  map[int64]bool
	waitCounts      map[int64]int
	skipDefaultLoad bool
}

type cancelReadCloser struct{}

func (c cancelReadCloser) Read(p []byte) (int, error) { return 0, context.Canceled }
func (c cancelReadCloser) Close() error               { return nil }

type failingGinWriter struct {
	gin.ResponseWriter
	failAfter int
	writes    int
}

func (w *failingGinWriter) Write(p []byte) (int, error) {
	if w.writes >= w.failAfter {
		return 0, errors.New("write failed")
	}
	w.writes++
	return w.ResponseWriter.Write(p)
}

func (c stubConcurrencyCache) AcquireAccountSlot(ctx context.Context, accountID int64, maxConcurrency int, requestID string) (bool, error) {
	if c.acquireResults != nil {
		if result, ok := c.acquireResults[accountID]; ok {
			return result, nil
		}
	}
	return true, nil
}

func (c stubConcurrencyCache) ReleaseAccountSlot(ctx context.Context, accountID int64, requestID string) error {
	return nil
}

func (c stubConcurrencyCache) GetAccountsLoadBatch(ctx context.Context, accounts []AccountWithConcurrency) (map[int64]*AccountLoadInfo, error) {
	if c.loadBatchErr != nil {
		return nil, c.loadBatchErr
	}
	out := make(map[int64]*AccountLoadInfo, len(accounts))
	if c.skipDefaultLoad && c.loadMap != nil {
		for _, acc := range accounts {
			if load, ok := c.loadMap[acc.ID]; ok {
				out[acc.ID] = load
			}
		}
		return out, nil
	}
	for _, acc := range accounts {
		if c.loadMap != nil {
			if load, ok := c.loadMap[acc.ID]; ok {
				out[acc.ID] = load
				continue
			}
		}
		out[acc.ID] = &AccountLoadInfo{AccountID: acc.ID, LoadRate: 0}
	}
	return out, nil
}

func TestOpenAIGatewayService_GenerateSessionHash_Priority(t *testing.T) {
	gin.SetMode(gin.TestMode)
	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/openai/v1/responses", nil)

	svc := &OpenAIGatewayService{}

	bodyWithKey := []byte(`{"prompt_cache_key":"ses_aaa"}`)

	// 1) session_id header wins
	c.Request.Header.Set("session_id", "sess-123")
	c.Request.Header.Set("conversation_id", "conv-456")
	h1 := svc.GenerateSessionHash(c, bodyWithKey)
	if h1 == "" {
		t.Fatalf("expected non-empty hash")
	}

	// 2) conversation_id used when session_id absent
	c.Request.Header.Del("session_id")
	h2 := svc.GenerateSessionHash(c, bodyWithKey)
	if h2 == "" {
		t.Fatalf("expected non-empty hash")
	}
	if h1 == h2 {
		t.Fatalf("expected different hashes for different keys")
	}

	// 3) prompt_cache_key used when both headers absent
	c.Request.Header.Del("conversation_id")
	h3 := svc.GenerateSessionHash(c, bodyWithKey)
	if h3 == "" {
		t.Fatalf("expected non-empty hash")
	}
	if h2 == h3 {
		t.Fatalf("expected different hashes for different keys")
	}

	// 4) empty when no signals
	h4 := svc.GenerateSessionHash(c, []byte(`{}`))
	if h4 != "" {
		t.Fatalf("expected empty hash when no signals")
	}
}

func TestOpenAIGatewayService_GenerateSessionHash_UsesXXHash64(t *testing.T) {
	gin.SetMode(gin.TestMode)
	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/openai/v1/responses", nil)

	c.Request.Header.Set("session_id", "sess-fixed-value")
	svc := &OpenAIGatewayService{}

	got := svc.GenerateSessionHash(c, nil)
	want := fmt.Sprintf("%016x", xxhash.Sum64String("sess-fixed-value"))
	require.Equal(t, want, got)
}

func TestOpenAIGatewayService_GenerateSessionHash_AttachesLegacyHashToContext(t *testing.T) {
	gin.SetMode(gin.TestMode)
	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/openai/v1/responses", nil)

	c.Request.Header.Set("session_id", "sess-legacy-check")
	svc := &OpenAIGatewayService{}

	sessionHash := svc.GenerateSessionHash(c, nil)
	require.NotEmpty(t, sessionHash)
	require.NotNil(t, c.Request)
	require.NotNil(t, c.Request.Context())
	require.NotEmpty(t, openAILegacySessionHashFromContext(c.Request.Context()))
}

func TestOpenAIGatewayService_GenerateSessionHashWithFallback(t *testing.T) {
	gin.SetMode(gin.TestMode)
	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/openai/v1/responses", nil)

	svc := &OpenAIGatewayService{}
	seed := "openai_ws_ingress:9:100:200"

	got := svc.GenerateSessionHashWithFallback(c, []byte(`{}`), seed)
	want := fmt.Sprintf("%016x", xxhash.Sum64String(seed))
	require.Equal(t, want, got)
	require.NotEmpty(t, openAILegacySessionHashFromContext(c.Request.Context()))

	empty := svc.GenerateSessionHashWithFallback(c, []byte(`{}`), "   ")
	require.Equal(t, "", empty)
}

func (c stubConcurrencyCache) GetAccountWaitingCount(ctx context.Context, accountID int64) (int, error) {
	if c.waitCounts != nil {
		if count, ok := c.waitCounts[accountID]; ok {
			return count, nil
		}
	}
	return 0, nil
}

type stubGatewayCache struct {
	sessionBindings map[string]int64
	deletedSessions map[string]int
}

func (c *stubGatewayCache) GetSessionAccountID(ctx context.Context, groupID int64, sessionHash string) (int64, error) {
	if id, ok := c.sessionBindings[sessionHash]; ok {
		return id, nil
	}
	return 0, errors.New("not found")
}

func (c *stubGatewayCache) SetSessionAccountID(ctx context.Context, groupID int64, sessionHash string, accountID int64, ttl time.Duration) error {
	if c.sessionBindings == nil {
		c.sessionBindings = make(map[string]int64)
	}
	c.sessionBindings[sessionHash] = accountID
	return nil
}

func (c *stubGatewayCache) RefreshSessionTTL(ctx context.Context, groupID int64, sessionHash string, ttl time.Duration) error {
	return nil
}

func (c *stubGatewayCache) DeleteSessionAccountID(ctx context.Context, groupID int64, sessionHash string) error {
	if c.sessionBindings == nil {
		return nil
	}
	if c.deletedSessions == nil {
		c.deletedSessions = make(map[string]int)
	}
	c.deletedSessions[sessionHash]++
	delete(c.sessionBindings, sessionHash)
	return nil
}

func TestOpenAISelectAccountWithLoadAwareness_FiltersUnschedulable(t *testing.T) {
	now := time.Now()
	resetAt := now.Add(10 * time.Minute)
	groupID := int64(1)

	rateLimited := Account{
		ID:               1,
		Platform:         PlatformOpenAI,
		Type:             AccountTypeAPIKey,
		Status:           StatusActive,
		Schedulable:      true,
		Concurrency:      1,
		Priority:         0,
		RateLimitResetAt: &resetAt,
	}
	available := Account{
		ID:          2,
		Platform:    PlatformOpenAI,
		Type:        AccountTypeAPIKey,
		Status:      StatusActive,
		Schedulable: true,
		Concurrency: 1,
		Priority:    1,
	}

	svc := &OpenAIGatewayService{
		accountRepo:        stubOpenAIAccountRepo{accounts: []Account{rateLimited, available}},
		concurrencyService: NewConcurrencyService(stubConcurrencyCache{}),
	}

	selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "", "gpt-5.2", nil)
	if err != nil {
		t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
	}
	if selection == nil || selection.Account == nil {
		t.Fatalf("expected selection with account")
	}
	if selection.Account.ID != available.ID {
		t.Fatalf("expected account %d, got %d", available.ID, selection.Account.ID)
	}
	if selection.ReleaseFunc != nil {
		selection.ReleaseFunc()
	}
}

func TestOpenAISelectAccountWithLoadAwareness_FiltersUnschedulableWhenNoConcurrencyService(t *testing.T) {
	now := time.Now()
	resetAt := now.Add(10 * time.Minute)
	groupID := int64(1)

	rateLimited := Account{
		ID:               1,
		Platform:         PlatformOpenAI,
		Type:             AccountTypeAPIKey,
		Status:           StatusActive,
		Schedulable:      true,
		Concurrency:      1,
		Priority:         0,
		RateLimitResetAt: &resetAt,
	}
	available := Account{
		ID:          2,
		Platform:    PlatformOpenAI,
		Type:        AccountTypeAPIKey,
		Status:      StatusActive,
		Schedulable: true,
		Concurrency: 1,
		Priority:    1,
	}

	svc := &OpenAIGatewayService{
		accountRepo: stubOpenAIAccountRepo{accounts: []Account{rateLimited, available}},
		// concurrencyService is nil, forcing the non-load-batch selection path.
	}

	selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "", "gpt-5.2", nil)
	if err != nil {
		t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
	}
	if selection == nil || selection.Account == nil {
		t.Fatalf("expected selection with account")
	}
	if selection.Account.ID != available.ID {
		t.Fatalf("expected account %d, got %d", available.ID, selection.Account.ID)
	}
	if selection.ReleaseFunc != nil {
		selection.ReleaseFunc()
	}
}

func TestOpenAISelectAccountForModelWithExclusions_StickyUnschedulableClearsSession(t *testing.T) {
	sessionHash := "session-1"
	repo := stubOpenAIAccountRepo{
		accounts: []Account{
			{ID: 1, Platform: PlatformOpenAI, Status: StatusDisabled, Schedulable: true, Concurrency: 1},
			{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1},
		},
	}
	cache := &stubGatewayCache{
		sessionBindings: map[string]int64{"openai:" + sessionHash: 1},
	}

	svc := &OpenAIGatewayService{
		accountRepo: repo,
		cache:       cache,
	}

	acc, err := svc.SelectAccountForModelWithExclusions(context.Background(), nil, sessionHash, "gpt-4", nil)
	if err != nil {
		t.Fatalf("SelectAccountForModelWithExclusions error: %v", err)
	}
	if acc == nil || acc.ID != 2 {
		t.Fatalf("expected account 2, got %+v", acc)
	}
	if cache.deletedSessions["openai:"+sessionHash] != 1 {
		t.Fatalf("expected sticky session to be deleted")
	}
	if cache.sessionBindings["openai:"+sessionHash] != 2 {
		t.Fatalf("expected sticky session to bind to account 2")
	}
}

func TestOpenAISelectAccountWithLoadAwareness_StickyUnschedulableClearsSession(t *testing.T) {
	sessionHash := "session-2"
	groupID := int64(1)
	repo := stubOpenAIAccountRepo{
		accounts: []Account{
			{ID: 1, Platform: PlatformOpenAI, Status: StatusDisabled, Schedulable: true, Concurrency: 1},
			{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1},
		},
	}
	cache := &stubGatewayCache{
		sessionBindings: map[string]int64{"openai:" + sessionHash: 1},
	}

	svc := &OpenAIGatewayService{
		accountRepo:        repo,
		cache:              cache,
		concurrencyService: NewConcurrencyService(stubConcurrencyCache{}),
	}

	selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, sessionHash, "gpt-4", nil)
	if err != nil {
		t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
	}
	if selection == nil || selection.Account == nil || selection.Account.ID != 2 {
		t.Fatalf("expected account 2, got %+v", selection)
	}
	if cache.deletedSessions["openai:"+sessionHash] != 1 {
		t.Fatalf("expected sticky session to be deleted")
	}
	if cache.sessionBindings["openai:"+sessionHash] != 2 {
		t.Fatalf("expected sticky session to bind to account 2")
	}
	if selection.ReleaseFunc != nil {
		selection.ReleaseFunc()
	}
}

func TestOpenAISelectAccountForModelWithExclusions_NoModelSupport(t *testing.T) {
	repo := stubOpenAIAccountRepo{
		accounts: []Account{
			{
				ID:          1,
				Platform:    PlatformOpenAI,
				Status:      StatusActive,
				Schedulable: true,
				Credentials: map[string]any{"model_mapping": map[string]any{"gpt-3.5-turbo": "gpt-3.5-turbo"}},
			},
		},
	}
	cache := &stubGatewayCache{}

	svc := &OpenAIGatewayService{
		accountRepo: repo,
		cache:       cache,
	}

	acc, err := svc.SelectAccountForModelWithExclusions(context.Background(), nil, "", "gpt-4", nil)
	if err == nil {
		t.Fatalf("expected error for unsupported model")
	}
	if acc != nil {
		t.Fatalf("expected nil account for unsupported model")
	}
	if !strings.Contains(err.Error(), "supporting model") {
		t.Fatalf("unexpected error: %v", err)
	}
}

func TestOpenAISelectAccountWithLoadAwareness_LoadBatchErrorFallback(t *testing.T) {
	groupID := int64(1)
	repo := stubOpenAIAccountRepo{
		accounts: []Account{
			{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 2},
			{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
		},
	}
	cache := &stubGatewayCache{}
	concurrencyCache := stubConcurrencyCache{
		loadBatchErr: errors.New("load batch failed"),
	}

	svc := &OpenAIGatewayService{
		accountRepo:        repo,
		cache:              cache,
		concurrencyService: NewConcurrencyService(concurrencyCache),
	}

	selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "fallback", "gpt-4", nil)
	if err != nil {
		t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
	}
	if selection == nil || selection.Account == nil {
		t.Fatalf("expected selection")
	}
	if selection.Account.ID != 2 {
		t.Fatalf("expected account 2, got %d", selection.Account.ID)
	}
	if cache.sessionBindings["openai:fallback"] != 2 {
		t.Fatalf("expected sticky session updated")
	}
	if selection.ReleaseFunc != nil {
		selection.ReleaseFunc()
	}
}

func TestOpenAISelectAccountWithLoadAwareness_NoSlotFallbackWait(t *testing.T) {
	groupID := int64(1)
	repo := stubOpenAIAccountRepo{
		accounts: []Account{
			{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
		},
	}
	cache := &stubGatewayCache{}
	concurrencyCache := stubConcurrencyCache{
		acquireResults: map[int64]bool{1: false},
		loadMap: map[int64]*AccountLoadInfo{
			1: {AccountID: 1, LoadRate: 10},
		},
	}

	svc := &OpenAIGatewayService{
		accountRepo:        repo,
		cache:              cache,
		concurrencyService: NewConcurrencyService(concurrencyCache),
	}

	selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "", "gpt-4", nil)
	if err != nil {
		t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
	}
	if selection == nil || selection.WaitPlan == nil {
		t.Fatalf("expected wait plan fallback")
	}
	if selection.Account == nil || selection.Account.ID != 1 {
		t.Fatalf("expected account 1")
	}
}

func TestOpenAISelectAccountForModelWithExclusions_SetsStickyBinding(t *testing.T) {
	sessionHash := "bind"
	repo := stubOpenAIAccountRepo{
		accounts: []Account{
			{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
		},
	}
	cache := &stubGatewayCache{}

	svc := &OpenAIGatewayService{
		accountRepo: repo,
		cache:       cache,
	}

	acc, err := svc.SelectAccountForModelWithExclusions(context.Background(), nil, sessionHash, "gpt-4", nil)
	if err != nil {
		t.Fatalf("SelectAccountForModelWithExclusions error: %v", err)
	}
	if acc == nil || acc.ID != 1 {
		t.Fatalf("expected account 1")
	}
	if cache.sessionBindings["openai:"+sessionHash] != 1 {
		t.Fatalf("expected sticky session binding")
	}
}

func TestOpenAISelectAccountWithLoadAwareness_StickyWaitPlan(t *testing.T) {
	sessionHash := "sticky-wait"
	groupID := int64(1)
	repo := stubOpenAIAccountRepo{
		accounts: []Account{
			{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
		},
	}
	cache := &stubGatewayCache{
		sessionBindings: map[string]int64{"openai:" + sessionHash: 1},
	}
	concurrencyCache := stubConcurrencyCache{
		acquireResults: map[int64]bool{1: false},
		waitCounts:     map[int64]int{1: 0},
	}

	svc := &OpenAIGatewayService{
		accountRepo:        repo,
		cache:              cache,
		concurrencyService: NewConcurrencyService(concurrencyCache),
	}

	selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, sessionHash, "gpt-4", nil)
	if err != nil {
		t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
	}
	if selection == nil || selection.WaitPlan == nil {
		t.Fatalf("expected sticky wait plan")
	}
	if selection.Account == nil || selection.Account.ID != 1 {
		t.Fatalf("expected account 1")
	}
}

func TestOpenAISelectAccountWithLoadAwareness_PrefersLowerLoad(t *testing.T) {
	groupID := int64(1)
	repo := stubOpenAIAccountRepo{
		accounts: []Account{
			{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
			{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
		},
	}
	cache := &stubGatewayCache{}
	concurrencyCache := stubConcurrencyCache{
		loadMap: map[int64]*AccountLoadInfo{
			1: {AccountID: 1, LoadRate: 80},
			2: {AccountID: 2, LoadRate: 10},
		},
	}

	svc := &OpenAIGatewayService{
		accountRepo:        repo,
		cache:              cache,
		concurrencyService: NewConcurrencyService(concurrencyCache),
	}

	selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "load", "gpt-4", nil)
	if err != nil {
		t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
	}
	if selection == nil || selection.Account == nil || selection.Account.ID != 2 {
		t.Fatalf("expected account 2")
	}
	if cache.sessionBindings["openai:load"] != 2 {
		t.Fatalf("expected sticky session updated")
	}
}

func TestOpenAISelectAccountForModelWithExclusions_StickyExcludedFallback(t *testing.T) {
	sessionHash := "excluded"
	repo := stubOpenAIAccountRepo{
		accounts: []Account{
			{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
			{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 2},
		},
	}
	cache := &stubGatewayCache{
		sessionBindings: map[string]int64{"openai:" + sessionHash: 1},
	}

	svc := &OpenAIGatewayService{
		accountRepo: repo,
		cache:       cache,
	}

	excluded := map[int64]struct{}{1: {}}
	acc, err := svc.SelectAccountForModelWithExclusions(context.Background(), nil, sessionHash, "gpt-4", excluded)
	if err != nil {
		t.Fatalf("SelectAccountForModelWithExclusions error: %v", err)
	}
	if acc == nil || acc.ID != 2 {
		t.Fatalf("expected account 2")
	}
}

func TestOpenAISelectAccountForModelWithExclusions_StickyNonOpenAI(t *testing.T) {
	sessionHash := "non-openai"
	repo := stubOpenAIAccountRepo{
		accounts: []Account{
			{ID: 1, Platform: PlatformAnthropic, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
			{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 2},
		},
	}
	cache := &stubGatewayCache{
		sessionBindings: map[string]int64{"openai:" + sessionHash: 1},
	}

	svc := &OpenAIGatewayService{
		accountRepo: repo,
		cache:       cache,
	}

	acc, err := svc.SelectAccountForModelWithExclusions(context.Background(), nil, sessionHash, "gpt-4", nil)
	if err != nil {
		t.Fatalf("SelectAccountForModelWithExclusions error: %v", err)
	}
	if acc == nil || acc.ID != 2 {
		t.Fatalf("expected account 2")
	}
}

func TestOpenAISelectAccountForModelWithExclusions_NoAccounts(t *testing.T) {
	repo := stubOpenAIAccountRepo{accounts: []Account{}}
	cache := &stubGatewayCache{}

	svc := &OpenAIGatewayService{
		accountRepo: repo,
		cache:       cache,
	}

	acc, err := svc.SelectAccountForModelWithExclusions(context.Background(), nil, "", "", nil)
	if err == nil {
		t.Fatalf("expected error for no accounts")
	}
	if acc != nil {
		t.Fatalf("expected nil account")
	}
	if !strings.Contains(err.Error(), "no available OpenAI accounts") {
		t.Fatalf("unexpected error: %v", err)
	}
}

func TestOpenAISelectAccountWithLoadAwareness_NoCandidates(t *testing.T) {
	groupID := int64(1)
	resetAt := time.Now().Add(1 * time.Hour)
	repo := stubOpenAIAccountRepo{
		accounts: []Account{
			{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1, RateLimitResetAt: &resetAt},
		},
	}
	cache := &stubGatewayCache{}
	concurrencyCache := stubConcurrencyCache{}

	svc := &OpenAIGatewayService{
		accountRepo:        repo,
		cache:              cache,
		concurrencyService: NewConcurrencyService(concurrencyCache),
	}

	selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "", "gpt-4", nil)
	if err == nil {
		t.Fatalf("expected error for no candidates")
	}
	if selection != nil {
		t.Fatalf("expected nil selection")
	}
}

func TestOpenAISelectAccountWithLoadAwareness_AllFullWaitPlan(t *testing.T) {
	groupID := int64(1)
	repo := stubOpenAIAccountRepo{
		accounts: []Account{
			{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
		},
	}
	cache := &stubGatewayCache{}
	concurrencyCache := stubConcurrencyCache{
		loadMap: map[int64]*AccountLoadInfo{
			1: {AccountID: 1, LoadRate: 100},
		},
	}

	svc := &OpenAIGatewayService{
		accountRepo:        repo,
		cache:              cache,
		concurrencyService: NewConcurrencyService(concurrencyCache),
	}

	selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "", "gpt-4", nil)
	if err != nil {
		t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
	}
	if selection == nil || selection.WaitPlan == nil {
		t.Fatalf("expected wait plan")
	}
}

func TestOpenAISelectAccountWithLoadAwareness_LoadBatchErrorNoAcquire(t *testing.T) {
	groupID := int64(1)
	repo := stubOpenAIAccountRepo{
		accounts: []Account{
			{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
		},
	}
	cache := &stubGatewayCache{}
	concurrencyCache := stubConcurrencyCache{
		loadBatchErr:   errors.New("load batch failed"),
		acquireResults: map[int64]bool{1: false},
	}

	svc := &OpenAIGatewayService{
		accountRepo:        repo,
		cache:              cache,
		concurrencyService: NewConcurrencyService(concurrencyCache),
	}

	selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "", "gpt-4", nil)
	if err != nil {
		t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
	}
	if selection == nil || selection.WaitPlan == nil {
		t.Fatalf("expected wait plan")
	}
}

func TestOpenAISelectAccountWithLoadAwareness_MissingLoadInfo(t *testing.T) {
	groupID := int64(1)
	repo := stubOpenAIAccountRepo{
		accounts: []Account{
			{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
			{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
		},
	}
	cache := &stubGatewayCache{}
	concurrencyCache := stubConcurrencyCache{
		loadMap: map[int64]*AccountLoadInfo{
			1: {AccountID: 1, LoadRate: 50},
		},
		skipDefaultLoad: true,
	}

	svc := &OpenAIGatewayService{
		accountRepo:        repo,
		cache:              cache,
		concurrencyService: NewConcurrencyService(concurrencyCache),
	}

	selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "", "gpt-4", nil)
	if err != nil {
		t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
	}
	if selection == nil || selection.Account == nil || selection.Account.ID != 2 {
		t.Fatalf("expected account 2")
	}
}

func TestOpenAISelectAccountForModelWithExclusions_LeastRecentlyUsed(t *testing.T) {
	oldTime := time.Now().Add(-2 * time.Hour)
	newTime := time.Now().Add(-1 * time.Hour)
	repo := stubOpenAIAccountRepo{
		accounts: []Account{
			{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Priority: 1, LastUsedAt: &newTime},
			{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Priority: 1, LastUsedAt: &oldTime},
		},
	}
	cache := &stubGatewayCache{}

	svc := &OpenAIGatewayService{
		accountRepo: repo,
		cache:       cache,
	}

	acc, err := svc.SelectAccountForModelWithExclusions(context.Background(), nil, "", "gpt-4", nil)
	if err != nil {
		t.Fatalf("SelectAccountForModelWithExclusions error: %v", err)
	}
	if acc == nil || acc.ID != 2 {
		t.Fatalf("expected account 2")
	}
}

func TestOpenAISelectAccountWithLoadAwareness_PreferNeverUsed(t *testing.T) {
	groupID := int64(1)
	lastUsed := time.Now().Add(-1 * time.Hour)
	repo := stubOpenAIAccountRepo{
		accounts: []Account{
			{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1, LastUsedAt: &lastUsed},
			{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
		},
	}
	cache := &stubGatewayCache{}
	concurrencyCache := stubConcurrencyCache{
		loadMap: map[int64]*AccountLoadInfo{
			1: {AccountID: 1, LoadRate: 10},
			2: {AccountID: 2, LoadRate: 10},
		},
	}

	svc := &OpenAIGatewayService{
		accountRepo:        repo,
		cache:              cache,
		concurrencyService: NewConcurrencyService(concurrencyCache),
	}

	selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "", "gpt-4", nil)
	if err != nil {
		t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
	}
	if selection == nil || selection.Account == nil || selection.Account.ID != 2 {
		t.Fatalf("expected account 2")
	}
}

func TestOpenAIStreamingTimeout(t *testing.T) {
	gin.SetMode(gin.TestMode)
	cfg := &config.Config{
		Gateway: config.GatewayConfig{
			StreamDataIntervalTimeout: 1,
			StreamKeepaliveInterval:   0,
			MaxLineSize:               defaultMaxLineSize,
		},
	}
	svc := &OpenAIGatewayService{cfg: cfg}

	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/", nil)

	pr, pw := io.Pipe()
	resp := &http.Response{
		StatusCode: http.StatusOK,
		Body:       pr,
		Header:     http.Header{},
	}

	start := time.Now()
	_, err := svc.handleStreamingResponse(c.Request.Context(), resp, c, &Account{ID: 1}, start, "model", "model")
	_ = pw.Close()
	_ = pr.Close()

	if err == nil || !strings.Contains(err.Error(), "stream data interval timeout") {
		t.Fatalf("expected stream timeout error, got %v", err)
	}
	if !strings.Contains(rec.Body.String(), "\"type\":\"error\"") || !strings.Contains(rec.Body.String(), "stream_timeout") {
		t.Fatalf("expected OpenAI-compatible error SSE event, got %q", rec.Body.String())
	}
}

func TestOpenAIStreamingContextCanceledDoesNotInjectErrorEvent(t *testing.T) {
	gin.SetMode(gin.TestMode)
	cfg := &config.Config{
		Gateway: config.GatewayConfig{
			StreamDataIntervalTimeout: 0,
			StreamKeepaliveInterval:   0,
			MaxLineSize:               defaultMaxLineSize,
		},
	}
	svc := &OpenAIGatewayService{cfg: cfg}

	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	ctx, cancel := context.WithCancel(context.Background())
	cancel()
	c.Request = httptest.NewRequest(http.MethodPost, "/", nil).WithContext(ctx)

	resp := &http.Response{
		StatusCode: http.StatusOK,
		Body:       cancelReadCloser{},
		Header:     http.Header{},
	}

	_, err := svc.handleStreamingResponse(c.Request.Context(), resp, c, &Account{ID: 1}, time.Now(), "model", "model")
	if err != nil {
		t.Fatalf("expected nil error, got %v", err)
	}
	if strings.Contains(rec.Body.String(), "event: error") || strings.Contains(rec.Body.String(), "stream_read_error") {
		t.Fatalf("expected no injected SSE error event, got %q", rec.Body.String())
	}
}

func TestOpenAIStreamingClientDisconnectDrainsUpstreamUsage(t *testing.T) {
	gin.SetMode(gin.TestMode)
	cfg := &config.Config{
		Gateway: config.GatewayConfig{
			StreamDataIntervalTimeout: 0,
			StreamKeepaliveInterval:   0,
			MaxLineSize:               defaultMaxLineSize,
		},
	}
	svc := &OpenAIGatewayService{cfg: cfg}

	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/", nil)
	c.Writer = &failingGinWriter{ResponseWriter: c.Writer, failAfter: 0}

	pr, pw := io.Pipe()
	resp := &http.Response{
		StatusCode: http.StatusOK,
		Body:       pr,
		Header:     http.Header{},
	}

	go func() {
		defer func() { _ = pw.Close() }()
		_, _ = pw.Write([]byte("data: {\"type\":\"response.in_progress\",\"response\":{}}\n\n"))
		_, _ = pw.Write([]byte("data: {\"type\":\"response.completed\",\"response\":{\"usage\":{\"input_tokens\":3,\"output_tokens\":5,\"input_tokens_details\":{\"cached_tokens\":1}}}}\n\n"))
	}()

	result, err := svc.handleStreamingResponse(c.Request.Context(), resp, c, &Account{ID: 1}, time.Now(), "model", "model")
	_ = pr.Close()
	if err != nil {
		t.Fatalf("expected nil error, got %v", err)
	}
	if result == nil || result.usage == nil {
		t.Fatalf("expected usage result")
	}
	if result.usage.InputTokens != 3 || result.usage.OutputTokens != 5 || result.usage.CacheReadInputTokens != 1 {
		t.Fatalf("unexpected usage: %+v", *result.usage)
	}
	if strings.Contains(rec.Body.String(), "event: error") || strings.Contains(rec.Body.String(), "write_failed") {
		t.Fatalf("expected no injected SSE error event, got %q", rec.Body.String())
	}
}

func TestOpenAIStreamingTooLong(t *testing.T) {
	gin.SetMode(gin.TestMode)
	cfg := &config.Config{
		Gateway: config.GatewayConfig{
			StreamDataIntervalTimeout: 0,
			StreamKeepaliveInterval:   0,
			MaxLineSize:               64 * 1024,
		},
	}
	svc := &OpenAIGatewayService{cfg: cfg}

	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/", nil)

	pr, pw := io.Pipe()
	resp := &http.Response{
		StatusCode: http.StatusOK,
		Body:       pr,
		Header:     http.Header{},
	}

	go func() {
		defer func() { _ = pw.Close() }()
		// 写入超过 MaxLineSize 的单行数据，触发 ErrTooLong
		payload := "data: " + strings.Repeat("a", 128*1024) + "\n"
		_, _ = pw.Write([]byte(payload))
	}()

	_, err := svc.handleStreamingResponse(c.Request.Context(), resp, c, &Account{ID: 2}, time.Now(), "model", "model")
	_ = pr.Close()

	if !errors.Is(err, bufio.ErrTooLong) {
		t.Fatalf("expected ErrTooLong, got %v", err)
	}
	if !strings.Contains(rec.Body.String(), "\"type\":\"error\"") || !strings.Contains(rec.Body.String(), "response_too_large") {
		t.Fatalf("expected OpenAI-compatible error SSE event, got %q", rec.Body.String())
	}
}

func TestOpenAINonStreamingContentTypePassThrough(t *testing.T) {
	gin.SetMode(gin.TestMode)
	cfg := &config.Config{
		Security: config.SecurityConfig{
			ResponseHeaders: config.ResponseHeaderConfig{Enabled: false},
		},
	}
	svc := &OpenAIGatewayService{cfg: cfg}

	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/", nil)

	body := []byte(`{"usage":{"input_tokens":1,"output_tokens":2,"input_tokens_details":{"cached_tokens":0}}}`)
	resp := &http.Response{
		StatusCode: http.StatusOK,
		Body:       io.NopCloser(bytes.NewReader(body)),
		Header:     http.Header{"Content-Type": []string{"application/vnd.test+json"}},
	}

	_, err := svc.handleNonStreamingResponse(c.Request.Context(), resp, c, &Account{}, "model", "model")
	if err != nil {
		t.Fatalf("handleNonStreamingResponse error: %v", err)
	}

	if !strings.Contains(rec.Header().Get("Content-Type"), "application/vnd.test+json") {
		t.Fatalf("expected Content-Type passthrough, got %q", rec.Header().Get("Content-Type"))
	}
}

func TestOpenAINonStreamingContentTypeDefault(t *testing.T) {
	gin.SetMode(gin.TestMode)
	cfg := &config.Config{
		Security: config.SecurityConfig{
			ResponseHeaders: config.ResponseHeaderConfig{Enabled: false},
		},
	}
	svc := &OpenAIGatewayService{cfg: cfg}

	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/", nil)

	body := []byte(`{"usage":{"input_tokens":1,"output_tokens":2,"input_tokens_details":{"cached_tokens":0}}}`)
	resp := &http.Response{
		StatusCode: http.StatusOK,
		Body:       io.NopCloser(bytes.NewReader(body)),
		Header:     http.Header{},
	}

	_, err := svc.handleNonStreamingResponse(c.Request.Context(), resp, c, &Account{}, "model", "model")
	if err != nil {
		t.Fatalf("handleNonStreamingResponse error: %v", err)
	}

	if !strings.Contains(rec.Header().Get("Content-Type"), "application/json") {
		t.Fatalf("expected default Content-Type, got %q", rec.Header().Get("Content-Type"))
	}
}

func TestOpenAIStreamingHeadersOverride(t *testing.T) {
	gin.SetMode(gin.TestMode)
	cfg := &config.Config{
		Security: config.SecurityConfig{
			ResponseHeaders: config.ResponseHeaderConfig{Enabled: false},
		},
		Gateway: config.GatewayConfig{
			StreamDataIntervalTimeout: 0,
			StreamKeepaliveInterval:   0,
			MaxLineSize:               defaultMaxLineSize,
		},
	}
	svc := &OpenAIGatewayService{cfg: cfg}

	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/", nil)

	pr, pw := io.Pipe()
	resp := &http.Response{
		StatusCode: http.StatusOK,
		Body:       pr,
		Header: http.Header{
			"Cache-Control": []string{"upstream"},
			"X-Request-Id":  []string{"req-123"},
			"Content-Type":  []string{"application/custom"},
		},
	}

	go func() {
		defer func() { _ = pw.Close() }()
		_, _ = pw.Write([]byte("data: {}\n\n"))
	}()

	_, err := svc.handleStreamingResponse(c.Request.Context(), resp, c, &Account{ID: 1}, time.Now(), "model", "model")
	_ = pr.Close()
	if err != nil {
		t.Fatalf("handleStreamingResponse error: %v", err)
	}

	if rec.Header().Get("Cache-Control") != "no-cache" {
		t.Fatalf("expected Cache-Control override, got %q", rec.Header().Get("Cache-Control"))
	}
	if rec.Header().Get("Content-Type") != "text/event-stream" {
		t.Fatalf("expected Content-Type override, got %q", rec.Header().Get("Content-Type"))
	}
	if rec.Header().Get("X-Request-Id") != "req-123" {
		t.Fatalf("expected X-Request-Id passthrough, got %q", rec.Header().Get("X-Request-Id"))
	}
}

func TestOpenAIStreamingReuseScannerBufferAndStillWorks(t *testing.T) {
	gin.SetMode(gin.TestMode)
	cfg := &config.Config{
		Gateway: config.GatewayConfig{
			StreamDataIntervalTimeout: 0,
			StreamKeepaliveInterval:   0,
			MaxLineSize:               defaultMaxLineSize,
		},
	}
	svc := &OpenAIGatewayService{cfg: cfg}

	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/", nil)

	pr, pw := io.Pipe()
	resp := &http.Response{
		StatusCode: http.StatusOK,
		Body:       pr,
		Header:     http.Header{},
	}

	go func() {
		defer func() { _ = pw.Close() }()
		_, _ = pw.Write([]byte("data: {\"type\":\"response.completed\",\"response\":{\"usage\":{\"input_tokens\":1,\"output_tokens\":2,\"input_tokens_details\":{\"cached_tokens\":3}}}}\n\n"))
	}()

	result, err := svc.handleStreamingResponse(c.Request.Context(), resp, c, &Account{ID: 1}, time.Now(), "model", "model")
	_ = pr.Close()
	require.NoError(t, err)
	require.NotNil(t, result)
	require.NotNil(t, result.usage)
	require.Equal(t, 1, result.usage.InputTokens)
	require.Equal(t, 2, result.usage.OutputTokens)
	require.Equal(t, 3, result.usage.CacheReadInputTokens)
}

func TestOpenAIInvalidBaseURLWhenAllowlistDisabled(t *testing.T) {
	gin.SetMode(gin.TestMode)
	cfg := &config.Config{
		Security: config.SecurityConfig{
			URLAllowlist: config.URLAllowlistConfig{Enabled: false},
		},
	}
	svc := &OpenAIGatewayService{cfg: cfg}

	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/", nil)

	account := &Account{
		Platform:    PlatformOpenAI,
		Type:        AccountTypeAPIKey,
		Credentials: map[string]any{"base_url": "://invalid-url"},
	}

	_, err := svc.buildUpstreamRequest(c.Request.Context(), c, account, []byte("{}"), "token", false, "", false)
	if err == nil {
		t.Fatalf("expected error for invalid base_url when allowlist disabled")
	}
}

func TestOpenAIValidateUpstreamBaseURLDisabledRequiresHTTPS(t *testing.T) {
	cfg := &config.Config{
		Security: config.SecurityConfig{
			URLAllowlist: config.URLAllowlistConfig{Enabled: false},
		},
	}
	svc := &OpenAIGatewayService{cfg: cfg}

	if _, err := svc.validateUpstreamBaseURL("http://not-https.example.com"); err == nil {
		t.Fatalf("expected http to be rejected when allow_insecure_http is false")
	}
	normalized, err := svc.validateUpstreamBaseURL("https://example.com")
	if err != nil {
		t.Fatalf("expected https to be allowed when allowlist disabled, got %v", err)
	}
	if normalized != "https://example.com" {
		t.Fatalf("expected raw url passthrough, got %q", normalized)
	}
}

func TestOpenAIValidateUpstreamBaseURLDisabledAllowsHTTP(t *testing.T) {
	cfg := &config.Config{
		Security: config.SecurityConfig{
			URLAllowlist: config.URLAllowlistConfig{
				Enabled:           false,
				AllowInsecureHTTP: true,
			},
		},
	}
	svc := &OpenAIGatewayService{cfg: cfg}

	normalized, err := svc.validateUpstreamBaseURL("http://not-https.example.com")
	if err != nil {
		t.Fatalf("expected http allowed when allow_insecure_http is true, got %v", err)
	}
	if normalized != "http://not-https.example.com" {
		t.Fatalf("expected raw url passthrough, got %q", normalized)
	}
}

func TestOpenAIValidateUpstreamBaseURLEnabledEnforcesAllowlist(t *testing.T) {
	cfg := &config.Config{
		Security: config.SecurityConfig{
			URLAllowlist: config.URLAllowlistConfig{
				Enabled:       true,
				UpstreamHosts: []string{"example.com"},
			},
		},
	}
	svc := &OpenAIGatewayService{cfg: cfg}

	if _, err := svc.validateUpstreamBaseURL("https://example.com"); err != nil {
		t.Fatalf("expected allowlisted host to pass, got %v", err)
	}
	if _, err := svc.validateUpstreamBaseURL("https://evil.com"); err == nil {
		t.Fatalf("expected non-allowlisted host to fail")
	}
}

func TestOpenAIUpdateCodexUsageSnapshotFromHeaders(t *testing.T) {
	repo := &snapshotUpdateAccountRepo{updateExtraCalls: make(chan map[string]any, 1)}
	svc := &OpenAIGatewayService{accountRepo: repo}
	headers := http.Header{}
	headers.Set("x-codex-primary-used-percent", "12")
	headers.Set("x-codex-secondary-used-percent", "34")
	headers.Set("x-codex-primary-window-minutes", "300")
	headers.Set("x-codex-secondary-window-minutes", "10080")
	headers.Set("x-codex-primary-reset-after-seconds", "600")
	headers.Set("x-codex-secondary-reset-after-seconds", "86400")

	svc.UpdateCodexUsageSnapshotFromHeaders(context.Background(), 123, headers)

	select {
	case updates := <-repo.updateExtraCalls:
		require.Equal(t, 12.0, updates["codex_5h_used_percent"])
		require.Equal(t, 34.0, updates["codex_7d_used_percent"])
		require.Equal(t, 600, updates["codex_5h_reset_after_seconds"])
		require.Equal(t, 86400, updates["codex_7d_reset_after_seconds"])
	case <-time.After(2 * time.Second):
		t.Fatal("expected UpdateExtra to be called")
	}
}

func TestOpenAIResponsesRequestPathSuffix(t *testing.T) {
	gin.SetMode(gin.TestMode)
	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)

	tests := []struct {
		name string
		path string
		want string
	}{
		{name: "exact v1 responses", path: "/v1/responses", want: ""},
		{name: "compact v1 responses", path: "/v1/responses/compact", want: "/compact"},
		{name: "compact alias responses", path: "/responses/compact/", want: "/compact"},
		{name: "nested suffix", path: "/openai/v1/responses/compact/detail", want: "/compact/detail"},
		{name: "unrelated path", path: "/v1/chat/completions", want: ""},
	}

	for _, tt := range tests {
		t.Run(tt.name, func(t *testing.T) {
			c.Request = httptest.NewRequest(http.MethodPost, tt.path, nil)
			require.Equal(t, tt.want, openAIResponsesRequestPathSuffix(c))
		})
	}
}

func TestOpenAIBuildUpstreamRequestOpenAIPassthroughPreservesCompactPath(t *testing.T) {
	gin.SetMode(gin.TestMode)
	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/v1/responses/compact", bytes.NewReader([]byte(`{"model":"gpt-5"}`)))

	svc := &OpenAIGatewayService{}
	account := &Account{Type: AccountTypeOAuth}

	req, err := svc.buildUpstreamRequestOpenAIPassthrough(c.Request.Context(), c, account, []byte(`{"model":"gpt-5"}`), "token")
	require.NoError(t, err)
	require.Equal(t, chatgptCodexURL+"/compact", req.URL.String())
	require.Equal(t, "application/json", req.Header.Get("Accept"))
	require.Equal(t, codexCLIVersion, req.Header.Get("Version"))
	require.NotEmpty(t, req.Header.Get("Session_Id"))
}

func TestOpenAIBuildUpstreamRequestCompactForcesJSONAcceptForOAuth(t *testing.T) {
	gin.SetMode(gin.TestMode)
	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/v1/responses/compact", bytes.NewReader([]byte(`{"model":"gpt-5"}`)))

	svc := &OpenAIGatewayService{}
	account := &Account{
		Type:        AccountTypeOAuth,
		Credentials: map[string]any{"chatgpt_account_id": "chatgpt-acc"},
	}

	req, err := svc.buildUpstreamRequest(c.Request.Context(), c, account, []byte(`{"model":"gpt-5"}`), "token", false, "", true)
	require.NoError(t, err)
	require.Equal(t, chatgptCodexURL+"/compact", req.URL.String())
	require.Equal(t, "application/json", req.Header.Get("Accept"))
	require.Equal(t, codexCLIVersion, req.Header.Get("Version"))
	require.NotEmpty(t, req.Header.Get("Session_Id"))
}

func TestOpenAIBuildUpstreamRequestPreservesCompactPathForAPIKeyBaseURL(t *testing.T) {
	gin.SetMode(gin.TestMode)
	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/responses/compact", bytes.NewReader([]byte(`{"model":"gpt-5"}`)))

	svc := &OpenAIGatewayService{cfg: &config.Config{
		Security: config.SecurityConfig{
			URLAllowlist: config.URLAllowlistConfig{Enabled: false},
		},
	}}
	account := &Account{
		Type:        AccountTypeAPIKey,
		Platform:    PlatformOpenAI,
		Credentials: map[string]any{"base_url": "https://example.com/v1"},
	}

	req, err := svc.buildUpstreamRequest(c.Request.Context(), c, account, []byte(`{"model":"gpt-5"}`), "token", false, "", false)
	require.NoError(t, err)
	require.Equal(t, "https://example.com/v1/responses/compact", req.URL.String())
}

func TestOpenAIBuildUpstreamRequestOAuthOfficialClientOriginatorCompatibility(t *testing.T) {
	gin.SetMode(gin.TestMode)

	tests := []struct {
		name           string
		userAgent      string
		originator     string
		wantOriginator string
	}{
		{name: "desktop originator preserved", originator: "Codex Desktop", wantOriginator: "Codex Desktop"},
		{name: "vscode originator preserved", originator: "codex_vscode", wantOriginator: "codex_vscode"},
		{name: "official ua fallback to codex_cli_rs", userAgent: "Codex Desktop/1.2.3", wantOriginator: "codex_cli_rs"},
	}

	for _, tt := range tests {
		t.Run(tt.name, func(t *testing.T) {
			rec := httptest.NewRecorder()
			c, _ := gin.CreateTestContext(rec)
			c.Request = httptest.NewRequest(http.MethodPost, "/v1/responses", bytes.NewReader([]byte(`{"model":"gpt-5"}`)))
			if tt.userAgent != "" {
				c.Request.Header.Set("User-Agent", tt.userAgent)
			}
			if tt.originator != "" {
				c.Request.Header.Set("originator", tt.originator)
			}

			svc := &OpenAIGatewayService{}
			account := &Account{
				Type:        AccountTypeOAuth,
				Credentials: map[string]any{"chatgpt_account_id": "chatgpt-acc"},
			}

			isCodexCLI := openai.IsCodexOfficialClientByHeaders(c.GetHeader("User-Agent"), c.GetHeader("originator"))
			req, err := svc.buildUpstreamRequest(c.Request.Context(), c, account, []byte(`{"model":"gpt-5"}`), "token", false, "", isCodexCLI)
			require.NoError(t, err)
			require.Equal(t, tt.wantOriginator, req.Header.Get("originator"))
		})
	}
}

// ==================== P1-08 修复：model 替换性能优化测试 ====================

// ==================== P1-08 修复：model 替换性能优化测试 =============
func TestReplaceModelInSSELine(t *testing.T) {
	svc := &OpenAIGatewayService{}

	tests := []struct {
		name     string
		line     string
		from     string
		to       string
		expected string
	}{
		{
			name:     "顶层 model 字段替换",
			line:     `data: {"id":"chatcmpl-123","model":"gpt-4o","choices":[]}`,
			from:     "gpt-4o",
			to:       "my-custom-model",
			expected: `data: {"id":"chatcmpl-123","model":"my-custom-model","choices":[]}`,
		},
		{
			name:     "嵌套 response.model 替换",
			line:     `data: {"type":"response","response":{"id":"resp-1","model":"gpt-4o","output":[]}}`,
			from:     "gpt-4o",
			to:       "my-model",
			expected: `data: {"type":"response","response":{"id":"resp-1","model":"my-model","output":[]}}`,
		},
		{
			name:     "model 不匹配时不替换",
			line:     `data: {"id":"chatcmpl-123","model":"gpt-3.5-turbo","choices":[]}`,
			from:     "gpt-4o",
			to:       "my-model",
			expected: `data: {"id":"chatcmpl-123","model":"gpt-3.5-turbo","choices":[]}`,
		},
		{
			name:     "无 model 字段时不替换",
			line:     `data: {"id":"chatcmpl-123","choices":[]}`,
			from:     "gpt-4o",
			to:       "my-model",
			expected: `data: {"id":"chatcmpl-123","choices":[]}`,
		},
		{
			name:     "空 data 行",
			line:     `data: `,
			from:     "gpt-4o",
			to:       "my-model",
			expected: `data: `,
		},
		{
			name:     "[DONE] 行",
			line:     `data: [DONE]`,
			from:     "gpt-4o",
			to:       "my-model",
			expected: `data: [DONE]`,
		},
		{
			name:     "非 data: 前缀行",
			line:     `event: message`,
			from:     "gpt-4o",
			to:       "my-model",
			expected: `event: message`,
		},
		{
			name:     "非法 JSON 不替换",
			line:     `data: {invalid json}`,
			from:     "gpt-4o",
			to:       "my-model",
			expected: `data: {invalid json}`,
		},
		{
			name:     "无空格 data: 格式",
			line:     `data:{"id":"x","model":"gpt-4o"}`,
			from:     "gpt-4o",
			to:       "my-model",
			expected: `data: {"id":"x","model":"my-model"}`,
		},
		{
			name:     "model 名含特殊字符",
			line:     `data: {"model":"org/model-v2.1-beta"}`,
			from:     "org/model-v2.1-beta",
			to:       "custom/alias",
			expected: `data: {"model":"custom/alias"}`,
		},
		{
			name:     "空行",
			line:     "",
			from:     "gpt-4o",
			to:       "my-model",
			expected: "",
		},
		{
			name:     "保持其他字段不变",
			line:     `data: {"id":"abc","object":"chat.completion.chunk","model":"gpt-4o","created":1234567890,"choices":[{"index":0,"delta":{"content":"hi"}}]}`,
			from:     "gpt-4o",
			to:       "alias",
			expected: `data: {"id":"abc","object":"chat.completion.chunk","model":"alias","created":1234567890,"choices":[{"index":0,"delta":{"content":"hi"}}]}`,
		},
		{
			name:     "顶层优先于嵌套：同时存在两个 model",
			line:     `data: {"model":"gpt-4o","response":{"model":"gpt-4o"}}`,
			from:     "gpt-4o",
			to:       "replaced",
			expected: `data: {"model":"replaced","response":{"model":"gpt-4o"}}`,
		},
	}

	for _, tt := range tests {
		t.Run(tt.name, func(t *testing.T) {
			got := svc.replaceModelInSSELine(tt.line, tt.from, tt.to)
			require.Equal(t, tt.expected, got)
		})
	}
}

func TestReplaceModelInSSEBody(t *testing.T) {
	svc := &OpenAIGatewayService{}

	tests := []struct {
		name     string
		body     string
		from     string
		to       string
		expected string
	}{
		{
			name:     "多行 SSE body 替换",
			body:     "data: {\"model\":\"gpt-4o\",\"choices\":[]}\n\ndata: {\"model\":\"gpt-4o\",\"choices\":[{\"delta\":{\"content\":\"hi\"}}]}\n\ndata: [DONE]\n",
			from:     "gpt-4o",
			to:       "alias",
			expected: "data: {\"model\":\"alias\",\"choices\":[]}\n\ndata: {\"model\":\"alias\",\"choices\":[{\"delta\":{\"content\":\"hi\"}}]}\n\ndata: [DONE]\n",
		},
		{
			name:     "无需替换的 body",
			body:     "data: {\"model\":\"gpt-3.5-turbo\"}\n\ndata: [DONE]\n",
			from:     "gpt-4o",
			to:       "alias",
			expected: "data: {\"model\":\"gpt-3.5-turbo\"}\n\ndata: [DONE]\n",
		},
		{
			name:     "混合 event 和 data 行",
			body:     "event: message\ndata: {\"model\":\"gpt-4o\"}\n\n",
			from:     "gpt-4o",
			to:       "alias",
			expected: "event: message\ndata: {\"model\":\"alias\"}\n\n",
		},
		{
			name:     "空 body",
			body:     "",
			from:     "gpt-4o",
			to:       "alias",
			expected: "",
		},
	}

	for _, tt := range tests {
		t.Run(tt.name, func(t *testing.T) {
			got := svc.replaceModelInSSEBody(tt.body, tt.from, tt.to)
			require.Equal(t, tt.expected, got)
		})
	}
}

func TestReplaceModelInResponseBody(t *testing.T) {
	svc := &OpenAIGatewayService{}

	tests := []struct {
		name     string
		body     string
		from     string
		to       string
		expected string
	}{
		{
			name:     "替换顶层 model",
			body:     `{"id":"chatcmpl-123","model":"gpt-4o","choices":[]}`,
			from:     "gpt-4o",
			to:       "alias",
			expected: `{"id":"chatcmpl-123","model":"alias","choices":[]}`,
		},
		{
			name:     "model 不匹配不替换",
			body:     `{"id":"chatcmpl-123","model":"gpt-3.5-turbo","choices":[]}`,
			from:     "gpt-4o",
			to:       "alias",
			expected: `{"id":"chatcmpl-123","model":"gpt-3.5-turbo","choices":[]}`,
		},
		{
			name:     "无 model 字段不替换",
			body:     `{"id":"chatcmpl-123","choices":[]}`,
			from:     "gpt-4o",
			to:       "alias",
			expected: `{"id":"chatcmpl-123","choices":[]}`,
		},
		{
			name:     "非法 JSON 返回原值",
			body:     `not json`,
			from:     "gpt-4o",
			to:       "alias",
			expected: `not json`,
		},
		{
			name:     "空 body 返回原值",
			body:     ``,
			from:     "gpt-4o",
			to:       "alias",
			expected: ``,
		},
		{
			name:     "保持嵌套结构不变",
			body:     `{"model":"gpt-4o","usage":{"prompt_tokens":10,"completion_tokens":20},"choices":[{"message":{"role":"assistant","content":"hello"}}]}`,
			from:     "gpt-4o",
			to:       "alias",
			expected: `{"model":"alias","usage":{"prompt_tokens":10,"completion_tokens":20},"choices":[{"message":{"role":"assistant","content":"hello"}}]}`,
		},
	}

	for _, tt := range tests {
		t.Run(tt.name, func(t *testing.T) {
			got := svc.replaceModelInResponseBody([]byte(tt.body), tt.from, tt.to)
			require.Equal(t, tt.expected, string(got))
		})
	}
}

func TestExtractOpenAISSEDataLine(t *testing.T) {
	tests := []struct {
		name     string
		line     string
		wantData string
		wantOK   bool
	}{
		{name: "标准格式", line: `data: {"type":"x"}`, wantData: `{"type":"x"}`, wantOK: true},
		{name: "无空格格式", line: `data:{"type":"x"}`, wantData: `{"type":"x"}`, wantOK: true},
		{name: "纯空数据", line: `data:   `, wantData: ``, wantOK: true},
		{name: "非 data 行", line: `event: message`, wantData: ``, wantOK: false},
	}

	for _, tt := range tests {
		t.Run(tt.name, func(t *testing.T) {
			got, ok := extractOpenAISSEDataLine(tt.line)
			require.Equal(t, tt.wantOK, ok)
			require.Equal(t, tt.wantData, got)
		})
	}
}

func TestParseSSEUsage_SelectiveParsing(t *testing.T) {
	svc := &OpenAIGatewayService{}
	usage := &OpenAIUsage{InputTokens: 9, OutputTokens: 8, CacheReadInputTokens: 7}

	// 非 completed 事件，不应覆盖 usage
	svc.parseSSEUsage(`{"type":"response.in_progress","response":{"usage":{"input_tokens":1,"output_tokens":2}}}`, usage)
	require.Equal(t, 9, usage.InputTokens)
	require.Equal(t, 8, usage.OutputTokens)
	require.Equal(t, 7, usage.CacheReadInputTokens)

	// completed 事件，应提取 usage
	svc.parseSSEUsage(`{"type":"response.completed","response":{"usage":{"input_tokens":3,"output_tokens":5,"input_tokens_details":{"cached_tokens":2}}}}`, usage)
	require.Equal(t, 3, usage.InputTokens)
	require.Equal(t, 5, usage.OutputTokens)
	require.Equal(t, 2, usage.CacheReadInputTokens)
}

func TestExtractCodexFinalResponse_SampleReplay(t *testing.T) {
	body := strings.Join([]string{
		`event: message`,
		`data: {"type":"response.in_progress","response":{"id":"resp_1"}}`,
		`data: {"type":"response.completed","response":{"id":"resp_1","model":"gpt-4o","usage":{"input_tokens":11,"output_tokens":22,"input_tokens_details":{"cached_tokens":3}}}}`,
		`data: [DONE]`,
	}, "\n")

	finalResp, ok := extractCodexFinalResponse(body)
	require.True(t, ok)
	require.Contains(t, string(finalResp), `"id":"resp_1"`)
	require.Contains(t, string(finalResp), `"input_tokens":11`)
}

func TestHandleOAuthSSEToJSON_CompletedEventReturnsJSON(t *testing.T) {
	gin.SetMode(gin.TestMode)
	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/", nil)

	svc := &OpenAIGatewayService{cfg: &config.Config{}}
	resp := &http.Response{
		StatusCode: http.StatusOK,
		Header:     http.Header{"Content-Type": []string{"text/event-stream"}},
	}
	body := []byte(strings.Join([]string{
		`data: {"type":"response.in_progress","response":{"id":"resp_2"}}`,
		`data: {"type":"response.completed","response":{"id":"resp_2","model":"gpt-4o","usage":{"input_tokens":7,"output_tokens":9,"input_tokens_details":{"cached_tokens":1}}}}`,
		`data: [DONE]`,
	}, "\n"))

	usage, err := svc.handleOAuthSSEToJSON(resp, c, body, "gpt-4o", "gpt-4o")
	require.NoError(t, err)
	require.NotNil(t, usage)
	require.Equal(t, 7, usage.InputTokens)
	require.Equal(t, 9, usage.OutputTokens)
	require.Equal(t, 1, usage.CacheReadInputTokens)
	// Header 可能由上游 Content-Type 透传；关键是 body 已转换为最终 JSON 响应。
	require.NotContains(t, rec.Body.String(), "event:")
	require.Contains(t, rec.Body.String(), `"id":"resp_2"`)
	require.NotContains(t, rec.Body.String(), "data:")
}

func TestHandleOAuthSSEToJSON_NoFinalResponseKeepsSSEBody(t *testing.T) {
	gin.SetMode(gin.TestMode)
	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/", nil)

	svc := &OpenAIGatewayService{cfg: &config.Config{}}
	resp := &http.Response{
		StatusCode: http.StatusOK,
		Header:     http.Header{"Content-Type": []string{"text/event-stream"}},
	}
	body := []byte(strings.Join([]string{
		`data: {"type":"response.in_progress","response":{"id":"resp_3"}}`,
		`data: [DONE]`,
	}, "\n"))

	usage, err := svc.handleOAuthSSEToJSON(resp, c, body, "gpt-4o", "gpt-4o")
	require.NoError(t, err)
	require.NotNil(t, usage)
	require.Equal(t, 0, usage.InputTokens)
	require.Contains(t, rec.Header().Get("Content-Type"), "text/event-stream")
	require.Contains(t, rec.Body.String(), `data: {"type":"response.in_progress"`)
}

func TestHandleOAuthSSEToJSON_ResponseFailedReturnsProtocolError(t *testing.T) {
	gin.SetMode(gin.TestMode)
	rec := httptest.NewRecorder()
	c, _ := gin.CreateTestContext(rec)
	c.Request = httptest.NewRequest(http.MethodPost, "/", nil)

	svc := &OpenAIGatewayService{cfg: &config.Config{}}
	resp := &http.Response{
		StatusCode: http.StatusOK,
		Header:     http.Header{"Content-Type": []string{"text/event-stream"}},
	}
	body := []byte(strings.Join([]string{
		`data: {"type":"response.failed","error":{"message":"upstream rejected request"}}`,
		`data: [DONE]`,
	}, "\n"))

	usage, err := svc.handleOAuthSSEToJSON(resp, c, body, "gpt-4o", "gpt-4o")
	require.Nil(t, usage)
	require.Error(t, err)
	require.Equal(t, http.StatusBadGateway, rec.Code)
	require.Contains(t, rec.Body.String(), "upstream rejected request")
	require.Contains(t, rec.Header().Get("Content-Type"), "application/json")
}
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+								package service
 								import (
 									"bufio"
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+									"bytes"
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+									"context"
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									"errors"
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									"fmt"
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									"io"
 									"net/http"
 									"net/http/httptest"
 									"strings"
 									"testing"
 									"time"
 									"github.com/Wei-Shaw/sub2api/internal/config"
-												fix(openai): detect official codex client by headers

											
										
										
											2026-03-07 14:12:38 +08:00
+									"github.com/Wei-Shaw/sub2api/internal/pkg/openai"
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+									"github.com/cespare/xxhash/v2"
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									"github.com/gin-gonic/gin"
-												perf(service): SSE Scanner buffer 改用 sync.Pool 复用，减少高并发 GC 压力

将流式响应中 bufio.Scanner 的 64KB buffer 从每次 make 分配改为
sync.Pool 复用，统一切片表达式为 [:0]、变量命名为 scanBuf，
并补充对应的单元测试。

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-06 22:55:12 +08:00
+									"github.com/stretchr/testify/require"
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+								)
-												test: 完善自动化测试体系（7个模块，73个任务）

系统性地修复、补充和强化项目的自动化测试能力：

1. 测试基础设施修复
   - 修复 stubConcurrencyCache 缺失方法和构造函数参数不匹配
   - 创建 testutil 共享包（stubs.go, fixtures.go, httptest.go）
   - 为所有 Stub 添加编译期接口断言

2. 中间件测试补充
   - 新增 JWT 认证中间件测试（有效/过期/篡改/缺失 Token）
   - 补充 rate_limiter 和 recovery 中间件测试场景

3. 网关核心路径测试
   - 新增账户选择、等待队列、流式响应、并发控制、计费、Claude Code 检测测试
   - 覆盖负载均衡、粘性会话、SSE 转发、槽位管理等关键逻辑

4. 前端测试体系（11个新测试文件，163个测试用例）
   - Pinia stores: auth, app, subscriptions
   - API client: 请求拦截器、响应拦截器、401 刷新
   - Router guards: 认证重定向、管理员权限、简易模式限制
   - Composables: useForm, useTableLoader, useClipboard
   - Components: LoginForm, ApiKeyCreate, Dashboard

5. CI/CD 流水线重构
   - 重构 backend-ci.yml 为统一的 ci.yml
   - 前后端 4 个并行 Job + Postgres/Redis services
   - Race 检测、覆盖率收集与门禁、Docker 构建验证

6. E2E 自动化测试
   - e2e-test.sh 自动化脚本（Docker 启动→健康检查→测试→清理）
   - 用户注册→登录→API Key→网关调用完整链路测试
   - Mock 模式和 API Key 脱敏支持

7. 修复预存问题
   - tlsfingerprint dialer_test.go 缺失 build tag 导致集成测试编译冲突

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-08 12:05:39 +08:00
+								// 编译期接口断言
 								var _ AccountRepository = (*stubOpenAIAccountRepo)(nil)
 								var _ GatewayCache = (*stubGatewayCache)(nil)
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+								type stubOpenAIAccountRepo struct {
 									AccountRepository
 									accounts []Account
 								}
-												fix(openai): restore ws usage window display

											
										
										
											2026-03-06 20:46:10 +08:00
+								type snapshotUpdateAccountRepo struct {
 									stubOpenAIAccountRepo
 									updateExtraCalls chan map[string]any
 								}
 								func (r *snapshotUpdateAccountRepo) UpdateExtra(ctx context.Context, id int64, updates map[string]any) error {
 									if r.updateExtraCalls != nil {
 										copied := make(map[string]any, len(updates))
 										for k, v := range updates {
 											copied[k] = v
 										}
 										r.updateExtraCalls <- copied
 									}
 									return nil
 								}
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+								func (r stubOpenAIAccountRepo) GetByID(ctx context.Context, id int64) (*Account, error) {
 									for i := range r.accounts {
 										if r.accounts[i].ID == id {
 											return &r.accounts[i], nil
 										}
 									}
 									return nil, errors.New("account not found")
 								}
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+								func (r stubOpenAIAccountRepo) ListSchedulableByGroupIDAndPlatform(ctx context.Context, groupID int64, platform string) ([]Account, error) {
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+									var result []Account
 									for _, acc := range r.accounts {
 										if acc.Platform == platform {
 											result = append(result, acc)
 										}
 									}
 									return result, nil
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+								}
 								func (r stubOpenAIAccountRepo) ListSchedulableByPlatform(ctx context.Context, platform string) ([]Account, error) {
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+									var result []Account
 									for _, acc := range r.accounts {
 										if acc.Platform == platform {
 											result = append(result, acc)
 										}
 									}
 									return result, nil
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+								}
-												fix(gateway): 分组隔离 — 禁止未分组账号被跨组调度

当 API Key 无分组时，调度仅从未分组账号池中选取。
修复 isAccountInGroup 在 groupID==nil 时的逻辑，
同时补全 scheduler_snapshot_service 和 gemini_compat_service
中的 SimpleMode 保护，确保分组隔离在所有调度路径生效。

新增 ListSchedulableUngroupedByPlatform/s 方法，
使用 Ent 的 Not(HasAccountGroups()) 谓词实现未分组账号隔离。
新增 17 个单元和端到端隔离测试，覆盖所有分支和边界条件。

											
										
										
											2026-03-03 13:10:26 +08:00
+								func (r stubOpenAIAccountRepo) ListSchedulableUngroupedByPlatform(ctx context.Context, platform string) ([]Account, error) {
 									return r.ListSchedulableByPlatform(ctx, platform)
 								}
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+								type stubConcurrencyCache struct {
 									ConcurrencyCache
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+									loadBatchErr    error
 									loadMap         map[int64]*AccountLoadInfo
 									acquireResults  map[int64]bool
 									waitCounts      map[int64]int
 									skipDefaultLoad bool
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+								}
-												fix(gateway): avoid injecting invalid SSE on client cancel

											
										
										
											2026-01-15 21:42:13 +08:00
+								type cancelReadCloser struct{}
 								func (c cancelReadCloser) Read(p []byte) (int, error) { return 0, context.Canceled }
 								func (c cancelReadCloser) Close() error               { return nil }
-												fix(gateway): drain upstream after client disconnect

											
										
										
											2026-01-15 21:51:14 +08:00
+								type failingGinWriter struct {
 									gin.ResponseWriter
 									failAfter int
 									writes    int
 								}
 								func (w *failingGinWriter) Write(p []byte) (int, error) {
 									if w.writes >= w.failAfter {
 										return 0, errors.New("write failed")
 									}
 									w.writes++
 									return w.ResponseWriter.Write(p)
 								}
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+								func (c stubConcurrencyCache) AcquireAccountSlot(ctx context.Context, accountID int64, maxConcurrency int, requestID string) (bool, error) {
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+									if c.acquireResults != nil {
 										if result, ok := c.acquireResults[accountID]; ok {
 											return result, nil
 										}
 									}
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+									return true, nil
 								}
 								func (c stubConcurrencyCache) ReleaseAccountSlot(ctx context.Context, accountID int64, requestID string) error {
 									return nil
 								}
 								func (c stubConcurrencyCache) GetAccountsLoadBatch(ctx context.Context, accounts []AccountWithConcurrency) (map[int64]*AccountLoadInfo, error) {
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+									if c.loadBatchErr != nil {
 										return nil, c.loadBatchErr
 									}
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+									out := make(map[int64]*AccountLoadInfo, len(accounts))
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+									if c.skipDefaultLoad && c.loadMap != nil {
 										for _, acc := range accounts {
 											if load, ok := c.loadMap[acc.ID]; ok {
 												out[acc.ID] = load
 											}
 										}
 										return out, nil
 									}
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+									for _, acc := range accounts {
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+										if c.loadMap != nil {
 											if load, ok := c.loadMap[acc.ID]; ok {
 												out[acc.ID] = load
 												continue
 											}
 										}
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+										out[acc.ID] = &AccountLoadInfo{AccountID: acc.ID, LoadRate: 0}
 									}
 									return out, nil
 								}
-												fix(openai): 使用 prompt_cache_key 兜底粘性会话

opencode 请求不带 session_id/conversation_id，导致粘性会话失效。现在按 header 优先、prompt_cache_key 兜底生成 session hash，并补充单测验证优先级。

											
										
										
											2026-01-17 02:31:16 +08:00
+								func TestOpenAIGatewayService_GenerateSessionHash_Priority(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/openai/v1/responses", nil)
 									svc := &OpenAIGatewayService{}
-												perf(backend): 使用 gjson/sjson 优化热路径 JSON 处理

将 API 网关热路径中的 json.Unmarshal+json.Marshal 替换为 gjson 零拷贝查询和 sjson 精准写入：
- unwrapV1InternalResponse 性能提升 22x（4009ns→182ns），内存分配减少 28.5x
- unwrapGeminiResponse、extractGeminiUsage、estimateGeminiCountTokens、ParseGeminiRateLimitResetTime 改为接收 []byte 使用 gjson 提取
- ParseGatewayRequest 的 model/stream/metadata/thinking/max_tokens 改用 gjson 类型安全提取
- Handler 层（sora/openai）改用 gjson 提取字段、sjson 注入/修改字段，移除 map[string]any 中间变量
- Sora Client 响应解析改用 gjson ForEach 遍历，减少内存分配
- 新增约 100 个单元测试用例，所有改动函数覆盖率 >85%

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-10 08:59:30 +08:00
+									bodyWithKey := []byte(`{"prompt_cache_key":"ses_aaa"}`)
-												fix(openai): 使用 prompt_cache_key 兜底粘性会话

opencode 请求不带 session_id/conversation_id，导致粘性会话失效。现在按 header 优先、prompt_cache_key 兜底生成 session hash，并补充单测验证优先级。

											
										
										
											2026-01-17 02:31:16 +08:00
+									// 1) session_id header wins
 									c.Request.Header.Set("session_id", "sess-123")
 									c.Request.Header.Set("conversation_id", "conv-456")
-												perf(backend): 使用 gjson/sjson 优化热路径 JSON 处理

将 API 网关热路径中的 json.Unmarshal+json.Marshal 替换为 gjson 零拷贝查询和 sjson 精准写入：
- unwrapV1InternalResponse 性能提升 22x（4009ns→182ns），内存分配减少 28.5x
- unwrapGeminiResponse、extractGeminiUsage、estimateGeminiCountTokens、ParseGeminiRateLimitResetTime 改为接收 []byte 使用 gjson 提取
- ParseGatewayRequest 的 model/stream/metadata/thinking/max_tokens 改用 gjson 类型安全提取
- Handler 层（sora/openai）改用 gjson 提取字段、sjson 注入/修改字段，移除 map[string]any 中间变量
- Sora Client 响应解析改用 gjson ForEach 遍历，减少内存分配
- 新增约 100 个单元测试用例，所有改动函数覆盖率 >85%

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-10 08:59:30 +08:00
+									h1 := svc.GenerateSessionHash(c, bodyWithKey)
-												fix(openai): 使用 prompt_cache_key 兜底粘性会话

opencode 请求不带 session_id/conversation_id，导致粘性会话失效。现在按 header 优先、prompt_cache_key 兜底生成 session hash，并补充单测验证优先级。

											
										
										
											2026-01-17 02:31:16 +08:00
+									if h1 == "" {
 										t.Fatalf("expected non-empty hash")
 									}
 									// 2) conversation_id used when session_id absent
 									c.Request.Header.Del("session_id")
-												perf(backend): 使用 gjson/sjson 优化热路径 JSON 处理

将 API 网关热路径中的 json.Unmarshal+json.Marshal 替换为 gjson 零拷贝查询和 sjson 精准写入：
- unwrapV1InternalResponse 性能提升 22x（4009ns→182ns），内存分配减少 28.5x
- unwrapGeminiResponse、extractGeminiUsage、estimateGeminiCountTokens、ParseGeminiRateLimitResetTime 改为接收 []byte 使用 gjson 提取
- ParseGatewayRequest 的 model/stream/metadata/thinking/max_tokens 改用 gjson 类型安全提取
- Handler 层（sora/openai）改用 gjson 提取字段、sjson 注入/修改字段，移除 map[string]any 中间变量
- Sora Client 响应解析改用 gjson ForEach 遍历，减少内存分配
- 新增约 100 个单元测试用例，所有改动函数覆盖率 >85%

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-10 08:59:30 +08:00
+									h2 := svc.GenerateSessionHash(c, bodyWithKey)
-												fix(openai): 使用 prompt_cache_key 兜底粘性会话

opencode 请求不带 session_id/conversation_id，导致粘性会话失效。现在按 header 优先、prompt_cache_key 兜底生成 session hash，并补充单测验证优先级。

											
										
										
											2026-01-17 02:31:16 +08:00
+									if h2 == "" {
 										t.Fatalf("expected non-empty hash")
 									}
 									if h1 == h2 {
 										t.Fatalf("expected different hashes for different keys")
 									}
 									// 3) prompt_cache_key used when both headers absent
 									c.Request.Header.Del("conversation_id")
-												perf(backend): 使用 gjson/sjson 优化热路径 JSON 处理

将 API 网关热路径中的 json.Unmarshal+json.Marshal 替换为 gjson 零拷贝查询和 sjson 精准写入：
- unwrapV1InternalResponse 性能提升 22x（4009ns→182ns），内存分配减少 28.5x
- unwrapGeminiResponse、extractGeminiUsage、estimateGeminiCountTokens、ParseGeminiRateLimitResetTime 改为接收 []byte 使用 gjson 提取
- ParseGatewayRequest 的 model/stream/metadata/thinking/max_tokens 改用 gjson 类型安全提取
- Handler 层（sora/openai）改用 gjson 提取字段、sjson 注入/修改字段，移除 map[string]any 中间变量
- Sora Client 响应解析改用 gjson ForEach 遍历，减少内存分配
- 新增约 100 个单元测试用例，所有改动函数覆盖率 >85%

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-10 08:59:30 +08:00
+									h3 := svc.GenerateSessionHash(c, bodyWithKey)
-												fix(openai): 使用 prompt_cache_key 兜底粘性会话

opencode 请求不带 session_id/conversation_id，导致粘性会话失效。现在按 header 优先、prompt_cache_key 兜底生成 session hash，并补充单测验证优先级。

											
										
										
											2026-01-17 02:31:16 +08:00
+									if h3 == "" {
 										t.Fatalf("expected non-empty hash")
 									}
 									if h2 == h3 {
 										t.Fatalf("expected different hashes for different keys")
 									}
 									// 4) empty when no signals
-												perf(backend): 使用 gjson/sjson 优化热路径 JSON 处理

将 API 网关热路径中的 json.Unmarshal+json.Marshal 替换为 gjson 零拷贝查询和 sjson 精准写入：
- unwrapV1InternalResponse 性能提升 22x（4009ns→182ns），内存分配减少 28.5x
- unwrapGeminiResponse、extractGeminiUsage、estimateGeminiCountTokens、ParseGeminiRateLimitResetTime 改为接收 []byte 使用 gjson 提取
- ParseGatewayRequest 的 model/stream/metadata/thinking/max_tokens 改用 gjson 类型安全提取
- Handler 层（sora/openai）改用 gjson 提取字段、sjson 注入/修改字段，移除 map[string]any 中间变量
- Sora Client 响应解析改用 gjson ForEach 遍历，减少内存分配
- 新增约 100 个单元测试用例，所有改动函数覆盖率 >85%

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-10 08:59:30 +08:00
+									h4 := svc.GenerateSessionHash(c, []byte(`{}`))
-												fix(openai): 使用 prompt_cache_key 兜底粘性会话

opencode 请求不带 session_id/conversation_id，导致粘性会话失效。现在按 header 优先、prompt_cache_key 兜底生成 session hash，并补充单测验证优先级。

											
										
										
											2026-01-17 02:31:16 +08:00
+									if h4 != "" {
 										t.Fatalf("expected empty hash when no signals")
 									}
 								}
-												feat(sync): full code sync from release

											
										
										
											2026-02-28 15:01:20 +08:00
+								func TestOpenAIGatewayService_GenerateSessionHash_UsesXXHash64(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/openai/v1/responses", nil)
 									c.Request.Header.Set("session_id", "sess-fixed-value")
 									svc := &OpenAIGatewayService{}
 									got := svc.GenerateSessionHash(c, nil)
 									want := fmt.Sprintf("%016x", xxhash.Sum64String("sess-fixed-value"))
 									require.Equal(t, want, got)
 								}
 								func TestOpenAIGatewayService_GenerateSessionHash_AttachesLegacyHashToContext(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/openai/v1/responses", nil)
 									c.Request.Header.Set("session_id", "sess-legacy-check")
 									svc := &OpenAIGatewayService{}
 									sessionHash := svc.GenerateSessionHash(c, nil)
 									require.NotEmpty(t, sessionHash)
 									require.NotNil(t, c.Request)
 									require.NotNil(t, c.Request.Context())
 									require.NotEmpty(t, openAILegacySessionHashFromContext(c.Request.Context()))
 								}
 								func TestOpenAIGatewayService_GenerateSessionHashWithFallback(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/openai/v1/responses", nil)
 									svc := &OpenAIGatewayService{}
 									seed := "openai_ws_ingress:9:100:200"
 									got := svc.GenerateSessionHashWithFallback(c, []byte(`{}`), seed)
 									want := fmt.Sprintf("%016x", xxhash.Sum64String(seed))
 									require.Equal(t, want, got)
 									require.NotEmpty(t, openAILegacySessionHashFromContext(c.Request.Context()))
 									empty := svc.GenerateSessionHashWithFallback(c, []byte(`{}`), "   ")
 									require.Equal(t, "", empty)
 								}
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+								func (c stubConcurrencyCache) GetAccountWaitingCount(ctx context.Context, accountID int64) (int, error) {
 									if c.waitCounts != nil {
 										if count, ok := c.waitCounts[accountID]; ok {
 											return count, nil
 										}
 									}
 									return 0, nil
 								}
 								type stubGatewayCache struct {
 									sessionBindings map[string]int64
 									deletedSessions map[string]int
 								}
 								func (c *stubGatewayCache) GetSessionAccountID(ctx context.Context, groupID int64, sessionHash string) (int64, error) {
 									if id, ok := c.sessionBindings[sessionHash]; ok {
 										return id, nil
 									}
 									return 0, errors.New("not found")
 								}
 								func (c *stubGatewayCache) SetSessionAccountID(ctx context.Context, groupID int64, sessionHash string, accountID int64, ttl time.Duration) error {
 									if c.sessionBindings == nil {
 										c.sessionBindings = make(map[string]int64)
 									}
 									c.sessionBindings[sessionHash] = accountID
 									return nil
 								}
 								func (c *stubGatewayCache) RefreshSessionTTL(ctx context.Context, groupID int64, sessionHash string, ttl time.Duration) error {
 									return nil
 								}
 								func (c *stubGatewayCache) DeleteSessionAccountID(ctx context.Context, groupID int64, sessionHash string) error {
 									if c.sessionBindings == nil {
 										return nil
 									}
 									if c.deletedSessions == nil {
 										c.deletedSessions = make(map[string]int)
 									}
 									c.deletedSessions[sessionHash]++
 									delete(c.sessionBindings, sessionHash)
 									return nil
 								}
-												fix(网关): 修复账号选择中的调度器快照延迟问题

## 问题描述
调度器快照更新存在0.5-1秒的延迟（Outbox轮询间隔），导致在账号被限流或过载后的短时间窗口内，
可能仍会被选中，造成请求失败。

## 根本原因
账号选择逻辑依赖调度器快照（listSchedulableAccounts），但快照更新有延迟：
- Outbox轮询: 每1秒检查一次变更事件
- 全量重建: 每300秒重建一次
- 时间窗口: 账号状态变更后0.5-1秒内，快照可能未更新

## 解决方案
在账号选择循环中添加IsSchedulable()实时检查，作为第二道防线：
1. 第一道防线: 调度器快照过滤（可能有延迟）
2. 第二道防线: IsSchedulable()实时检查（本次修复）

IsSchedulable()会检查：
- RateLimitResetAt: 限流重置时间
- OverloadUntil: 过载持续时间
- TempUnschedulableUntil: 临时不可调度时间
- Status: 账号状态
- Schedulable: 可调度标志

## 修改范围
### OpenAI Gateway Service
- SelectAccountForModelWithExclusions: 添加IsSchedulable()检查
- SelectAccountWithLoadAwareness: 添加IsSchedulable()检查

### Gateway Service (Claude/Gemini/Antigravity)
- 负载感知选择候选账号筛选: 添加IsSchedulable()检查
- selectAccountForModelWithPlatform: 添加IsSchedulable()检查
- selectAccountWithMixedScheduling: 添加IsSchedulable()检查

### 测试用例
- OpenAI: 添加2个测试用例验证限流账号过滤
- Gateway: 添加2个测试用例验证限流和过载账号过滤

### 其他修复
- ops_repo_preagg.go: 修复platform为NULL时的聚合问题

## 测试结果
所有单元测试通过 ✅

											
										
										
											2026-01-13 22:49:26 -08:00
+								func TestOpenAISelectAccountWithLoadAwareness_FiltersUnschedulable(t *testing.T) {
 									now := time.Now()
 									resetAt := now.Add(10 * time.Minute)
 									groupID := int64(1)
 									rateLimited := Account{
 										ID:               1,
 										Platform:         PlatformOpenAI,
 										Type:             AccountTypeAPIKey,
 										Status:           StatusActive,
 										Schedulable:      true,
 										Concurrency:      1,
 										Priority:         0,
 										RateLimitResetAt: &resetAt,
 									}
 									available := Account{
 										ID:          2,
 										Platform:    PlatformOpenAI,
 										Type:        AccountTypeAPIKey,
 										Status:      StatusActive,
 										Schedulable: true,
 										Concurrency: 1,
 										Priority:    1,
 									}
 									svc := &OpenAIGatewayService{
 										accountRepo:        stubOpenAIAccountRepo{accounts: []Account{rateLimited, available}},
 										concurrencyService: NewConcurrencyService(stubConcurrencyCache{}),
 									}
 									selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "", "gpt-5.2", nil)
 									if err != nil {
 										t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
 									}
 									if selection == nil || selection.Account == nil {
 										t.Fatalf("expected selection with account")
 									}
 									if selection.Account.ID != available.ID {
 										t.Fatalf("expected account %d, got %d", available.ID, selection.Account.ID)
 									}
 									if selection.ReleaseFunc != nil {
 										selection.ReleaseFunc()
 									}
 								}
 								func TestOpenAISelectAccountWithLoadAwareness_FiltersUnschedulableWhenNoConcurrencyService(t *testing.T) {
 									now := time.Now()
 									resetAt := now.Add(10 * time.Minute)
 									groupID := int64(1)
 									rateLimited := Account{
 										ID:               1,
 										Platform:         PlatformOpenAI,
 										Type:             AccountTypeAPIKey,
 										Status:           StatusActive,
 										Schedulable:      true,
 										Concurrency:      1,
 										Priority:         0,
 										RateLimitResetAt: &resetAt,
 									}
 									available := Account{
 										ID:          2,
 										Platform:    PlatformOpenAI,
 										Type:        AccountTypeAPIKey,
 										Status:      StatusActive,
 										Schedulable: true,
 										Concurrency: 1,
 										Priority:    1,
 									}
 									svc := &OpenAIGatewayService{
 										accountRepo: stubOpenAIAccountRepo{accounts: []Account{rateLimited, available}},
 										// concurrencyService is nil, forcing the non-load-batch selection path.
 									}
 									selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "", "gpt-5.2", nil)
 									if err != nil {
 										t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
 									}
 									if selection == nil || selection.Account == nil {
 										t.Fatalf("expected selection with account")
 									}
 									if selection.Account.ID != available.ID {
 										t.Fatalf("expected account %d, got %d", available.ID, selection.Account.ID)
 									}
 									if selection.ReleaseFunc != nil {
 										selection.ReleaseFunc()
 									}
 								}
-												fix(调度): 完善粘性会话清理与账号调度刷新

- Update/BulkUpdate 按不可调度字段触发缓存刷新
- GatewayCache 支持多前缀会话键清理
- 模型路由与混合调度优化粘性会话处理
- 补充调度与缓存相关测试覆盖

											
										
										
											2026-01-20 11:19:32 +08:00
+								func TestOpenAISelectAccountForModelWithExclusions_StickyUnschedulableClearsSession(t *testing.T) {
 									sessionHash := "session-1"
 									repo := stubOpenAIAccountRepo{
 										accounts: []Account{
 											{ID: 1, Platform: PlatformOpenAI, Status: StatusDisabled, Schedulable: true, Concurrency: 1},
 											{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1},
 										},
 									}
 									cache := &stubGatewayCache{
 										sessionBindings: map[string]int64{"openai:" + sessionHash: 1},
 									}
 									svc := &OpenAIGatewayService{
 										accountRepo: repo,
 										cache:       cache,
 									}
 									acc, err := svc.SelectAccountForModelWithExclusions(context.Background(), nil, sessionHash, "gpt-4", nil)
 									if err != nil {
 										t.Fatalf("SelectAccountForModelWithExclusions error: %v", err)
 									}
 									if acc == nil || acc.ID != 2 {
 										t.Fatalf("expected account 2, got %+v", acc)
 									}
 									if cache.deletedSessions["openai:"+sessionHash] != 1 {
 										t.Fatalf("expected sticky session to be deleted")
 									}
 									if cache.sessionBindings["openai:"+sessionHash] != 2 {
 										t.Fatalf("expected sticky session to bind to account 2")
 									}
 								}
 								func TestOpenAISelectAccountWithLoadAwareness_StickyUnschedulableClearsSession(t *testing.T) {
 									sessionHash := "session-2"
 									groupID := int64(1)
 									repo := stubOpenAIAccountRepo{
 										accounts: []Account{
 											{ID: 1, Platform: PlatformOpenAI, Status: StatusDisabled, Schedulable: true, Concurrency: 1},
 											{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1},
 										},
 									}
 									cache := &stubGatewayCache{
 										sessionBindings: map[string]int64{"openai:" + sessionHash: 1},
 									}
 									svc := &OpenAIGatewayService{
 										accountRepo:        repo,
 										cache:              cache,
 										concurrencyService: NewConcurrencyService(stubConcurrencyCache{}),
 									}
 									selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, sessionHash, "gpt-4", nil)
 									if err != nil {
 										t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
 									}
 									if selection == nil || selection.Account == nil || selection.Account.ID != 2 {
 										t.Fatalf("expected account 2, got %+v", selection)
 									}
 									if cache.deletedSessions["openai:"+sessionHash] != 1 {
 										t.Fatalf("expected sticky session to be deleted")
 									}
 									if cache.sessionBindings["openai:"+sessionHash] != 2 {
 										t.Fatalf("expected sticky session to bind to account 2")
 									}
 									if selection.ReleaseFunc != nil {
 										selection.ReleaseFunc()
 									}
 								}
 								func TestOpenAISelectAccountForModelWithExclusions_NoModelSupport(t *testing.T) {
 									repo := stubOpenAIAccountRepo{
 										accounts: []Account{
 											{
 												ID:          1,
 												Platform:    PlatformOpenAI,
 												Status:      StatusActive,
 												Schedulable: true,
 												Credentials: map[string]any{"model_mapping": map[string]any{"gpt-3.5-turbo": "gpt-3.5-turbo"}},
 											},
 										},
 									}
 									cache := &stubGatewayCache{}
 									svc := &OpenAIGatewayService{
 										accountRepo: repo,
 										cache:       cache,
 									}
 									acc, err := svc.SelectAccountForModelWithExclusions(context.Background(), nil, "", "gpt-4", nil)
 									if err == nil {
 										t.Fatalf("expected error for unsupported model")
 									}
 									if acc != nil {
 										t.Fatalf("expected nil account for unsupported model")
 									}
 									if !strings.Contains(err.Error(), "supporting model") {
 										t.Fatalf("unexpected error: %v", err)
 									}
 								}
 								func TestOpenAISelectAccountWithLoadAwareness_LoadBatchErrorFallback(t *testing.T) {
 									groupID := int64(1)
 									repo := stubOpenAIAccountRepo{
 										accounts: []Account{
 											{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 2},
 											{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
 										},
 									}
 									cache := &stubGatewayCache{}
 									concurrencyCache := stubConcurrencyCache{
 										loadBatchErr: errors.New("load batch failed"),
 									}
 									svc := &OpenAIGatewayService{
 										accountRepo:        repo,
 										cache:              cache,
 										concurrencyService: NewConcurrencyService(concurrencyCache),
 									}
 									selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "fallback", "gpt-4", nil)
 									if err != nil {
 										t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
 									}
 									if selection == nil || selection.Account == nil {
 										t.Fatalf("expected selection")
 									}
 									if selection.Account.ID != 2 {
 										t.Fatalf("expected account 2, got %d", selection.Account.ID)
 									}
 									if cache.sessionBindings["openai:fallback"] != 2 {
 										t.Fatalf("expected sticky session updated")
 									}
 									if selection.ReleaseFunc != nil {
 										selection.ReleaseFunc()
 									}
 								}
 								func TestOpenAISelectAccountWithLoadAwareness_NoSlotFallbackWait(t *testing.T) {
 									groupID := int64(1)
 									repo := stubOpenAIAccountRepo{
 										accounts: []Account{
 											{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
 										},
 									}
 									cache := &stubGatewayCache{}
 									concurrencyCache := stubConcurrencyCache{
 										acquireResults: map[int64]bool{1: false},
 										loadMap: map[int64]*AccountLoadInfo{
 : {AccountID: 1, LoadRate: 10},
 										},
 									}
 									svc := &OpenAIGatewayService{
 										accountRepo:        repo,
 										cache:              cache,
 										concurrencyService: NewConcurrencyService(concurrencyCache),
 									}
 									selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "", "gpt-4", nil)
 									if err != nil {
 										t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
 									}
 									if selection == nil || selection.WaitPlan == nil {
 										t.Fatalf("expected wait plan fallback")
 									}
 									if selection.Account == nil || selection.Account.ID != 1 {
 										t.Fatalf("expected account 1")
 									}
 								}
 								func TestOpenAISelectAccountForModelWithExclusions_SetsStickyBinding(t *testing.T) {
 									sessionHash := "bind"
 									repo := stubOpenAIAccountRepo{
 										accounts: []Account{
 											{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
 										},
 									}
 									cache := &stubGatewayCache{}
 									svc := &OpenAIGatewayService{
 										accountRepo: repo,
 										cache:       cache,
 									}
 									acc, err := svc.SelectAccountForModelWithExclusions(context.Background(), nil, sessionHash, "gpt-4", nil)
 									if err != nil {
 										t.Fatalf("SelectAccountForModelWithExclusions error: %v", err)
 									}
 									if acc == nil || acc.ID != 1 {
 										t.Fatalf("expected account 1")
 									}
 									if cache.sessionBindings["openai:"+sessionHash] != 1 {
 										t.Fatalf("expected sticky session binding")
 									}
 								}
 								func TestOpenAISelectAccountWithLoadAwareness_StickyWaitPlan(t *testing.T) {
 									sessionHash := "sticky-wait"
 									groupID := int64(1)
 									repo := stubOpenAIAccountRepo{
 										accounts: []Account{
 											{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
 										},
 									}
 									cache := &stubGatewayCache{
 										sessionBindings: map[string]int64{"openai:" + sessionHash: 1},
 									}
 									concurrencyCache := stubConcurrencyCache{
 										acquireResults: map[int64]bool{1: false},
 										waitCounts:     map[int64]int{1: 0},
 									}
 									svc := &OpenAIGatewayService{
 										accountRepo:        repo,
 										cache:              cache,
 										concurrencyService: NewConcurrencyService(concurrencyCache),
 									}
 									selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, sessionHash, "gpt-4", nil)
 									if err != nil {
 										t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
 									}
 									if selection == nil || selection.WaitPlan == nil {
 										t.Fatalf("expected sticky wait plan")
 									}
 									if selection.Account == nil || selection.Account.ID != 1 {
 										t.Fatalf("expected account 1")
 									}
 								}
 								func TestOpenAISelectAccountWithLoadAwareness_PrefersLowerLoad(t *testing.T) {
 									groupID := int64(1)
 									repo := stubOpenAIAccountRepo{
 										accounts: []Account{
 											{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
 											{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
 										},
 									}
 									cache := &stubGatewayCache{}
 									concurrencyCache := stubConcurrencyCache{
 										loadMap: map[int64]*AccountLoadInfo{
 : {AccountID: 1, LoadRate: 80},
 : {AccountID: 2, LoadRate: 10},
 										},
 									}
 									svc := &OpenAIGatewayService{
 										accountRepo:        repo,
 										cache:              cache,
 										concurrencyService: NewConcurrencyService(concurrencyCache),
 									}
 									selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "load", "gpt-4", nil)
 									if err != nil {
 										t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
 									}
 									if selection == nil || selection.Account == nil || selection.Account.ID != 2 {
 										t.Fatalf("expected account 2")
 									}
 									if cache.sessionBindings["openai:load"] != 2 {
 										t.Fatalf("expected sticky session updated")
 									}
 								}
 								func TestOpenAISelectAccountForModelWithExclusions_StickyExcludedFallback(t *testing.T) {
 									sessionHash := "excluded"
 									repo := stubOpenAIAccountRepo{
 										accounts: []Account{
 											{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
 											{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 2},
 										},
 									}
 									cache := &stubGatewayCache{
 										sessionBindings: map[string]int64{"openai:" + sessionHash: 1},
 									}
 									svc := &OpenAIGatewayService{
 										accountRepo: repo,
 										cache:       cache,
 									}
 									excluded := map[int64]struct{}{1: {}}
 									acc, err := svc.SelectAccountForModelWithExclusions(context.Background(), nil, sessionHash, "gpt-4", excluded)
 									if err != nil {
 										t.Fatalf("SelectAccountForModelWithExclusions error: %v", err)
 									}
 									if acc == nil || acc.ID != 2 {
 										t.Fatalf("expected account 2")
 									}
 								}
 								func TestOpenAISelectAccountForModelWithExclusions_StickyNonOpenAI(t *testing.T) {
 									sessionHash := "non-openai"
 									repo := stubOpenAIAccountRepo{
 										accounts: []Account{
 											{ID: 1, Platform: PlatformAnthropic, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
 											{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 2},
 										},
 									}
 									cache := &stubGatewayCache{
 										sessionBindings: map[string]int64{"openai:" + sessionHash: 1},
 									}
 									svc := &OpenAIGatewayService{
 										accountRepo: repo,
 										cache:       cache,
 									}
 									acc, err := svc.SelectAccountForModelWithExclusions(context.Background(), nil, sessionHash, "gpt-4", nil)
 									if err != nil {
 										t.Fatalf("SelectAccountForModelWithExclusions error: %v", err)
 									}
 									if acc == nil || acc.ID != 2 {
 										t.Fatalf("expected account 2")
 									}
 								}
 								func TestOpenAISelectAccountForModelWithExclusions_NoAccounts(t *testing.T) {
 									repo := stubOpenAIAccountRepo{accounts: []Account{}}
 									cache := &stubGatewayCache{}
 									svc := &OpenAIGatewayService{
 										accountRepo: repo,
 										cache:       cache,
 									}
 									acc, err := svc.SelectAccountForModelWithExclusions(context.Background(), nil, "", "", nil)
 									if err == nil {
 										t.Fatalf("expected error for no accounts")
 									}
 									if acc != nil {
 										t.Fatalf("expected nil account")
 									}
 									if !strings.Contains(err.Error(), "no available OpenAI accounts") {
 										t.Fatalf("unexpected error: %v", err)
 									}
 								}
 								func TestOpenAISelectAccountWithLoadAwareness_NoCandidates(t *testing.T) {
 									groupID := int64(1)
 									resetAt := time.Now().Add(1 * time.Hour)
 									repo := stubOpenAIAccountRepo{
 										accounts: []Account{
 											{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1, RateLimitResetAt: &resetAt},
 										},
 									}
 									cache := &stubGatewayCache{}
 									concurrencyCache := stubConcurrencyCache{}
 									svc := &OpenAIGatewayService{
 										accountRepo:        repo,
 										cache:              cache,
 										concurrencyService: NewConcurrencyService(concurrencyCache),
 									}
 									selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "", "gpt-4", nil)
 									if err == nil {
 										t.Fatalf("expected error for no candidates")
 									}
 									if selection != nil {
 										t.Fatalf("expected nil selection")
 									}
 								}
 								func TestOpenAISelectAccountWithLoadAwareness_AllFullWaitPlan(t *testing.T) {
 									groupID := int64(1)
 									repo := stubOpenAIAccountRepo{
 										accounts: []Account{
 											{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
 										},
 									}
 									cache := &stubGatewayCache{}
 									concurrencyCache := stubConcurrencyCache{
 										loadMap: map[int64]*AccountLoadInfo{
 : {AccountID: 1, LoadRate: 100},
 										},
 									}
 									svc := &OpenAIGatewayService{
 										accountRepo:        repo,
 										cache:              cache,
 										concurrencyService: NewConcurrencyService(concurrencyCache),
 									}
 									selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "", "gpt-4", nil)
 									if err != nil {
 										t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
 									}
 									if selection == nil || selection.WaitPlan == nil {
 										t.Fatalf("expected wait plan")
 									}
 								}
 								func TestOpenAISelectAccountWithLoadAwareness_LoadBatchErrorNoAcquire(t *testing.T) {
 									groupID := int64(1)
 									repo := stubOpenAIAccountRepo{
 										accounts: []Account{
 											{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
 										},
 									}
 									cache := &stubGatewayCache{}
 									concurrencyCache := stubConcurrencyCache{
 										loadBatchErr:   errors.New("load batch failed"),
 										acquireResults: map[int64]bool{1: false},
 									}
 									svc := &OpenAIGatewayService{
 										accountRepo:        repo,
 										cache:              cache,
 										concurrencyService: NewConcurrencyService(concurrencyCache),
 									}
 									selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "", "gpt-4", nil)
 									if err != nil {
 										t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
 									}
 									if selection == nil || selection.WaitPlan == nil {
 										t.Fatalf("expected wait plan")
 									}
 								}
 								func TestOpenAISelectAccountWithLoadAwareness_MissingLoadInfo(t *testing.T) {
 									groupID := int64(1)
 									repo := stubOpenAIAccountRepo{
 										accounts: []Account{
 											{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
 											{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
 										},
 									}
 									cache := &stubGatewayCache{}
 									concurrencyCache := stubConcurrencyCache{
 										loadMap: map[int64]*AccountLoadInfo{
 : {AccountID: 1, LoadRate: 50},
 										},
 										skipDefaultLoad: true,
 									}
 									svc := &OpenAIGatewayService{
 										accountRepo:        repo,
 										cache:              cache,
 										concurrencyService: NewConcurrencyService(concurrencyCache),
 									}
 									selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "", "gpt-4", nil)
 									if err != nil {
 										t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
 									}
 									if selection == nil || selection.Account == nil || selection.Account.ID != 2 {
 										t.Fatalf("expected account 2")
 									}
 								}
 								func TestOpenAISelectAccountForModelWithExclusions_LeastRecentlyUsed(t *testing.T) {
 									oldTime := time.Now().Add(-2 * time.Hour)
 									newTime := time.Now().Add(-1 * time.Hour)
 									repo := stubOpenAIAccountRepo{
 										accounts: []Account{
 											{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Priority: 1, LastUsedAt: &newTime},
 											{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Priority: 1, LastUsedAt: &oldTime},
 										},
 									}
 									cache := &stubGatewayCache{}
 									svc := &OpenAIGatewayService{
 										accountRepo: repo,
 										cache:       cache,
 									}
 									acc, err := svc.SelectAccountForModelWithExclusions(context.Background(), nil, "", "gpt-4", nil)
 									if err != nil {
 										t.Fatalf("SelectAccountForModelWithExclusions error: %v", err)
 									}
 									if acc == nil || acc.ID != 2 {
 										t.Fatalf("expected account 2")
 									}
 								}
 								func TestOpenAISelectAccountWithLoadAwareness_PreferNeverUsed(t *testing.T) {
 									groupID := int64(1)
 									lastUsed := time.Now().Add(-1 * time.Hour)
 									repo := stubOpenAIAccountRepo{
 										accounts: []Account{
 											{ID: 1, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1, LastUsedAt: &lastUsed},
 											{ID: 2, Platform: PlatformOpenAI, Status: StatusActive, Schedulable: true, Concurrency: 1, Priority: 1},
 										},
 									}
 									cache := &stubGatewayCache{}
 									concurrencyCache := stubConcurrencyCache{
 										loadMap: map[int64]*AccountLoadInfo{
 : {AccountID: 1, LoadRate: 10},
 : {AccountID: 2, LoadRate: 10},
 										},
 									}
 									svc := &OpenAIGatewayService{
 										accountRepo:        repo,
 										cache:              cache,
 										concurrencyService: NewConcurrencyService(concurrencyCache),
 									}
 									selection, err := svc.SelectAccountWithLoadAwareness(context.Background(), &groupID, "", "gpt-4", nil)
 									if err != nil {
 										t.Fatalf("SelectAccountWithLoadAwareness error: %v", err)
 									}
 									if selection == nil || selection.Account == nil || selection.Account.ID != 2 {
 										t.Fatalf("expected account 2")
 									}
 								}
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+								func TestOpenAIStreamingTimeout(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									cfg := &config.Config{
 										Gateway: config.GatewayConfig{
 											StreamDataIntervalTimeout: 1,
 											StreamKeepaliveInterval:   0,
 											MaxLineSize:               defaultMaxLineSize,
 										},
 									}
 									svc := &OpenAIGatewayService{cfg: cfg}
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/", nil)
 									pr, pw := io.Pipe()
 									resp := &http.Response{
 										StatusCode: http.StatusOK,
 										Body:       pr,
 										Header:     http.Header{},
 									}
 									start := time.Now()
 									_, err := svc.handleStreamingResponse(c.Request.Context(), resp, c, &Account{ID: 1}, start, "model", "model")
 									_ = pw.Close()
 									_ = pr.Close()
 									if err == nil || !strings.Contains(err.Error(), "stream data interval timeout") {
 										t.Fatalf("expected stream timeout error, got %v", err)
 									}
-												fix(openai): emit OpenAI-compatible SSE error events

											
										
										
											2026-01-19 13:53:39 +08:00
+									if !strings.Contains(rec.Body.String(), "\"type\":\"error\"") || !strings.Contains(rec.Body.String(), "stream_timeout") {
 										t.Fatalf("expected OpenAI-compatible error SSE event, got %q", rec.Body.String())
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									}
 								}
-												fix(gateway): avoid injecting invalid SSE on client cancel

											
										
										
											2026-01-15 21:42:13 +08:00
+								func TestOpenAIStreamingContextCanceledDoesNotInjectErrorEvent(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									cfg := &config.Config{
 										Gateway: config.GatewayConfig{
 											StreamDataIntervalTimeout: 0,
 											StreamKeepaliveInterval:   0,
 											MaxLineSize:               defaultMaxLineSize,
 										},
 									}
 									svc := &OpenAIGatewayService{cfg: cfg}
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									ctx, cancel := context.WithCancel(context.Background())
 									cancel()
 									c.Request = httptest.NewRequest(http.MethodPost, "/", nil).WithContext(ctx)
 									resp := &http.Response{
 										StatusCode: http.StatusOK,
 										Body:       cancelReadCloser{},
 										Header:     http.Header{},
 									}
 									_, err := svc.handleStreamingResponse(c.Request.Context(), resp, c, &Account{ID: 1}, time.Now(), "model", "model")
 									if err != nil {
 										t.Fatalf("expected nil error, got %v", err)
 									}
 									if strings.Contains(rec.Body.String(), "event: error") || strings.Contains(rec.Body.String(), "stream_read_error") {
 										t.Fatalf("expected no injected SSE error event, got %q", rec.Body.String())
 									}
 								}
-												fix(gateway): drain upstream after client disconnect

											
										
										
											2026-01-15 21:51:14 +08:00
+								func TestOpenAIStreamingClientDisconnectDrainsUpstreamUsage(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									cfg := &config.Config{
 										Gateway: config.GatewayConfig{
 											StreamDataIntervalTimeout: 0,
 											StreamKeepaliveInterval:   0,
 											MaxLineSize:               defaultMaxLineSize,
 										},
 									}
 									svc := &OpenAIGatewayService{cfg: cfg}
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/", nil)
 									c.Writer = &failingGinWriter{ResponseWriter: c.Writer, failAfter: 0}
 									pr, pw := io.Pipe()
 									resp := &http.Response{
 										StatusCode: http.StatusOK,
 										Body:       pr,
 										Header:     http.Header{},
 									}
 									go func() {
 										defer func() { _ = pw.Close() }()
 										_, _ = pw.Write([]byte("data: {\"type\":\"response.in_progress\",\"response\":{}}\n\n"))
 										_, _ = pw.Write([]byte("data: {\"type\":\"response.completed\",\"response\":{\"usage\":{\"input_tokens\":3,\"output_tokens\":5,\"input_tokens_details\":{\"cached_tokens\":1}}}}\n\n"))
 									}()
 									result, err := svc.handleStreamingResponse(c.Request.Context(), resp, c, &Account{ID: 1}, time.Now(), "model", "model")
 									_ = pr.Close()
 									if err != nil {
 										t.Fatalf("expected nil error, got %v", err)
 									}
 									if result == nil || result.usage == nil {
 										t.Fatalf("expected usage result")
 									}
 									if result.usage.InputTokens != 3 || result.usage.OutputTokens != 5 || result.usage.CacheReadInputTokens != 1 {
 										t.Fatalf("unexpected usage: %+v", *result.usage)
 									}
 									if strings.Contains(rec.Body.String(), "event: error") || strings.Contains(rec.Body.String(), "write_failed") {
 										t.Fatalf("expected no injected SSE error event, got %q", rec.Body.String())
 									}
 								}
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+								func TestOpenAIStreamingTooLong(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									cfg := &config.Config{
 										Gateway: config.GatewayConfig{
 											StreamDataIntervalTimeout: 0,
 											StreamKeepaliveInterval:   0,
 											MaxLineSize:               64 * 1024,
 										},
 									}
 									svc := &OpenAIGatewayService{cfg: cfg}
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/", nil)
 									pr, pw := io.Pipe()
 									resp := &http.Response{
 										StatusCode: http.StatusOK,
 										Body:       pr,
 										Header:     http.Header{},
 									}
 									go func() {
-												fix(后端): 修复 lint 失败并清理无用代码

修正测试中的 APIKey 名称引用
移除不可达返回与未使用函数
统一 gofmt 格式并处理 Close 错误

											
										
										
											2026-01-04 22:10:32 +08:00
+										defer func() { _ = pw.Close() }()
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+										// 写入超过 MaxLineSize 的单行数据，触发 ErrTooLong
 										payload := "data: " + strings.Repeat("a", 128*1024) + "\n"
 										_, _ = pw.Write([]byte(payload))
 									}()
 									_, err := svc.handleStreamingResponse(c.Request.Context(), resp, c, &Account{ID: 2}, time.Now(), "model", "model")
 									_ = pr.Close()
 									if !errors.Is(err, bufio.ErrTooLong) {
 										t.Fatalf("expected ErrTooLong, got %v", err)
 									}
-												fix(openai): emit OpenAI-compatible SSE error events

											
										
										
											2026-01-19 13:53:39 +08:00
+									if !strings.Contains(rec.Body.String(), "\"type\":\"error\"") || !strings.Contains(rec.Body.String(), "response_too_large") {
 										t.Fatalf("expected OpenAI-compatible error SSE event, got %q", rec.Body.String())
-												fix(流式): 提升SSE稳定性并统一超时配置

- 扩展SSE行长与间隔超时处理，补充keepalive

- 写入失败与超长行时发送错误事件，修复并发释放

- 同步默认配置与示例配置，更新Caddy超时/压缩规则

- 新增OpenAI流式超时与超长行测试

测试: go test ./...

											
										
										
											2026-01-04 19:49:59 +08:00
+									}
 								}
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
 								func TestOpenAINonStreamingContentTypePassThrough(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									cfg := &config.Config{
 										Security: config.SecurityConfig{
 											ResponseHeaders: config.ResponseHeaderConfig{Enabled: false},
 										},
 									}
 									svc := &OpenAIGatewayService{cfg: cfg}
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/", nil)
 									body := []byte(`{"usage":{"input_tokens":1,"output_tokens":2,"input_tokens_details":{"cached_tokens":0}}}`)
 									resp := &http.Response{
 										StatusCode: http.StatusOK,
 										Body:       io.NopCloser(bytes.NewReader(body)),
 										Header:     http.Header{"Content-Type": []string{"application/vnd.test+json"}},
 									}
 									_, err := svc.handleNonStreamingResponse(c.Request.Context(), resp, c, &Account{}, "model", "model")
 									if err != nil {
 										t.Fatalf("handleNonStreamingResponse error: %v", err)
 									}
 									if !strings.Contains(rec.Header().Get("Content-Type"), "application/vnd.test+json") {
 										t.Fatalf("expected Content-Type passthrough, got %q", rec.Header().Get("Content-Type"))
 									}
 								}
 								func TestOpenAINonStreamingContentTypeDefault(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									cfg := &config.Config{
 										Security: config.SecurityConfig{
 											ResponseHeaders: config.ResponseHeaderConfig{Enabled: false},
 										},
 									}
 									svc := &OpenAIGatewayService{cfg: cfg}
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/", nil)
 									body := []byte(`{"usage":{"input_tokens":1,"output_tokens":2,"input_tokens_details":{"cached_tokens":0}}}`)
 									resp := &http.Response{
 										StatusCode: http.StatusOK,
 										Body:       io.NopCloser(bytes.NewReader(body)),
 										Header:     http.Header{},
 									}
 									_, err := svc.handleNonStreamingResponse(c.Request.Context(), resp, c, &Account{}, "model", "model")
 									if err != nil {
 										t.Fatalf("handleNonStreamingResponse error: %v", err)
 									}
 									if !strings.Contains(rec.Header().Get("Content-Type"), "application/json") {
 										t.Fatalf("expected default Content-Type, got %q", rec.Header().Get("Content-Type"))
 									}
 								}
 								func TestOpenAIStreamingHeadersOverride(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									cfg := &config.Config{
 										Security: config.SecurityConfig{
 											ResponseHeaders: config.ResponseHeaderConfig{Enabled: false},
 										},
 										Gateway: config.GatewayConfig{
 											StreamDataIntervalTimeout: 0,
 											StreamKeepaliveInterval:   0,
 											MaxLineSize:               defaultMaxLineSize,
 										},
 									}
 									svc := &OpenAIGatewayService{cfg: cfg}
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/", nil)
 									pr, pw := io.Pipe()
 									resp := &http.Response{
 										StatusCode: http.StatusOK,
 										Body:       pr,
 										Header: http.Header{
 											"Cache-Control": []string{"upstream"},
-												fix(安全): 关闭白名单时保留最小校验与默认白名单

实现 allow_insecure_http 并在关闭校验时执行最小格式验证
- 关闭 allowlist 时要求 URL 可解析且 scheme 合规
- 响应头过滤关闭时使用默认白名单策略
- 更新相关文档、示例与测试覆盖

											
										
										
											2026-01-05 14:41:08 +08:00
+											"X-Request-Id":  []string{"req-123"},
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+											"Content-Type":  []string{"application/custom"},
 										},
 									}
 									go func() {
 										defer func() { _ = pw.Close() }()
 										_, _ = pw.Write([]byte("data: {}\n\n"))
 									}()
 									_, err := svc.handleStreamingResponse(c.Request.Context(), resp, c, &Account{ID: 1}, time.Now(), "model", "model")
 									_ = pr.Close()
 									if err != nil {
 										t.Fatalf("handleStreamingResponse error: %v", err)
 									}
 									if rec.Header().Get("Cache-Control") != "no-cache" {
 										t.Fatalf("expected Cache-Control override, got %q", rec.Header().Get("Cache-Control"))
 									}
 									if rec.Header().Get("Content-Type") != "text/event-stream" {
 										t.Fatalf("expected Content-Type override, got %q", rec.Header().Get("Content-Type"))
 									}
-												fix(安全): 关闭白名单时保留最小校验与默认白名单

实现 allow_insecure_http 并在关闭校验时执行最小格式验证
- 关闭 allowlist 时要求 URL 可解析且 scheme 合规
- 响应头过滤关闭时使用默认白名单策略
- 更新相关文档、示例与测试覆盖

											
										
										
											2026-01-05 14:41:08 +08:00
+									if rec.Header().Get("X-Request-Id") != "req-123" {
 										t.Fatalf("expected X-Request-Id passthrough, got %q", rec.Header().Get("X-Request-Id"))
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+									}
 								}
-												perf(service): SSE Scanner buffer 改用 sync.Pool 复用，减少高并发 GC 压力

将流式响应中 bufio.Scanner 的 64KB buffer 从每次 make 分配改为
sync.Pool 复用，统一切片表达式为 [:0]、变量命名为 scanBuf，
并补充对应的单元测试。

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-06 22:55:12 +08:00
+								func TestOpenAIStreamingReuseScannerBufferAndStillWorks(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									cfg := &config.Config{
 										Gateway: config.GatewayConfig{
 											StreamDataIntervalTimeout: 0,
 											StreamKeepaliveInterval:   0,
 											MaxLineSize:               defaultMaxLineSize,
 										},
 									}
 									svc := &OpenAIGatewayService{cfg: cfg}
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/", nil)
 									pr, pw := io.Pipe()
 									resp := &http.Response{
 										StatusCode: http.StatusOK,
 										Body:       pr,
 										Header:     http.Header{},
 									}
 									go func() {
 										defer func() { _ = pw.Close() }()
 										_, _ = pw.Write([]byte("data: {\"type\":\"response.completed\",\"response\":{\"usage\":{\"input_tokens\":1,\"output_tokens\":2,\"input_tokens_details\":{\"cached_tokens\":3}}}}\n\n"))
 									}()
 									result, err := svc.handleStreamingResponse(c.Request.Context(), resp, c, &Account{ID: 1}, time.Now(), "model", "model")
 									_ = pr.Close()
 									require.NoError(t, err)
 									require.NotNil(t, result)
 									require.NotNil(t, result.usage)
 									require.Equal(t, 1, result.usage.InputTokens)
 									require.Equal(t, 2, result.usage.OutputTokens)
 									require.Equal(t, 3, result.usage.CacheReadInputTokens)
 								}
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+								func TestOpenAIInvalidBaseURLWhenAllowlistDisabled(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									cfg := &config.Config{
 										Security: config.SecurityConfig{
 											URLAllowlist: config.URLAllowlistConfig{Enabled: false},
 										},
 									}
 									svc := &OpenAIGatewayService{cfg: cfg}
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/", nil)
 									account := &Account{
 										Platform:    PlatformOpenAI,
 										Type:        AccountTypeAPIKey,
 										Credentials: map[string]any{"base_url": "://invalid-url"},
 									}
-												Align OAuth transform with OpenCode instructions

											
										
										
											2026-01-10 20:53:16 +08:00
+									_, err := svc.buildUpstreamRequest(c.Request.Context(), c, account, []byte("{}"), "token", false, "", false)
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+									if err == nil {
 										t.Fatalf("expected error for invalid base_url when allowlist disabled")
 									}
 								}
-												fix(安全): 关闭白名单时保留最小校验与默认白名单

实现 allow_insecure_http 并在关闭校验时执行最小格式验证
- 关闭 allowlist 时要求 URL 可解析且 scheme 合规
- 响应头过滤关闭时使用默认白名单策略
- 更新相关文档、示例与测试覆盖

											
										
										
											2026-01-05 14:41:08 +08:00
+								func TestOpenAIValidateUpstreamBaseURLDisabledRequiresHTTPS(t *testing.T) {
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+									cfg := &config.Config{
 										Security: config.SecurityConfig{
 											URLAllowlist: config.URLAllowlistConfig{Enabled: false},
 										},
 									}
 									svc := &OpenAIGatewayService{cfg: cfg}
-												fix(安全): 关闭白名单时保留最小校验与默认白名单

实现 allow_insecure_http 并在关闭校验时执行最小格式验证
- 关闭 allowlist 时要求 URL 可解析且 scheme 合规
- 响应头过滤关闭时使用默认白名单策略
- 更新相关文档、示例与测试覆盖

											
										
										
											2026-01-05 14:41:08 +08:00
+									if _, err := svc.validateUpstreamBaseURL("http://not-https.example.com"); err == nil {
 										t.Fatalf("expected http to be rejected when allow_insecure_http is false")
 									}
 									normalized, err := svc.validateUpstreamBaseURL("https://example.com")
 									if err != nil {
 										t.Fatalf("expected https to be allowed when allowlist disabled, got %v", err)
 									}
 									if normalized != "https://example.com" {
 										t.Fatalf("expected raw url passthrough, got %q", normalized)
 									}
 								}
 								func TestOpenAIValidateUpstreamBaseURLDisabledAllowsHTTP(t *testing.T) {
 									cfg := &config.Config{
 										Security: config.SecurityConfig{
 											URLAllowlist: config.URLAllowlistConfig{
 												Enabled:           false,
 												AllowInsecureHTTP: true,
 											},
 										},
 									}
 									svc := &OpenAIGatewayService{cfg: cfg}
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+									normalized, err := svc.validateUpstreamBaseURL("http://not-https.example.com")
 									if err != nil {
-												fix(安全): 关闭白名单时保留最小校验与默认白名单

实现 allow_insecure_http 并在关闭校验时执行最小格式验证
- 关闭 allowlist 时要求 URL 可解析且 scheme 合规
- 响应头过滤关闭时使用默认白名单策略
- 更新相关文档、示例与测试覆盖

											
										
										
											2026-01-05 14:41:08 +08:00
+										t.Fatalf("expected http allowed when allow_insecure_http is true, got %v", err)
-												feat(安全): 添加安全开关并完善测试流程

实现安全开关默认关闭与响应头透传逻辑
- URL 校验与响应头过滤支持开关并覆盖流式路径
- 非流式 Content-Type 透传/默认值按配置生效
- 接入 go test、golangci-lint 与前端 lint/typecheck
- 补充相关测试与配置/文档说明

											
										
										
											2026-01-05 13:54:43 +08:00
+									}
 									if normalized != "http://not-https.example.com" {
 										t.Fatalf("expected raw url passthrough, got %q", normalized)
 									}
 								}
 								func TestOpenAIValidateUpstreamBaseURLEnabledEnforcesAllowlist(t *testing.T) {
 									cfg := &config.Config{
 										Security: config.SecurityConfig{
 											URLAllowlist: config.URLAllowlistConfig{
 												Enabled:       true,
 												UpstreamHosts: []string{"example.com"},
 											},
 										},
 									}
 									svc := &OpenAIGatewayService{cfg: cfg}
 									if _, err := svc.validateUpstreamBaseURL("https://example.com"); err != nil {
 										t.Fatalf("expected allowlisted host to pass, got %v", err)
 									}
 									if _, err := svc.validateUpstreamBaseURL("https://evil.com"); err == nil {
 										t.Fatalf("expected non-allowlisted host to fail")
 									}
 								}
-												perf(service): 优化 model 替换函数，用 gjson/sjson 替代全量 JSON 序列化

SSE 热路径中 replaceModelInSSELine 和 replaceModelInResponseBody 原来
使用 json.Unmarshal/Marshal 对每个事件做全量反序列化再序列化，现改为
gjson.Get/sjson.Set 精确字段操作，消除 O(n) 中间 map 分配，保持 JSON
字段顺序不变。涉及 OpenAIGatewayService 和 GatewayService 两个服务。

新增 23 个单元测试覆盖：顶层/嵌套 model 替换、不匹配跳过、空行/[DONE]/
非法 JSON 等边界情况。

Fixes: P1-08

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-07 17:09:55 +08:00
-												fix(openai): restore ws usage window display

											
										
										
											2026-03-06 20:46:10 +08:00
+								func TestOpenAIUpdateCodexUsageSnapshotFromHeaders(t *testing.T) {
 									repo := &snapshotUpdateAccountRepo{updateExtraCalls: make(chan map[string]any, 1)}
 									svc := &OpenAIGatewayService{accountRepo: repo}
 									headers := http.Header{}
 									headers.Set("x-codex-primary-used-percent", "12")
 									headers.Set("x-codex-secondary-used-percent", "34")
 									headers.Set("x-codex-primary-window-minutes", "300")
 									headers.Set("x-codex-secondary-window-minutes", "10080")
 									headers.Set("x-codex-primary-reset-after-seconds", "600")
 									headers.Set("x-codex-secondary-reset-after-seconds", "86400")
 									svc.UpdateCodexUsageSnapshotFromHeaders(context.Background(), 123, headers)
 									select {
 									case updates := <-repo.updateExtraCalls:
 										require.Equal(t, 12.0, updates["codex_5h_used_percent"])
 										require.Equal(t, 34.0, updates["codex_7d_used_percent"])
 										require.Equal(t, 600, updates["codex_5h_reset_after_seconds"])
 										require.Equal(t, 86400, updates["codex_7d_reset_after_seconds"])
 									case <-time.After(2 * time.Second):
 										t.Fatal("expected UpdateExtra to be called")
 									}
 								}
-												fix(openai): support remote compact task

											
										
										
											2026-03-06 18:50:28 +08:00
+								func TestOpenAIResponsesRequestPathSuffix(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									tests := []struct {
 										name string
 										path string
 										want string
 									}{
 										{name: "exact v1 responses", path: "/v1/responses", want: ""},
 										{name: "compact v1 responses", path: "/v1/responses/compact", want: "/compact"},
 										{name: "compact alias responses", path: "/responses/compact/", want: "/compact"},
 										{name: "nested suffix", path: "/openai/v1/responses/compact/detail", want: "/compact/detail"},
 										{name: "unrelated path", path: "/v1/chat/completions", want: ""},
 									}
 									for _, tt := range tests {
 										t.Run(tt.name, func(t *testing.T) {
 											c.Request = httptest.NewRequest(http.MethodPost, tt.path, nil)
 											require.Equal(t, tt.want, openAIResponsesRequestPathSuffix(c))
 										})
 									}
 								}
 								func TestOpenAIBuildUpstreamRequestOpenAIPassthroughPreservesCompactPath(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/v1/responses/compact", bytes.NewReader([]byte(`{"model":"gpt-5"}`)))
 									svc := &OpenAIGatewayService{}
 									account := &Account{Type: AccountTypeOAuth}
 									req, err := svc.buildUpstreamRequestOpenAIPassthrough(c.Request.Context(), c, account, []byte(`{"model":"gpt-5"}`), "token")
 									require.NoError(t, err)
 									require.Equal(t, chatgptCodexURL+"/compact", req.URL.String())
 									require.Equal(t, "application/json", req.Header.Get("Accept"))
 									require.Equal(t, codexCLIVersion, req.Header.Get("Version"))
 									require.NotEmpty(t, req.Header.Get("Session_Id"))
 								}
 								func TestOpenAIBuildUpstreamRequestCompactForcesJSONAcceptForOAuth(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/v1/responses/compact", bytes.NewReader([]byte(`{"model":"gpt-5"}`)))
 									svc := &OpenAIGatewayService{}
 									account := &Account{
 										Type:        AccountTypeOAuth,
 										Credentials: map[string]any{"chatgpt_account_id": "chatgpt-acc"},
 									}
 									req, err := svc.buildUpstreamRequest(c.Request.Context(), c, account, []byte(`{"model":"gpt-5"}`), "token", false, "", true)
 									require.NoError(t, err)
 									require.Equal(t, chatgptCodexURL+"/compact", req.URL.String())
 									require.Equal(t, "application/json", req.Header.Get("Accept"))
 									require.Equal(t, codexCLIVersion, req.Header.Get("Version"))
 									require.NotEmpty(t, req.Header.Get("Session_Id"))
 								}
 								func TestOpenAIBuildUpstreamRequestPreservesCompactPathForAPIKeyBaseURL(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/responses/compact", bytes.NewReader([]byte(`{"model":"gpt-5"}`)))
 									svc := &OpenAIGatewayService{cfg: &config.Config{
 										Security: config.SecurityConfig{
 											URLAllowlist: config.URLAllowlistConfig{Enabled: false},
 										},
 									}}
 									account := &Account{
 										Type:        AccountTypeAPIKey,
 										Platform:    PlatformOpenAI,
 										Credentials: map[string]any{"base_url": "https://example.com/v1"},
 									}
 									req, err := svc.buildUpstreamRequest(c.Request.Context(), c, account, []byte(`{"model":"gpt-5"}`), "token", false, "", false)
 									require.NoError(t, err)
 									require.Equal(t, "https://example.com/v1/responses/compact", req.URL.String())
 								}
-												fix(openai): detect official codex client by headers

											
										
										
											2026-03-07 14:12:38 +08:00
+								func TestOpenAIBuildUpstreamRequestOAuthOfficialClientOriginatorCompatibility(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									tests := []struct {
 										name           string
 										userAgent      string
 										originator     string
 										wantOriginator string
 									}{
 										{name: "desktop originator preserved", originator: "Codex Desktop", wantOriginator: "Codex Desktop"},
 										{name: "vscode originator preserved", originator: "codex_vscode", wantOriginator: "codex_vscode"},
 										{name: "official ua fallback to codex_cli_rs", userAgent: "Codex Desktop/1.2.3", wantOriginator: "codex_cli_rs"},
 									}
 									for _, tt := range tests {
 										t.Run(tt.name, func(t *testing.T) {
 											rec := httptest.NewRecorder()
 											c, _ := gin.CreateTestContext(rec)
 											c.Request = httptest.NewRequest(http.MethodPost, "/v1/responses", bytes.NewReader([]byte(`{"model":"gpt-5"}`)))
 											if tt.userAgent != "" {
 												c.Request.Header.Set("User-Agent", tt.userAgent)
 											}
 											if tt.originator != "" {
 												c.Request.Header.Set("originator", tt.originator)
 											}
 											svc := &OpenAIGatewayService{}
 											account := &Account{
 												Type:        AccountTypeOAuth,
 												Credentials: map[string]any{"chatgpt_account_id": "chatgpt-acc"},
 											}
 											isCodexCLI := openai.IsCodexOfficialClientByHeaders(c.GetHeader("User-Agent"), c.GetHeader("originator"))
 											req, err := svc.buildUpstreamRequest(c.Request.Context(), c, account, []byte(`{"model":"gpt-5"}`), "token", false, "", isCodexCLI)
 											require.NoError(t, err)
 											require.Equal(t, tt.wantOriginator, req.Header.Get("originator"))
 										})
 									}
 								}
-												perf(service): 优化 model 替换函数，用 gjson/sjson 替代全量 JSON 序列化

SSE 热路径中 replaceModelInSSELine 和 replaceModelInResponseBody 原来
使用 json.Unmarshal/Marshal 对每个事件做全量反序列化再序列化，现改为
gjson.Get/sjson.Set 精确字段操作，消除 O(n) 中间 map 分配，保持 JSON
字段顺序不变。涉及 OpenAIGatewayService 和 GatewayService 两个服务。

新增 23 个单元测试覆盖：顶层/嵌套 model 替换、不匹配跳过、空行/[DONE]/
非法 JSON 等边界情况。

Fixes: P1-08

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-07 17:09:55 +08:00
+								// ==================== P1-08 修复：model 替换性能优化测试 ====================
-												fix(openai): restore ws usage window display

											
										
										
											2026-03-06 20:46:10 +08:00
+								// ==================== P1-08 修复：model 替换性能优化测试 =============
-												perf(service): 优化 model 替换函数，用 gjson/sjson 替代全量 JSON 序列化

SSE 热路径中 replaceModelInSSELine 和 replaceModelInResponseBody 原来
使用 json.Unmarshal/Marshal 对每个事件做全量反序列化再序列化，现改为
gjson.Get/sjson.Set 精确字段操作，消除 O(n) 中间 map 分配，保持 JSON
字段顺序不变。涉及 OpenAIGatewayService 和 GatewayService 两个服务。

新增 23 个单元测试覆盖：顶层/嵌套 model 替换、不匹配跳过、空行/[DONE]/
非法 JSON 等边界情况。

Fixes: P1-08

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-02-07 17:09:55 +08:00
+								func TestReplaceModelInSSELine(t *testing.T) {
 									svc := &OpenAIGatewayService{}
 									tests := []struct {
 										name     string
 										line     string
 										from     string
 										to       string
 										expected string
 									}{
 										{
 											name:     "顶层 model 字段替换",
 											line:     `data: {"id":"chatcmpl-123","model":"gpt-4o","choices":[]}`,
 											from:     "gpt-4o",
 											to:       "my-custom-model",
 											expected: `data: {"id":"chatcmpl-123","model":"my-custom-model","choices":[]}`,
 										},
 										{
 											name:     "嵌套 response.model 替换",
 											line:     `data: {"type":"response","response":{"id":"resp-1","model":"gpt-4o","output":[]}}`,
 											from:     "gpt-4o",
 											to:       "my-model",
 											expected: `data: {"type":"response","response":{"id":"resp-1","model":"my-model","output":[]}}`,
 										},
 										{
 											name:     "model 不匹配时不替换",
 											line:     `data: {"id":"chatcmpl-123","model":"gpt-3.5-turbo","choices":[]}`,
 											from:     "gpt-4o",
 											to:       "my-model",
 											expected: `data: {"id":"chatcmpl-123","model":"gpt-3.5-turbo","choices":[]}`,
 										},
 										{
 											name:     "无 model 字段时不替换",
 											line:     `data: {"id":"chatcmpl-123","choices":[]}`,
 											from:     "gpt-4o",
 											to:       "my-model",
 											expected: `data: {"id":"chatcmpl-123","choices":[]}`,
 										},
 										{
 											name:     "空 data 行",
 											line:     `data: `,
 											from:     "gpt-4o",
 											to:       "my-model",
 											expected: `data: `,
 										},
 										{
 											name:     "[DONE] 行",
 											line:     `data: [DONE]`,
 											from:     "gpt-4o",
 											to:       "my-model",
 											expected: `data: [DONE]`,
 										},
 										{
 											name:     "非 data: 前缀行",
 											line:     `event: message`,
 											from:     "gpt-4o",
 											to:       "my-model",
 											expected: `event: message`,
 										},
 										{
 											name:     "非法 JSON 不替换",
 											line:     `data: {invalid json}`,
 											from:     "gpt-4o",
 											to:       "my-model",
 											expected: `data: {invalid json}`,
 										},
 										{
 											name:     "无空格 data: 格式",
 											line:     `data:{"id":"x","model":"gpt-4o"}`,
 											from:     "gpt-4o",
 											to:       "my-model",
 											expected: `data: {"id":"x","model":"my-model"}`,
 										},
 										{
 											name:     "model 名含特殊字符",
 											line:     `data: {"model":"org/model-v2.1-beta"}`,
 											from:     "org/model-v2.1-beta",
 											to:       "custom/alias",
 											expected: `data: {"model":"custom/alias"}`,
 										},
 										{
 											name:     "空行",
 											line:     "",
 											from:     "gpt-4o",
 											to:       "my-model",
 											expected: "",
 										},
 										{
 											name:     "保持其他字段不变",
 											line:     `data: {"id":"abc","object":"chat.completion.chunk","model":"gpt-4o","created":1234567890,"choices":[{"index":0,"delta":{"content":"hi"}}]}`,
 											from:     "gpt-4o",
 											to:       "alias",
 											expected: `data: {"id":"abc","object":"chat.completion.chunk","model":"alias","created":1234567890,"choices":[{"index":0,"delta":{"content":"hi"}}]}`,
 										},
 										{
 											name:     "顶层优先于嵌套：同时存在两个 model",
 											line:     `data: {"model":"gpt-4o","response":{"model":"gpt-4o"}}`,
 											from:     "gpt-4o",
 											to:       "replaced",
 											expected: `data: {"model":"replaced","response":{"model":"gpt-4o"}}`,
 										},
 									}
 									for _, tt := range tests {
 										t.Run(tt.name, func(t *testing.T) {
 											got := svc.replaceModelInSSELine(tt.line, tt.from, tt.to)
 											require.Equal(t, tt.expected, got)
 										})
 									}
 								}
 								func TestReplaceModelInSSEBody(t *testing.T) {
 									svc := &OpenAIGatewayService{}
 									tests := []struct {
 										name     string
 										body     string
 										from     string
 										to       string
 										expected string
 									}{
 										{
 											name:     "多行 SSE body 替换",
 											body:     "data: {\"model\":\"gpt-4o\",\"choices\":[]}\n\ndata: {\"model\":\"gpt-4o\",\"choices\":[{\"delta\":{\"content\":\"hi\"}}]}\n\ndata: [DONE]\n",
 											from:     "gpt-4o",
 											to:       "alias",
 											expected: "data: {\"model\":\"alias\",\"choices\":[]}\n\ndata: {\"model\":\"alias\",\"choices\":[{\"delta\":{\"content\":\"hi\"}}]}\n\ndata: [DONE]\n",
 										},
 										{
 											name:     "无需替换的 body",
 											body:     "data: {\"model\":\"gpt-3.5-turbo\"}\n\ndata: [DONE]\n",
 											from:     "gpt-4o",
 											to:       "alias",
 											expected: "data: {\"model\":\"gpt-3.5-turbo\"}\n\ndata: [DONE]\n",
 										},
 										{
 											name:     "混合 event 和 data 行",
 											body:     "event: message\ndata: {\"model\":\"gpt-4o\"}\n\n",
 											from:     "gpt-4o",
 											to:       "alias",
 											expected: "event: message\ndata: {\"model\":\"alias\"}\n\n",
 										},
 										{
 											name:     "空 body",
 											body:     "",
 											from:     "gpt-4o",
 											to:       "alias",
 											expected: "",
 										},
 									}
 									for _, tt := range tests {
 										t.Run(tt.name, func(t *testing.T) {
 											got := svc.replaceModelInSSEBody(tt.body, tt.from, tt.to)
 											require.Equal(t, tt.expected, got)
 										})
 									}
 								}
 								func TestReplaceModelInResponseBody(t *testing.T) {
 									svc := &OpenAIGatewayService{}
 									tests := []struct {
 										name     string
 										body     string
 										from     string
 										to       string
 										expected string
 									}{
 										{
 											name:     "替换顶层 model",
 											body:     `{"id":"chatcmpl-123","model":"gpt-4o","choices":[]}`,
 											from:     "gpt-4o",
 											to:       "alias",
 											expected: `{"id":"chatcmpl-123","model":"alias","choices":[]}`,
 										},
 										{
 											name:     "model 不匹配不替换",
 											body:     `{"id":"chatcmpl-123","model":"gpt-3.5-turbo","choices":[]}`,
 											from:     "gpt-4o",
 											to:       "alias",
 											expected: `{"id":"chatcmpl-123","model":"gpt-3.5-turbo","choices":[]}`,
 										},
 										{
 											name:     "无 model 字段不替换",
 											body:     `{"id":"chatcmpl-123","choices":[]}`,
 											from:     "gpt-4o",
 											to:       "alias",
 											expected: `{"id":"chatcmpl-123","choices":[]}`,
 										},
 										{
 											name:     "非法 JSON 返回原值",
 											body:     `not json`,
 											from:     "gpt-4o",
 											to:       "alias",
 											expected: `not json`,
 										},
 										{
 											name:     "空 body 返回原值",
 											body:     ``,
 											from:     "gpt-4o",
 											to:       "alias",
 											expected: ``,
 										},
 										{
 											name:     "保持嵌套结构不变",
 											body:     `{"model":"gpt-4o","usage":{"prompt_tokens":10,"completion_tokens":20},"choices":[{"message":{"role":"assistant","content":"hello"}}]}`,
 											from:     "gpt-4o",
 											to:       "alias",
 											expected: `{"model":"alias","usage":{"prompt_tokens":10,"completion_tokens":20},"choices":[{"message":{"role":"assistant","content":"hello"}}]}`,
 										},
 									}
 									for _, tt := range tests {
 										t.Run(tt.name, func(t *testing.T) {
 											got := svc.replaceModelInResponseBody([]byte(tt.body), tt.from, tt.to)
 											require.Equal(t, tt.expected, string(got))
 										})
 									}
 								}
-												feat(openai): 极致优化 OAuth 链路并补齐性能守护

- 优化 /v1/responses 热路径，减少重复解析与不必要拷贝\n- 优化并发与 token 竞争路径并补齐运行指标\n- 补充 OpenAI/Ops 相关单元测试与回归用例\n- 新增灰度阈值守护与压测脚本，支撑发布验收

											
										
										
											2026-02-12 09:41:37 +08:00
 								func TestExtractOpenAISSEDataLine(t *testing.T) {
 									tests := []struct {
 										name     string
 										line     string
 										wantData string
 										wantOK   bool
 									}{
 										{name: "标准格式", line: `data: {"type":"x"}`, wantData: `{"type":"x"}`, wantOK: true},
 										{name: "无空格格式", line: `data:{"type":"x"}`, wantData: `{"type":"x"}`, wantOK: true},
 										{name: "纯空数据", line: `data:   `, wantData: ``, wantOK: true},
 										{name: "非 data 行", line: `event: message`, wantData: ``, wantOK: false},
 									}
 									for _, tt := range tests {
 										t.Run(tt.name, func(t *testing.T) {
 											got, ok := extractOpenAISSEDataLine(tt.line)
 											require.Equal(t, tt.wantOK, ok)
 											require.Equal(t, tt.wantData, got)
 										})
 									}
 								}
 								func TestParseSSEUsage_SelectiveParsing(t *testing.T) {
 									svc := &OpenAIGatewayService{}
 									usage := &OpenAIUsage{InputTokens: 9, OutputTokens: 8, CacheReadInputTokens: 7}
 									// 非 completed 事件，不应覆盖 usage
 									svc.parseSSEUsage(`{"type":"response.in_progress","response":{"usage":{"input_tokens":1,"output_tokens":2}}}`, usage)
 									require.Equal(t, 9, usage.InputTokens)
 									require.Equal(t, 8, usage.OutputTokens)
 									require.Equal(t, 7, usage.CacheReadInputTokens)
 									// completed 事件，应提取 usage
 									svc.parseSSEUsage(`{"type":"response.completed","response":{"usage":{"input_tokens":3,"output_tokens":5,"input_tokens_details":{"cached_tokens":2}}}}`, usage)
 									require.Equal(t, 3, usage.InputTokens)
 									require.Equal(t, 5, usage.OutputTokens)
 									require.Equal(t, 2, usage.CacheReadInputTokens)
 								}
 								func TestExtractCodexFinalResponse_SampleReplay(t *testing.T) {
 									body := strings.Join([]string{
 										`event: message`,
 										`data: {"type":"response.in_progress","response":{"id":"resp_1"}}`,
 										`data: {"type":"response.completed","response":{"id":"resp_1","model":"gpt-4o","usage":{"input_tokens":11,"output_tokens":22,"input_tokens_details":{"cached_tokens":3}}}}`,
 										`data: [DONE]`,
 									}, "\n")
 									finalResp, ok := extractCodexFinalResponse(body)
 									require.True(t, ok)
 									require.Contains(t, string(finalResp), `"id":"resp_1"`)
 									require.Contains(t, string(finalResp), `"input_tokens":11`)
 								}
 								func TestHandleOAuthSSEToJSON_CompletedEventReturnsJSON(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/", nil)
 									svc := &OpenAIGatewayService{cfg: &config.Config{}}
 									resp := &http.Response{
 										StatusCode: http.StatusOK,
 										Header:     http.Header{"Content-Type": []string{"text/event-stream"}},
 									}
 									body := []byte(strings.Join([]string{
 										`data: {"type":"response.in_progress","response":{"id":"resp_2"}}`,
 										`data: {"type":"response.completed","response":{"id":"resp_2","model":"gpt-4o","usage":{"input_tokens":7,"output_tokens":9,"input_tokens_details":{"cached_tokens":1}}}}`,
 										`data: [DONE]`,
 									}, "\n"))
 									usage, err := svc.handleOAuthSSEToJSON(resp, c, body, "gpt-4o", "gpt-4o")
 									require.NoError(t, err)
 									require.NotNil(t, usage)
 									require.Equal(t, 7, usage.InputTokens)
 									require.Equal(t, 9, usage.OutputTokens)
 									require.Equal(t, 1, usage.CacheReadInputTokens)
 									// Header 可能由上游 Content-Type 透传；关键是 body 已转换为最终 JSON 响应。
 									require.NotContains(t, rec.Body.String(), "event:")
 									require.Contains(t, rec.Body.String(), `"id":"resp_2"`)
 									require.NotContains(t, rec.Body.String(), "data:")
 								}
 								func TestHandleOAuthSSEToJSON_NoFinalResponseKeepsSSEBody(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/", nil)
 									svc := &OpenAIGatewayService{cfg: &config.Config{}}
 									resp := &http.Response{
 										StatusCode: http.StatusOK,
 										Header:     http.Header{"Content-Type": []string{"text/event-stream"}},
 									}
 									body := []byte(strings.Join([]string{
 										`data: {"type":"response.in_progress","response":{"id":"resp_3"}}`,
 										`data: [DONE]`,
 									}, "\n"))
 									usage, err := svc.handleOAuthSSEToJSON(resp, c, body, "gpt-4o", "gpt-4o")
 									require.NoError(t, err)
 									require.NotNil(t, usage)
 									require.Equal(t, 0, usage.InputTokens)
 									require.Contains(t, rec.Header().Get("Content-Type"), "text/event-stream")
 									require.Contains(t, rec.Body.String(), `data: {"type":"response.in_progress"`)
 								}
-												fix(openai): 统一专属倍率计费链路并补齐回归测试

抽取共享的用户分组专属倍率解析器，统一缓存、singleflight 与回退逻辑。\n\n让 OpenAI 独立计费链路复用专属倍率解析，修复 usage 记录与实际扣费未命中用户专属倍率的问题。\n\n补齐 OpenAI 计费与解析器单元测试，并修复全量回归中暴露的 lint 阻塞项。\n\nCo-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-06 14:54:52 +08:00
 								func TestHandleOAuthSSEToJSON_ResponseFailedReturnsProtocolError(t *testing.T) {
 									gin.SetMode(gin.TestMode)
 									rec := httptest.NewRecorder()
 									c, _ := gin.CreateTestContext(rec)
 									c.Request = httptest.NewRequest(http.MethodPost, "/", nil)
 									svc := &OpenAIGatewayService{cfg: &config.Config{}}
 									resp := &http.Response{
 										StatusCode: http.StatusOK,
 										Header:     http.Header{"Content-Type": []string{"text/event-stream"}},
 									}
 									body := []byte(strings.Join([]string{
 										`data: {"type":"response.failed","error":{"message":"upstream rejected request"}}`,
 										`data: [DONE]`,
 									}, "\n"))
 									usage, err := svc.handleOAuthSSEToJSON(resp, c, body, "gpt-4o", "gpt-4o")
 									require.Nil(t, usage)
 									require.Error(t, err)
 									require.Equal(t, http.StatusBadGateway, rec.Code)
 									require.Contains(t, rec.Body.String(), "upstream rejected request")
 									require.Contains(t, rec.Header().Get("Content-Type"), "application/json")
 								}