优化上下文

This commit is contained in:
2026-06-10 18:00:58 +08:00
parent d9ba14e28b
commit 74268a8a07
6 changed files with 180 additions and 66 deletions
+86 -6
View File
@@ -180,12 +180,13 @@ func handleOpenAIProfiles(ctx *gin.Context) {
active = profile.Name
}
profiles = append(profiles, map[string]interface{}{
"name": profile.Name,
"active": profile.Active,
"baseUrl": profile.BaseUrl,
"model": profile.Model,
"timeout": profile.Timeout,
"maxTokens": profile.MaxTokens,
"name": profile.Name,
"active": profile.Active,
"baseUrl": profile.BaseUrl,
"model": profile.Model,
"timeout": profile.Timeout,
"maxTokens": profile.MaxTokens,
"contextWindowTokens": profile.ContextWindowTokens,
})
}
ReturnJson(ctx, "apiOK", gin.H{
@@ -317,6 +318,17 @@ func handleChat(ctx *gin.Context) {
apiReq.Messages = append([]openaiMessage{{Role: "system", Content: profile.SystemPrompt}}, apiReq.Messages...)
}
trimmedMessages, trimStats := trimOpenAIMessagesToContextWindow(apiReq.Messages, profile.ContextWindowTokens)
apiReq.Messages = trimmedMessages
if trimStats.RemovedMessages > 0 {
emitTrace("model", "context_window", "success", "上下文窗口已裁剪旧消息", map[string]interface{}{
"limit": trimStats.Limit,
"before_tokens": trimStats.BeforeTokens,
"after_tokens": trimStats.AfterTokens,
"removed_messages": trimStats.RemovedMessages,
})
}
modelPromptTokens := estimateOpenAIMessagesTokens(apiReq.Messages)
completionTokens := 0
modelUsageReceived := false
@@ -603,6 +615,74 @@ func normalizeImageDataURI(raw string) (string, error) {
return "data:" + mimeType + ";base64," + payload, nil
}
type contextWindowTrimStats struct {
Enabled bool
Limit int
BeforeTokens int
AfterTokens int
RemovedMessages int
}
func trimOpenAIMessagesToContextWindow(messages []openaiMessage, maxTokens int) ([]openaiMessage, contextWindowTrimStats) {
stats := contextWindowTrimStats{Enabled: maxTokens > 0, Limit: maxTokens}
if maxTokens <= 0 || len(messages) == 0 {
stats.BeforeTokens = estimateOpenAIMessagesTokens(messages)
stats.AfterTokens = stats.BeforeTokens
return messages, stats
}
result := append([]openaiMessage(nil), messages...)
stats.BeforeTokens = estimateOpenAIMessagesTokens(result)
stats.AfterTokens = stats.BeforeTokens
if stats.BeforeTokens <= maxTokens {
return result, stats
}
for stats.AfterTokens > maxTokens {
startIndex := 0
if len(result) > 0 && result[0].Role == "system" {
startIndex = 1
}
latestUserIndex := latestUserMessageIndex(result)
removeIndex := -1
for i := startIndex; i < len(result); i++ {
if i == latestUserIndex {
continue
}
if result[i].Role == "system" {
continue
}
removeIndex = i
break
}
if removeIndex == -1 {
break
}
removeCount := 1
if result[removeIndex].Role == "user" {
nextIndex := removeIndex + 1
if nextIndex < len(result) && nextIndex != latestUserIndex && result[nextIndex].Role == "assistant" {
removeCount = 2
}
}
result = append(result[:removeIndex], result[removeIndex+removeCount:]...)
stats.RemovedMessages += removeCount
stats.AfterTokens = estimateOpenAIMessagesTokens(result)
}
return result, stats
}
func latestUserMessageIndex(messages []openaiMessage) int {
for i := len(messages) - 1; i >= 0; i-- {
if messages[i].Role == "user" {
return i
}
}
return -1
}
type tokenUsageTracker struct {
promptTokens int
completionTokens int
+66 -52
View File
@@ -18,18 +18,19 @@ type TabAIChatSetting struct {
}
type TabAIChatOpenAIProfile struct {
ID uint `gorm:"primaryKey;autoIncrement"`
Name string `gorm:"size:100;not null;uniqueIndex"`
Active bool `gorm:"default:false;index"`
ApiKey string `gorm:"type:text"`
BaseUrl string `gorm:"size:500"`
Model string `gorm:"size:200"`
Timeout int `gorm:"default:120"`
MaxTokens int `gorm:"default:4096"`
SystemPrompt string `gorm:"type:text"`
SortOrder int `gorm:"default:0;index"`
CreatedAt *time.Time `gorm:"type:datetime;autoCreateTime"`
UpdatedAt *time.Time `gorm:"type:datetime;autoUpdateTime"`
ID uint `gorm:"primaryKey;autoIncrement"`
Name string `gorm:"size:100;not null;uniqueIndex"`
Active bool `gorm:"default:false;index"`
ApiKey string `gorm:"type:text"`
BaseUrl string `gorm:"size:500"`
Model string `gorm:"size:200"`
Timeout int `gorm:"default:120"`
MaxTokens int `gorm:"default:4096"`
ContextWindowTokens int `gorm:"default:0"`
SystemPrompt string `gorm:"type:text"`
SortOrder int `gorm:"default:0;index"`
CreatedAt *time.Time `gorm:"type:datetime;autoCreateTime"`
UpdatedAt *time.Time `gorm:"type:datetime;autoUpdateTime"`
}
type TabAIChatToolRouter struct {
@@ -120,12 +121,13 @@ func seedAIChatConfigFromYAMLIfEmpty() error {
profiles := cfg.OpenAI
if len(profiles) == 0 {
profiles = []models.ConfigsAIChatOpenAI_{{
Name: "default",
Active: true,
BaseUrl: "https://ark.cn-beijing.volces.com/api/v3",
Timeout: 120,
MaxTokens: 4096,
SystemPrompt: "你是一个有帮助的 AI 助手。",
Name: "default",
Active: true,
BaseUrl: "https://ark.cn-beijing.volces.com/api/v3",
Timeout: 120,
MaxTokens: 4096,
ContextWindowTokens: 0,
SystemPrompt: "你是一个有帮助的 AI 助手。",
}}
}
for i, profile := range profiles {
@@ -139,15 +141,16 @@ func seedAIChatConfigFromYAMLIfEmpty() error {
profile.MaxTokens = 4096
}
if err := tx.Create(&TabAIChatOpenAIProfile{
Name: profile.Name,
Active: profile.Active,
ApiKey: profile.ApiKey,
BaseUrl: profile.BaseUrl,
Model: profile.Model,
Timeout: profile.Timeout,
MaxTokens: profile.MaxTokens,
SystemPrompt: profile.SystemPrompt,
SortOrder: i,
Name: profile.Name,
Active: profile.Active,
ApiKey: profile.ApiKey,
BaseUrl: profile.BaseUrl,
Model: profile.Model,
Timeout: profile.Timeout,
MaxTokens: profile.MaxTokens,
ContextWindowTokens: nonNegativeInt(profile.ContextWindowTokens),
SystemPrompt: profile.SystemPrompt,
SortOrder: i,
}).Error; err != nil {
return err
}
@@ -232,14 +235,15 @@ func RefreshAIChatConfigCache() error {
for _, profile := range profiles {
cfg.OpenAI = append(cfg.OpenAI, models.ConfigsAIChatOpenAI_{
Name: profile.Name,
Active: profile.Active,
ApiKey: profile.ApiKey,
BaseUrl: profile.BaseUrl,
Model: profile.Model,
Timeout: defaultInt(profile.Timeout, 120),
MaxTokens: defaultInt(profile.MaxTokens, 4096),
SystemPrompt: profile.SystemPrompt,
Name: profile.Name,
Active: profile.Active,
ApiKey: profile.ApiKey,
BaseUrl: profile.BaseUrl,
Model: profile.Model,
Timeout: defaultInt(profile.Timeout, 120),
MaxTokens: defaultInt(profile.MaxTokens, 4096),
ContextWindowTokens: nonNegativeInt(profile.ContextWindowTokens),
SystemPrompt: profile.SystemPrompt,
})
}
for _, tool := range tools {
@@ -269,6 +273,13 @@ func defaultInt(value int, fallback int) int {
return value
}
func nonNegativeInt(value int) int {
if value < 0 {
return 0
}
return value
}
func handleAIChatAdminGetConfig(ctx *gin.Context) {
if ok, _ := requireSysAdmin(ctx); !ok {
return
@@ -357,6 +368,7 @@ func saveAIChatConfig(req models.ConfigsAIChat_) error {
if profile.MaxTokens <= 0 {
profile.MaxTokens = 4096
}
profile.ContextWindowTokens = nonNegativeInt(profile.ContextWindowTokens)
if profile.Active {
if activeSet {
profile.Active = false
@@ -366,15 +378,16 @@ func saveAIChatConfig(req models.ConfigsAIChat_) error {
}
tab := TabAIChatOpenAIProfile{
Name: profile.Name,
Active: profile.Active,
ApiKey: profile.ApiKey,
BaseUrl: profile.BaseUrl,
Model: profile.Model,
Timeout: profile.Timeout,
MaxTokens: profile.MaxTokens,
SystemPrompt: profile.SystemPrompt,
SortOrder: i,
Name: profile.Name,
Active: profile.Active,
ApiKey: profile.ApiKey,
BaseUrl: profile.BaseUrl,
Model: profile.Model,
Timeout: profile.Timeout,
MaxTokens: profile.MaxTokens,
ContextWindowTokens: profile.ContextWindowTokens,
SystemPrompt: profile.SystemPrompt,
SortOrder: i,
}
if old, ok := existingByName[profile.Name]; ok {
tab.ID = old.ID
@@ -447,14 +460,15 @@ func maskAIChatProfiles(profiles []models.ConfigsAIChatOpenAI_) []gin.H {
items := make([]gin.H, 0, len(profiles))
for _, profile := range profiles {
items = append(items, gin.H{
"name": profile.Name,
"active": profile.Active,
"apiKeySet": profile.ApiKey != "",
"baseUrl": profile.BaseUrl,
"model": profile.Model,
"timeout": profile.Timeout,
"maxTokens": profile.MaxTokens,
"systemPrompt": profile.SystemPrompt,
"name": profile.Name,
"active": profile.Active,
"apiKeySet": profile.ApiKey != "",
"baseUrl": profile.BaseUrl,
"model": profile.Model,
"timeout": profile.Timeout,
"maxTokens": profile.MaxTokens,
"contextWindowTokens": profile.ContextWindowTokens,
"systemPrompt": profile.SystemPrompt,
})
}
return items