refactor: remove max_context_load_time and max_context_tokens from bot settings

These two fields controlled history context window (time-based) and token-based trimming. They are no longer needed — the resolver now always uses the hardcoded 24-hour default and skips token-based history trimming.
2026-04-27 07:16:19 +09:00 · 2026-03-29 00:00:10 +08:00
parent 90ac222bc9
commit 0730ff2945
25 changed files with 176 additions and 388 deletions
@@ -153,8 +153,6 @@ func (r *Resolver) resolve(ctx context.Context, req conversation.ChatRequest) (r
 		return resolvedContext{}, errors.New("chat id is required")
 	}

-	skipHistory := req.MaxContextLoadTime < 0
-
 	botSettings, err := r.loadBotSettings(ctx, req.BotID)
 	if err != nil {
 		return resolvedContext{}, err
@@ -176,55 +174,23 @@ func (r *Resolver) resolve(ctx context.Context, req conversation.ChatRequest) (r
 	}
 	clientType := provider.ClientType

-	maxCtx := coalescePositiveInt(req.MaxContextLoadTime, botSettings.MaxContextLoadTime, defaultMaxContextMinutes)
-	maxTokens := botSettings.MaxContextTokens
-
 	memoryMsg := r.loadMemoryContextMessage(ctx, req)
 	reqMessages := pruneMessagesForGateway(nonNilModelMessages(req.Messages))
 	if memoryMsg != nil {
 		pruned, _ := pruneMessageForGateway(*memoryMsg)
 		memoryMsg = &pruned
 	}
-	var overhead int
-	if memoryMsg != nil {
-		overhead += estimateMessageTokens(*memoryMsg)
-	}
-	for _, m := range reqMessages {
-		overhead += estimateMessageTokens(m)
-	}
-	const systemPromptReserve = 4096
-	overhead += systemPromptReserve
-
-	historyBudget := maxTokens - overhead
-	if maxTokens > 0 && historyBudget <= 0 {
-		historyBudget = 1
-	} else if historyBudget < 0 {
-		historyBudget = 0
-	}
-
-	r.logger.Debug("context token budget",
-		slog.Int("max_tokens", maxTokens),
-		slog.Int("overhead", overhead),
-		slog.Int("system_prompt_reserve", systemPromptReserve),
-		slog.Int("history_budget", historyBudget),
-	)

 	var messages []conversation.ModelMessage
-	if !skipHistory && r.conversationSvc != nil {
-		loaded, loadErr := r.loadMessages(ctx, req.ChatID, req.SessionID, maxCtx)
+	if r.conversationSvc != nil {
+		loaded, loadErr := r.loadMessages(ctx, req.ChatID, req.SessionID, defaultMaxContextMinutes)
 		if loadErr != nil {
 			return resolvedContext{}, loadErr
 		}
 		loaded = pruneHistoryForGateway(loaded)
 		loaded = dedupePersistedCurrentUserMessage(loaded, req)
 		loaded = r.replaceCompactedMessages(ctx, loaded)
-		messages = trimMessagesByTokens(r.logger, loaded, historyBudget)
-		r.logger.Debug("context trim result",
-			slog.Int("loaded_messages", len(loaded)),
-			slog.Int("kept_messages", len(messages)),
-			slog.Int("trimmed_messages", len(loaded)-len(messages)),
-			slog.Int("history_budget", historyBudget),
-		)
+		messages = trimMessagesByTokens(r.logger, loaded, 0)
 	}
 	if memoryMsg != nil {
 		messages = append(messages, *memoryMsg)
@@ -153,15 +153,6 @@ func decodeIndexedByteObject(raw json.RawMessage) ([]byte, bool) {
 	return out, true
 }

-func coalescePositiveInt(values ...int) int {
-	for _, v := range values {
-		if v > 0 {
-			return v
-		}
-	}
-	return defaultMaxContextMinutes
-}
-
 func nonNilModelMessages(m []conversation.ModelMessage) []conversation.ModelMessage {
 	if m == nil {
 		return []conversation.ModelMessage{}
@@ -241,14 +241,13 @@ type ChatRequest struct {
 	// Set by the inbound channel processor; called by the resolver at persist time.
 	OutboundAssetCollector func() []OutboundAssetRef `json:"-"`

-	Query              string           `json:"query"`
-	Model              string           `json:"model,omitempty"`
-	Provider           string           `json:"provider,omitempty"`
-	MaxContextLoadTime int              `json:"max_context_load_time,omitempty"`
-	Channels           []string         `json:"channels,omitempty"`
-	CurrentChannel     string           `json:"current_channel,omitempty"`
-	Messages           []ModelMessage   `json:"messages,omitempty"`
-	Attachments        []ChatAttachment `json:"attachments,omitempty"`
+	Query          string           `json:"query"`
+	Model          string           `json:"model,omitempty"`
+	Provider       string           `json:"provider,omitempty"`
+	Channels       []string         `json:"channels,omitempty"`
+	CurrentChannel string           `json:"current_channel,omitempty"`
+	Messages       []ModelMessage   `json:"messages,omitempty"`
+	Attachments    []ChatAttachment `json:"attachments,omitempty"`
 }

 // ChatResponse is the output of a non-streaming chat call.