mirror of
https://github.com/sipeed/picoclaw.git
synced 2026-06-12 18:08:54 +00:00
e414b82ac3
* fix(cron): publish agent response to outbound bus for cron-triggered jobs
When a cron job triggers agent execution via ProcessDirectWithChannel,
the agent response was silently discarded — the code assumed AgentLoop
would auto-publish it, but SendResponse is false on this path.
Delegate to PublishResponseIfNeeded (exported from AgentLoop) so the
response reaches the originating channel (e.g. Telegram) only when the
message tool did not already deliver content in the same round.
Also adds a "directive" message type to CronPayload, allowing cron jobs
to instruct the agent to execute a task rather than echo static text.
* fix(cron): add type validation and directive test coverage
Address reviewer blocking feedback:
1. Server-side whitelist for `type` parameter — the `enum` in
Parameters() is only an LLM schema hint; any string was persisted.
Now `addJob` rejects values other than "message" and "directive".
2. Comprehensive test coverage for the directive code path:
- directive adds prompt prefix to ProcessDirectWithChannel
- deliver=true + directive routes through agent (not direct publish)
- directive prompt content, sessionKey, channel, chatID are correct
- invalid type is rejected; valid types ("", "message", "directive") pass
- deliver=true message type goes directly to bus (regression)
- agent error path does not trigger publish (regression)
Also merge the two UpdateJob calls in addJob into one to avoid
redundant disk I/O (non-blocking suggestion from review).
* fix(cron): remove omitempty from CronPayload.Type for consistent JSON
Empty string and "message" are semantically equivalent defaults;
always serializing the field avoids asymmetric JSON output.
* test(cron): remove redundant test, strengthen error path coverage
- Remove ExecuteJobDirectivePassesCorrectContent: its assertions on
sessionKey/channel/chatID duplicate ExecuteJobPublishesAgentResponse;
its prompt check duplicates DirectiveAddsPromptPrefix.
- Strengthen DirectiveAddsPromptPrefix with exact prompt match and
publish response assertion.
- Fix ReturnsErrorWithoutPublish: set non-empty stub response so the
test verifies the error branch early-return, not the response==""
guard.
* fix(ci): satisfy golines and gosmopolitan in cron code
3586 lines
106 KiB
Go
3586 lines
106 KiB
Go
// PicoClaw - Ultra-lightweight personal AI agent
|
|
// Inspired by and based on nanobot: https://github.com/HKUDS/nanobot
|
|
// License: MIT
|
|
//
|
|
// Copyright (c) 2026 PicoClaw contributors
|
|
|
|
package agent
|
|
|
|
import (
|
|
"context"
|
|
"encoding/json"
|
|
"errors"
|
|
"fmt"
|
|
"path/filepath"
|
|
"regexp"
|
|
"strings"
|
|
"sync"
|
|
"sync/atomic"
|
|
"time"
|
|
|
|
"github.com/sipeed/picoclaw/pkg/bus"
|
|
"github.com/sipeed/picoclaw/pkg/channels"
|
|
"github.com/sipeed/picoclaw/pkg/commands"
|
|
"github.com/sipeed/picoclaw/pkg/config"
|
|
"github.com/sipeed/picoclaw/pkg/constants"
|
|
"github.com/sipeed/picoclaw/pkg/logger"
|
|
"github.com/sipeed/picoclaw/pkg/media"
|
|
"github.com/sipeed/picoclaw/pkg/providers"
|
|
"github.com/sipeed/picoclaw/pkg/routing"
|
|
"github.com/sipeed/picoclaw/pkg/skills"
|
|
"github.com/sipeed/picoclaw/pkg/state"
|
|
"github.com/sipeed/picoclaw/pkg/tools"
|
|
"github.com/sipeed/picoclaw/pkg/utils"
|
|
"github.com/sipeed/picoclaw/pkg/voice"
|
|
)
|
|
|
|
type AgentLoop struct {
|
|
// Core dependencies
|
|
bus *bus.MessageBus
|
|
cfg *config.Config
|
|
registry *AgentRegistry
|
|
state *state.Manager
|
|
|
|
// Event system (from Incoming)
|
|
eventBus *EventBus
|
|
hooks *HookManager
|
|
|
|
// Runtime state
|
|
running atomic.Bool
|
|
summarizing sync.Map
|
|
fallback *providers.FallbackChain
|
|
channelManager *channels.Manager
|
|
mediaStore media.MediaStore
|
|
transcriber voice.Transcriber
|
|
cmdRegistry *commands.Registry
|
|
mcp mcpRuntime
|
|
hookRuntime hookRuntime
|
|
steering *steeringQueue
|
|
pendingSkills sync.Map
|
|
mu sync.RWMutex
|
|
|
|
// Concurrent turn management (from HEAD)
|
|
activeTurnStates sync.Map // key: sessionKey (string), value: *turnState
|
|
subTurnCounter atomic.Int64 // Counter for generating unique SubTurn IDs
|
|
|
|
// Turn tracking (from Incoming)
|
|
turnSeq atomic.Uint64
|
|
activeRequests sync.WaitGroup
|
|
|
|
reloadFunc func() error
|
|
}
|
|
|
|
// processOptions configures how a message is processed
|
|
type processOptions struct {
|
|
SessionKey string // Session identifier for history/context
|
|
Channel string // Target channel for tool execution
|
|
ChatID string // Target chat ID for tool execution
|
|
SenderID string // Current sender ID for dynamic context
|
|
SenderDisplayName string // Current sender display name for dynamic context
|
|
UserMessage string // User message content (may include prefix)
|
|
ForcedSkills []string // Skills explicitly requested for this message
|
|
SystemPromptOverride string // Override the default system prompt (Used by SubTurns)
|
|
Media []string // media:// refs from inbound message
|
|
InitialSteeringMessages []providers.Message // Steering messages from refactor/agent
|
|
DefaultResponse string // Response when LLM returns empty
|
|
EnableSummary bool // Whether to trigger summarization
|
|
SendResponse bool // Whether to send response via bus
|
|
SuppressToolFeedback bool // Whether to suppress inline tool feedback messages
|
|
NoHistory bool // If true, don't load session history (for heartbeat)
|
|
SkipInitialSteeringPoll bool // If true, skip the steering poll at loop start (used by Continue)
|
|
}
|
|
|
|
type continuationTarget struct {
|
|
SessionKey string
|
|
Channel string
|
|
ChatID string
|
|
}
|
|
|
|
const (
|
|
defaultResponse = "The model returned an empty response. This may indicate a provider error or token limit."
|
|
toolLimitResponse = "I've reached `max_tool_iterations` without a final response. Increase `max_tool_iterations` in config.json if this task needs more tool steps."
|
|
handledToolResponseSummary = "Requested output delivered via tool attachment."
|
|
sessionKeyAgentPrefix = "agent:"
|
|
metadataKeyAccountID = "account_id"
|
|
metadataKeyGuildID = "guild_id"
|
|
metadataKeyTeamID = "team_id"
|
|
metadataKeyParentPeerKind = "parent_peer_kind"
|
|
metadataKeyParentPeerID = "parent_peer_id"
|
|
)
|
|
|
|
func NewAgentLoop(
|
|
cfg *config.Config,
|
|
msgBus *bus.MessageBus,
|
|
provider providers.LLMProvider,
|
|
) *AgentLoop {
|
|
registry := NewAgentRegistry(cfg, provider)
|
|
|
|
// Set up shared fallback chain
|
|
cooldown := providers.NewCooldownTracker()
|
|
fallbackChain := providers.NewFallbackChain(cooldown)
|
|
|
|
// Create state manager using default agent's workspace for channel recording
|
|
defaultAgent := registry.GetDefaultAgent()
|
|
var stateManager *state.Manager
|
|
if defaultAgent != nil {
|
|
stateManager = state.NewManager(defaultAgent.Workspace)
|
|
}
|
|
|
|
eventBus := NewEventBus()
|
|
al := &AgentLoop{
|
|
bus: msgBus,
|
|
cfg: cfg,
|
|
registry: registry,
|
|
state: stateManager,
|
|
eventBus: eventBus,
|
|
summarizing: sync.Map{},
|
|
fallback: fallbackChain,
|
|
cmdRegistry: commands.NewRegistry(commands.BuiltinDefinitions()),
|
|
steering: newSteeringQueue(parseSteeringMode(cfg.Agents.Defaults.SteeringMode)),
|
|
}
|
|
al.hooks = NewHookManager(eventBus)
|
|
configureHookManagerFromConfig(al.hooks, cfg)
|
|
|
|
// Register shared tools to all agents (now that al is created)
|
|
registerSharedTools(al, cfg, msgBus, registry, provider)
|
|
|
|
return al
|
|
}
|
|
|
|
// registerSharedTools registers tools that are shared across all agents (web, message, spawn).
|
|
func registerSharedTools(
|
|
al *AgentLoop,
|
|
cfg *config.Config,
|
|
msgBus *bus.MessageBus,
|
|
registry *AgentRegistry,
|
|
provider providers.LLMProvider,
|
|
) {
|
|
allowReadPaths := buildAllowReadPatterns(cfg)
|
|
|
|
for _, agentID := range registry.ListAgentIDs() {
|
|
agent, ok := registry.GetAgent(agentID)
|
|
if !ok {
|
|
continue
|
|
}
|
|
|
|
if cfg.Tools.IsToolEnabled("web") {
|
|
searchTool, err := tools.NewWebSearchTool(tools.WebSearchToolOptions{
|
|
BraveAPIKeys: cfg.Tools.Web.Brave.APIKeys.Values(),
|
|
BraveMaxResults: cfg.Tools.Web.Brave.MaxResults,
|
|
BraveEnabled: cfg.Tools.Web.Brave.Enabled,
|
|
TavilyAPIKeys: cfg.Tools.Web.Tavily.APIKeys.Values(),
|
|
TavilyBaseURL: cfg.Tools.Web.Tavily.BaseURL,
|
|
TavilyMaxResults: cfg.Tools.Web.Tavily.MaxResults,
|
|
TavilyEnabled: cfg.Tools.Web.Tavily.Enabled,
|
|
DuckDuckGoMaxResults: cfg.Tools.Web.DuckDuckGo.MaxResults,
|
|
DuckDuckGoEnabled: cfg.Tools.Web.DuckDuckGo.Enabled,
|
|
PerplexityAPIKeys: cfg.Tools.Web.Perplexity.APIKeys.Values(),
|
|
PerplexityMaxResults: cfg.Tools.Web.Perplexity.MaxResults,
|
|
PerplexityEnabled: cfg.Tools.Web.Perplexity.Enabled,
|
|
SearXNGBaseURL: cfg.Tools.Web.SearXNG.BaseURL,
|
|
SearXNGMaxResults: cfg.Tools.Web.SearXNG.MaxResults,
|
|
SearXNGEnabled: cfg.Tools.Web.SearXNG.Enabled,
|
|
GLMSearchAPIKey: cfg.Tools.Web.GLMSearch.APIKey.String(),
|
|
GLMSearchBaseURL: cfg.Tools.Web.GLMSearch.BaseURL,
|
|
GLMSearchEngine: cfg.Tools.Web.GLMSearch.SearchEngine,
|
|
GLMSearchMaxResults: cfg.Tools.Web.GLMSearch.MaxResults,
|
|
GLMSearchEnabled: cfg.Tools.Web.GLMSearch.Enabled,
|
|
BaiduSearchAPIKey: cfg.Tools.Web.BaiduSearch.APIKey.String(),
|
|
BaiduSearchBaseURL: cfg.Tools.Web.BaiduSearch.BaseURL,
|
|
BaiduSearchMaxResults: cfg.Tools.Web.BaiduSearch.MaxResults,
|
|
BaiduSearchEnabled: cfg.Tools.Web.BaiduSearch.Enabled,
|
|
Proxy: cfg.Tools.Web.Proxy,
|
|
})
|
|
if err != nil {
|
|
logger.ErrorCF("agent", "Failed to create web search tool", map[string]any{"error": err.Error()})
|
|
} else if searchTool != nil {
|
|
agent.Tools.Register(searchTool)
|
|
}
|
|
}
|
|
if cfg.Tools.IsToolEnabled("web_fetch") {
|
|
fetchTool, err := tools.NewWebFetchToolWithProxy(
|
|
50000,
|
|
cfg.Tools.Web.Proxy,
|
|
cfg.Tools.Web.Format,
|
|
cfg.Tools.Web.FetchLimitBytes,
|
|
cfg.Tools.Web.PrivateHostWhitelist)
|
|
if err != nil {
|
|
logger.ErrorCF("agent", "Failed to create web fetch tool", map[string]any{"error": err.Error()})
|
|
} else {
|
|
agent.Tools.Register(fetchTool)
|
|
}
|
|
}
|
|
|
|
// Hardware tools (I2C, SPI) - Linux only, returns error on other platforms
|
|
if cfg.Tools.IsToolEnabled("i2c") {
|
|
agent.Tools.Register(tools.NewI2CTool())
|
|
}
|
|
if cfg.Tools.IsToolEnabled("spi") {
|
|
agent.Tools.Register(tools.NewSPITool())
|
|
}
|
|
|
|
// Message tool
|
|
if cfg.Tools.IsToolEnabled("message") {
|
|
messageTool := tools.NewMessageTool()
|
|
messageTool.SetSendCallback(func(channel, chatID, content string) error {
|
|
pubCtx, pubCancel := context.WithTimeout(context.Background(), 5*time.Second)
|
|
defer pubCancel()
|
|
return msgBus.PublishOutbound(pubCtx, bus.OutboundMessage{
|
|
Channel: channel,
|
|
ChatID: chatID,
|
|
Content: content,
|
|
})
|
|
})
|
|
agent.Tools.Register(messageTool)
|
|
}
|
|
|
|
// Send file tool (outbound media via MediaStore — store injected later by SetMediaStore)
|
|
if cfg.Tools.IsToolEnabled("send_file") {
|
|
sendFileTool := tools.NewSendFileTool(
|
|
agent.Workspace,
|
|
cfg.Agents.Defaults.RestrictToWorkspace,
|
|
cfg.Agents.Defaults.GetMaxMediaSize(),
|
|
nil,
|
|
allowReadPaths,
|
|
)
|
|
agent.Tools.Register(sendFileTool)
|
|
}
|
|
|
|
// Skill discovery and installation tools
|
|
skills_enabled := cfg.Tools.IsToolEnabled("skills")
|
|
find_skills_enable := cfg.Tools.IsToolEnabled("find_skills")
|
|
install_skills_enable := cfg.Tools.IsToolEnabled("install_skill")
|
|
if skills_enabled && (find_skills_enable || install_skills_enable) {
|
|
clawHubConfig := cfg.Tools.Skills.Registries.ClawHub
|
|
registryMgr := skills.NewRegistryManagerFromConfig(skills.RegistryConfig{
|
|
MaxConcurrentSearches: cfg.Tools.Skills.MaxConcurrentSearches,
|
|
ClawHub: skills.ClawHubConfig{
|
|
Enabled: clawHubConfig.Enabled,
|
|
BaseURL: clawHubConfig.BaseURL,
|
|
AuthToken: clawHubConfig.AuthToken.String(),
|
|
SearchPath: clawHubConfig.SearchPath,
|
|
SkillsPath: clawHubConfig.SkillsPath,
|
|
DownloadPath: clawHubConfig.DownloadPath,
|
|
Timeout: clawHubConfig.Timeout,
|
|
MaxZipSize: clawHubConfig.MaxZipSize,
|
|
MaxResponseSize: clawHubConfig.MaxResponseSize,
|
|
},
|
|
})
|
|
|
|
if find_skills_enable {
|
|
searchCache := skills.NewSearchCache(
|
|
cfg.Tools.Skills.SearchCache.MaxSize,
|
|
time.Duration(cfg.Tools.Skills.SearchCache.TTLSeconds)*time.Second,
|
|
)
|
|
agent.Tools.Register(tools.NewFindSkillsTool(registryMgr, searchCache))
|
|
}
|
|
|
|
if install_skills_enable {
|
|
agent.Tools.Register(tools.NewInstallSkillTool(registryMgr, agent.Workspace))
|
|
}
|
|
}
|
|
|
|
// Spawn and spawn_status tools share a SubagentManager.
|
|
// Construct it when either tool is enabled (both require subagent).
|
|
spawnEnabled := cfg.Tools.IsToolEnabled("spawn")
|
|
spawnStatusEnabled := cfg.Tools.IsToolEnabled("spawn_status")
|
|
if (spawnEnabled || spawnStatusEnabled) && cfg.Tools.IsToolEnabled("subagent") {
|
|
subagentManager := tools.NewSubagentManager(provider, agent.Model, agent.Workspace)
|
|
subagentManager.SetLLMOptions(agent.MaxTokens, agent.Temperature)
|
|
|
|
// Set the spawner that links into AgentLoop's turnState
|
|
subagentManager.SetSpawner(func(
|
|
ctx context.Context,
|
|
task, label, targetAgentID string,
|
|
tls *tools.ToolRegistry,
|
|
maxTokens int,
|
|
temperature float64,
|
|
hasMaxTokens, hasTemperature bool,
|
|
) (*tools.ToolResult, error) {
|
|
// 1. Recover parent Turn State from Context
|
|
parentTS := turnStateFromContext(ctx)
|
|
if parentTS == nil {
|
|
// Fallback: If no turnState exists in context, create an isolated ad-hoc root turn state
|
|
// so that the tool can still function outside of an agent loop (e.g. tests, raw invocations).
|
|
parentTS = &turnState{
|
|
ctx: ctx,
|
|
turnID: "adhoc-root",
|
|
depth: 0,
|
|
session: nil, // Ephemeral session not needed for adhoc spawn
|
|
pendingResults: make(chan *tools.ToolResult, 16),
|
|
concurrencySem: make(chan struct{}, 5),
|
|
}
|
|
}
|
|
|
|
// 2. Build Tools slice from registry
|
|
var tlSlice []tools.Tool
|
|
for _, name := range tls.List() {
|
|
if t, ok := tls.Get(name); ok {
|
|
tlSlice = append(tlSlice, t)
|
|
}
|
|
}
|
|
|
|
// 3. System Prompt
|
|
systemPrompt := "You are a subagent. Complete the given task independently and report the result.\n" +
|
|
"You have access to tools - use them as needed to complete your task.\n" +
|
|
"After completing the task, provide a clear summary of what was done.\n\n" +
|
|
"Task: " + task
|
|
|
|
// 4. Resolve Model
|
|
modelToUse := agent.Model
|
|
if targetAgentID != "" {
|
|
if targetAgent, ok := al.GetRegistry().GetAgent(targetAgentID); ok {
|
|
modelToUse = targetAgent.Model
|
|
}
|
|
}
|
|
|
|
// 5. Build SubTurnConfig
|
|
cfg := SubTurnConfig{
|
|
Model: modelToUse,
|
|
Tools: tlSlice,
|
|
SystemPrompt: systemPrompt,
|
|
}
|
|
if hasMaxTokens {
|
|
cfg.MaxTokens = maxTokens
|
|
}
|
|
|
|
// 6. Spawn SubTurn
|
|
return spawnSubTurn(ctx, al, parentTS, cfg)
|
|
})
|
|
|
|
// Clone the parent's tool registry so subagents can use all
|
|
// tools registered so far (file, web, etc.) but NOT spawn/
|
|
// spawn_status which are added below — preventing recursive
|
|
// subagent spawning.
|
|
subagentManager.SetTools(agent.Tools.Clone())
|
|
if spawnEnabled {
|
|
spawnTool := tools.NewSpawnTool(subagentManager)
|
|
spawnTool.SetSpawner(NewSubTurnSpawner(al))
|
|
currentAgentID := agentID
|
|
spawnTool.SetAllowlistChecker(func(targetAgentID string) bool {
|
|
return registry.CanSpawnSubagent(currentAgentID, targetAgentID)
|
|
})
|
|
|
|
agent.Tools.Register(spawnTool)
|
|
|
|
// Also register the synchronous subagent tool
|
|
subagentTool := tools.NewSubagentTool(subagentManager)
|
|
subagentTool.SetSpawner(NewSubTurnSpawner(al))
|
|
agent.Tools.Register(subagentTool)
|
|
}
|
|
if spawnStatusEnabled {
|
|
agent.Tools.Register(tools.NewSpawnStatusTool(subagentManager))
|
|
}
|
|
} else if (spawnEnabled || spawnStatusEnabled) && !cfg.Tools.IsToolEnabled("subagent") {
|
|
logger.WarnCF("agent", "spawn/spawn_status tools require subagent to be enabled", nil)
|
|
}
|
|
}
|
|
}
|
|
|
|
func (al *AgentLoop) Run(ctx context.Context) error {
|
|
al.running.Store(true)
|
|
|
|
if err := al.ensureHooksInitialized(ctx); err != nil {
|
|
return err
|
|
}
|
|
if err := al.ensureMCPInitialized(ctx); err != nil {
|
|
return err
|
|
}
|
|
|
|
idleTicker := time.NewTicker(100 * time.Millisecond)
|
|
defer idleTicker.Stop()
|
|
|
|
for {
|
|
select {
|
|
case <-ctx.Done():
|
|
return nil
|
|
case <-idleTicker.C:
|
|
if !al.running.Load() {
|
|
return nil
|
|
}
|
|
case msg, ok := <-al.bus.InboundChan():
|
|
if !ok {
|
|
return nil
|
|
}
|
|
|
|
// Start a goroutine that drains the bus while processMessage is
|
|
// running. Only messages that resolve to the active turn scope are
|
|
// redirected into steering; other inbound messages are requeued.
|
|
drainCancel := func() {}
|
|
if activeScope, activeAgentID, ok := al.resolveSteeringTarget(msg); ok {
|
|
drainCtx, cancel := context.WithCancel(ctx)
|
|
drainCancel = cancel
|
|
go al.drainBusToSteering(drainCtx, activeScope, activeAgentID)
|
|
}
|
|
|
|
// Process message
|
|
func() {
|
|
defer func() {
|
|
if al.channelManager != nil {
|
|
al.channelManager.InvokeTypingStop(msg.Channel, msg.ChatID)
|
|
}
|
|
}()
|
|
// TODO: Re-enable media cleanup after inbound media is properly consumed by the agent.
|
|
// Currently disabled because files are deleted before the LLM can access their content.
|
|
// defer func() {
|
|
// if al.mediaStore != nil && msg.MediaScope != "" {
|
|
// if releaseErr := al.mediaStore.ReleaseAll(msg.MediaScope); releaseErr != nil {
|
|
// logger.WarnCF("agent", "Failed to release media", map[string]any{
|
|
// "scope": msg.MediaScope,
|
|
// "error": releaseErr.Error(),
|
|
// })
|
|
// }
|
|
// }
|
|
// }()
|
|
|
|
drainCanceled := false
|
|
cancelDrain := func() {
|
|
if drainCanceled {
|
|
return
|
|
}
|
|
drainCancel()
|
|
drainCanceled = true
|
|
}
|
|
defer cancelDrain()
|
|
|
|
response, err := al.processMessage(ctx, msg)
|
|
if err != nil {
|
|
response = fmt.Sprintf("Error processing message: %v", err)
|
|
}
|
|
finalResponse := response
|
|
|
|
target, targetErr := al.buildContinuationTarget(msg)
|
|
if targetErr != nil {
|
|
logger.WarnCF("agent", "Failed to build steering continuation target",
|
|
map[string]any{
|
|
"channel": msg.Channel,
|
|
"error": targetErr.Error(),
|
|
})
|
|
return
|
|
}
|
|
if target == nil {
|
|
cancelDrain()
|
|
if finalResponse != "" {
|
|
al.PublishResponseIfNeeded(ctx, msg.Channel, msg.ChatID, finalResponse)
|
|
}
|
|
return
|
|
}
|
|
|
|
for al.pendingSteeringCountForScope(target.SessionKey) > 0 {
|
|
logger.InfoCF("agent", "Continuing queued steering after turn end",
|
|
map[string]any{
|
|
"channel": target.Channel,
|
|
"chat_id": target.ChatID,
|
|
"session_key": target.SessionKey,
|
|
"queue_depth": al.pendingSteeringCountForScope(target.SessionKey),
|
|
})
|
|
|
|
continued, continueErr := al.Continue(ctx, target.SessionKey, target.Channel, target.ChatID)
|
|
if continueErr != nil {
|
|
logger.WarnCF("agent", "Failed to continue queued steering",
|
|
map[string]any{
|
|
"channel": target.Channel,
|
|
"chat_id": target.ChatID,
|
|
"error": continueErr.Error(),
|
|
})
|
|
return
|
|
}
|
|
if continued == "" {
|
|
return
|
|
}
|
|
|
|
finalResponse = continued
|
|
}
|
|
|
|
cancelDrain()
|
|
|
|
for al.pendingSteeringCountForScope(target.SessionKey) > 0 {
|
|
logger.InfoCF("agent", "Draining steering queued during turn shutdown",
|
|
map[string]any{
|
|
"channel": target.Channel,
|
|
"chat_id": target.ChatID,
|
|
"session_key": target.SessionKey,
|
|
"queue_depth": al.pendingSteeringCountForScope(target.SessionKey),
|
|
})
|
|
|
|
continued, continueErr := al.Continue(ctx, target.SessionKey, target.Channel, target.ChatID)
|
|
if continueErr != nil {
|
|
logger.WarnCF("agent", "Failed to continue queued steering after shutdown drain",
|
|
map[string]any{
|
|
"channel": target.Channel,
|
|
"chat_id": target.ChatID,
|
|
"error": continueErr.Error(),
|
|
})
|
|
return
|
|
}
|
|
if continued == "" {
|
|
break
|
|
}
|
|
|
|
finalResponse = continued
|
|
}
|
|
|
|
if finalResponse != "" {
|
|
al.PublishResponseIfNeeded(ctx, target.Channel, target.ChatID, finalResponse)
|
|
}
|
|
}()
|
|
}
|
|
}
|
|
}
|
|
|
|
// drainBusToSteering consumes inbound messages and redirects messages from the
|
|
// active scope into the steering queue. Messages from other scopes are requeued
|
|
// so they can be processed normally after the active turn. It drains all
|
|
// immediately available messages, blocking for the first one until ctx is done.
|
|
func (al *AgentLoop) drainBusToSteering(ctx context.Context, activeScope, activeAgentID string) {
|
|
blocking := true
|
|
for {
|
|
var msg bus.InboundMessage
|
|
|
|
if blocking {
|
|
// Block waiting for the first available message or ctx cancellation.
|
|
select {
|
|
case <-ctx.Done():
|
|
return
|
|
case m, ok := <-al.bus.InboundChan():
|
|
if !ok {
|
|
return
|
|
}
|
|
msg = m
|
|
}
|
|
} else {
|
|
// Non-blocking: drain any remaining queued messages, return when empty.
|
|
select {
|
|
case m, ok := <-al.bus.InboundChan():
|
|
if !ok {
|
|
return
|
|
}
|
|
msg = m
|
|
default:
|
|
return
|
|
}
|
|
}
|
|
blocking = false
|
|
|
|
msgScope, _, scopeOK := al.resolveSteeringTarget(msg)
|
|
if !scopeOK || msgScope != activeScope {
|
|
if err := al.requeueInboundMessage(msg); err != nil {
|
|
logger.WarnCF("agent", "Failed to requeue non-steering inbound message", map[string]any{
|
|
"error": err.Error(),
|
|
"channel": msg.Channel,
|
|
"sender_id": msg.SenderID,
|
|
})
|
|
}
|
|
continue
|
|
}
|
|
|
|
// Transcribe audio if needed before steering, so the agent sees text.
|
|
msg, _ = al.transcribeAudioInMessage(ctx, msg)
|
|
|
|
logger.InfoCF("agent", "Redirecting inbound message to steering queue",
|
|
map[string]any{
|
|
"channel": msg.Channel,
|
|
"sender_id": msg.SenderID,
|
|
"content_len": len(msg.Content),
|
|
"scope": activeScope,
|
|
})
|
|
|
|
if err := al.enqueueSteeringMessage(activeScope, activeAgentID, providers.Message{
|
|
Role: "user",
|
|
Content: msg.Content,
|
|
Media: append([]string(nil), msg.Media...),
|
|
}); err != nil {
|
|
logger.WarnCF("agent", "Failed to steer message, will be lost",
|
|
map[string]any{
|
|
"error": err.Error(),
|
|
"channel": msg.Channel,
|
|
})
|
|
}
|
|
}
|
|
}
|
|
|
|
func (al *AgentLoop) Stop() {
|
|
al.running.Store(false)
|
|
}
|
|
|
|
func (al *AgentLoop) PublishResponseIfNeeded(ctx context.Context, channel, chatID, response string) {
|
|
if response == "" {
|
|
return
|
|
}
|
|
|
|
alreadySent := false
|
|
defaultAgent := al.GetRegistry().GetDefaultAgent()
|
|
if defaultAgent != nil {
|
|
if tool, ok := defaultAgent.Tools.Get("message"); ok {
|
|
if mt, ok := tool.(*tools.MessageTool); ok {
|
|
alreadySent = mt.HasSentInRound()
|
|
}
|
|
}
|
|
}
|
|
|
|
if alreadySent {
|
|
logger.DebugCF(
|
|
"agent",
|
|
"Skipped outbound (message tool already sent)",
|
|
map[string]any{"channel": channel},
|
|
)
|
|
return
|
|
}
|
|
|
|
al.bus.PublishOutbound(ctx, bus.OutboundMessage{
|
|
Channel: channel,
|
|
ChatID: chatID,
|
|
Content: response,
|
|
})
|
|
logger.InfoCF("agent", "Published outbound response",
|
|
map[string]any{
|
|
"channel": channel,
|
|
"chat_id": chatID,
|
|
"content_len": len(response),
|
|
})
|
|
}
|
|
|
|
func (al *AgentLoop) buildContinuationTarget(msg bus.InboundMessage) (*continuationTarget, error) {
|
|
if msg.Channel == "system" {
|
|
return nil, nil
|
|
}
|
|
|
|
route, _, err := al.resolveMessageRoute(msg)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return &continuationTarget{
|
|
SessionKey: resolveScopeKey(route, msg.SessionKey),
|
|
Channel: msg.Channel,
|
|
ChatID: msg.ChatID,
|
|
}, nil
|
|
}
|
|
|
|
// Close releases resources held by agent session stores. Call after Stop.
|
|
func (al *AgentLoop) Close() {
|
|
mcpManager := al.mcp.takeManager()
|
|
|
|
if mcpManager != nil {
|
|
if err := mcpManager.Close(); err != nil {
|
|
logger.ErrorCF("agent", "Failed to close MCP manager",
|
|
map[string]any{
|
|
"error": err.Error(),
|
|
})
|
|
}
|
|
}
|
|
|
|
al.GetRegistry().Close()
|
|
if al.hooks != nil {
|
|
al.hooks.Close()
|
|
}
|
|
if al.eventBus != nil {
|
|
al.eventBus.Close()
|
|
}
|
|
}
|
|
|
|
// MountHook registers an in-process hook on the agent loop.
|
|
func (al *AgentLoop) MountHook(reg HookRegistration) error {
|
|
if al == nil || al.hooks == nil {
|
|
return fmt.Errorf("hook manager is not initialized")
|
|
}
|
|
return al.hooks.Mount(reg)
|
|
}
|
|
|
|
// UnmountHook removes a previously registered in-process hook.
|
|
func (al *AgentLoop) UnmountHook(name string) {
|
|
if al == nil || al.hooks == nil {
|
|
return
|
|
}
|
|
al.hooks.Unmount(name)
|
|
}
|
|
|
|
// SubscribeEvents registers a subscriber for agent-loop events.
|
|
func (al *AgentLoop) SubscribeEvents(buffer int) EventSubscription {
|
|
if al == nil || al.eventBus == nil {
|
|
ch := make(chan Event)
|
|
close(ch)
|
|
return EventSubscription{C: ch}
|
|
}
|
|
return al.eventBus.Subscribe(buffer)
|
|
}
|
|
|
|
// UnsubscribeEvents removes a previously registered event subscriber.
|
|
func (al *AgentLoop) UnsubscribeEvents(id uint64) {
|
|
if al == nil || al.eventBus == nil {
|
|
return
|
|
}
|
|
al.eventBus.Unsubscribe(id)
|
|
}
|
|
|
|
// EventDrops returns the number of dropped events for the given kind.
|
|
func (al *AgentLoop) EventDrops(kind EventKind) int64 {
|
|
if al == nil || al.eventBus == nil {
|
|
return 0
|
|
}
|
|
return al.eventBus.Dropped(kind)
|
|
}
|
|
|
|
type turnEventScope struct {
|
|
agentID string
|
|
sessionKey string
|
|
turnID string
|
|
}
|
|
|
|
func (al *AgentLoop) newTurnEventScope(agentID, sessionKey string) turnEventScope {
|
|
seq := al.turnSeq.Add(1)
|
|
return turnEventScope{
|
|
agentID: agentID,
|
|
sessionKey: sessionKey,
|
|
turnID: fmt.Sprintf("%s-turn-%d", agentID, seq),
|
|
}
|
|
}
|
|
|
|
func (ts turnEventScope) meta(iteration int, source, tracePath string) EventMeta {
|
|
return EventMeta{
|
|
AgentID: ts.agentID,
|
|
TurnID: ts.turnID,
|
|
SessionKey: ts.sessionKey,
|
|
Iteration: iteration,
|
|
Source: source,
|
|
TracePath: tracePath,
|
|
}
|
|
}
|
|
|
|
func (al *AgentLoop) emitEvent(kind EventKind, meta EventMeta, payload any) {
|
|
evt := Event{
|
|
Kind: kind,
|
|
Meta: meta,
|
|
Payload: payload,
|
|
}
|
|
|
|
if al == nil || al.eventBus == nil {
|
|
return
|
|
}
|
|
|
|
al.logEvent(evt)
|
|
|
|
al.eventBus.Emit(evt)
|
|
}
|
|
|
|
func cloneEventArguments(args map[string]any) map[string]any {
|
|
if len(args) == 0 {
|
|
return nil
|
|
}
|
|
|
|
cloned := make(map[string]any, len(args))
|
|
for k, v := range args {
|
|
cloned[k] = v
|
|
}
|
|
return cloned
|
|
}
|
|
|
|
func (al *AgentLoop) hookAbortError(ts *turnState, stage string, decision HookDecision) error {
|
|
reason := decision.Reason
|
|
if reason == "" {
|
|
reason = "hook requested turn abort"
|
|
}
|
|
|
|
err := fmt.Errorf("hook aborted turn during %s: %s", stage, reason)
|
|
al.emitEvent(
|
|
EventKindError,
|
|
ts.eventMeta("hooks", "turn.error"),
|
|
ErrorPayload{
|
|
Stage: "hook." + stage,
|
|
Message: err.Error(),
|
|
},
|
|
)
|
|
return err
|
|
}
|
|
|
|
func hookDeniedToolContent(prefix, reason string) string {
|
|
if reason == "" {
|
|
return prefix
|
|
}
|
|
return prefix + ": " + reason
|
|
}
|
|
|
|
func (al *AgentLoop) logEvent(evt Event) {
|
|
fields := map[string]any{
|
|
"event_kind": evt.Kind.String(),
|
|
"agent_id": evt.Meta.AgentID,
|
|
"turn_id": evt.Meta.TurnID,
|
|
"session_key": evt.Meta.SessionKey,
|
|
"iteration": evt.Meta.Iteration,
|
|
}
|
|
|
|
if evt.Meta.TracePath != "" {
|
|
fields["trace"] = evt.Meta.TracePath
|
|
}
|
|
if evt.Meta.Source != "" {
|
|
fields["source"] = evt.Meta.Source
|
|
}
|
|
|
|
switch payload := evt.Payload.(type) {
|
|
case TurnStartPayload:
|
|
fields["channel"] = payload.Channel
|
|
fields["chat_id"] = payload.ChatID
|
|
fields["user_len"] = len(payload.UserMessage)
|
|
fields["media_count"] = payload.MediaCount
|
|
case TurnEndPayload:
|
|
fields["status"] = payload.Status
|
|
fields["iterations_total"] = payload.Iterations
|
|
fields["duration_ms"] = payload.Duration.Milliseconds()
|
|
fields["final_len"] = payload.FinalContentLen
|
|
case LLMRequestPayload:
|
|
fields["model"] = payload.Model
|
|
fields["messages"] = payload.MessagesCount
|
|
fields["tools"] = payload.ToolsCount
|
|
fields["max_tokens"] = payload.MaxTokens
|
|
case LLMDeltaPayload:
|
|
fields["content_delta_len"] = payload.ContentDeltaLen
|
|
fields["reasoning_delta_len"] = payload.ReasoningDeltaLen
|
|
case LLMResponsePayload:
|
|
fields["content_len"] = payload.ContentLen
|
|
fields["tool_calls"] = payload.ToolCalls
|
|
fields["has_reasoning"] = payload.HasReasoning
|
|
case LLMRetryPayload:
|
|
fields["attempt"] = payload.Attempt
|
|
fields["max_retries"] = payload.MaxRetries
|
|
fields["reason"] = payload.Reason
|
|
fields["error"] = payload.Error
|
|
fields["backoff_ms"] = payload.Backoff.Milliseconds()
|
|
case ContextCompressPayload:
|
|
fields["reason"] = payload.Reason
|
|
fields["dropped_messages"] = payload.DroppedMessages
|
|
fields["remaining_messages"] = payload.RemainingMessages
|
|
case SessionSummarizePayload:
|
|
fields["summarized_messages"] = payload.SummarizedMessages
|
|
fields["kept_messages"] = payload.KeptMessages
|
|
fields["summary_len"] = payload.SummaryLen
|
|
fields["omitted_oversized"] = payload.OmittedOversized
|
|
case ToolExecStartPayload:
|
|
fields["tool"] = payload.Tool
|
|
fields["args_count"] = len(payload.Arguments)
|
|
case ToolExecEndPayload:
|
|
fields["tool"] = payload.Tool
|
|
fields["duration_ms"] = payload.Duration.Milliseconds()
|
|
fields["for_llm_len"] = payload.ForLLMLen
|
|
fields["for_user_len"] = payload.ForUserLen
|
|
fields["is_error"] = payload.IsError
|
|
fields["async"] = payload.Async
|
|
case ToolExecSkippedPayload:
|
|
fields["tool"] = payload.Tool
|
|
fields["reason"] = payload.Reason
|
|
case SteeringInjectedPayload:
|
|
fields["count"] = payload.Count
|
|
fields["total_content_len"] = payload.TotalContentLen
|
|
case FollowUpQueuedPayload:
|
|
fields["source_tool"] = payload.SourceTool
|
|
fields["channel"] = payload.Channel
|
|
fields["chat_id"] = payload.ChatID
|
|
fields["content_len"] = payload.ContentLen
|
|
case InterruptReceivedPayload:
|
|
fields["interrupt_kind"] = payload.Kind
|
|
fields["role"] = payload.Role
|
|
fields["content_len"] = payload.ContentLen
|
|
fields["queue_depth"] = payload.QueueDepth
|
|
fields["hint_len"] = payload.HintLen
|
|
case SubTurnSpawnPayload:
|
|
fields["child_agent_id"] = payload.AgentID
|
|
fields["label"] = payload.Label
|
|
case SubTurnEndPayload:
|
|
fields["child_agent_id"] = payload.AgentID
|
|
fields["status"] = payload.Status
|
|
case SubTurnResultDeliveredPayload:
|
|
fields["target_channel"] = payload.TargetChannel
|
|
fields["target_chat_id"] = payload.TargetChatID
|
|
fields["content_len"] = payload.ContentLen
|
|
case ErrorPayload:
|
|
fields["stage"] = payload.Stage
|
|
fields["error"] = payload.Message
|
|
}
|
|
|
|
logger.InfoCF("eventbus", fmt.Sprintf("Agent event: %s", evt.Kind.String()), fields)
|
|
}
|
|
|
|
func (al *AgentLoop) RegisterTool(tool tools.Tool) {
|
|
registry := al.GetRegistry()
|
|
for _, agentID := range registry.ListAgentIDs() {
|
|
if agent, ok := registry.GetAgent(agentID); ok {
|
|
agent.Tools.Register(tool)
|
|
}
|
|
}
|
|
}
|
|
|
|
func (al *AgentLoop) SetChannelManager(cm *channels.Manager) {
|
|
al.channelManager = cm
|
|
}
|
|
|
|
// ReloadProviderAndConfig atomically swaps the provider and config with proper synchronization.
|
|
// It uses a context to allow timeout control from the caller.
|
|
// Returns an error if the reload fails or context is canceled.
|
|
func (al *AgentLoop) ReloadProviderAndConfig(
|
|
ctx context.Context,
|
|
provider providers.LLMProvider,
|
|
cfg *config.Config,
|
|
) error {
|
|
// Validate inputs
|
|
if provider == nil {
|
|
return fmt.Errorf("provider cannot be nil")
|
|
}
|
|
if cfg == nil {
|
|
return fmt.Errorf("config cannot be nil")
|
|
}
|
|
|
|
// Create new registry with updated config and provider
|
|
// Wrap in defer/recover to handle any panics gracefully
|
|
var registry *AgentRegistry
|
|
var panicErr error
|
|
done := make(chan struct{}, 1)
|
|
|
|
go func() {
|
|
defer func() {
|
|
if r := recover(); r != nil {
|
|
panicErr = fmt.Errorf("panic during registry creation: %v", r)
|
|
logger.ErrorCF("agent", "Panic during registry creation",
|
|
map[string]any{"panic": r})
|
|
}
|
|
close(done)
|
|
}()
|
|
|
|
registry = NewAgentRegistry(cfg, provider)
|
|
}()
|
|
|
|
// Wait for completion or context cancellation
|
|
select {
|
|
case <-done:
|
|
if registry == nil {
|
|
if panicErr != nil {
|
|
return fmt.Errorf("registry creation failed: %w", panicErr)
|
|
}
|
|
return fmt.Errorf("registry creation failed (nil result)")
|
|
}
|
|
case <-ctx.Done():
|
|
return fmt.Errorf("context canceled during registry creation: %w", ctx.Err())
|
|
}
|
|
|
|
// Check context again before proceeding
|
|
if err := ctx.Err(); err != nil {
|
|
return fmt.Errorf("context canceled after registry creation: %w", err)
|
|
}
|
|
|
|
// Ensure shared tools are re-registered on the new registry
|
|
registerSharedTools(al, cfg, al.bus, registry, provider)
|
|
|
|
// Atomically swap the config and registry under write lock
|
|
// This ensures readers see a consistent pair
|
|
al.mu.Lock()
|
|
oldRegistry := al.registry
|
|
|
|
// Store new values
|
|
al.cfg = cfg
|
|
al.registry = registry
|
|
|
|
// Also update fallback chain with new config
|
|
al.fallback = providers.NewFallbackChain(providers.NewCooldownTracker())
|
|
|
|
al.mu.Unlock()
|
|
|
|
al.hookRuntime.reset(al)
|
|
configureHookManagerFromConfig(al.hooks, cfg)
|
|
|
|
// Close old provider after releasing the lock
|
|
// This prevents blocking readers while closing
|
|
if oldProvider, ok := extractProvider(oldRegistry); ok {
|
|
if stateful, ok := oldProvider.(providers.StatefulProvider); ok {
|
|
// Give in-flight requests a moment to complete
|
|
// Use a reasonable timeout that balances cleanup vs resource usage
|
|
select {
|
|
case <-time.After(100 * time.Millisecond):
|
|
stateful.Close()
|
|
case <-ctx.Done():
|
|
// Context canceled, close immediately but log warning
|
|
logger.WarnCF("agent", "Context canceled during provider cleanup, forcing close",
|
|
map[string]any{"error": ctx.Err()})
|
|
stateful.Close()
|
|
}
|
|
}
|
|
}
|
|
|
|
logger.InfoCF("agent", "Provider and config reloaded successfully",
|
|
map[string]any{
|
|
"model": cfg.Agents.Defaults.GetModelName(),
|
|
})
|
|
|
|
return nil
|
|
}
|
|
|
|
// GetRegistry returns the current registry (thread-safe)
|
|
func (al *AgentLoop) GetRegistry() *AgentRegistry {
|
|
al.mu.RLock()
|
|
defer al.mu.RUnlock()
|
|
return al.registry
|
|
}
|
|
|
|
// GetConfig returns the current config (thread-safe)
|
|
func (al *AgentLoop) GetConfig() *config.Config {
|
|
al.mu.RLock()
|
|
defer al.mu.RUnlock()
|
|
return al.cfg
|
|
}
|
|
|
|
// SetMediaStore injects a MediaStore for media lifecycle management.
|
|
func (al *AgentLoop) SetMediaStore(s media.MediaStore) {
|
|
al.mediaStore = s
|
|
|
|
// Propagate store to all registered tools that can emit media.
|
|
registry := al.GetRegistry()
|
|
for _, agentID := range registry.ListAgentIDs() {
|
|
if agent, ok := registry.GetAgent(agentID); ok {
|
|
agent.Tools.SetMediaStore(s)
|
|
}
|
|
}
|
|
}
|
|
|
|
// SetTranscriber injects a voice transcriber for agent-level audio transcription.
|
|
func (al *AgentLoop) SetTranscriber(t voice.Transcriber) {
|
|
al.transcriber = t
|
|
}
|
|
|
|
// SetReloadFunc sets the callback function for triggering config reload.
|
|
func (al *AgentLoop) SetReloadFunc(fn func() error) {
|
|
al.reloadFunc = fn
|
|
}
|
|
|
|
var audioAnnotationRe = regexp.MustCompile(`\[(voice|audio)(?::[^\]]*)?\]`)
|
|
|
|
// transcribeAudioInMessage resolves audio media refs, transcribes them, and
|
|
// replaces audio annotations in msg.Content with the transcribed text.
|
|
// Returns the (possibly modified) message and true if audio was transcribed.
|
|
func (al *AgentLoop) transcribeAudioInMessage(ctx context.Context, msg bus.InboundMessage) (bus.InboundMessage, bool) {
|
|
if al.transcriber == nil || al.mediaStore == nil || len(msg.Media) == 0 {
|
|
return msg, false
|
|
}
|
|
|
|
// Transcribe each audio media ref in order.
|
|
var transcriptions []string
|
|
for _, ref := range msg.Media {
|
|
path, meta, err := al.mediaStore.ResolveWithMeta(ref)
|
|
if err != nil {
|
|
logger.WarnCF("voice", "Failed to resolve media ref", map[string]any{"ref": ref, "error": err})
|
|
continue
|
|
}
|
|
if !utils.IsAudioFile(meta.Filename, meta.ContentType) {
|
|
continue
|
|
}
|
|
result, err := al.transcriber.Transcribe(ctx, path)
|
|
if err != nil {
|
|
logger.WarnCF("voice", "Transcription failed", map[string]any{"ref": ref, "error": err})
|
|
transcriptions = append(transcriptions, "")
|
|
continue
|
|
}
|
|
transcriptions = append(transcriptions, result.Text)
|
|
}
|
|
|
|
if len(transcriptions) == 0 {
|
|
return msg, false
|
|
}
|
|
|
|
al.sendTranscriptionFeedback(ctx, msg.Channel, msg.ChatID, msg.MessageID, transcriptions)
|
|
|
|
// Replace audio annotations sequentially with transcriptions.
|
|
idx := 0
|
|
newContent := audioAnnotationRe.ReplaceAllStringFunc(msg.Content, func(match string) string {
|
|
if idx >= len(transcriptions) {
|
|
return match
|
|
}
|
|
text := transcriptions[idx]
|
|
idx++
|
|
return "[voice: " + text + "]"
|
|
})
|
|
|
|
// Append any remaining transcriptions not matched by an annotation.
|
|
for ; idx < len(transcriptions); idx++ {
|
|
newContent += "\n[voice: " + transcriptions[idx] + "]"
|
|
}
|
|
|
|
msg.Content = newContent
|
|
return msg, true
|
|
}
|
|
|
|
// sendTranscriptionFeedback sends feedback to the user with the result of
|
|
// audio transcription if the option is enabled. It uses Manager.SendMessage
|
|
// which executes synchronously (rate limiting, splitting, retry) so that
|
|
// ordering with the subsequent placeholder is guaranteed.
|
|
func (al *AgentLoop) sendTranscriptionFeedback(
|
|
ctx context.Context,
|
|
channel, chatID, messageID string,
|
|
validTexts []string,
|
|
) {
|
|
if !al.cfg.Voice.EchoTranscription {
|
|
return
|
|
}
|
|
if al.channelManager == nil {
|
|
return
|
|
}
|
|
|
|
var nonEmpty []string
|
|
for _, t := range validTexts {
|
|
if t != "" {
|
|
nonEmpty = append(nonEmpty, t)
|
|
}
|
|
}
|
|
|
|
var feedbackMsg string
|
|
if len(nonEmpty) > 0 {
|
|
feedbackMsg = "Transcript: " + strings.Join(nonEmpty, "\n")
|
|
} else {
|
|
feedbackMsg = "No voice detected in the audio"
|
|
}
|
|
|
|
err := al.channelManager.SendMessage(ctx, bus.OutboundMessage{
|
|
Channel: channel,
|
|
ChatID: chatID,
|
|
Content: feedbackMsg,
|
|
ReplyToMessageID: messageID,
|
|
})
|
|
if err != nil {
|
|
logger.WarnCF("voice", "Failed to send transcription feedback", map[string]any{"error": err.Error()})
|
|
}
|
|
}
|
|
|
|
// inferMediaType determines the media type ("image", "audio", "video", "file")
|
|
// from a filename and MIME content type.
|
|
func inferMediaType(filename, contentType string) string {
|
|
ct := strings.ToLower(contentType)
|
|
fn := strings.ToLower(filename)
|
|
|
|
if strings.HasPrefix(ct, "image/") {
|
|
return "image"
|
|
}
|
|
if strings.HasPrefix(ct, "audio/") || ct == "application/ogg" {
|
|
return "audio"
|
|
}
|
|
if strings.HasPrefix(ct, "video/") {
|
|
return "video"
|
|
}
|
|
|
|
// Fallback: infer from extension
|
|
ext := filepath.Ext(fn)
|
|
switch ext {
|
|
case ".jpg", ".jpeg", ".png", ".gif", ".webp", ".bmp", ".svg":
|
|
return "image"
|
|
case ".mp3", ".wav", ".ogg", ".m4a", ".flac", ".aac", ".wma", ".opus":
|
|
return "audio"
|
|
case ".mp4", ".avi", ".mov", ".webm", ".mkv":
|
|
return "video"
|
|
}
|
|
|
|
return "file"
|
|
}
|
|
|
|
// RecordLastChannel records the last active channel for this workspace.
|
|
// This uses the atomic state save mechanism to prevent data loss on crash.
|
|
func (al *AgentLoop) RecordLastChannel(channel string) error {
|
|
if al.state == nil {
|
|
return nil
|
|
}
|
|
return al.state.SetLastChannel(channel)
|
|
}
|
|
|
|
// RecordLastChatID records the last active chat ID for this workspace.
|
|
// This uses the atomic state save mechanism to prevent data loss on crash.
|
|
func (al *AgentLoop) RecordLastChatID(chatID string) error {
|
|
if al.state == nil {
|
|
return nil
|
|
}
|
|
return al.state.SetLastChatID(chatID)
|
|
}
|
|
|
|
func (al *AgentLoop) ProcessDirect(
|
|
ctx context.Context,
|
|
content, sessionKey string,
|
|
) (string, error) {
|
|
return al.ProcessDirectWithChannel(ctx, content, sessionKey, "cli", "direct")
|
|
}
|
|
|
|
func (al *AgentLoop) ProcessDirectWithChannel(
|
|
ctx context.Context,
|
|
content, sessionKey, channel, chatID string,
|
|
) (string, error) {
|
|
if err := al.ensureHooksInitialized(ctx); err != nil {
|
|
return "", err
|
|
}
|
|
if err := al.ensureMCPInitialized(ctx); err != nil {
|
|
return "", err
|
|
}
|
|
|
|
msg := bus.InboundMessage{
|
|
Channel: channel,
|
|
SenderID: "cron",
|
|
ChatID: chatID,
|
|
Content: content,
|
|
SessionKey: sessionKey,
|
|
}
|
|
|
|
return al.processMessage(ctx, msg)
|
|
}
|
|
|
|
// ProcessHeartbeat processes a heartbeat request without session history.
|
|
// Each heartbeat is independent and doesn't accumulate context.
|
|
func (al *AgentLoop) ProcessHeartbeat(
|
|
ctx context.Context,
|
|
content, channel, chatID string,
|
|
) (string, error) {
|
|
if err := al.ensureHooksInitialized(ctx); err != nil {
|
|
return "", err
|
|
}
|
|
if err := al.ensureMCPInitialized(ctx); err != nil {
|
|
return "", err
|
|
}
|
|
|
|
agent := al.GetRegistry().GetDefaultAgent()
|
|
if agent == nil {
|
|
return "", fmt.Errorf("no default agent for heartbeat")
|
|
}
|
|
return al.runAgentLoop(ctx, agent, processOptions{
|
|
SessionKey: "heartbeat",
|
|
Channel: channel,
|
|
ChatID: chatID,
|
|
UserMessage: content,
|
|
DefaultResponse: defaultResponse,
|
|
EnableSummary: false,
|
|
SendResponse: false,
|
|
SuppressToolFeedback: true,
|
|
NoHistory: true, // Don't load session history for heartbeat
|
|
})
|
|
}
|
|
|
|
func (al *AgentLoop) processMessage(ctx context.Context, msg bus.InboundMessage) (string, error) {
|
|
// Add message preview to log (show full content for error messages)
|
|
var logContent string
|
|
if strings.Contains(msg.Content, "Error:") || strings.Contains(msg.Content, "error") {
|
|
logContent = msg.Content // Full content for errors
|
|
} else {
|
|
logContent = utils.Truncate(msg.Content, 80)
|
|
}
|
|
logger.InfoCF(
|
|
"agent",
|
|
fmt.Sprintf("Processing message from %s:%s: %s", msg.Channel, msg.SenderID, logContent),
|
|
map[string]any{
|
|
"channel": msg.Channel,
|
|
"chat_id": msg.ChatID,
|
|
"sender_id": msg.SenderID,
|
|
"session_key": msg.SessionKey,
|
|
},
|
|
)
|
|
|
|
var hadAudio bool
|
|
msg, hadAudio = al.transcribeAudioInMessage(ctx, msg)
|
|
|
|
// For audio messages the placeholder was deferred by the channel.
|
|
// Now that transcription (and optional feedback) is done, send it.
|
|
if hadAudio && al.channelManager != nil {
|
|
al.channelManager.SendPlaceholder(ctx, msg.Channel, msg.ChatID)
|
|
}
|
|
|
|
// Route system messages to processSystemMessage
|
|
if msg.Channel == "system" {
|
|
return al.processSystemMessage(ctx, msg)
|
|
}
|
|
|
|
route, agent, routeErr := al.resolveMessageRoute(msg)
|
|
if routeErr != nil {
|
|
return "", routeErr
|
|
}
|
|
|
|
// Reset message-tool state for this round so we don't skip publishing due to a previous round.
|
|
if tool, ok := agent.Tools.Get("message"); ok {
|
|
if resetter, ok := tool.(interface{ ResetSentInRound() }); ok {
|
|
resetter.ResetSentInRound()
|
|
}
|
|
}
|
|
|
|
// Resolve session key from route, while preserving explicit agent-scoped keys.
|
|
scopeKey := resolveScopeKey(route, msg.SessionKey)
|
|
sessionKey := scopeKey
|
|
|
|
logger.InfoCF("agent", "Routed message",
|
|
map[string]any{
|
|
"agent_id": agent.ID,
|
|
"scope_key": scopeKey,
|
|
"session_key": sessionKey,
|
|
"matched_by": route.MatchedBy,
|
|
"route_agent": route.AgentID,
|
|
"route_channel": route.Channel,
|
|
})
|
|
|
|
opts := processOptions{
|
|
SessionKey: sessionKey,
|
|
Channel: msg.Channel,
|
|
ChatID: msg.ChatID,
|
|
SenderID: msg.SenderID,
|
|
SenderDisplayName: msg.Sender.DisplayName,
|
|
UserMessage: msg.Content,
|
|
Media: msg.Media,
|
|
DefaultResponse: defaultResponse,
|
|
EnableSummary: true,
|
|
SendResponse: false,
|
|
}
|
|
|
|
// context-dependent commands check their own Runtime fields and report
|
|
// "unavailable" when the required capability is nil.
|
|
if response, handled := al.handleCommand(ctx, msg, agent, &opts); handled {
|
|
return response, nil
|
|
}
|
|
|
|
if pending := al.takePendingSkills(opts.SessionKey); len(pending) > 0 {
|
|
opts.ForcedSkills = append(opts.ForcedSkills, pending...)
|
|
logger.InfoCF("agent", "Applying pending skill override",
|
|
map[string]any{
|
|
"session_key": opts.SessionKey,
|
|
"skills": strings.Join(pending, ","),
|
|
})
|
|
}
|
|
|
|
return al.runAgentLoop(ctx, agent, opts)
|
|
}
|
|
|
|
func (al *AgentLoop) resolveMessageRoute(msg bus.InboundMessage) (routing.ResolvedRoute, *AgentInstance, error) {
|
|
registry := al.GetRegistry()
|
|
route := registry.ResolveRoute(routing.RouteInput{
|
|
Channel: msg.Channel,
|
|
AccountID: inboundMetadata(msg, metadataKeyAccountID),
|
|
Peer: extractPeer(msg),
|
|
ParentPeer: extractParentPeer(msg),
|
|
GuildID: inboundMetadata(msg, metadataKeyGuildID),
|
|
TeamID: inboundMetadata(msg, metadataKeyTeamID),
|
|
})
|
|
|
|
agent, ok := registry.GetAgent(route.AgentID)
|
|
if !ok {
|
|
agent = registry.GetDefaultAgent()
|
|
}
|
|
if agent == nil {
|
|
return routing.ResolvedRoute{}, nil, fmt.Errorf("no agent available for route (agent_id=%s)", route.AgentID)
|
|
}
|
|
|
|
return route, agent, nil
|
|
}
|
|
|
|
func resolveScopeKey(route routing.ResolvedRoute, msgSessionKey string) string {
|
|
if msgSessionKey != "" && strings.HasPrefix(msgSessionKey, sessionKeyAgentPrefix) {
|
|
return msgSessionKey
|
|
}
|
|
return route.SessionKey
|
|
}
|
|
|
|
func (al *AgentLoop) resolveSteeringTarget(msg bus.InboundMessage) (string, string, bool) {
|
|
if msg.Channel == "system" {
|
|
return "", "", false
|
|
}
|
|
|
|
route, agent, err := al.resolveMessageRoute(msg)
|
|
if err != nil || agent == nil {
|
|
return "", "", false
|
|
}
|
|
|
|
return resolveScopeKey(route, msg.SessionKey), agent.ID, true
|
|
}
|
|
|
|
func (al *AgentLoop) requeueInboundMessage(msg bus.InboundMessage) error {
|
|
if al.bus == nil {
|
|
return nil
|
|
}
|
|
pubCtx, cancel := context.WithTimeout(context.Background(), time.Second)
|
|
defer cancel()
|
|
return al.bus.PublishOutbound(pubCtx, bus.OutboundMessage{
|
|
Channel: msg.Channel,
|
|
ChatID: msg.ChatID,
|
|
Content: msg.Content,
|
|
})
|
|
}
|
|
|
|
func (al *AgentLoop) processSystemMessage(
|
|
ctx context.Context,
|
|
msg bus.InboundMessage,
|
|
) (string, error) {
|
|
if msg.Channel != "system" {
|
|
return "", fmt.Errorf(
|
|
"processSystemMessage called with non-system message channel: %s",
|
|
msg.Channel,
|
|
)
|
|
}
|
|
|
|
logger.InfoCF("agent", "Processing system message",
|
|
map[string]any{
|
|
"sender_id": msg.SenderID,
|
|
"chat_id": msg.ChatID,
|
|
})
|
|
|
|
// Parse origin channel from chat_id (format: "channel:chat_id")
|
|
var originChannel, originChatID string
|
|
if idx := strings.Index(msg.ChatID, ":"); idx > 0 {
|
|
originChannel = msg.ChatID[:idx]
|
|
originChatID = msg.ChatID[idx+1:]
|
|
} else {
|
|
originChannel = "cli"
|
|
originChatID = msg.ChatID
|
|
}
|
|
|
|
// Extract subagent result from message content
|
|
// Format: "Task 'label' completed.\n\nResult:\n<actual content>"
|
|
content := msg.Content
|
|
if idx := strings.Index(content, "Result:\n"); idx >= 0 {
|
|
content = content[idx+8:] // Extract just the result part
|
|
}
|
|
|
|
// Skip internal channels - only log, don't send to user
|
|
if constants.IsInternalChannel(originChannel) {
|
|
logger.InfoCF("agent", "Subagent completed (internal channel)",
|
|
map[string]any{
|
|
"sender_id": msg.SenderID,
|
|
"content_len": len(content),
|
|
"channel": originChannel,
|
|
})
|
|
return "", nil
|
|
}
|
|
|
|
// Use default agent for system messages
|
|
agent := al.GetRegistry().GetDefaultAgent()
|
|
if agent == nil {
|
|
return "", fmt.Errorf("no default agent for system message")
|
|
}
|
|
|
|
// Use the origin session for context
|
|
sessionKey := routing.BuildAgentMainSessionKey(agent.ID)
|
|
|
|
return al.runAgentLoop(ctx, agent, processOptions{
|
|
SessionKey: sessionKey,
|
|
Channel: originChannel,
|
|
ChatID: originChatID,
|
|
UserMessage: fmt.Sprintf("[System: %s] %s", msg.SenderID, msg.Content),
|
|
DefaultResponse: "Background task completed.",
|
|
EnableSummary: false,
|
|
SendResponse: true,
|
|
})
|
|
}
|
|
|
|
// runAgentLoop remains the top-level shell that starts a turn and publishes
|
|
// any post-turn work. runTurn owns the full turn lifecycle.
|
|
func (al *AgentLoop) runAgentLoop(
|
|
ctx context.Context,
|
|
agent *AgentInstance,
|
|
opts processOptions,
|
|
) (string, error) {
|
|
// Record last channel for heartbeat notifications (skip internal channels and cli)
|
|
if opts.Channel != "" && opts.ChatID != "" && !constants.IsInternalChannel(opts.Channel) {
|
|
channelKey := fmt.Sprintf("%s:%s", opts.Channel, opts.ChatID)
|
|
if err := al.RecordLastChannel(channelKey); err != nil {
|
|
logger.WarnCF(
|
|
"agent",
|
|
"Failed to record last channel",
|
|
map[string]any{"error": err.Error()},
|
|
)
|
|
}
|
|
}
|
|
|
|
ts := newTurnState(agent, opts, al.newTurnEventScope(agent.ID, opts.SessionKey))
|
|
result, err := al.runTurn(ctx, ts)
|
|
if err != nil {
|
|
return "", err
|
|
}
|
|
if result.status == TurnEndStatusAborted {
|
|
return "", nil
|
|
}
|
|
|
|
for _, followUp := range result.followUps {
|
|
if pubErr := al.bus.PublishInbound(ctx, followUp); pubErr != nil {
|
|
logger.WarnCF("agent", "Failed to publish follow-up after turn",
|
|
map[string]any{
|
|
"turn_id": ts.turnID,
|
|
"error": pubErr.Error(),
|
|
})
|
|
}
|
|
}
|
|
|
|
if opts.SendResponse && result.finalContent != "" {
|
|
al.bus.PublishOutbound(ctx, bus.OutboundMessage{
|
|
Channel: opts.Channel,
|
|
ChatID: opts.ChatID,
|
|
Content: result.finalContent,
|
|
})
|
|
}
|
|
|
|
if result.finalContent != "" {
|
|
responsePreview := utils.Truncate(result.finalContent, 120)
|
|
logger.InfoCF("agent", fmt.Sprintf("Response: %s", responsePreview),
|
|
map[string]any{
|
|
"agent_id": agent.ID,
|
|
"session_key": opts.SessionKey,
|
|
"iterations": ts.currentIteration(),
|
|
"final_length": len(result.finalContent),
|
|
})
|
|
}
|
|
|
|
return result.finalContent, nil
|
|
}
|
|
|
|
func (al *AgentLoop) targetReasoningChannelID(channelName string) (chatID string) {
|
|
if al.channelManager == nil {
|
|
return ""
|
|
}
|
|
if ch, ok := al.channelManager.GetChannel(channelName); ok {
|
|
return ch.ReasoningChannelID()
|
|
}
|
|
return ""
|
|
}
|
|
|
|
func (al *AgentLoop) handleReasoning(
|
|
ctx context.Context,
|
|
reasoningContent, channelName, channelID string,
|
|
) {
|
|
if reasoningContent == "" || channelName == "" || channelID == "" {
|
|
return
|
|
}
|
|
|
|
// Check context cancellation before attempting to publish,
|
|
// since PublishOutbound's select may race between send and ctx.Done().
|
|
if ctx.Err() != nil {
|
|
return
|
|
}
|
|
|
|
// Use a short timeout so the goroutine does not block indefinitely when
|
|
// the outbound bus is full. Reasoning output is best-effort; dropping it
|
|
// is acceptable to avoid goroutine accumulation.
|
|
pubCtx, pubCancel := context.WithTimeout(ctx, 5*time.Second)
|
|
defer pubCancel()
|
|
|
|
if err := al.bus.PublishOutbound(pubCtx, bus.OutboundMessage{
|
|
Channel: channelName,
|
|
ChatID: channelID,
|
|
Content: reasoningContent,
|
|
}); err != nil {
|
|
// Treat context.DeadlineExceeded / context.Canceled as expected
|
|
// (bus full under load, or parent canceled). Check the error
|
|
// itself rather than ctx.Err(), because pubCtx may time out
|
|
// (5 s) while the parent ctx is still active.
|
|
// Also treat ErrBusClosed as expected — it occurs during normal
|
|
// shutdown when the bus is closed before all goroutines finish.
|
|
if errors.Is(err, context.DeadlineExceeded) || errors.Is(err, context.Canceled) ||
|
|
errors.Is(err, bus.ErrBusClosed) {
|
|
logger.DebugCF("agent", "Reasoning publish skipped (timeout/cancel)", map[string]any{
|
|
"channel": channelName,
|
|
"error": err.Error(),
|
|
})
|
|
} else {
|
|
logger.WarnCF("agent", "Failed to publish reasoning (best-effort)", map[string]any{
|
|
"channel": channelName,
|
|
"error": err.Error(),
|
|
})
|
|
}
|
|
}
|
|
}
|
|
|
|
func (al *AgentLoop) runTurn(ctx context.Context, ts *turnState) (turnResult, error) {
|
|
turnCtx, turnCancel := context.WithCancel(ctx)
|
|
defer turnCancel()
|
|
ts.setTurnCancel(turnCancel)
|
|
|
|
// Inject turnState and AgentLoop into context so tools (e.g. spawn) can retrieve them.
|
|
turnCtx = withTurnState(turnCtx, ts)
|
|
turnCtx = WithAgentLoop(turnCtx, al)
|
|
|
|
al.registerActiveTurn(ts)
|
|
defer al.clearActiveTurn(ts)
|
|
|
|
turnStatus := TurnEndStatusCompleted
|
|
defer func() {
|
|
al.emitEvent(
|
|
EventKindTurnEnd,
|
|
ts.eventMeta("runTurn", "turn.end"),
|
|
TurnEndPayload{
|
|
Status: turnStatus,
|
|
Iterations: ts.currentIteration(),
|
|
Duration: time.Since(ts.startedAt),
|
|
FinalContentLen: ts.finalContentLen(),
|
|
},
|
|
)
|
|
}()
|
|
|
|
al.emitEvent(
|
|
EventKindTurnStart,
|
|
ts.eventMeta("runTurn", "turn.start"),
|
|
TurnStartPayload{
|
|
Channel: ts.channel,
|
|
ChatID: ts.chatID,
|
|
UserMessage: ts.userMessage,
|
|
MediaCount: len(ts.media),
|
|
},
|
|
)
|
|
|
|
var history []providers.Message
|
|
var summary string
|
|
if !ts.opts.NoHistory {
|
|
history = ts.agent.Sessions.GetHistory(ts.sessionKey)
|
|
summary = ts.agent.Sessions.GetSummary(ts.sessionKey)
|
|
}
|
|
ts.captureRestorePoint(history, summary)
|
|
|
|
messages := ts.agent.ContextBuilder.BuildMessages(
|
|
history,
|
|
summary,
|
|
ts.userMessage,
|
|
ts.media,
|
|
ts.channel,
|
|
ts.chatID,
|
|
ts.opts.SenderID,
|
|
ts.opts.SenderDisplayName,
|
|
activeSkillNames(ts.agent, ts.opts)...,
|
|
)
|
|
|
|
cfg := al.GetConfig()
|
|
maxMediaSize := cfg.Agents.Defaults.GetMaxMediaSize()
|
|
messages = resolveMediaRefs(messages, al.mediaStore, maxMediaSize)
|
|
|
|
if !ts.opts.NoHistory {
|
|
toolDefs := ts.agent.Tools.ToProviderDefs()
|
|
if isOverContextBudget(ts.agent.ContextWindow, messages, toolDefs, ts.agent.MaxTokens) {
|
|
logger.WarnCF("agent", "Proactive compression: context budget exceeded before LLM call",
|
|
map[string]any{"session_key": ts.sessionKey})
|
|
if compression, ok := al.forceCompression(ts.agent, ts.sessionKey); ok {
|
|
al.emitEvent(
|
|
EventKindContextCompress,
|
|
ts.eventMeta("runTurn", "turn.context.compress"),
|
|
ContextCompressPayload{
|
|
Reason: ContextCompressReasonProactive,
|
|
DroppedMessages: compression.DroppedMessages,
|
|
RemainingMessages: compression.RemainingMessages,
|
|
},
|
|
)
|
|
ts.refreshRestorePointFromSession(ts.agent)
|
|
}
|
|
newHistory := ts.agent.Sessions.GetHistory(ts.sessionKey)
|
|
newSummary := ts.agent.Sessions.GetSummary(ts.sessionKey)
|
|
messages = ts.agent.ContextBuilder.BuildMessages(
|
|
newHistory, newSummary, ts.userMessage,
|
|
ts.media, ts.channel, ts.chatID,
|
|
ts.opts.SenderID, ts.opts.SenderDisplayName,
|
|
activeSkillNames(ts.agent, ts.opts)...,
|
|
)
|
|
messages = resolveMediaRefs(messages, al.mediaStore, maxMediaSize)
|
|
}
|
|
}
|
|
|
|
// Save user message to session (from Incoming)
|
|
if !ts.opts.NoHistory && (strings.TrimSpace(ts.userMessage) != "" || len(ts.media) > 0) {
|
|
rootMsg := providers.Message{
|
|
Role: "user",
|
|
Content: ts.userMessage,
|
|
Media: append([]string(nil), ts.media...),
|
|
}
|
|
if len(rootMsg.Media) > 0 {
|
|
ts.agent.Sessions.AddFullMessage(ts.sessionKey, rootMsg)
|
|
} else {
|
|
ts.agent.Sessions.AddMessage(ts.sessionKey, rootMsg.Role, rootMsg.Content)
|
|
}
|
|
ts.recordPersistedMessage(rootMsg)
|
|
}
|
|
|
|
activeCandidates, activeModel, usedLight := al.selectCandidates(ts.agent, ts.userMessage, messages)
|
|
activeProvider := ts.agent.Provider
|
|
if usedLight && ts.agent.LightProvider != nil {
|
|
activeProvider = ts.agent.LightProvider
|
|
}
|
|
pendingMessages := append([]providers.Message(nil), ts.opts.InitialSteeringMessages...)
|
|
var finalContent string
|
|
|
|
turnLoop:
|
|
for ts.currentIteration() < ts.agent.MaxIterations || len(pendingMessages) > 0 || func() bool {
|
|
graceful, _ := ts.gracefulInterruptRequested()
|
|
return graceful
|
|
}() {
|
|
if ts.hardAbortRequested() {
|
|
turnStatus = TurnEndStatusAborted
|
|
return al.abortTurn(ts)
|
|
}
|
|
|
|
iteration := ts.currentIteration() + 1
|
|
ts.setIteration(iteration)
|
|
ts.setPhase(TurnPhaseRunning)
|
|
|
|
if iteration > 1 {
|
|
if steerMsgs := al.dequeueSteeringMessagesForScope(ts.sessionKey); len(steerMsgs) > 0 {
|
|
pendingMessages = append(pendingMessages, steerMsgs...)
|
|
}
|
|
} else if !ts.opts.SkipInitialSteeringPoll {
|
|
if steerMsgs := al.dequeueSteeringMessagesForScopeWithFallback(ts.sessionKey); len(steerMsgs) > 0 {
|
|
pendingMessages = append(pendingMessages, steerMsgs...)
|
|
}
|
|
}
|
|
|
|
// Check if parent turn has ended (SubTurn support from HEAD)
|
|
if ts.parentTurnState != nil && ts.IsParentEnded() {
|
|
if !ts.critical {
|
|
logger.InfoCF("agent", "Parent turn ended, non-critical SubTurn exiting gracefully", map[string]any{
|
|
"agent_id": ts.agentID,
|
|
"iteration": iteration,
|
|
"turn_id": ts.turnID,
|
|
})
|
|
break
|
|
}
|
|
logger.InfoCF("agent", "Parent turn ended, critical SubTurn continues running", map[string]any{
|
|
"agent_id": ts.agentID,
|
|
"iteration": iteration,
|
|
"turn_id": ts.turnID,
|
|
})
|
|
}
|
|
|
|
// Poll for pending SubTurn results (from HEAD)
|
|
if ts.pendingResults != nil {
|
|
select {
|
|
case result, ok := <-ts.pendingResults:
|
|
if ok && result != nil && result.ForLLM != "" {
|
|
content := al.cfg.FilterSensitiveData(result.ForLLM)
|
|
msg := providers.Message{Role: "user", Content: fmt.Sprintf("[SubTurn Result] %s", content)}
|
|
pendingMessages = append(pendingMessages, msg)
|
|
}
|
|
default:
|
|
// No results available
|
|
}
|
|
}
|
|
|
|
// Inject pending steering messages
|
|
if len(pendingMessages) > 0 {
|
|
resolvedPending := resolveMediaRefs(pendingMessages, al.mediaStore, maxMediaSize)
|
|
totalContentLen := 0
|
|
for i, pm := range pendingMessages {
|
|
messages = append(messages, resolvedPending[i])
|
|
totalContentLen += len(pm.Content)
|
|
if !ts.opts.NoHistory {
|
|
ts.agent.Sessions.AddFullMessage(ts.sessionKey, pm)
|
|
ts.recordPersistedMessage(pm)
|
|
}
|
|
logger.InfoCF("agent", "Injected steering message into context",
|
|
map[string]any{
|
|
"agent_id": ts.agent.ID,
|
|
"iteration": iteration,
|
|
"content_len": len(pm.Content),
|
|
"media_count": len(pm.Media),
|
|
})
|
|
}
|
|
al.emitEvent(
|
|
EventKindSteeringInjected,
|
|
ts.eventMeta("runTurn", "turn.steering.injected"),
|
|
SteeringInjectedPayload{
|
|
Count: len(pendingMessages),
|
|
TotalContentLen: totalContentLen,
|
|
},
|
|
)
|
|
pendingMessages = nil
|
|
}
|
|
|
|
logger.DebugCF("agent", "LLM iteration",
|
|
map[string]any{
|
|
"agent_id": ts.agent.ID,
|
|
"iteration": iteration,
|
|
"max": ts.agent.MaxIterations,
|
|
})
|
|
|
|
gracefulTerminal, _ := ts.gracefulInterruptRequested()
|
|
providerToolDefs := ts.agent.Tools.ToProviderDefs()
|
|
|
|
// Native web search support (from HEAD)
|
|
_, hasWebSearch := ts.agent.Tools.Get("web_search")
|
|
useNativeSearch := al.cfg.Tools.Web.PreferNative &&
|
|
hasWebSearch &&
|
|
func() bool {
|
|
// Check if provider supports native search
|
|
if ns, ok := ts.agent.Provider.(interface{ SupportsNativeSearch() bool }); ok {
|
|
return ns.SupportsNativeSearch()
|
|
}
|
|
return false
|
|
}()
|
|
|
|
if useNativeSearch {
|
|
// Filter out client-side web_search tool
|
|
filtered := make([]providers.ToolDefinition, 0, len(providerToolDefs))
|
|
for _, td := range providerToolDefs {
|
|
if td.Function.Name != "web_search" {
|
|
filtered = append(filtered, td)
|
|
}
|
|
}
|
|
providerToolDefs = filtered
|
|
}
|
|
|
|
callMessages := messages
|
|
if gracefulTerminal {
|
|
callMessages = append(append([]providers.Message(nil), messages...), ts.interruptHintMessage())
|
|
providerToolDefs = nil
|
|
ts.markGracefulTerminalUsed()
|
|
}
|
|
|
|
llmOpts := map[string]any{
|
|
"max_tokens": ts.agent.MaxTokens,
|
|
"temperature": ts.agent.Temperature,
|
|
"prompt_cache_key": ts.agent.ID,
|
|
}
|
|
if useNativeSearch {
|
|
llmOpts["native_search"] = true
|
|
}
|
|
if ts.agent.ThinkingLevel != ThinkingOff {
|
|
if tc, ok := ts.agent.Provider.(providers.ThinkingCapable); ok && tc.SupportsThinking() {
|
|
llmOpts["thinking_level"] = string(ts.agent.ThinkingLevel)
|
|
} else {
|
|
logger.WarnCF("agent", "thinking_level is set but current provider does not support it, ignoring",
|
|
map[string]any{"agent_id": ts.agent.ID, "thinking_level": string(ts.agent.ThinkingLevel)})
|
|
}
|
|
}
|
|
|
|
llmModel := activeModel
|
|
if al.hooks != nil {
|
|
llmReq, decision := al.hooks.BeforeLLM(turnCtx, &LLMHookRequest{
|
|
Meta: ts.eventMeta("runTurn", "turn.llm.request"),
|
|
Model: llmModel,
|
|
Messages: callMessages,
|
|
Tools: providerToolDefs,
|
|
Options: llmOpts,
|
|
Channel: ts.channel,
|
|
ChatID: ts.chatID,
|
|
GracefulTerminal: gracefulTerminal,
|
|
})
|
|
switch decision.normalizedAction() {
|
|
case HookActionContinue, HookActionModify:
|
|
if llmReq != nil {
|
|
llmModel = llmReq.Model
|
|
callMessages = llmReq.Messages
|
|
providerToolDefs = llmReq.Tools
|
|
llmOpts = llmReq.Options
|
|
}
|
|
case HookActionAbortTurn:
|
|
turnStatus = TurnEndStatusError
|
|
return turnResult{}, al.hookAbortError(ts, "before_llm", decision)
|
|
case HookActionHardAbort:
|
|
_ = ts.requestHardAbort()
|
|
turnStatus = TurnEndStatusAborted
|
|
return al.abortTurn(ts)
|
|
}
|
|
}
|
|
|
|
al.emitEvent(
|
|
EventKindLLMRequest,
|
|
ts.eventMeta("runTurn", "turn.llm.request"),
|
|
LLMRequestPayload{
|
|
Model: llmModel,
|
|
MessagesCount: len(callMessages),
|
|
ToolsCount: len(providerToolDefs),
|
|
MaxTokens: ts.agent.MaxTokens,
|
|
Temperature: ts.agent.Temperature,
|
|
},
|
|
)
|
|
|
|
logger.DebugCF("agent", "LLM request",
|
|
map[string]any{
|
|
"agent_id": ts.agent.ID,
|
|
"iteration": iteration,
|
|
"model": llmModel,
|
|
"messages_count": len(callMessages),
|
|
"tools_count": len(providerToolDefs),
|
|
"max_tokens": ts.agent.MaxTokens,
|
|
"temperature": ts.agent.Temperature,
|
|
"system_prompt_len": len(callMessages[0].Content),
|
|
})
|
|
logger.DebugCF("agent", "Full LLM request",
|
|
map[string]any{
|
|
"iteration": iteration,
|
|
"messages_json": formatMessagesForLog(callMessages),
|
|
"tools_json": formatToolsForLog(providerToolDefs),
|
|
})
|
|
|
|
callLLM := func(messagesForCall []providers.Message, toolDefsForCall []providers.ToolDefinition) (*providers.LLMResponse, error) {
|
|
providerCtx, providerCancel := context.WithCancel(turnCtx)
|
|
ts.setProviderCancel(providerCancel)
|
|
defer func() {
|
|
providerCancel()
|
|
ts.clearProviderCancel(providerCancel)
|
|
}()
|
|
|
|
al.activeRequests.Add(1)
|
|
defer al.activeRequests.Done()
|
|
|
|
if len(activeCandidates) > 1 && al.fallback != nil {
|
|
fbResult, fbErr := al.fallback.Execute(
|
|
providerCtx,
|
|
activeCandidates,
|
|
func(ctx context.Context, provider, model string) (*providers.LLMResponse, error) {
|
|
return activeProvider.Chat(ctx, messagesForCall, toolDefsForCall, model, llmOpts)
|
|
},
|
|
)
|
|
if fbErr != nil {
|
|
return nil, fbErr
|
|
}
|
|
if fbResult.Provider != "" && len(fbResult.Attempts) > 0 {
|
|
logger.InfoCF(
|
|
"agent",
|
|
fmt.Sprintf("Fallback: succeeded with %s/%s after %d attempts",
|
|
fbResult.Provider, fbResult.Model, len(fbResult.Attempts)+1),
|
|
map[string]any{"agent_id": ts.agent.ID, "iteration": iteration},
|
|
)
|
|
}
|
|
return fbResult.Response, nil
|
|
}
|
|
return activeProvider.Chat(providerCtx, messagesForCall, toolDefsForCall, llmModel, llmOpts)
|
|
}
|
|
|
|
var response *providers.LLMResponse
|
|
var err error
|
|
maxRetries := 2
|
|
for retry := 0; retry <= maxRetries; retry++ {
|
|
response, err = callLLM(callMessages, providerToolDefs)
|
|
if err == nil {
|
|
break
|
|
}
|
|
if ts.hardAbortRequested() && errors.Is(err, context.Canceled) {
|
|
turnStatus = TurnEndStatusAborted
|
|
return al.abortTurn(ts)
|
|
}
|
|
|
|
errMsg := strings.ToLower(err.Error())
|
|
isTimeoutError := errors.Is(err, context.DeadlineExceeded) ||
|
|
strings.Contains(errMsg, "deadline exceeded") ||
|
|
strings.Contains(errMsg, "client.timeout") ||
|
|
strings.Contains(errMsg, "timed out") ||
|
|
strings.Contains(errMsg, "timeout exceeded")
|
|
|
|
isContextError := !isTimeoutError && (strings.Contains(errMsg, "context_length_exceeded") ||
|
|
strings.Contains(errMsg, "context window") ||
|
|
strings.Contains(errMsg, "context_window") ||
|
|
strings.Contains(errMsg, "maximum context length") ||
|
|
strings.Contains(errMsg, "token limit") ||
|
|
strings.Contains(errMsg, "too many tokens") ||
|
|
strings.Contains(errMsg, "max_tokens") ||
|
|
strings.Contains(errMsg, "invalidparameter") ||
|
|
strings.Contains(errMsg, "prompt is too long") ||
|
|
strings.Contains(errMsg, "request too large"))
|
|
|
|
if isTimeoutError && retry < maxRetries {
|
|
backoff := time.Duration(retry+1) * 5 * time.Second
|
|
al.emitEvent(
|
|
EventKindLLMRetry,
|
|
ts.eventMeta("runTurn", "turn.llm.retry"),
|
|
LLMRetryPayload{
|
|
Attempt: retry + 1,
|
|
MaxRetries: maxRetries,
|
|
Reason: "timeout",
|
|
Error: err.Error(),
|
|
Backoff: backoff,
|
|
},
|
|
)
|
|
logger.WarnCF("agent", "Timeout error, retrying after backoff", map[string]any{
|
|
"error": err.Error(),
|
|
"retry": retry,
|
|
"backoff": backoff.String(),
|
|
})
|
|
if sleepErr := sleepWithContext(turnCtx, backoff); sleepErr != nil {
|
|
if ts.hardAbortRequested() {
|
|
turnStatus = TurnEndStatusAborted
|
|
return al.abortTurn(ts)
|
|
}
|
|
err = sleepErr
|
|
break
|
|
}
|
|
continue
|
|
}
|
|
|
|
if isContextError && retry < maxRetries && !ts.opts.NoHistory {
|
|
al.emitEvent(
|
|
EventKindLLMRetry,
|
|
ts.eventMeta("runTurn", "turn.llm.retry"),
|
|
LLMRetryPayload{
|
|
Attempt: retry + 1,
|
|
MaxRetries: maxRetries,
|
|
Reason: "context_limit",
|
|
Error: err.Error(),
|
|
},
|
|
)
|
|
logger.WarnCF(
|
|
"agent",
|
|
"Context window error detected, attempting compression",
|
|
map[string]any{
|
|
"error": err.Error(),
|
|
"retry": retry,
|
|
},
|
|
)
|
|
|
|
if retry == 0 && !constants.IsInternalChannel(ts.channel) {
|
|
al.bus.PublishOutbound(ctx, bus.OutboundMessage{
|
|
Channel: ts.channel,
|
|
ChatID: ts.chatID,
|
|
Content: "Context window exceeded. Compressing history and retrying...",
|
|
})
|
|
}
|
|
|
|
if compression, ok := al.forceCompression(ts.agent, ts.sessionKey); ok {
|
|
al.emitEvent(
|
|
EventKindContextCompress,
|
|
ts.eventMeta("runTurn", "turn.context.compress"),
|
|
ContextCompressPayload{
|
|
Reason: ContextCompressReasonRetry,
|
|
DroppedMessages: compression.DroppedMessages,
|
|
RemainingMessages: compression.RemainingMessages,
|
|
},
|
|
)
|
|
ts.refreshRestorePointFromSession(ts.agent)
|
|
}
|
|
|
|
newHistory := ts.agent.Sessions.GetHistory(ts.sessionKey)
|
|
newSummary := ts.agent.Sessions.GetSummary(ts.sessionKey)
|
|
messages = ts.agent.ContextBuilder.BuildMessages(
|
|
newHistory, newSummary, "",
|
|
nil, ts.channel, ts.chatID, ts.opts.SenderID, ts.opts.SenderDisplayName,
|
|
activeSkillNames(ts.agent, ts.opts)...,
|
|
)
|
|
callMessages = messages
|
|
if gracefulTerminal {
|
|
callMessages = append(append([]providers.Message(nil), messages...), ts.interruptHintMessage())
|
|
}
|
|
continue
|
|
}
|
|
break
|
|
}
|
|
|
|
if err != nil {
|
|
turnStatus = TurnEndStatusError
|
|
al.emitEvent(
|
|
EventKindError,
|
|
ts.eventMeta("runTurn", "turn.error"),
|
|
ErrorPayload{
|
|
Stage: "llm",
|
|
Message: err.Error(),
|
|
},
|
|
)
|
|
logger.ErrorCF("agent", "LLM call failed",
|
|
map[string]any{
|
|
"agent_id": ts.agent.ID,
|
|
"iteration": iteration,
|
|
"model": llmModel,
|
|
"error": err.Error(),
|
|
})
|
|
return turnResult{}, fmt.Errorf("LLM call failed after retries: %w", err)
|
|
}
|
|
|
|
if al.hooks != nil {
|
|
llmResp, decision := al.hooks.AfterLLM(turnCtx, &LLMHookResponse{
|
|
Meta: ts.eventMeta("runTurn", "turn.llm.response"),
|
|
Model: llmModel,
|
|
Response: response,
|
|
Channel: ts.channel,
|
|
ChatID: ts.chatID,
|
|
})
|
|
switch decision.normalizedAction() {
|
|
case HookActionContinue, HookActionModify:
|
|
if llmResp != nil && llmResp.Response != nil {
|
|
response = llmResp.Response
|
|
}
|
|
case HookActionAbortTurn:
|
|
turnStatus = TurnEndStatusError
|
|
return turnResult{}, al.hookAbortError(ts, "after_llm", decision)
|
|
case HookActionHardAbort:
|
|
_ = ts.requestHardAbort()
|
|
turnStatus = TurnEndStatusAborted
|
|
return al.abortTurn(ts)
|
|
}
|
|
}
|
|
|
|
// Save finishReason to turnState for SubTurn truncation detection
|
|
if innerTS := turnStateFromContext(ctx); innerTS != nil {
|
|
innerTS.SetLastFinishReason(response.FinishReason)
|
|
// Save usage for token budget tracking
|
|
if response.Usage != nil {
|
|
innerTS.SetLastUsage(response.Usage)
|
|
}
|
|
}
|
|
|
|
reasoningContent := response.Reasoning
|
|
if reasoningContent == "" {
|
|
reasoningContent = response.ReasoningContent
|
|
}
|
|
go al.handleReasoning(
|
|
turnCtx,
|
|
reasoningContent,
|
|
ts.channel,
|
|
al.targetReasoningChannelID(ts.channel),
|
|
)
|
|
al.emitEvent(
|
|
EventKindLLMResponse,
|
|
ts.eventMeta("runTurn", "turn.llm.response"),
|
|
LLMResponsePayload{
|
|
ContentLen: len(response.Content),
|
|
ToolCalls: len(response.ToolCalls),
|
|
HasReasoning: response.Reasoning != "" || response.ReasoningContent != "",
|
|
},
|
|
)
|
|
|
|
llmResponseFields := map[string]any{
|
|
"agent_id": ts.agent.ID,
|
|
"iteration": iteration,
|
|
"content_chars": len(response.Content),
|
|
"tool_calls": len(response.ToolCalls),
|
|
"reasoning": response.Reasoning,
|
|
"target_channel": al.targetReasoningChannelID(ts.channel),
|
|
"channel": ts.channel,
|
|
}
|
|
if response.Usage != nil {
|
|
llmResponseFields["prompt_tokens"] = response.Usage.PromptTokens
|
|
llmResponseFields["completion_tokens"] = response.Usage.CompletionTokens
|
|
llmResponseFields["total_tokens"] = response.Usage.TotalTokens
|
|
}
|
|
logger.DebugCF("agent", "LLM response", llmResponseFields)
|
|
|
|
if len(response.ToolCalls) == 0 || gracefulTerminal {
|
|
responseContent := response.Content
|
|
if responseContent == "" && response.ReasoningContent != "" {
|
|
responseContent = response.ReasoningContent
|
|
}
|
|
if steerMsgs := al.dequeueSteeringMessagesForScope(ts.sessionKey); len(steerMsgs) > 0 {
|
|
logger.InfoCF("agent", "Steering arrived after direct LLM response; continuing turn",
|
|
map[string]any{
|
|
"agent_id": ts.agent.ID,
|
|
"iteration": iteration,
|
|
"steering_count": len(steerMsgs),
|
|
})
|
|
pendingMessages = append(pendingMessages, steerMsgs...)
|
|
continue
|
|
}
|
|
finalContent = responseContent
|
|
logger.InfoCF("agent", "LLM response without tool calls (direct answer)",
|
|
map[string]any{
|
|
"agent_id": ts.agent.ID,
|
|
"iteration": iteration,
|
|
"content_chars": len(finalContent),
|
|
})
|
|
break
|
|
}
|
|
|
|
normalizedToolCalls := make([]providers.ToolCall, 0, len(response.ToolCalls))
|
|
for _, tc := range response.ToolCalls {
|
|
normalizedToolCalls = append(normalizedToolCalls, providers.NormalizeToolCall(tc))
|
|
}
|
|
|
|
toolNames := make([]string, 0, len(normalizedToolCalls))
|
|
for _, tc := range normalizedToolCalls {
|
|
toolNames = append(toolNames, tc.Name)
|
|
}
|
|
logger.InfoCF("agent", "LLM requested tool calls",
|
|
map[string]any{
|
|
"agent_id": ts.agent.ID,
|
|
"tools": toolNames,
|
|
"count": len(normalizedToolCalls),
|
|
"iteration": iteration,
|
|
})
|
|
|
|
allResponsesHandled := len(normalizedToolCalls) > 0
|
|
assistantMsg := providers.Message{
|
|
Role: "assistant",
|
|
Content: response.Content,
|
|
ReasoningContent: response.ReasoningContent,
|
|
}
|
|
for _, tc := range normalizedToolCalls {
|
|
argumentsJSON, _ := json.Marshal(tc.Arguments)
|
|
extraContent := tc.ExtraContent
|
|
thoughtSignature := ""
|
|
if tc.Function != nil {
|
|
thoughtSignature = tc.Function.ThoughtSignature
|
|
}
|
|
assistantMsg.ToolCalls = append(assistantMsg.ToolCalls, providers.ToolCall{
|
|
ID: tc.ID,
|
|
Type: "function",
|
|
Name: tc.Name,
|
|
Function: &providers.FunctionCall{
|
|
Name: tc.Name,
|
|
Arguments: string(argumentsJSON),
|
|
ThoughtSignature: thoughtSignature,
|
|
},
|
|
ExtraContent: extraContent,
|
|
ThoughtSignature: thoughtSignature,
|
|
})
|
|
}
|
|
messages = append(messages, assistantMsg)
|
|
if !ts.opts.NoHistory {
|
|
ts.agent.Sessions.AddFullMessage(ts.sessionKey, assistantMsg)
|
|
ts.recordPersistedMessage(assistantMsg)
|
|
}
|
|
|
|
ts.setPhase(TurnPhaseTools)
|
|
for i, tc := range normalizedToolCalls {
|
|
if ts.hardAbortRequested() {
|
|
turnStatus = TurnEndStatusAborted
|
|
return al.abortTurn(ts)
|
|
}
|
|
|
|
toolName := tc.Name
|
|
toolArgs := cloneStringAnyMap(tc.Arguments)
|
|
|
|
if al.hooks != nil {
|
|
toolReq, decision := al.hooks.BeforeTool(turnCtx, &ToolCallHookRequest{
|
|
Meta: ts.eventMeta("runTurn", "turn.tool.before"),
|
|
Tool: toolName,
|
|
Arguments: toolArgs,
|
|
Channel: ts.channel,
|
|
ChatID: ts.chatID,
|
|
})
|
|
switch decision.normalizedAction() {
|
|
case HookActionContinue, HookActionModify:
|
|
if toolReq != nil {
|
|
toolName = toolReq.Tool
|
|
toolArgs = toolReq.Arguments
|
|
}
|
|
case HookActionDenyTool:
|
|
allResponsesHandled = false
|
|
denyContent := hookDeniedToolContent("Tool execution denied by hook", decision.Reason)
|
|
al.emitEvent(
|
|
EventKindToolExecSkipped,
|
|
ts.eventMeta("runTurn", "turn.tool.skipped"),
|
|
ToolExecSkippedPayload{
|
|
Tool: toolName,
|
|
Reason: denyContent,
|
|
},
|
|
)
|
|
deniedMsg := providers.Message{
|
|
Role: "tool",
|
|
Content: denyContent,
|
|
ToolCallID: tc.ID,
|
|
}
|
|
messages = append(messages, deniedMsg)
|
|
if !ts.opts.NoHistory {
|
|
ts.agent.Sessions.AddFullMessage(ts.sessionKey, deniedMsg)
|
|
ts.recordPersistedMessage(deniedMsg)
|
|
}
|
|
continue
|
|
case HookActionAbortTurn:
|
|
turnStatus = TurnEndStatusError
|
|
return turnResult{}, al.hookAbortError(ts, "before_tool", decision)
|
|
case HookActionHardAbort:
|
|
_ = ts.requestHardAbort()
|
|
turnStatus = TurnEndStatusAborted
|
|
return al.abortTurn(ts)
|
|
}
|
|
}
|
|
|
|
if al.hooks != nil {
|
|
approval := al.hooks.ApproveTool(turnCtx, &ToolApprovalRequest{
|
|
Meta: ts.eventMeta("runTurn", "turn.tool.approve"),
|
|
Tool: toolName,
|
|
Arguments: toolArgs,
|
|
Channel: ts.channel,
|
|
ChatID: ts.chatID,
|
|
})
|
|
if !approval.Approved {
|
|
allResponsesHandled = false
|
|
denyContent := hookDeniedToolContent("Tool execution denied by approval hook", approval.Reason)
|
|
al.emitEvent(
|
|
EventKindToolExecSkipped,
|
|
ts.eventMeta("runTurn", "turn.tool.skipped"),
|
|
ToolExecSkippedPayload{
|
|
Tool: toolName,
|
|
Reason: denyContent,
|
|
},
|
|
)
|
|
deniedMsg := providers.Message{
|
|
Role: "tool",
|
|
Content: denyContent,
|
|
ToolCallID: tc.ID,
|
|
}
|
|
messages = append(messages, deniedMsg)
|
|
if !ts.opts.NoHistory {
|
|
ts.agent.Sessions.AddFullMessage(ts.sessionKey, deniedMsg)
|
|
ts.recordPersistedMessage(deniedMsg)
|
|
}
|
|
continue
|
|
}
|
|
}
|
|
|
|
argsJSON, _ := json.Marshal(toolArgs)
|
|
argsPreview := utils.Truncate(string(argsJSON), 200)
|
|
logger.InfoCF("agent", fmt.Sprintf("Tool call: %s(%s)", toolName, argsPreview),
|
|
map[string]any{
|
|
"agent_id": ts.agent.ID,
|
|
"tool": toolName,
|
|
"iteration": iteration,
|
|
})
|
|
al.emitEvent(
|
|
EventKindToolExecStart,
|
|
ts.eventMeta("runTurn", "turn.tool.start"),
|
|
ToolExecStartPayload{
|
|
Tool: toolName,
|
|
Arguments: cloneEventArguments(toolArgs),
|
|
},
|
|
)
|
|
|
|
// Send tool feedback to chat channel if enabled (from HEAD)
|
|
if al.cfg.Agents.Defaults.IsToolFeedbackEnabled() &&
|
|
ts.channel != "" &&
|
|
!ts.opts.SuppressToolFeedback {
|
|
feedbackPreview := utils.Truncate(
|
|
string(argsJSON),
|
|
al.cfg.Agents.Defaults.GetToolFeedbackMaxArgsLength(),
|
|
)
|
|
feedbackMsg := fmt.Sprintf("\U0001f527 `%s`\n```\n%s\n```", tc.Name, feedbackPreview)
|
|
fbCtx, fbCancel := context.WithTimeout(turnCtx, 3*time.Second)
|
|
_ = al.bus.PublishOutbound(fbCtx, bus.OutboundMessage{
|
|
Channel: ts.channel,
|
|
ChatID: ts.chatID,
|
|
Content: feedbackMsg,
|
|
})
|
|
fbCancel()
|
|
}
|
|
|
|
toolCallID := tc.ID
|
|
toolIteration := iteration
|
|
asyncToolName := toolName
|
|
asyncCallback := func(_ context.Context, result *tools.ToolResult) {
|
|
// Send ForUser content directly to the user (immediate feedback),
|
|
// mirroring the synchronous tool execution path.
|
|
if !result.Silent && result.ForUser != "" {
|
|
outCtx, outCancel := context.WithTimeout(context.Background(), 5*time.Second)
|
|
defer outCancel()
|
|
_ = al.bus.PublishOutbound(outCtx, bus.OutboundMessage{
|
|
Channel: ts.channel,
|
|
ChatID: ts.chatID,
|
|
Content: result.ForUser,
|
|
})
|
|
}
|
|
|
|
// Determine content for the agent loop (ForLLM or error).
|
|
content := result.ContentForLLM()
|
|
if content == "" {
|
|
return
|
|
}
|
|
|
|
// Filter sensitive data before publishing
|
|
content = al.cfg.FilterSensitiveData(content)
|
|
|
|
logger.InfoCF("agent", "Async tool completed, publishing result",
|
|
map[string]any{
|
|
"tool": asyncToolName,
|
|
"content_len": len(content),
|
|
"channel": ts.channel,
|
|
})
|
|
al.emitEvent(
|
|
EventKindFollowUpQueued,
|
|
ts.scope.meta(toolIteration, "runTurn", "turn.follow_up.queued"),
|
|
FollowUpQueuedPayload{
|
|
SourceTool: asyncToolName,
|
|
Channel: ts.channel,
|
|
ChatID: ts.chatID,
|
|
ContentLen: len(content),
|
|
},
|
|
)
|
|
|
|
pubCtx, pubCancel := context.WithTimeout(context.Background(), 5*time.Second)
|
|
defer pubCancel()
|
|
_ = al.bus.PublishInbound(pubCtx, bus.InboundMessage{
|
|
Channel: "system",
|
|
SenderID: fmt.Sprintf("async:%s", asyncToolName),
|
|
ChatID: fmt.Sprintf("%s:%s", ts.channel, ts.chatID),
|
|
Content: content,
|
|
})
|
|
}
|
|
|
|
toolStart := time.Now()
|
|
toolResult := ts.agent.Tools.ExecuteWithContext(
|
|
turnCtx,
|
|
toolName,
|
|
toolArgs,
|
|
ts.channel,
|
|
ts.chatID,
|
|
asyncCallback,
|
|
)
|
|
toolDuration := time.Since(toolStart)
|
|
|
|
if ts.hardAbortRequested() {
|
|
turnStatus = TurnEndStatusAborted
|
|
return al.abortTurn(ts)
|
|
}
|
|
|
|
if al.hooks != nil {
|
|
toolResp, decision := al.hooks.AfterTool(turnCtx, &ToolResultHookResponse{
|
|
Meta: ts.eventMeta("runTurn", "turn.tool.after"),
|
|
Tool: toolName,
|
|
Arguments: toolArgs,
|
|
Result: toolResult,
|
|
Duration: toolDuration,
|
|
Channel: ts.channel,
|
|
ChatID: ts.chatID,
|
|
})
|
|
switch decision.normalizedAction() {
|
|
case HookActionContinue, HookActionModify:
|
|
if toolResp != nil {
|
|
if toolResp.Tool != "" {
|
|
toolName = toolResp.Tool
|
|
}
|
|
if toolResp.Result != nil {
|
|
toolResult = toolResp.Result
|
|
}
|
|
}
|
|
case HookActionAbortTurn:
|
|
turnStatus = TurnEndStatusError
|
|
return turnResult{}, al.hookAbortError(ts, "after_tool", decision)
|
|
case HookActionHardAbort:
|
|
_ = ts.requestHardAbort()
|
|
turnStatus = TurnEndStatusAborted
|
|
return al.abortTurn(ts)
|
|
}
|
|
}
|
|
|
|
if toolResult == nil {
|
|
toolResult = tools.ErrorResult("hook returned nil tool result")
|
|
}
|
|
if len(toolResult.Media) > 0 && toolResult.ResponseHandled {
|
|
parts := make([]bus.MediaPart, 0, len(toolResult.Media))
|
|
for _, ref := range toolResult.Media {
|
|
part := bus.MediaPart{Ref: ref}
|
|
if al.mediaStore != nil {
|
|
if _, meta, err := al.mediaStore.ResolveWithMeta(ref); err == nil {
|
|
part.Filename = meta.Filename
|
|
part.ContentType = meta.ContentType
|
|
part.Type = inferMediaType(meta.Filename, meta.ContentType)
|
|
}
|
|
}
|
|
parts = append(parts, part)
|
|
}
|
|
outboundMedia := bus.OutboundMediaMessage{
|
|
Channel: ts.channel,
|
|
ChatID: ts.chatID,
|
|
Parts: parts,
|
|
}
|
|
if al.channelManager != nil && ts.channel != "" && !constants.IsInternalChannel(ts.channel) {
|
|
if err := al.channelManager.SendMedia(ctx, outboundMedia); err != nil {
|
|
logger.WarnCF("agent", "Failed to deliver handled tool media",
|
|
map[string]any{
|
|
"agent_id": ts.agent.ID,
|
|
"tool": toolName,
|
|
"channel": ts.channel,
|
|
"chat_id": ts.chatID,
|
|
"error": err.Error(),
|
|
})
|
|
toolResult = tools.ErrorResult(fmt.Sprintf("failed to deliver attachment: %v", err)).WithError(err)
|
|
}
|
|
} else if al.bus != nil {
|
|
al.bus.PublishOutboundMedia(ctx, outboundMedia)
|
|
// Queuing media is only best-effort; it has not been delivered yet.
|
|
toolResult.ResponseHandled = false
|
|
}
|
|
}
|
|
|
|
if len(toolResult.Media) > 0 && !toolResult.ResponseHandled {
|
|
toolResult.ArtifactTags = buildArtifactTags(al.mediaStore, toolResult.Media)
|
|
}
|
|
|
|
if !toolResult.ResponseHandled {
|
|
allResponsesHandled = false
|
|
}
|
|
|
|
if !toolResult.Silent && toolResult.ForUser != "" && ts.opts.SendResponse {
|
|
al.bus.PublishOutbound(ctx, bus.OutboundMessage{
|
|
Channel: ts.channel,
|
|
ChatID: ts.chatID,
|
|
Content: toolResult.ForUser,
|
|
})
|
|
logger.DebugCF("agent", "Sent tool result to user",
|
|
map[string]any{
|
|
"tool": toolName,
|
|
"content_len": len(toolResult.ForUser),
|
|
})
|
|
}
|
|
|
|
contentForLLM := toolResult.ContentForLLM()
|
|
|
|
// Filter sensitive data (API keys, tokens, secrets) before sending to LLM
|
|
if al.cfg.Tools.IsFilterSensitiveDataEnabled() {
|
|
contentForLLM = al.cfg.FilterSensitiveData(contentForLLM)
|
|
}
|
|
|
|
toolResultMsg := providers.Message{
|
|
Role: "tool",
|
|
Content: contentForLLM,
|
|
ToolCallID: toolCallID,
|
|
}
|
|
al.emitEvent(
|
|
EventKindToolExecEnd,
|
|
ts.eventMeta("runTurn", "turn.tool.end"),
|
|
ToolExecEndPayload{
|
|
Tool: toolName,
|
|
Duration: toolDuration,
|
|
ForLLMLen: len(contentForLLM),
|
|
ForUserLen: len(toolResult.ForUser),
|
|
IsError: toolResult.IsError,
|
|
Async: toolResult.Async,
|
|
},
|
|
)
|
|
messages = append(messages, toolResultMsg)
|
|
if !ts.opts.NoHistory {
|
|
ts.agent.Sessions.AddFullMessage(ts.sessionKey, toolResultMsg)
|
|
ts.recordPersistedMessage(toolResultMsg)
|
|
}
|
|
|
|
if steerMsgs := al.dequeueSteeringMessagesForScope(ts.sessionKey); len(steerMsgs) > 0 {
|
|
pendingMessages = append(pendingMessages, steerMsgs...)
|
|
}
|
|
|
|
skipReason := ""
|
|
skipMessage := ""
|
|
if len(pendingMessages) > 0 {
|
|
skipReason = "queued user steering message"
|
|
skipMessage = "Skipped due to queued user message."
|
|
} else if gracefulPending, _ := ts.gracefulInterruptRequested(); gracefulPending {
|
|
skipReason = "graceful interrupt requested"
|
|
skipMessage = "Skipped due to graceful interrupt."
|
|
}
|
|
|
|
if skipReason != "" {
|
|
remaining := len(normalizedToolCalls) - i - 1
|
|
if remaining > 0 {
|
|
logger.InfoCF("agent", "Turn checkpoint: skipping remaining tools",
|
|
map[string]any{
|
|
"agent_id": ts.agent.ID,
|
|
"completed": i + 1,
|
|
"skipped": remaining,
|
|
"reason": skipReason,
|
|
})
|
|
for j := i + 1; j < len(normalizedToolCalls); j++ {
|
|
skippedTC := normalizedToolCalls[j]
|
|
al.emitEvent(
|
|
EventKindToolExecSkipped,
|
|
ts.eventMeta("runTurn", "turn.tool.skipped"),
|
|
ToolExecSkippedPayload{
|
|
Tool: skippedTC.Name,
|
|
Reason: skipReason,
|
|
},
|
|
)
|
|
skippedMsg := providers.Message{
|
|
Role: "tool",
|
|
Content: skipMessage,
|
|
ToolCallID: skippedTC.ID,
|
|
}
|
|
messages = append(messages, skippedMsg)
|
|
if !ts.opts.NoHistory {
|
|
ts.agent.Sessions.AddFullMessage(ts.sessionKey, skippedMsg)
|
|
ts.recordPersistedMessage(skippedMsg)
|
|
}
|
|
}
|
|
}
|
|
break
|
|
}
|
|
|
|
// Also poll for any SubTurn results that arrived during tool execution.
|
|
if ts.pendingResults != nil {
|
|
select {
|
|
case result, ok := <-ts.pendingResults:
|
|
if ok && result != nil && result.ForLLM != "" {
|
|
content := al.cfg.FilterSensitiveData(result.ForLLM)
|
|
msg := providers.Message{Role: "user", Content: fmt.Sprintf("[SubTurn Result] %s", content)}
|
|
messages = append(messages, msg)
|
|
ts.agent.Sessions.AddFullMessage(ts.sessionKey, msg)
|
|
}
|
|
default:
|
|
// No results available
|
|
}
|
|
}
|
|
}
|
|
|
|
if allResponsesHandled {
|
|
if len(pendingMessages) > 0 {
|
|
logger.InfoCF("agent", "Pending steering exists after handled tool delivery; continuing turn before finalizing",
|
|
map[string]any{
|
|
"agent_id": ts.agent.ID,
|
|
"steering_count": len(pendingMessages),
|
|
"session_key": ts.sessionKey,
|
|
})
|
|
finalContent = ""
|
|
goto turnLoop
|
|
}
|
|
|
|
if steerMsgs := al.dequeueSteeringMessagesForScope(ts.sessionKey); len(steerMsgs) > 0 {
|
|
logger.InfoCF("agent", "Steering arrived after handled tool delivery; continuing turn before finalizing",
|
|
map[string]any{
|
|
"agent_id": ts.agent.ID,
|
|
"steering_count": len(steerMsgs),
|
|
"session_key": ts.sessionKey,
|
|
})
|
|
pendingMessages = append(pendingMessages, steerMsgs...)
|
|
finalContent = ""
|
|
goto turnLoop
|
|
}
|
|
|
|
summaryMsg := providers.Message{
|
|
Role: "assistant",
|
|
Content: handledToolResponseSummary,
|
|
}
|
|
|
|
if !ts.opts.NoHistory {
|
|
ts.agent.Sessions.AddMessage(ts.sessionKey, summaryMsg.Role, summaryMsg.Content)
|
|
ts.recordPersistedMessage(summaryMsg)
|
|
if err := ts.agent.Sessions.Save(ts.sessionKey); err != nil {
|
|
turnStatus = TurnEndStatusError
|
|
al.emitEvent(
|
|
EventKindError,
|
|
ts.eventMeta("runTurn", "turn.error"),
|
|
ErrorPayload{
|
|
Stage: "session_save",
|
|
Message: err.Error(),
|
|
},
|
|
)
|
|
return turnResult{}, err
|
|
}
|
|
}
|
|
if ts.opts.EnableSummary {
|
|
al.maybeSummarize(ts.agent, ts.sessionKey, ts.scope)
|
|
}
|
|
|
|
ts.setPhase(TurnPhaseCompleted)
|
|
ts.setFinalContent("")
|
|
logger.InfoCF("agent", "Tool output satisfied delivery; ending turn without follow-up LLM",
|
|
map[string]any{
|
|
"agent_id": ts.agent.ID,
|
|
"iteration": iteration,
|
|
"tool_count": len(normalizedToolCalls),
|
|
})
|
|
return turnResult{
|
|
finalContent: "",
|
|
status: turnStatus,
|
|
followUps: append([]bus.InboundMessage(nil), ts.followUps...),
|
|
}, nil
|
|
}
|
|
|
|
ts.agent.Tools.TickTTL()
|
|
logger.DebugCF("agent", "TTL tick after tool execution", map[string]any{
|
|
"agent_id": ts.agent.ID, "iteration": iteration,
|
|
})
|
|
}
|
|
|
|
if steerMsgs := al.dequeueSteeringMessagesForScope(ts.sessionKey); len(steerMsgs) > 0 {
|
|
logger.InfoCF("agent", "Steering arrived after turn completion; continuing turn before finalizing",
|
|
map[string]any{
|
|
"agent_id": ts.agent.ID,
|
|
"steering_count": len(steerMsgs),
|
|
"session_key": ts.sessionKey,
|
|
})
|
|
pendingMessages = append(pendingMessages, steerMsgs...)
|
|
finalContent = ""
|
|
goto turnLoop
|
|
}
|
|
|
|
if ts.hardAbortRequested() {
|
|
turnStatus = TurnEndStatusAborted
|
|
return al.abortTurn(ts)
|
|
}
|
|
|
|
if finalContent == "" {
|
|
if ts.currentIteration() >= ts.agent.MaxIterations && ts.agent.MaxIterations > 0 {
|
|
finalContent = toolLimitResponse
|
|
} else {
|
|
finalContent = ts.opts.DefaultResponse
|
|
}
|
|
}
|
|
|
|
ts.setPhase(TurnPhaseFinalizing)
|
|
ts.setFinalContent(finalContent)
|
|
if !ts.opts.NoHistory {
|
|
finalMsg := providers.Message{Role: "assistant", Content: finalContent}
|
|
ts.agent.Sessions.AddMessage(ts.sessionKey, finalMsg.Role, finalMsg.Content)
|
|
ts.recordPersistedMessage(finalMsg)
|
|
if err := ts.agent.Sessions.Save(ts.sessionKey); err != nil {
|
|
turnStatus = TurnEndStatusError
|
|
al.emitEvent(
|
|
EventKindError,
|
|
ts.eventMeta("runTurn", "turn.error"),
|
|
ErrorPayload{
|
|
Stage: "session_save",
|
|
Message: err.Error(),
|
|
},
|
|
)
|
|
return turnResult{}, err
|
|
}
|
|
}
|
|
|
|
if ts.opts.EnableSummary {
|
|
al.maybeSummarize(ts.agent, ts.sessionKey, ts.scope)
|
|
}
|
|
|
|
ts.setPhase(TurnPhaseCompleted)
|
|
return turnResult{
|
|
finalContent: finalContent,
|
|
status: turnStatus,
|
|
followUps: append([]bus.InboundMessage(nil), ts.followUps...),
|
|
}, nil
|
|
}
|
|
|
|
func (al *AgentLoop) abortTurn(ts *turnState) (turnResult, error) {
|
|
ts.setPhase(TurnPhaseAborted)
|
|
if !ts.opts.NoHistory {
|
|
if err := ts.restoreSession(ts.agent); err != nil {
|
|
al.emitEvent(
|
|
EventKindError,
|
|
ts.eventMeta("abortTurn", "turn.error"),
|
|
ErrorPayload{
|
|
Stage: "session_restore",
|
|
Message: err.Error(),
|
|
},
|
|
)
|
|
return turnResult{}, err
|
|
}
|
|
}
|
|
return turnResult{status: TurnEndStatusAborted}, nil
|
|
}
|
|
|
|
func sleepWithContext(ctx context.Context, d time.Duration) error {
|
|
timer := time.NewTimer(d)
|
|
defer timer.Stop()
|
|
|
|
select {
|
|
case <-ctx.Done():
|
|
return ctx.Err()
|
|
case <-timer.C:
|
|
return nil
|
|
}
|
|
}
|
|
|
|
// selectCandidates returns the model candidates and resolved model name to use
|
|
// for a conversation turn. When model routing is configured and the incoming
|
|
// message scores below the complexity threshold, it returns the light model
|
|
// candidates instead of the primary ones.
|
|
//
|
|
// The returned (candidates, model) pair is used for all LLM calls within one
|
|
// turn — tool follow-up iterations use the same tier as the initial call so
|
|
// that a multi-step tool chain doesn't switch models mid-way.
|
|
func (al *AgentLoop) selectCandidates(
|
|
agent *AgentInstance,
|
|
userMsg string,
|
|
history []providers.Message,
|
|
) (candidates []providers.FallbackCandidate, model string, usedLight bool) {
|
|
if agent.Router == nil || len(agent.LightCandidates) == 0 {
|
|
return agent.Candidates, resolvedCandidateModel(agent.Candidates, agent.Model), false
|
|
}
|
|
|
|
_, usedLight, score := agent.Router.SelectModel(userMsg, history, agent.Model)
|
|
if !usedLight {
|
|
logger.DebugCF("agent", "Model routing: primary model selected",
|
|
map[string]any{
|
|
"agent_id": agent.ID,
|
|
"score": score,
|
|
"threshold": agent.Router.Threshold(),
|
|
})
|
|
return agent.Candidates, resolvedCandidateModel(agent.Candidates, agent.Model), false
|
|
}
|
|
|
|
logger.InfoCF("agent", "Model routing: light model selected",
|
|
map[string]any{
|
|
"agent_id": agent.ID,
|
|
"light_model": agent.Router.LightModel(),
|
|
"score": score,
|
|
"threshold": agent.Router.Threshold(),
|
|
})
|
|
return agent.LightCandidates, resolvedCandidateModel(agent.LightCandidates, agent.Router.LightModel()), true
|
|
}
|
|
|
|
// maybeSummarize triggers summarization if the session history exceeds thresholds.
|
|
func (al *AgentLoop) maybeSummarize(agent *AgentInstance, sessionKey string, turnScope turnEventScope) {
|
|
newHistory := agent.Sessions.GetHistory(sessionKey)
|
|
tokenEstimate := al.estimateTokens(newHistory)
|
|
threshold := agent.ContextWindow * agent.SummarizeTokenPercent / 100
|
|
|
|
if len(newHistory) > agent.SummarizeMessageThreshold || tokenEstimate > threshold {
|
|
summarizeKey := agent.ID + ":" + sessionKey
|
|
if _, loading := al.summarizing.LoadOrStore(summarizeKey, true); !loading {
|
|
go func() {
|
|
defer al.summarizing.Delete(summarizeKey)
|
|
logger.Debug("Memory threshold reached. Optimizing conversation history...")
|
|
al.summarizeSession(agent, sessionKey, turnScope)
|
|
}()
|
|
}
|
|
}
|
|
}
|
|
|
|
type compressionResult struct {
|
|
DroppedMessages int
|
|
RemainingMessages int
|
|
}
|
|
|
|
// forceCompression aggressively reduces context when the limit is hit.
|
|
// It drops the oldest ~50% of Turns (a Turn is a complete user→LLM→response
|
|
// cycle, as defined in #1316), so tool-call sequences are never split.
|
|
//
|
|
// If the history is a single Turn with no safe split point, the function
|
|
// falls back to keeping only the most recent user message. This breaks
|
|
// Turn atomicity as a last resort to avoid a context-exceeded loop.
|
|
//
|
|
// Session history contains only user/assistant/tool messages — the system
|
|
// prompt is built dynamically by BuildMessages and is NOT stored here.
|
|
// The compression note is recorded in the session summary so that
|
|
// BuildMessages can include it in the next system prompt.
|
|
func (al *AgentLoop) forceCompression(agent *AgentInstance, sessionKey string) (compressionResult, bool) {
|
|
history := agent.Sessions.GetHistory(sessionKey)
|
|
if len(history) <= 2 {
|
|
return compressionResult{}, false
|
|
}
|
|
|
|
// Split at a Turn boundary so no tool-call sequence is torn apart.
|
|
// parseTurnBoundaries gives us the start of each Turn; we drop the
|
|
// oldest half of Turns and keep the most recent ones.
|
|
turns := parseTurnBoundaries(history)
|
|
var mid int
|
|
if len(turns) >= 2 {
|
|
mid = turns[len(turns)/2]
|
|
} else {
|
|
// Fewer than 2 Turns — fall back to message-level midpoint
|
|
// aligned to the nearest Turn boundary.
|
|
mid = findSafeBoundary(history, len(history)/2)
|
|
}
|
|
var keptHistory []providers.Message
|
|
if mid <= 0 {
|
|
// No safe Turn boundary — the entire history is a single Turn
|
|
// (e.g. one user message followed by a massive tool response).
|
|
// Keeping everything would leave the agent stuck in a context-
|
|
// exceeded loop, so fall back to keeping only the most recent
|
|
// user message. This breaks Turn atomicity as a last resort.
|
|
for i := len(history) - 1; i >= 0; i-- {
|
|
if history[i].Role == "user" {
|
|
keptHistory = []providers.Message{history[i]}
|
|
break
|
|
}
|
|
}
|
|
} else {
|
|
keptHistory = history[mid:]
|
|
}
|
|
|
|
droppedCount := len(history) - len(keptHistory)
|
|
|
|
// Record compression in the session summary so BuildMessages includes it
|
|
// in the system prompt. We do not modify history messages themselves.
|
|
existingSummary := agent.Sessions.GetSummary(sessionKey)
|
|
compressionNote := fmt.Sprintf(
|
|
"[Emergency compression dropped %d oldest messages due to context limit]",
|
|
droppedCount,
|
|
)
|
|
if existingSummary != "" {
|
|
compressionNote = existingSummary + "\n\n" + compressionNote
|
|
}
|
|
agent.Sessions.SetSummary(sessionKey, compressionNote)
|
|
|
|
agent.Sessions.SetHistory(sessionKey, keptHistory)
|
|
agent.Sessions.Save(sessionKey)
|
|
|
|
logger.WarnCF("agent", "Forced compression executed", map[string]any{
|
|
"session_key": sessionKey,
|
|
"dropped_msgs": droppedCount,
|
|
"new_count": len(keptHistory),
|
|
})
|
|
|
|
return compressionResult{
|
|
DroppedMessages: droppedCount,
|
|
RemainingMessages: len(keptHistory),
|
|
}, true
|
|
}
|
|
|
|
// GetStartupInfo returns information about loaded tools and skills for logging.
|
|
func (al *AgentLoop) GetStartupInfo() map[string]any {
|
|
info := make(map[string]any)
|
|
|
|
registry := al.GetRegistry()
|
|
agent := registry.GetDefaultAgent()
|
|
if agent == nil {
|
|
return info
|
|
}
|
|
|
|
// Tools info
|
|
toolsList := agent.Tools.List()
|
|
info["tools"] = map[string]any{
|
|
"count": len(toolsList),
|
|
"names": toolsList,
|
|
}
|
|
|
|
// Skills info
|
|
info["skills"] = agent.ContextBuilder.GetSkillsInfo()
|
|
|
|
// Agents info
|
|
info["agents"] = map[string]any{
|
|
"count": len(registry.ListAgentIDs()),
|
|
"ids": registry.ListAgentIDs(),
|
|
}
|
|
|
|
return info
|
|
}
|
|
|
|
// formatMessagesForLog formats messages for logging
|
|
func formatMessagesForLog(messages []providers.Message) string {
|
|
if len(messages) == 0 {
|
|
return "[]"
|
|
}
|
|
|
|
var sb strings.Builder
|
|
sb.WriteString("[\n")
|
|
for i, msg := range messages {
|
|
fmt.Fprintf(&sb, " [%d] Role: %s\n", i, msg.Role)
|
|
if len(msg.ToolCalls) > 0 {
|
|
sb.WriteString(" ToolCalls:\n")
|
|
for _, tc := range msg.ToolCalls {
|
|
fmt.Fprintf(&sb, " - ID: %s, Type: %s, Name: %s\n", tc.ID, tc.Type, tc.Name)
|
|
if tc.Function != nil {
|
|
fmt.Fprintf(
|
|
&sb,
|
|
" Arguments: %s\n",
|
|
utils.Truncate(tc.Function.Arguments, 200),
|
|
)
|
|
}
|
|
}
|
|
}
|
|
if msg.Content != "" {
|
|
content := utils.Truncate(msg.Content, 200)
|
|
fmt.Fprintf(&sb, " Content: %s\n", content)
|
|
}
|
|
if msg.ToolCallID != "" {
|
|
fmt.Fprintf(&sb, " ToolCallID: %s\n", msg.ToolCallID)
|
|
}
|
|
sb.WriteString("\n")
|
|
}
|
|
sb.WriteString("]")
|
|
return sb.String()
|
|
}
|
|
|
|
// formatToolsForLog formats tool definitions for logging
|
|
func formatToolsForLog(toolDefs []providers.ToolDefinition) string {
|
|
if len(toolDefs) == 0 {
|
|
return "[]"
|
|
}
|
|
|
|
var sb strings.Builder
|
|
sb.WriteString("[\n")
|
|
for i, tool := range toolDefs {
|
|
fmt.Fprintf(&sb, " [%d] Type: %s, Name: %s\n", i, tool.Type, tool.Function.Name)
|
|
fmt.Fprintf(&sb, " Description: %s\n", tool.Function.Description)
|
|
if len(tool.Function.Parameters) > 0 {
|
|
fmt.Fprintf(
|
|
&sb,
|
|
" Parameters: %s\n",
|
|
utils.Truncate(fmt.Sprintf("%v", tool.Function.Parameters), 200),
|
|
)
|
|
}
|
|
}
|
|
sb.WriteString("]")
|
|
return sb.String()
|
|
}
|
|
|
|
// summarizeSession summarizes the conversation history for a session.
|
|
func (al *AgentLoop) summarizeSession(agent *AgentInstance, sessionKey string, turnScope turnEventScope) {
|
|
ctx, cancel := context.WithTimeout(context.Background(), 120*time.Second)
|
|
defer cancel()
|
|
|
|
history := agent.Sessions.GetHistory(sessionKey)
|
|
summary := agent.Sessions.GetSummary(sessionKey)
|
|
|
|
// Keep the most recent Turns for continuity, aligned to a Turn boundary
|
|
// so that no tool-call sequence is split.
|
|
if len(history) <= 4 {
|
|
return
|
|
}
|
|
|
|
safeCut := findSafeBoundary(history, len(history)-4)
|
|
if safeCut <= 0 {
|
|
return
|
|
}
|
|
keepCount := len(history) - safeCut
|
|
toSummarize := history[:safeCut]
|
|
|
|
// Oversized Message Guard
|
|
maxMessageTokens := agent.ContextWindow / 2
|
|
validMessages := make([]providers.Message, 0)
|
|
omitted := false
|
|
|
|
for _, m := range toSummarize {
|
|
if m.Role != "user" && m.Role != "assistant" {
|
|
continue
|
|
}
|
|
msgTokens := len(m.Content) / 2
|
|
if msgTokens > maxMessageTokens {
|
|
omitted = true
|
|
continue
|
|
}
|
|
validMessages = append(validMessages, m)
|
|
}
|
|
|
|
if len(validMessages) == 0 {
|
|
return
|
|
}
|
|
|
|
const (
|
|
maxSummarizationMessages = 10
|
|
llmMaxRetries = 3
|
|
llmTemperature = 0.3
|
|
fallbackMaxContentLength = 200
|
|
)
|
|
|
|
// Multi-Part Summarization
|
|
var finalSummary string
|
|
if len(validMessages) > maxSummarizationMessages {
|
|
mid := len(validMessages) / 2
|
|
|
|
mid = al.findNearestUserMessage(validMessages, mid)
|
|
|
|
part1 := validMessages[:mid]
|
|
part2 := validMessages[mid:]
|
|
|
|
s1, _ := al.summarizeBatch(ctx, agent, part1, "")
|
|
s2, _ := al.summarizeBatch(ctx, agent, part2, "")
|
|
|
|
mergePrompt := fmt.Sprintf(
|
|
"Merge these two conversation summaries into one cohesive summary:\n\n1: %s\n\n2: %s",
|
|
s1,
|
|
s2,
|
|
)
|
|
|
|
resp, err := al.retryLLMCall(ctx, agent, mergePrompt, llmMaxRetries)
|
|
if err == nil && resp.Content != "" {
|
|
finalSummary = resp.Content
|
|
} else {
|
|
finalSummary = s1 + " " + s2
|
|
}
|
|
} else {
|
|
finalSummary, _ = al.summarizeBatch(ctx, agent, validMessages, summary)
|
|
}
|
|
|
|
if omitted && finalSummary != "" {
|
|
finalSummary += "\n[Note: Some oversized messages were omitted from this summary for efficiency.]"
|
|
}
|
|
|
|
if finalSummary != "" {
|
|
agent.Sessions.SetSummary(sessionKey, finalSummary)
|
|
agent.Sessions.TruncateHistory(sessionKey, keepCount)
|
|
agent.Sessions.Save(sessionKey)
|
|
al.emitEvent(
|
|
EventKindSessionSummarize,
|
|
turnScope.meta(0, "summarizeSession", "turn.session.summarize"),
|
|
SessionSummarizePayload{
|
|
SummarizedMessages: len(validMessages),
|
|
KeptMessages: keepCount,
|
|
SummaryLen: len(finalSummary),
|
|
OmittedOversized: omitted,
|
|
},
|
|
)
|
|
}
|
|
}
|
|
|
|
// findNearestUserMessage finds the nearest user message to the given index.
|
|
// It searches backward first, then forward if no user message is found.
|
|
func (al *AgentLoop) findNearestUserMessage(messages []providers.Message, mid int) int {
|
|
originalMid := mid
|
|
|
|
for mid > 0 && messages[mid].Role != "user" {
|
|
mid--
|
|
}
|
|
|
|
if messages[mid].Role == "user" {
|
|
return mid
|
|
}
|
|
|
|
mid = originalMid
|
|
for mid < len(messages) && messages[mid].Role != "user" {
|
|
mid++
|
|
}
|
|
|
|
if mid < len(messages) {
|
|
return mid
|
|
}
|
|
|
|
return originalMid
|
|
}
|
|
|
|
// retryLLMCall calls the LLM with retry logic.
|
|
func (al *AgentLoop) retryLLMCall(
|
|
ctx context.Context,
|
|
agent *AgentInstance,
|
|
prompt string,
|
|
maxRetries int,
|
|
) (*providers.LLMResponse, error) {
|
|
const (
|
|
llmTemperature = 0.3
|
|
)
|
|
|
|
var resp *providers.LLMResponse
|
|
var err error
|
|
|
|
for attempt := 0; attempt < maxRetries; attempt++ {
|
|
al.activeRequests.Add(1)
|
|
resp, err = func() (*providers.LLMResponse, error) {
|
|
defer al.activeRequests.Done()
|
|
return agent.Provider.Chat(
|
|
ctx,
|
|
[]providers.Message{{Role: "user", Content: prompt}},
|
|
nil,
|
|
agent.Model,
|
|
map[string]any{
|
|
"max_tokens": agent.MaxTokens,
|
|
"temperature": llmTemperature,
|
|
"prompt_cache_key": agent.ID,
|
|
},
|
|
)
|
|
}()
|
|
|
|
if err == nil && resp != nil && resp.Content != "" {
|
|
return resp, nil
|
|
}
|
|
if attempt < maxRetries-1 {
|
|
time.Sleep(time.Duration(attempt+1) * 100 * time.Millisecond)
|
|
}
|
|
}
|
|
|
|
return resp, err
|
|
}
|
|
|
|
// summarizeBatch summarizes a batch of messages.
|
|
func (al *AgentLoop) summarizeBatch(
|
|
ctx context.Context,
|
|
agent *AgentInstance,
|
|
batch []providers.Message,
|
|
existingSummary string,
|
|
) (string, error) {
|
|
const (
|
|
llmMaxRetries = 3
|
|
llmTemperature = 0.3
|
|
fallbackMinContentLength = 200
|
|
fallbackMaxContentPercent = 10
|
|
)
|
|
|
|
var sb strings.Builder
|
|
sb.WriteString(
|
|
"Provide a concise summary of this conversation segment, preserving core context and key points.\n",
|
|
)
|
|
if existingSummary != "" {
|
|
sb.WriteString("Existing context: ")
|
|
sb.WriteString(existingSummary)
|
|
sb.WriteString("\n")
|
|
}
|
|
sb.WriteString("\nCONVERSATION:\n")
|
|
for _, m := range batch {
|
|
fmt.Fprintf(&sb, "%s: %s\n", m.Role, m.Content)
|
|
}
|
|
prompt := sb.String()
|
|
|
|
response, err := al.retryLLMCall(ctx, agent, prompt, llmMaxRetries)
|
|
if err == nil && response.Content != "" {
|
|
return strings.TrimSpace(response.Content), nil
|
|
}
|
|
|
|
var fallback strings.Builder
|
|
fallback.WriteString("Conversation summary: ")
|
|
for i, m := range batch {
|
|
if i > 0 {
|
|
fallback.WriteString(" | ")
|
|
}
|
|
content := strings.TrimSpace(m.Content)
|
|
runes := []rune(content)
|
|
if len(runes) == 0 {
|
|
fallback.WriteString(fmt.Sprintf("%s: ", m.Role))
|
|
continue
|
|
}
|
|
|
|
keepLength := len(runes) * fallbackMaxContentPercent / 100
|
|
if keepLength < fallbackMinContentLength {
|
|
keepLength = fallbackMinContentLength
|
|
}
|
|
|
|
if keepLength > len(runes) {
|
|
keepLength = len(runes)
|
|
}
|
|
|
|
content = string(runes[:keepLength])
|
|
if keepLength < len(runes) {
|
|
content += "..."
|
|
}
|
|
fallback.WriteString(fmt.Sprintf("%s: %s", m.Role, content))
|
|
}
|
|
return fallback.String(), nil
|
|
}
|
|
|
|
// estimateTokens estimates the number of tokens in a message list.
|
|
// Counts Content, ToolCalls arguments, and ToolCallID metadata so that
|
|
// tool-heavy conversations are not systematically undercounted.
|
|
func (al *AgentLoop) estimateTokens(messages []providers.Message) int {
|
|
total := 0
|
|
for _, m := range messages {
|
|
total += estimateMessageTokens(m)
|
|
}
|
|
return total
|
|
}
|
|
|
|
func (al *AgentLoop) handleCommand(
|
|
ctx context.Context,
|
|
msg bus.InboundMessage,
|
|
agent *AgentInstance,
|
|
opts *processOptions,
|
|
) (string, bool) {
|
|
if !commands.HasCommandPrefix(msg.Content) {
|
|
return "", false
|
|
}
|
|
|
|
if matched, handled, reply := al.applyExplicitSkillCommand(msg.Content, agent, opts); matched {
|
|
return reply, handled
|
|
}
|
|
|
|
if al.cmdRegistry == nil {
|
|
return "", false
|
|
}
|
|
|
|
rt := al.buildCommandsRuntime(agent, opts)
|
|
executor := commands.NewExecutor(al.cmdRegistry, rt)
|
|
|
|
var commandReply string
|
|
result := executor.Execute(ctx, commands.Request{
|
|
Channel: msg.Channel,
|
|
ChatID: msg.ChatID,
|
|
SenderID: msg.SenderID,
|
|
Text: msg.Content,
|
|
Reply: func(text string) error {
|
|
commandReply = text
|
|
return nil
|
|
},
|
|
})
|
|
|
|
switch result.Outcome {
|
|
case commands.OutcomeHandled:
|
|
if result.Err != nil {
|
|
return mapCommandError(result), true
|
|
}
|
|
if commandReply != "" {
|
|
return commandReply, true
|
|
}
|
|
return "", true
|
|
default: // OutcomePassthrough — let the message fall through to LLM
|
|
return "", false
|
|
}
|
|
}
|
|
|
|
func activeSkillNames(agent *AgentInstance, opts processOptions) []string {
|
|
if agent == nil {
|
|
return nil
|
|
}
|
|
|
|
combined := make([]string, 0, len(agent.SkillsFilter)+len(opts.ForcedSkills))
|
|
combined = append(combined, agent.SkillsFilter...)
|
|
combined = append(combined, opts.ForcedSkills...)
|
|
if len(combined) == 0 {
|
|
return nil
|
|
}
|
|
|
|
var resolved []string
|
|
seen := make(map[string]struct{}, len(combined))
|
|
for _, name := range combined {
|
|
name = strings.TrimSpace(name)
|
|
if name == "" {
|
|
continue
|
|
}
|
|
if agent.ContextBuilder != nil {
|
|
if canonical, ok := agent.ContextBuilder.ResolveSkillName(name); ok {
|
|
name = canonical
|
|
}
|
|
}
|
|
key := strings.ToLower(name)
|
|
if _, ok := seen[key]; ok {
|
|
continue
|
|
}
|
|
seen[key] = struct{}{}
|
|
resolved = append(resolved, name)
|
|
}
|
|
|
|
return resolved
|
|
}
|
|
|
|
func (al *AgentLoop) applyExplicitSkillCommand(
|
|
raw string,
|
|
agent *AgentInstance,
|
|
opts *processOptions,
|
|
) (matched bool, handled bool, reply string) {
|
|
cmdName, ok := commands.CommandName(raw)
|
|
if !ok || cmdName != "use" {
|
|
return false, false, ""
|
|
}
|
|
|
|
if agent == nil || agent.ContextBuilder == nil {
|
|
return true, true, commandsUnavailableSkillMessage()
|
|
}
|
|
|
|
parts := strings.Fields(strings.TrimSpace(raw))
|
|
if len(parts) < 2 {
|
|
return true, true, buildUseCommandHelp(agent)
|
|
}
|
|
|
|
arg := strings.TrimSpace(parts[1])
|
|
if strings.EqualFold(arg, "clear") || strings.EqualFold(arg, "off") {
|
|
if opts != nil {
|
|
al.clearPendingSkills(opts.SessionKey)
|
|
}
|
|
return true, true, "Cleared pending skill override."
|
|
}
|
|
|
|
skillName, ok := agent.ContextBuilder.ResolveSkillName(arg)
|
|
if !ok {
|
|
return true, true, fmt.Sprintf("Unknown skill: %s\nUse /list skills to see installed skills.", arg)
|
|
}
|
|
|
|
if len(parts) < 3 {
|
|
if opts == nil || strings.TrimSpace(opts.SessionKey) == "" {
|
|
return true, true, commandsUnavailableSkillMessage()
|
|
}
|
|
al.setPendingSkills(opts.SessionKey, []string{skillName})
|
|
return true, true, fmt.Sprintf(
|
|
"Skill %q is armed for your next message. Send your next prompt normally, or use /use clear to cancel.",
|
|
skillName,
|
|
)
|
|
}
|
|
|
|
message := strings.TrimSpace(strings.Join(parts[2:], " "))
|
|
if message == "" {
|
|
return true, true, buildUseCommandHelp(agent)
|
|
}
|
|
|
|
if opts != nil {
|
|
opts.ForcedSkills = append(opts.ForcedSkills, skillName)
|
|
opts.UserMessage = message
|
|
}
|
|
|
|
return true, false, ""
|
|
}
|
|
|
|
func (al *AgentLoop) buildCommandsRuntime(agent *AgentInstance, opts *processOptions) *commands.Runtime {
|
|
registry := al.GetRegistry()
|
|
cfg := al.GetConfig()
|
|
rt := &commands.Runtime{
|
|
Config: cfg,
|
|
ListAgentIDs: registry.ListAgentIDs,
|
|
ListDefinitions: al.cmdRegistry.Definitions,
|
|
GetEnabledChannels: func() []string {
|
|
if al.channelManager == nil {
|
|
return nil
|
|
}
|
|
return al.channelManager.GetEnabledChannels()
|
|
},
|
|
GetActiveTurn: func() any {
|
|
info := al.GetActiveTurn()
|
|
if info == nil {
|
|
return nil
|
|
}
|
|
return info
|
|
},
|
|
SwitchChannel: func(value string) error {
|
|
if al.channelManager == nil {
|
|
return fmt.Errorf("channel manager not initialized")
|
|
}
|
|
if _, exists := al.channelManager.GetChannel(value); !exists && value != "cli" {
|
|
return fmt.Errorf("channel '%s' not found or not enabled", value)
|
|
}
|
|
return nil
|
|
},
|
|
}
|
|
if agent != nil && agent.ContextBuilder != nil {
|
|
rt.ListSkillNames = agent.ContextBuilder.ListSkillNames
|
|
}
|
|
rt.ReloadConfig = func() error {
|
|
if al.reloadFunc == nil {
|
|
return fmt.Errorf("reload not configured")
|
|
}
|
|
return al.reloadFunc()
|
|
}
|
|
if agent != nil {
|
|
if agent.ContextBuilder != nil {
|
|
rt.ListSkillNames = agent.ContextBuilder.ListSkillNames
|
|
}
|
|
rt.GetModelInfo = func() (string, string) {
|
|
return agent.Model, resolvedCandidateProvider(agent.Candidates, cfg.Agents.Defaults.Provider)
|
|
}
|
|
rt.SwitchModel = func(value string) (string, error) {
|
|
value = strings.TrimSpace(value)
|
|
modelCfg, err := resolvedModelConfig(cfg, value, agent.Workspace)
|
|
if err != nil {
|
|
return "", err
|
|
}
|
|
|
|
nextProvider, _, err := providers.CreateProviderFromConfig(modelCfg)
|
|
if err != nil {
|
|
return "", fmt.Errorf("failed to initialize model %q: %w", value, err)
|
|
}
|
|
|
|
nextCandidates := resolveModelCandidates(cfg, cfg.Agents.Defaults.Provider, modelCfg.Model, agent.Fallbacks)
|
|
if len(nextCandidates) == 0 {
|
|
return "", fmt.Errorf("model %q did not resolve to any provider candidates", value)
|
|
}
|
|
|
|
oldModel := agent.Model
|
|
oldProvider := agent.Provider
|
|
agent.Model = value
|
|
agent.Provider = nextProvider
|
|
agent.Candidates = nextCandidates
|
|
agent.ThinkingLevel = parseThinkingLevel(modelCfg.ThinkingLevel)
|
|
|
|
if oldProvider != nil && oldProvider != nextProvider {
|
|
if stateful, ok := oldProvider.(providers.StatefulProvider); ok {
|
|
stateful.Close()
|
|
}
|
|
}
|
|
return oldModel, nil
|
|
}
|
|
|
|
rt.ClearHistory = func() error {
|
|
if opts == nil {
|
|
return fmt.Errorf("process options not available")
|
|
}
|
|
if agent.Sessions == nil {
|
|
return fmt.Errorf("sessions not initialized for agent")
|
|
}
|
|
|
|
agent.Sessions.SetHistory(opts.SessionKey, make([]providers.Message, 0))
|
|
agent.Sessions.SetSummary(opts.SessionKey, "")
|
|
agent.Sessions.Save(opts.SessionKey)
|
|
return nil
|
|
}
|
|
}
|
|
return rt
|
|
}
|
|
|
|
func commandsUnavailableSkillMessage() string {
|
|
return "Skill selection is unavailable in the current context."
|
|
}
|
|
|
|
func buildUseCommandHelp(agent *AgentInstance) string {
|
|
if agent == nil || agent.ContextBuilder == nil {
|
|
return "Usage: /use <skill> [message]"
|
|
}
|
|
|
|
names := agent.ContextBuilder.ListSkillNames()
|
|
if len(names) == 0 {
|
|
return "Usage: /use <skill> [message]\nNo installed skills found."
|
|
}
|
|
|
|
return fmt.Sprintf(
|
|
"Usage: /use <skill> [message]\n\nInstalled Skills:\n- %s\n\nUse /use <skill> to apply a skill to your next message, or /use <skill> <message> to force it immediately.",
|
|
strings.Join(names, "\n- "),
|
|
)
|
|
}
|
|
|
|
func (al *AgentLoop) setPendingSkills(sessionKey string, skillNames []string) {
|
|
sessionKey = strings.TrimSpace(sessionKey)
|
|
if sessionKey == "" || len(skillNames) == 0 {
|
|
return
|
|
}
|
|
|
|
filtered := make([]string, 0, len(skillNames))
|
|
for _, name := range skillNames {
|
|
name = strings.TrimSpace(name)
|
|
if name != "" {
|
|
filtered = append(filtered, name)
|
|
}
|
|
}
|
|
if len(filtered) == 0 {
|
|
return
|
|
}
|
|
|
|
al.pendingSkills.Store(sessionKey, filtered)
|
|
}
|
|
|
|
func (al *AgentLoop) takePendingSkills(sessionKey string) []string {
|
|
sessionKey = strings.TrimSpace(sessionKey)
|
|
if sessionKey == "" {
|
|
return nil
|
|
}
|
|
|
|
value, ok := al.pendingSkills.LoadAndDelete(sessionKey)
|
|
if !ok {
|
|
return nil
|
|
}
|
|
|
|
skills, ok := value.([]string)
|
|
if !ok {
|
|
return nil
|
|
}
|
|
|
|
return append([]string(nil), skills...)
|
|
}
|
|
|
|
func (al *AgentLoop) clearPendingSkills(sessionKey string) {
|
|
sessionKey = strings.TrimSpace(sessionKey)
|
|
if sessionKey == "" {
|
|
return
|
|
}
|
|
al.pendingSkills.Delete(sessionKey)
|
|
}
|
|
|
|
func mapCommandError(result commands.ExecuteResult) string {
|
|
if result.Command == "" {
|
|
return fmt.Sprintf("Failed to execute command: %v", result.Err)
|
|
}
|
|
return fmt.Sprintf("Failed to execute /%s: %v", result.Command, result.Err)
|
|
}
|
|
|
|
// extractPeer extracts the routing peer from the inbound message's structured Peer field.
|
|
func extractPeer(msg bus.InboundMessage) *routing.RoutePeer {
|
|
if msg.Peer.Kind == "" {
|
|
return nil
|
|
}
|
|
peerID := msg.Peer.ID
|
|
if peerID == "" {
|
|
if msg.Peer.Kind == "direct" {
|
|
peerID = msg.SenderID
|
|
} else {
|
|
peerID = msg.ChatID
|
|
}
|
|
}
|
|
return &routing.RoutePeer{Kind: msg.Peer.Kind, ID: peerID}
|
|
}
|
|
|
|
func inboundMetadata(msg bus.InboundMessage, key string) string {
|
|
if msg.Metadata == nil {
|
|
return ""
|
|
}
|
|
return msg.Metadata[key]
|
|
}
|
|
|
|
// extractParentPeer extracts the parent peer (reply-to) from inbound message metadata.
|
|
func extractParentPeer(msg bus.InboundMessage) *routing.RoutePeer {
|
|
parentKind := inboundMetadata(msg, metadataKeyParentPeerKind)
|
|
parentID := inboundMetadata(msg, metadataKeyParentPeerID)
|
|
if parentKind == "" || parentID == "" {
|
|
return nil
|
|
}
|
|
return &routing.RoutePeer{Kind: parentKind, ID: parentID}
|
|
}
|
|
|
|
// isNativeSearchProvider reports whether the given LLM provider implements
|
|
// NativeSearchCapable and returns true for SupportsNativeSearch.
|
|
func isNativeSearchProvider(p providers.LLMProvider) bool {
|
|
if ns, ok := p.(providers.NativeSearchCapable); ok {
|
|
return ns.SupportsNativeSearch()
|
|
}
|
|
return false
|
|
}
|
|
|
|
// filterClientWebSearch returns a copy of tools with the client-side
|
|
// web_search tool removed. Used when native provider search is preferred.
|
|
func filterClientWebSearch(tools []providers.ToolDefinition) []providers.ToolDefinition {
|
|
result := make([]providers.ToolDefinition, 0, len(tools))
|
|
for _, t := range tools {
|
|
if strings.EqualFold(t.Function.Name, "web_search") {
|
|
continue
|
|
}
|
|
result = append(result, t)
|
|
}
|
|
return result
|
|
}
|
|
|
|
// Helper to extract provider from registry for cleanup
|
|
func extractProvider(registry *AgentRegistry) (providers.LLMProvider, bool) {
|
|
if registry == nil {
|
|
return nil, false
|
|
}
|
|
// Get any agent to access the provider
|
|
defaultAgent := registry.GetDefaultAgent()
|
|
if defaultAgent == nil {
|
|
return nil, false
|
|
}
|
|
return defaultAgent.Provider, true
|
|
}
|