Spaces:

serverbaru
/

zeroclaw

Sleeping

personalbotai

Move picoclaw_space to root for Hugging Face Spaces deployment

c1dcaaa about 1 month ago

44.7 kB

	// PicoClaw - Ultra-lightweight personal AI agent
	// Inspired by and based on nanobot: https://github.com/HKUDS/nanobot
	// License: MIT
	//
	// Copyright (c) 2026 PicoClaw contributors

	package agent

	import (
	"context"
	"encoding/json"
	"fmt"
	"os"
	"os/exec"
	"path/filepath"
	"regexp"
	"strings"
	"sync"
	"sync/atomic"
	"time"
	"unicode/utf8"

	"github.com/sipeed/picoclaw/pkg/bus"
	"github.com/sipeed/picoclaw/pkg/channels"
	"github.com/sipeed/picoclaw/pkg/config"
	"github.com/sipeed/picoclaw/pkg/constants"
	"github.com/sipeed/picoclaw/pkg/logger"
	"github.com/sipeed/picoclaw/pkg/metrics"
	"github.com/sipeed/picoclaw/pkg/providers"
	"github.com/sipeed/picoclaw/pkg/session"
	"github.com/sipeed/picoclaw/pkg/state"
	"github.com/sipeed/picoclaw/pkg/tools"
	"github.com/sipeed/picoclaw/pkg/utils"
	)

	type ToolCacheEntry struct {
	Result *tools.ToolResult
	ExpiresAt time.Time
	}

	type AgentLoop struct {
	bus *bus.MessageBus
	provider providers.LLMProvider
	workspace string
	model string
	fallbackModels []string
	contextWindow int // Maximum context window size in tokens
	maxIterations int
	sessions *session.SessionManager
	state *state.Manager
	contextBuilder *ContextBuilder
	tools *tools.ToolRegistry
	running atomic.Bool
	summarizing sync.Map // Tracks which sessions are currently being summarized
	channelManager *channels.Manager
	config *config.Config
	cache map[string]ToolCacheEntry
	cacheMutex sync.RWMutex
	}

	// processOptions configures how a message is processed
	type processOptions struct {
	SessionKey string // Session identifier for history/context
	Channel string // Target channel for tool execution
	ChatID string // Target chat ID for tool execution
	UserMessage string // User message content (may include prefix)
	DefaultResponse string // Response when LLM returns empty
	EnableSummary bool // Whether to trigger summarization
	SendResponse bool // Whether to send response via bus
	NoHistory bool // If true, don't load session history (for heartbeat)
	Media []string // Attached media file paths
	MaxIterations int // Maximum iterations for this specific request
	}

	// createToolRegistry creates a tool registry with common tools.
	// This is shared between main agent and subagents.
	func createToolRegistry(workspace string, restrict bool, cfg config.Config, msgBus bus.MessageBus) *tools.ToolRegistry {
	registry := tools.NewToolRegistry()

	// File system tools
	registry.Register(tools.NewReadFileTool(workspace, restrict))
	registry.Register(tools.NewWriteFileTool(workspace, restrict))
	registry.Register(tools.NewListDirTool(workspace, restrict))
	registry.Register(tools.NewEditFileTool(workspace, restrict))
	registry.Register(tools.NewAppendFileTool(workspace, restrict))

	// Shell execution
	registry.Register(tools.NewExecTool(workspace, restrict, cfg.Tools.ResourceLimits))

	if searchTool := tools.NewWebSearchTool(tools.WebSearchToolOptions{
	BraveAPIKey: cfg.Tools.Web.Brave.APIKey,
	BraveMaxResults: cfg.Tools.Web.Brave.MaxResults,
	BraveEnabled: cfg.Tools.Web.Brave.Enabled,
	DuckDuckGoMaxResults: cfg.Tools.Web.DuckDuckGo.MaxResults,
	DuckDuckGoEnabled: cfg.Tools.Web.DuckDuckGo.Enabled,
	}); searchTool != nil {
	registry.Register(searchTool)
	}
	registry.Register(tools.NewWebFetchTool(50000))

	// Hardware tools (I2C, SPI) - Linux only, returns error on other platforms
	registry.Register(tools.NewI2CTool())
	registry.Register(tools.NewSPITool())

	// Message tool - available to both agent and subagent
	// Subagent uses it to communicate directly with user
	messageTool := tools.NewMessageTool()
	messageTool.SetSendCallback(func(channel, chatID, content string) error {
	var audioPath string

	// Check for [NO_VOICE] prefix to skip TTS
	if strings.HasPrefix(strings.TrimSpace(content), "[NO_VOICE]") {
	content = strings.TrimSpace(strings.TrimPrefix(strings.TrimSpace(content), "[NO_VOICE]"))
	} else {
	// Try to generate audio
	if path, err := generateTTS(workspace, content); err == nil {
	audioPath = path
	} else {
	logger.DebugCF("agent", "TTS generation skipped/failed (message tool)", map[string]interface{}{
	"error": err.Error(),
	})
	}
	}

	msgBus.PublishOutbound(bus.OutboundMessage{
	Channel: channel,
	ChatID: chatID,
	Content: content,
	AudioPath: audioPath,
	})
	return nil
	})
	registry.Register(messageTool)

	return registry
	}

	func NewAgentLoop(cfg config.Config, msgBus bus.MessageBus, provider providers.LLMProvider) *AgentLoop {
	workspace := cfg.WorkspacePath()
	os.MkdirAll(workspace, 0755)

	restrict := cfg.Agents.Defaults.RestrictToWorkspace

	// Create tool registry for main agent
	toolsRegistry := createToolRegistry(workspace, restrict, cfg, msgBus)

	// Create subagent manager with its own tool registry
	subagentManager := tools.NewSubagentManager(provider, cfg.Agents.Defaults.Model, workspace, msgBus)
	subagentTools := createToolRegistry(workspace, restrict, cfg, msgBus)
	// Subagent doesn't need spawn/subagent tools to avoid recursion
	subagentManager.SetTools(subagentTools)

	// Register spawn tool (for main agent)
	spawnTool := tools.NewSpawnTool(subagentManager)
	toolsRegistry.Register(spawnTool)

	// Register subagent tool (synchronous execution)
	subagentTool := tools.NewSubagentTool(subagentManager)
	toolsRegistry.Register(subagentTool)

	sessionsManager := session.NewSessionManager(filepath.Join(workspace, "sessions"))

	// Create state manager for atomic state persistence
	stateManager := state.NewManager(workspace)

	// Create context builder and set tools registry
	contextBuilder := NewContextBuilder(workspace)
	contextBuilder.SetToolsRegistry(toolsRegistry)

	return &AgentLoop{
	config: cfg,
	bus: msgBus,
	provider: provider,
	workspace: workspace,
	model: cfg.Agents.Defaults.Model,
	fallbackModels: cfg.Agents.Defaults.FallbackModels,
	contextWindow: cfg.Agents.Defaults.MaxTokens, // Restore context window for summarization
	maxIterations: cfg.Agents.Defaults.MaxToolIterations,
	sessions: sessionsManager,
	state: stateManager,
	contextBuilder: contextBuilder,
	tools: toolsRegistry,
	summarizing: sync.Map{},
	cache: make(map[string]ToolCacheEntry),
	}
	}

	func generateTTS(workspace, text string) (string, error) {
	// Clean text for TTS (remove markdown symbols)
	// 1. Remove code blocks
	reCode := regexp.MustCompile("```[\\s\\S]*?```")
	cleanText := reCode.ReplaceAllString(text, "code block")

	// 2. Remove inline code
	reInline := regexp.MustCompile("`[^`]*`")
	cleanText = reInline.ReplaceAllString(cleanText, "code")

	// 3. Remove links [text](url) -> text
	reLink := regexp.MustCompile(`\[([^\]]+)\]$[^$]+\)`)
	cleanText = reLink.ReplaceAllString(cleanText, "$1")

	// 4. Remove bold/italic/header markers (*, _, #)
	reSymbols := regexp.MustCompile(`[\*\_#]`)
	cleanText = reSymbols.ReplaceAllString(cleanText, "")

	// Search in workspace/skills and system skills
	skillPaths := []string{
	filepath.Join(workspace, "skills", "voice-tts"),
	"/picoclaw/skills/voice-tts",
	"workspace/skills/voice-tts",
	}

	var scriptPath string
	for _, p := range skillPaths {
	sp := filepath.Join(p, "scripts", "speak.py")
	if _, err := os.Stat(sp); err == nil {
	scriptPath = sp
	break
	}
	}

	if scriptPath == "" {
	return "", fmt.Errorf("voice-tts skill not found")
	}

	// Generate temp file
	outFile := filepath.Join(os.TempDir(), fmt.Sprintf("tts_%d.mp3", time.Now().UnixNano()))

	// Execute script
	// python3 script.py "text" --file outFile --no-play
	cmd := exec.Command("python3", scriptPath, cleanText, "--file", outFile, "--no-play")
	if out, err := cmd.CombinedOutput(); err != nil {
	return "", fmt.Errorf("tts execution failed: %v, output: %s", err, out)
	}

	return outFile, nil
	}

	func (al *AgentLoop) Run(ctx context.Context) error {
	al.running.Store(true)

	for al.running.Load() {
	select {
	case <-ctx.Done():
	return nil
	default:
	msg, ok := al.bus.ConsumeInbound(ctx)
	if !ok {
	continue
	}

	response, err := al.processMessage(ctx, msg)
	if err != nil {
	response = fmt.Sprintf("Error processing message: %v", err)
	}

	if response != "" {
	// Check if the message tool already sent a response during this round.
	// If so, skip publishing to avoid duplicate messages to the user.
	alreadySent := false
	if tool, ok := al.tools.Get("message"); ok {
	if mt, ok := tool.(*tools.MessageTool); ok {
	alreadySent = mt.HasSentInRound()
	}
	}

	if !alreadySent {
	var audioPath string
	// Try to generate audio
	if path, err := generateTTS(al.workspace, response); err == nil {
	audioPath = path
	} else {
	// Debug log if TTS fails (e.g. skill not found)
	logger.DebugCF("agent", "TTS generation skipped/failed", map[string]interface{}{
	"error": err.Error(),
	})
	}

	al.bus.PublishOutbound(bus.OutboundMessage{
	Channel: msg.Channel,
	ChatID: msg.ChatID,
	Content: response,
	AudioPath: audioPath,
	})
	}
	}
	}
	}

	return nil
	}

	func (al *AgentLoop) Stop() {
	al.running.Store(false)
	}

	func (al *AgentLoop) RegisterTool(tool tools.Tool) {
	al.tools.Register(tool)
	}

	func (al AgentLoop) SetChannelManager(cm channels.Manager) {
	al.channelManager = cm
	}

	// RecordLastChannel records the last active channel for this workspace.
	// This uses the atomic state save mechanism to prevent data loss on crash.
	func (al *AgentLoop) RecordLastChannel(channel string) error {
	return al.state.SetLastChannel(channel)
	}

	// RecordLastChatID records the last active chat ID for this workspace.
	// This uses the atomic state save mechanism to prevent data loss on crash.
	func (al *AgentLoop) RecordLastChatID(chatID string) error {
	return al.state.SetLastChatID(chatID)
	}

	func (al *AgentLoop) ProcessDirect(ctx context.Context, content, sessionKey string) (string, error) {
	return al.ProcessDirectWithChannel(ctx, content, sessionKey, "cli", "direct")
	}

	func (al *AgentLoop) ProcessDirectWithChannel(ctx context.Context, content, sessionKey, channel, chatID string) (string, error) {
	msg := bus.InboundMessage{
	Channel: channel,
	SenderID: "cron",
	ChatID: chatID,
	Content: content,
	SessionKey: sessionKey,
	}

	return al.processMessage(ctx, msg)
	}

	// ProcessHeartbeat processes a heartbeat request without session history.
	// Each heartbeat is independent and doesn't accumulate context.
	func (al *AgentLoop) ProcessHeartbeat(ctx context.Context, content, channel, chatID string) (string, error) {
	return al.runAgentLoop(ctx, processOptions{
	SessionKey: "heartbeat",
	Channel: channel,
	ChatID: chatID,
	UserMessage: content,
	DefaultResponse: "Saya telah selesai memproses pesan, namun tidak ada respons tambahan.",
	EnableSummary: false,
	SendResponse: false,
	NoHistory: true, // Don't load session history for heartbeat
	})
	}

	func (al *AgentLoop) processMessage(ctx context.Context, msg bus.InboundMessage) (string, error) {
	// Add message preview to log (show full content for error messages)
	var logContent string
	if strings.Contains(msg.Content, "Error:") \|\| strings.Contains(msg.Content, "error") {
	logContent = msg.Content // Full content for errors
	} else {
	logContent = utils.Truncate(msg.Content, 80)
	}
	logger.InfoCF("agent", fmt.Sprintf("Processing message from %s:%s: %s", msg.Channel, msg.SenderID, logContent),
	map[string]interface{}{
	"channel": msg.Channel,
	"chat_id": msg.ChatID,
	"sender_id": msg.SenderID,
	"session_key": msg.SessionKey,
	})

	// Route system messages to processSystemMessage
	if msg.Channel == "system" {
	return al.processSystemMessage(ctx, msg)
	}

	// Check for commands
	if response, handled := al.handleCommand(ctx, msg); handled {
	return response, nil
	}

	// Process as user message
	return al.runAgentLoop(ctx, processOptions{
	SessionKey: msg.SessionKey,
	Channel: msg.Channel,
	ChatID: msg.ChatID,
	UserMessage: msg.Content,
	DefaultResponse: "Saya telah selesai memproses pesan, namun tidak ada respons tambahan.",
	EnableSummary: true,
	SendResponse: false,
	Media: msg.Media,
	})
	}

	func (al *AgentLoop) processSystemMessage(ctx context.Context, msg bus.InboundMessage) (string, error) {
	// Verify this is a system message
	if msg.Channel != "system" {
	return "", fmt.Errorf("processSystemMessage called with non-system message channel: %s", msg.Channel)
	}

	logger.InfoCF("agent", "Processing system message",
	map[string]interface{}{
	"sender_id": msg.SenderID,
	"chat_id": msg.ChatID,
	})

	// Parse origin channel from chat_id (format: "channel:chat_id")
	var originChannel string
	if idx := strings.Index(msg.ChatID, ":"); idx > 0 {
	originChannel = msg.ChatID[:idx]
	} else {
	// Fallback
	originChannel = "cli"
	}

	// Extract subagent result from message content
	// Format: "Task 'label' completed.\n\nResult:\n<actual content>"
	content := msg.Content
	if idx := strings.Index(content, "Result:\n"); idx >= 0 {
	content = content[idx+8:] // Extract just the result part
	}

	// Skip internal channels - only log, don't send to user
	if constants.IsInternalChannel(originChannel) {
	logger.InfoCF("agent", "Subagent completed (internal channel)",
	map[string]interface{}{
	"sender_id": msg.SenderID,
	"content_len": len(content),
	"channel": originChannel,
	})
	return "", nil
	}

	// Agent acts as dispatcher only - subagent handles user interaction via message tool
	// Don't forward result here, subagent should use message tool to communicate with user
	logger.InfoCF("agent", "Subagent completed",
	map[string]interface{}{
	"sender_id": msg.SenderID,
	"channel": originChannel,
	"content_len": len(content),
	})

	// Agent only logs, does not respond to user
	return "", nil
	}

	// runAgentLoop is the core message processing logic.
	// It handles context building, LLM calls, tool execution, and response handling.
	func (al *AgentLoop) runAgentLoop(ctx context.Context, opts processOptions) (string, error) {
	// 0. Record last channel for heartbeat notifications (skip internal channels)
	if opts.Channel != "" && opts.ChatID != "" {
	// Don't record internal channels (cli, system, subagent)
	if !constants.IsInternalChannel(opts.Channel) {
	channelKey := fmt.Sprintf("%s:%s", opts.Channel, opts.ChatID)
	if err := al.RecordLastChannel(channelKey); err != nil {
	logger.WarnCF("agent", "Failed to record last channel: %v", map[string]interface{}{"error": err.Error()})
	}
	}
	}

	// 1. Update tool contexts
	al.updateToolContexts(opts.Channel, opts.ChatID)

	// Determine adaptive iteration limit
	if opts.MaxIterations == 0 {
	// Heuristic:
	// - Short messages (< 50 chars): likely simple queries -> 10 iterations
	// - Medium messages (< 200 chars): standard tasks -> 25 iterations
	// - Long messages or complex keywords: complex tasks -> al.maxIterations (usually 50)
	msgLen := len(opts.UserMessage)
	opts.MaxIterations = 25 // Default medium

	if msgLen < 50 {
	opts.MaxIterations = 10
	} else if msgLen >= 200 {
	opts.MaxIterations = al.maxIterations
	}

	// Check for complexity keywords
	keywords := []string{"plan", "analyze", "research", "scan", "crawl", "recursive", "complex"}
	lowerMsg := strings.ToLower(opts.UserMessage)
	for _, kw := range keywords {
	if strings.Contains(lowerMsg, kw) {
	opts.MaxIterations = al.maxIterations + 10 // Boost for complex tasks
	break
	}
	}

	// Ensure we don't exceed a hard safety limit (e.g., 100) unless configured
	if opts.MaxIterations > 100 {
	opts.MaxIterations = 100
	}
	}

	logger.InfoCF("agent", "Adaptive iteration limit set", map[string]interface{}{
	"limit": opts.MaxIterations,
	"msg_len": len(opts.UserMessage),
	})

	// 2. Build messages (skip history for heartbeat)
	var history []providers.Message
	var summary string
	if !opts.NoHistory {
	history = al.sessions.GetHistory(opts.SessionKey)
	summary = al.sessions.GetSummary(opts.SessionKey)
	}
	messages := al.contextBuilder.BuildMessages(
	history,
	summary,
	opts.UserMessage,
	opts.Media,
	opts.Channel,
	opts.ChatID,
	)

	// 3. Save user message to session
	al.sessions.AddMessage(opts.SessionKey, "user", opts.UserMessage)

	// 4. Run LLM iteration loop
	finalContent, iteration, err := al.runLLMIteration(ctx, messages, opts)
	if err != nil {
	return "", err
	}

	// If last tool had ForUser content and we already sent it, we might not need to send final response
	// This is controlled by the tool's Silent flag and ForUser content

	// 5. Handle empty response
	if finalContent == "" {
	// Try to construct a meaningful response from the last action
	history := al.sessions.GetHistory(opts.SessionKey)
	if len(history) > 0 {
	lastMsg := history[len(history)-1]
	if lastMsg.Role == "tool" {
	// Find tool name from previous assistant message
	var toolName string
	if len(history) > 1 {
	prevMsg := history[len(history)-2]
	if prevMsg.Role == "assistant" {
	for _, tc := range prevMsg.ToolCalls {
	if tc.ID == lastMsg.ToolCallID {
	toolName = tc.Name
	break
	}
	}
	}
	}

	contentPreview := utils.Truncate(lastMsg.Content, 200)
	if toolName != "" {
	finalContent = fmt.Sprintf("Saya telah selesai menjalankan %s.\n\nHasil:\n%s", toolName, contentPreview)
	} else {
	finalContent = fmt.Sprintf("Proses selesai.\n\nHasil:\n%s", contentPreview)
	}
	}
	}

	// Fallback to default if still empty
	if finalContent == "" {
	finalContent = opts.DefaultResponse
	}
	}

	// 6. Save final assistant message to session
	al.sessions.AddMessage(opts.SessionKey, "assistant", finalContent)
	al.sessions.Save(opts.SessionKey)

	// 7. Optional: summarization
	if opts.EnableSummary {
	al.maybeSummarize(opts.SessionKey, opts.Channel, opts.ChatID)
	}

	// 8. Optional: send response via bus
	if opts.SendResponse {
	al.bus.PublishOutbound(bus.OutboundMessage{
	Channel: opts.Channel,
	ChatID: opts.ChatID,
	Content: finalContent,
	})
	}

	// 9. Log response
	responsePreview := utils.Truncate(finalContent, 120)
	logger.InfoCF("agent", fmt.Sprintf("Response: %s", responsePreview),
	map[string]interface{}{
	"session_key": opts.SessionKey,
	"iterations": iteration,
	"final_length": len(finalContent),
	})

	return finalContent, nil
	}

	// runLLMIteration executes the LLM call loop with tool handling.
	// Returns the final content, iteration count, and any error.
	func (al *AgentLoop) runLLMIteration(ctx context.Context, messages []providers.Message, opts processOptions) (string, int, error) {
	iteration := 0
	var finalContent string

	// Use config for dynamic values if not overridden
	maxIterations := opts.MaxIterations
	if maxIterations <= 0 {
	if al.config != nil {
	maxIterations = al.config.GetAgentDefaults().MaxToolIterations
	}
	if maxIterations <= 0 {
	maxIterations = al.maxIterations
	}
	}

	for iteration < maxIterations {
	iteration++
	metrics.AgentIterations.Inc()

	// Adaptive iteration limit:
	// If we are nearing the limit but the agent is still using tools effectively (not looping),
	// we might want to extend the limit slightly.
	// For now, let's implement a simple check: if we hit the limit, but the last action was a successful tool call
	// that produced new information (not an error), we could allow 1-2 more iterations.
	// However, to keep it simple and safe, we'll just log a warning if we hit the limit.
	if iteration == maxIterations {
	logger.WarnCF("agent", "Max iterations reached", map[string]interface{}{
	"limit": maxIterations,
	})
	}

	logger.DebugCF("agent", "LLM iteration",
	map[string]interface{}{
	"iteration": iteration,
	"max": maxIterations,
	})

	// Build tool definitions
	providerToolDefs := al.tools.ToProviderDefs()

	// Log LLM request details
	logger.DebugCF("agent", "LLM request",
	map[string]interface{}{
	"iteration": iteration,
	"model": al.model,
	"messages_count": len(messages),
	"tools_count": len(providerToolDefs),
	"max_tokens": 8192,
	"temperature": 0.7,
	"system_prompt_len": len(messages[0].Content),
	})

	// Log full messages (detailed)
	logger.DebugCF("agent", "Full LLM request",
	map[string]interface{}{
	"iteration": iteration,
	"messages_json": formatMessagesForLog(messages),
	"tools_json": formatToolsForLog(providerToolDefs),
	})

	var response *providers.LLMResponse
	var err error

	// Create list of models to try: [current_model, fallback_1, fallback_2, ...]
	modelsToTry := []string{al.model}
	if len(al.fallbackModels) > 0 {
	modelsToTry = append(modelsToTry, al.fallbackModels...)
	} else {
	// Legacy/Fallback hardcoded if config is empty
	backupModels := []string{
	"arcee-ai/trinity-large-preview:free",
	}
	modelsToTry = append(modelsToTry, backupModels...)
	}

	modelSuccess := false

	for modelIdx, modelToUse := range modelsToTry {
	// Retry loop for context/token errors
	maxRetries := 2
	for retry := 0; retry <= maxRetries; retry++ {
	response, err = al.provider.Chat(ctx, messages, providerToolDefs, modelToUse, map[string]interface{}{
	"max_tokens": 8192,
	"temperature": 0.7,
	})

	if err == nil {
	modelSuccess = true
	metrics.LLMRequests.WithLabelValues(modelToUse, "success").Inc()
	break // Success
	}
	metrics.LLMRequests.WithLabelValues(modelToUse, "error").Inc()

	errMsg := strings.ToLower(err.Error())
	// Check for context window errors (provider specific, but usually contain "token" or "invalid")
	isContextError := strings.Contains(errMsg, "token") \|\|
	strings.Contains(errMsg, "context") \|\|
	strings.Contains(errMsg, "invalidparameter") \|\|
	strings.Contains(errMsg, "length")

	// Check for transient errors (network, server error)
	isTransientError := strings.Contains(errMsg, "timeout") \|\|
	strings.Contains(errMsg, "connection") \|\|
	strings.Contains(errMsg, "500") \|\|
	strings.Contains(errMsg, "502") \|\|
	strings.Contains(errMsg, "503") \|\|
	strings.Contains(errMsg, "504") \|\|
	strings.Contains(errMsg, "rate limit") \|\|
	strings.Contains(errMsg, "429")

	if (isContextError \|\| isTransientError) && retry < maxRetries {
	logger.WarnCF("agent", "Recoverable error detected, retrying with backoff", map[string]interface{}{
	"error": err.Error(),
	"retry": retry,
	"model": modelToUse,
	"is_context": isContextError,
	"is_transient": isTransientError,
	})

	// Exponential backoff: 1s, 2s, 4s
	backoff := time.Duration(1<<retry) * time.Second
	time.Sleep(backoff)

	if isContextError {
	if retry == 0 && !constants.IsInternalChannel(opts.Channel) && opts.SendResponse {
	al.bus.PublishOutbound(bus.OutboundMessage{
	Channel: opts.Channel,
	ChatID: opts.ChatID,
	Content: "⚠️ Context window exceeded. Compressing history and retrying...",
	})
	}
	// Apply compression logic if needed (currently simple retry)
	// Ideally call al.forceCompression(opts.SessionKey) here if we had access to modify history in-place
	// But history is passed as argument 'messages'.
	// To fix context error, we MUST reduce 'messages'.

	// Simple truncation for retry
	if len(messages) > 2 {
	// Drop a few oldest messages from the middle (preserve system prompt and last few)
	// messages[0] is system.
	// Remove messages[1] and messages[2] if available
	if len(messages) > 4 {
	// Remove 2 messages (user+assistant pair usually)
	newMessages := make([]providers.Message, 0, len(messages)-2)
	newMessages = append(newMessages, messages[0])
	newMessages = append(newMessages, messages[3:]...)
	messages = newMessages
	logger.WarnCF("agent", "Dropped 2 oldest messages for retry", nil)
	}
	}
	}
	} else {
	// Non-recoverable or max retries reached
	break
	}
	}

	if modelSuccess {
	if modelToUse != al.model {
	logger.WarnCF("agent", "Switched to fallback model", map[string]interface{}{
	"original": al.model,
	"current": modelToUse,
	})
	}
	break
	}

	logger.WarnCF("agent", "Model failed, checking fallbacks", map[string]interface{}{
	"model": modelToUse,
	"error": err.Error(),
	"has_more": modelIdx < len(modelsToTry)-1,
	})
	}

	if !modelSuccess {
	logger.ErrorCF("agent", "LLM call failed after all models tried", map[string]interface{}{
	"error": err.Error(),
	})
	return "", iteration, fmt.Errorf("LLM call failed after all models tried: %w", err)
	}


	// Check if no tool calls - we're done
	if len(response.ToolCalls) == 0 {
	finalContent = response.Content
	logger.InfoCF("agent", "LLM response without tool calls (direct answer)",
	map[string]interface{}{
	"iteration": iteration,
	"content_chars": len(finalContent),
	})
	break
	}

	// Log tool calls
	toolNames := make([]string, 0, len(response.ToolCalls))
	for _, tc := range response.ToolCalls {
	toolNames = append(toolNames, tc.Name)
	}
	logger.InfoCF("agent", "LLM requested tool calls",
	map[string]interface{}{
	"tools": toolNames,
	"count": len(response.ToolCalls),
	"iteration": iteration,
	})

	// Build assistant message with tool calls
	assistantMsg := providers.Message{
	Role: "assistant",
	Content: response.Content,
	}
	for _, tc := range response.ToolCalls {
	argumentsJSON, _ := json.Marshal(tc.Arguments)
	assistantMsg.ToolCalls = append(assistantMsg.ToolCalls, providers.ToolCall{
	ID: tc.ID,
	Type: "function",
	Function: &providers.FunctionCall{
	Name: tc.Name,
	Arguments: string(argumentsJSON),
	},
	})
	}
	messages = append(messages, assistantMsg)

	// Save assistant message with tool calls to session
	al.sessions.AddFullMessage(opts.SessionKey, assistantMsg)

	// Execute tool calls
	// We execute read-only tools in parallel, and side-effect tools sequentially to preserve causality.
	// Results must be appended to messages in the original order.
	results := make([]providers.Message, len(response.ToolCalls))
	executed := make([]bool, len(response.ToolCalls))

	// Helper to check if tool is safe for parallel execution
	isSafe := func(name string) bool {
	switch name {
	case "read_file", "list_dir", "web_fetch", "web_search", "weather":
	return true
	default:
	return false
	}
	}

	// Helper to check if tool result is cacheable
	isCacheable := func(name string) bool {
	switch name {
	case "read_file", "list_dir":
	return true
	default:
	return false
	}
	}

	i := 0
	for i < len(response.ToolCalls) {
	// Identify a batch of safe tools
	start := i
	end := i

	if isSafe(response.ToolCalls[i].Name) {
	// Extend batch while tools are safe
	for end < len(response.ToolCalls) && isSafe(response.ToolCalls[end].Name) {
	end++
	}
	} else {
	// Single unsafe tool
	end = i + 1
	}

	// Execute batch
	var wg sync.WaitGroup
	for j := start; j < end; j++ {
	wg.Add(1)
	go func(idx int, tc providers.ToolCall) {
	defer wg.Done()

	// Log tool call with arguments preview
	argsJSON, _ := json.Marshal(tc.Arguments)
	argsPreview := utils.Truncate(string(argsJSON), 200)
	logger.InfoCF("agent", fmt.Sprintf("Tool call: %s(%s)", tc.Name, argsPreview),
	map[string]interface{}{
	"tool": tc.Name,
	"iteration": iteration,
	})

	var toolResult *tools.ToolResult
	var cacheKey string

	// Check cache for deterministic tools
	if isCacheable(tc.Name) {
	cacheKey = tc.Name + ":" + string(argsJSON)
	al.cacheMutex.RLock()
	if entry, ok := al.cache[cacheKey]; ok && time.Now().Before(entry.ExpiresAt) {
	toolResult = entry.Result
	logger.DebugCF("agent", "Cache hit for tool", map[string]interface{}{"tool": tc.Name})
	metrics.ToolCacheHits.WithLabelValues(tc.Name).Inc()
	} else {
	metrics.ToolCacheMisses.WithLabelValues(tc.Name).Inc()
	}
	al.cacheMutex.RUnlock()
	}

	if toolResult == nil {
	// Create async callback
	asyncCallback := func(callbackCtx context.Context, result *tools.ToolResult) {
	if !result.Silent && result.ForUser != "" {
	logger.InfoCF("agent", "Async tool completed, agent will handle notification",
	map[string]interface{}{
	"tool": tc.Name,
	"content_len": len(result.ForUser),
	})
	}
	}

	// Retry logic for tool execution
	maxRetries := 2
	for retry := 0; retry <= maxRetries; retry++ {
	toolResult = al.tools.ExecuteWithContext(ctx, tc.Name, tc.Arguments, opts.Channel, opts.ChatID, asyncCallback)

	if toolResult.Err == nil {
	break
	}

	// Check for transient errors
	errMsg := strings.ToLower(toolResult.Err.Error())
	isTransient := strings.Contains(errMsg, "timeout") \|\|
	strings.Contains(errMsg, "connection") \|\|
	strings.Contains(errMsg, "rate limit") \|\|
	strings.Contains(errMsg, "429") \|\|
	strings.Contains(errMsg, "500") \|\|
	strings.Contains(errMsg, "502") \|\|
	strings.Contains(errMsg, "503") \|\|
	strings.Contains(errMsg, "504") \|\|
	strings.Contains(errMsg, "temporary")

	if !isTransient {
	break
	}

	if retry < maxRetries {
	logger.WarnCF("agent", "Tool execution failed, retrying", map[string]interface{}{
	"tool": tc.Name,
	"error": toolResult.Err.Error(),
	"retry": retry,
	})
	time.Sleep(time.Duration(1<<retry) * time.Second)
	}
	}

	// Update cache if successful
	if isCacheable(tc.Name) && toolResult.Err == nil {
	al.cacheMutex.Lock()
	al.cache[cacheKey] = ToolCacheEntry{
	Result: toolResult,
	ExpiresAt: time.Now().Add(60 * time.Second), // 60s TTL
	}
	al.cacheMutex.Unlock()
	}
	}

	// Send ForUser content to user immediately if not Silent
	if !toolResult.Silent && toolResult.ForUser != "" && opts.SendResponse {
	al.bus.PublishOutbound(bus.OutboundMessage{
	Channel: opts.Channel,
	ChatID: opts.ChatID,
	Content: toolResult.ForUser,
	})
	logger.DebugCF("agent", "Sent tool result to user",
	map[string]interface{}{
	"tool": tc.Name,
	"content_len": len(toolResult.ForUser),
	})
	}

	// Determine content for LLM based on tool result
	contentForLLM := toolResult.ForLLM
	if contentForLLM == "" && toolResult.Err != nil {
	contentForLLM = toolResult.Err.Error()
	}

	results[idx] = providers.Message{
	Role: "tool",
	Content: contentForLLM,
	ToolCallID: tc.ID,
	}
	executed[idx] = true
	}(j, response.ToolCalls[j])
	}
	wg.Wait()
	i = end
	}

	// Append results to messages and session in order
	for idx, res := range results {
	if !executed[idx] {
	// Should not happen if logic is correct
	logger.ErrorCF("agent", "Tool result missing for index", map[string]interface{}{"index": idx})
	continue
	}
	messages = append(messages, res)
	al.sessions.AddFullMessage(opts.SessionKey, res)
	}

	// Automatic iteration extension
	// If we reached the limit but just finished executing tools, the task is likely not done.
	// We extend the limit to allow the agent to finish, up to a hard safety limit.
	if iteration >= maxIterations {
	hardLimit := 100 // Default safety hard limit
	// If config has a higher limit, respect that + buffer
	if al.config != nil {
	configLimit := al.config.GetAgentDefaults().MaxToolIterations
	if configLimit > hardLimit {
	hardLimit = configLimit + 20
	}
	}

	if maxIterations < hardLimit {
	extension := 10
	newLimit := maxIterations + extension
	if newLimit > hardLimit {
	newLimit = hardLimit
	}

	if newLimit > maxIterations {
	logger.WarnCF("agent", "Auto-extending iteration limit", map[string]interface{}{
	"old_limit": maxIterations,
	"new_limit": newLimit,
	"reason": "task ongoing",
	})
	maxIterations = newLimit

	// Notify user slightly if it's a significant extension
	if maxIterations > 30 && !constants.IsInternalChannel(opts.Channel) && opts.SendResponse {
	// Only send a subtle notification once or if really long
	if maxIterations == 40 \|\| maxIterations == 70 {
	al.bus.PublishOutbound(bus.OutboundMessage{
	Channel: opts.Channel,
	ChatID: opts.ChatID,
	Content: fmt.Sprintf("🔄 Memperpanjang waktu proses (%d langkah)...", maxIterations),
	})
	}
	}
	}
	}
	}
	}

	return finalContent, iteration, nil
	}



	// updateToolContexts updates the context for tools that need channel/chatID info.
	func (al *AgentLoop) updateToolContexts(channel, chatID string) {
	// Use ContextualTool interface instead of type assertions
	if tool, ok := al.tools.Get("message"); ok {
	if mt, ok := tool.(tools.ContextualTool); ok {
	mt.SetContext(channel, chatID)
	}
	}
	if tool, ok := al.tools.Get("spawn"); ok {
	if st, ok := tool.(tools.ContextualTool); ok {
	st.SetContext(channel, chatID)
	}
	}
	if tool, ok := al.tools.Get("subagent"); ok {
	if st, ok := tool.(tools.ContextualTool); ok {
	st.SetContext(channel, chatID)
	}
	}
	}

	// maybeSummarize triggers summarization if the session history exceeds thresholds.
	func (al *AgentLoop) maybeSummarize(sessionKey, channel, chatID string) {
	newHistory := al.sessions.GetHistory(sessionKey)
	tokenEstimate := al.estimateTokens(newHistory)
	threshold := al.contextWindow * 75 / 100

	if len(newHistory) > 20 \|\| tokenEstimate > threshold {
	if _, loading := al.summarizing.LoadOrStore(sessionKey, true); !loading {
	go func() {
	defer al.summarizing.Delete(sessionKey)
	// Notify user about optimization if not an internal channel
	if !constants.IsInternalChannel(channel) {
	al.bus.PublishOutbound(bus.OutboundMessage{
	Channel: channel,
	ChatID: chatID,
	Content: "🧹 Sedang merapikan ingatan percakapan untuk menjaga performa...",
	})
	}
	al.summarizeSession(sessionKey)
	}()
	}
	}
	}

	// forceCompression aggressively reduces context when the limit is hit.
	// It drops the oldest 50% of messages (keeping system prompt and last user message).
	func (al *AgentLoop) forceCompression(sessionKey string) {
	history := al.sessions.GetHistory(sessionKey)
	if len(history) <= 4 {
	return
	}

	// Keep system prompt (usually [0]) and the very last message (user's trigger)
	// We want to drop the oldest half of the conversation
	// Assuming [0] is system, [1:] is conversation
	conversation := history[1 : len(history)-1]
	if len(conversation) == 0 {
	return
	}

	// Helper to find the mid-point of the conversation
	mid := len(conversation) / 2

	// New history structure:
	// 1. System Prompt
	// 2. [Summary of dropped part] - synthesized
	// 3. Second half of conversation
	// 4. Last message

	// Simplified approach for emergency: Drop first half of conversation
	// and rely on existing summary if present, or create a placeholder.

	droppedCount := mid
	keptConversation := conversation[mid:]

	newHistory := make([]providers.Message, 0)
	newHistory = append(newHistory, history[0]) // System prompt

	// Add a note about compression
	compressionNote := fmt.Sprintf("[System: Emergency compression dropped %d oldest messages due to context limit]", droppedCount)
	// If there was an existing summary, we might lose it if it was in the dropped part (which is just messages).
	// The summary is stored separately in session.Summary, so it persists!
	// We just need to ensure the user knows there's a gap.

	// We only modify the messages list here
	newHistory = append(newHistory, providers.Message{
	Role: "system",
	Content: compressionNote,
	})

	newHistory = append(newHistory, keptConversation...)
	newHistory = append(newHistory, history[len(history)-1]) // Last message

	// Update session
	al.sessions.SetHistory(sessionKey, newHistory)
	al.sessions.Save(sessionKey)

	logger.WarnCF("agent", "Forced compression executed", map[string]interface{}{
	"session_key": sessionKey,
	"dropped_msgs": droppedCount,
	"new_count": len(newHistory),
	})
	}

	// GetStartupInfo returns information about loaded tools and skills for logging.
	func (al *AgentLoop) GetStartupInfo() map[string]interface{} {
	info := make(map[string]interface{})

	// Tools info
	tools := al.tools.List()
	info["tools"] = map[string]interface{}{
	"count": len(tools),
	"names": tools,
	}

	// Skills info
	info["skills"] = al.contextBuilder.GetSkillsInfo()

	return info
	}

	// formatMessagesForLog formats messages for logging
	func formatMessagesForLog(messages []providers.Message) string {
	if len(messages) == 0 {
	return "[]"
	}

	buf := utils.GetBuffer()
	defer utils.PutBuffer(buf)

	buf.WriteString("[\n")
	for i, msg := range messages {
	buf.WriteString(fmt.Sprintf(" [%d] Role: %s\n", i, msg.Role))
	if len(msg.ToolCalls) > 0 {
	buf.WriteString(" ToolCalls:\n")
	for _, tc := range msg.ToolCalls {
	buf.WriteString(fmt.Sprintf(" - ID: %s, Type: %s, Name: %s\n", tc.ID, tc.Type, tc.Name))
	if tc.Function != nil {
	buf.WriteString(fmt.Sprintf(" Arguments: %s\n", utils.Truncate(tc.Function.Arguments, 200)))
	}
	}
	}
	if msg.Content != "" {
	content := utils.Truncate(msg.Content, 200)
	buf.WriteString(fmt.Sprintf(" Content: %s\n", content))
	}
	if msg.ToolCallID != "" {
	buf.WriteString(fmt.Sprintf(" ToolCallID: %s\n", msg.ToolCallID))
	}
	buf.WriteString("\n")
	}
	buf.WriteString("]")
	return buf.String()
	}

	// formatToolsForLog formats tool definitions for logging
	func formatToolsForLog(tools []providers.ToolDefinition) string {
	if len(tools) == 0 {
	return "[]"
	}

	buf := utils.GetBuffer()
	defer utils.PutBuffer(buf)

	buf.WriteString("[\n")
	for i, tool := range tools {
	buf.WriteString(fmt.Sprintf(" [%d] Type: %s, Name: %s\n", i, tool.Type, tool.Function.Name))
	buf.WriteString(fmt.Sprintf(" Description: %s\n", tool.Function.Description))
	if len(tool.Function.Parameters) > 0 {
	buf.WriteString(fmt.Sprintf(" Parameters: %s\n", utils.Truncate(fmt.Sprintf("%v", tool.Function.Parameters), 200)))
	}
	}
	buf.WriteString("]")
	return buf.String()
	}

	// summarizeSession summarizes the conversation history for a session.
	func (al *AgentLoop) summarizeSession(sessionKey string) {
	ctx, cancel := context.WithTimeout(context.Background(), 120*time.Second)
	defer cancel()

	history := al.sessions.GetHistory(sessionKey)
	summary := al.sessions.GetSummary(sessionKey)

	// Keep last 4 messages for continuity
	if len(history) <= 4 {
	return
	}

	toSummarize := history[:len(history)-4]

	// Oversized Message Guard
	// Skip messages larger than 50% of context window to prevent summarizer overflow
	maxMessageTokens := al.contextWindow / 2
	validMessages := make([]providers.Message, 0)
	omitted := false

	for _, m := range toSummarize {
	if m.Role != "user" && m.Role != "assistant" {
	continue
	}
	// Estimate tokens for this message
	msgTokens := len(m.Content) / 2 // Use safer estimate here too (2.5 -> 2 for integer division safety)
	if msgTokens > maxMessageTokens {
	omitted = true
	continue
	}
	validMessages = append(validMessages, m)
	}

	if len(validMessages) == 0 {
	return
	}

	// Multi-Part Summarization
	// Split into two parts if history is significant
	var finalSummary string
	if len(validMessages) > 10 {
	mid := len(validMessages) / 2
	part1 := validMessages[:mid]
	part2 := validMessages[mid:]

	s1, _ := al.summarizeBatch(ctx, part1, "")
	s2, _ := al.summarizeBatch(ctx, part2, "")

	// Merge them
	mergePrompt := fmt.Sprintf("Merge these two conversation summaries into one cohesive summary:\n\n1: %s\n\n2: %s", s1, s2)
	resp, err := al.provider.Chat(ctx, []providers.Message{{Role: "user", Content: mergePrompt}}, nil, al.model, map[string]interface{}{
	"max_tokens": 1024,
	"temperature": 0.3,
	})
	if err == nil {
	finalSummary = resp.Content
	} else {
	finalSummary = s1 + " " + s2
	}
	} else {
	finalSummary, _ = al.summarizeBatch(ctx, validMessages, summary)
	}

	if omitted && finalSummary != "" {
	finalSummary += "\n[Note: Some oversized messages were omitted from this summary for efficiency.]"
	}

	if finalSummary != "" {
	al.sessions.SetSummary(sessionKey, finalSummary)
	al.sessions.TruncateHistory(sessionKey, 4)
	al.sessions.Save(sessionKey)
	}
	}

	// summarizeBatch summarizes a batch of messages.
	func (al *AgentLoop) summarizeBatch(ctx context.Context, batch []providers.Message, existingSummary string) (string, error) {
	prompt := "Provide a concise summary of this conversation segment, preserving core context and key points.\n"
	if existingSummary != "" {
	prompt += "Existing context: " + existingSummary + "\n"
	}
	prompt += "\nCONVERSATION:\n"
	for _, m := range batch {
	prompt += fmt.Sprintf("%s: %s\n", m.Role, m.Content)
	}

	response, err := al.provider.Chat(ctx, []providers.Message{{Role: "user", Content: prompt}}, nil, al.model, map[string]interface{}{
	"max_tokens": 1024,
	"temperature": 0.3,
	})
	if err != nil {
	return "", err
	}
	return response.Content, nil
	}

	// estimateTokens estimates the number of tokens in a message list.
	// Uses a safe heuristic of 2.5 characters per token to account for CJK and other
	// overheads better than the previous 3 chars/token.
	func (al *AgentLoop) estimateTokens(messages []providers.Message) int {
	totalChars := 0
	for _, m := range messages {
	totalChars += utf8.RuneCountInString(m.Content)
	}
	// 2.5 chars per token = totalChars * 2 / 5
	return totalChars * 2 / 5
	}

	func (al *AgentLoop) handleCommand(ctx context.Context, msg bus.InboundMessage) (string, bool) {
	content := strings.TrimSpace(msg.Content)
	if !strings.HasPrefix(content, "/") {
	return "", false
	}

	parts := strings.Fields(content)
	if len(parts) == 0 {
	return "", false
	}

	cmd := parts[0]
	args := parts[1:]

	switch cmd {
	case "/show":
	if len(args) < 1 {
	return "Usage: /show [model\|channel]", true
	}
	switch args[0] {
	case "model":
	return fmt.Sprintf("Current model: %s", al.model), true
	case "channel":
	return fmt.Sprintf("Current channel: %s", msg.Channel), true
	default:
	return fmt.Sprintf("Unknown show target: %s", args[0]), true
	}

	case "/list":
	if len(args) < 1 {
	return "Usage: /list [models\|channels]", true
	}
	switch args[0] {
	case "models":
	// TODO: Fetch available models dynamically if possible
	return "Available models: glm-4.7, claude-3-5-sonnet, gpt-4o (configured in config.json/env)", true
	case "channels":
	if al.channelManager == nil {
	return "Channel manager not initialized", true
	}
	channels := al.channelManager.GetEnabledChannels()
	if len(channels) == 0 {
	return "No channels enabled", true
	}
	return fmt.Sprintf("Enabled channels: %s", strings.Join(channels, ", ")), true
	default:
	return fmt.Sprintf("Unknown list target: %s", args[0]), true
	}

	case "/switch":
	if len(args) < 3 \|\| args[1] != "to" {
	return "Usage: /switch [model\|channel] to <name>", true
	}
	target := args[0]
	value := args[2]

	switch target {
	case "model":
	oldModel := al.model
	al.model = value
	return fmt.Sprintf("Switched model from %s to %s", oldModel, value), true
	case "channel":
	// This changes the 'default' channel for some operations, or effectively redirects output?
	// For now, let's just validate if the channel exists
	if al.channelManager == nil {
	return "Channel manager not initialized", true
	}
	if _, exists := al.channelManager.GetChannel(value); !exists && value != "cli" {
	return fmt.Sprintf("Channel '%s' not found or not enabled", value), true
	}

	// If message came from CLI, maybe we want to redirect CLI output to this channel?
	// That would require state persistence about "redirected channel"
	// For now, just acknowledged.
	return fmt.Sprintf("Switched target channel to %s (Note: this currently only validates existence)", value), true
	default:
	return fmt.Sprintf("Unknown switch target: %s", target), true
	}
	}

	return "", false
	}