Initial commit: Orca Agent Framework

Core features: - Microkernel architecture with Actor model - Session management with JSONL persistence - Tool system (5 built-in tools) - Skill system with SKILL.md parsing - Sandbox security execution - Ollama integration with gemma4:e4b - Prompt-based tool calling (compatible with native function calling) - REPL interface 11 packages, all tests passing
2026-05-08 00:55:48 +08:00 · 2026-05-08 00:55:48 +08:00 · 6b94476347
commit 6b94476347
42 changed files with 8993 additions and 0 deletions
--- a/cmd/orca/main.go
+++ b/cmd/orca/main.go
@ -0,0 +1,205 @@
 // Orca is a Go-based Agent framework with a microkernel architecture.
 //
 // It supports multi-agent collaboration, persistent session memory,
 // skill-based automation, sandboxed execution, custom tool registration,
 // and local LLM integration via Ollama.
 package main
 import (
 	"bufio"
 	"fmt"
 	"log"
 	"os"
 	"os/signal"
 	"strings"
 	"syscall"
 	"time"
 	"github.com/orca/orca/internal/config"
 	"github.com/orca/orca/pkg/kernel"
 )
 func main() {
 	// Load configuration from environment variables
 	cfg := config.LoadConfigFromEnv()
 	// Support shorter env var names for Ollama (without ORCA_ prefix)
 	if v := os.Getenv("OLLAMA_BASE_URL"); v != "" {
 		cfg.Ollama.BaseURL = v
 	}
 	if v := os.Getenv("OLLAMA_MODEL"); v != "" {
 		cfg.Ollama.Model = v
 	}
 	if v := os.Getenv("OLLAMA_TIMEOUT"); v != "" {
 		if d, err := time.ParseDuration(v); err == nil {
 			cfg.Ollama.Timeout = d
 		}
 	}
 	// Create and start kernel
 	k := kernel.NewWithConfig(cfg)
 	if err := k.Start(); err != nil {
 		log.Fatalf("Failed to start kernel: %v", err)
 	}
 	fmt.Println("Orca Agent Framework")
 	fmt.Println("Kernel started successfully")
 	fmt.Printf("  LLM Model: %s\n", cfg.Ollama.Model)
 	fmt.Printf("  Ollama URL: %s\n", cfg.Ollama.BaseURL)
 	fmt.Println("Type your message or /help for commands.")
 	fmt.Println()
 	// Handle graceful shutdown
 	sig := make(chan os.Signal, 1)
 	signal.Notify(sig, syscall.SIGINT, syscall.SIGTERM)
 	// REPL loop in a goroutine so we can catch signals
 	done := make(chan struct{})
 	go func() {
 		scanner := bufio.NewScanner(os.Stdin)
 		for {
 			fmt.Print("> ")
 			if !scanner.Scan() {
 				break
 			}
 			input := strings.TrimSpace(scanner.Text())
 			if input == "" {
 				continue
 			}
 			// Handle commands
 			if strings.HasPrefix(input, "/") {
 				handleCommand(input, k)
 				continue
 			}
 			// Send message to LLM agent via kernel
 			response, err := k.SendMessage("user", "llm", input)
 			if err != nil {
 				fmt.Printf("Error: %v\n", err)
 				continue
 			}
 			fmt.Println(response)
 			fmt.Println()
 		}
 		if err := scanner.Err(); err != nil {
 			fmt.Fprintf(os.Stderr, "Error reading input: %v\n", err)
 		}
 		close(done)
 	}()
 	// Wait for either SIGINT or REPL exit
 	select {
 	case <-sig:
 		fmt.Println("\nShutting down Orca kernel...")
 	case <-done:
 		fmt.Println("\nInput closed. Shutting down Orca kernel...")
 	}
 	if err := k.Stop(); err != nil {
 		log.Fatalf("Failed to stop kernel: %v", err)
 	}
 	fmt.Println("Orca kernel shut down gracefully.")
 }
 // handleCommand processes REPL commands.
 func handleCommand(cmd string, k *kernel.Kernel) {
 	switch cmd {
 	case "/help":
 		fmt.Println("Available commands:")
 		fmt.Println("  /help       - Show this help message")
 		fmt.Println("  /exit       - Exit the program")
 		fmt.Println("  /quit       - Exit the program")
 		fmt.Println("  /plugins    - List registered plugins")
 		fmt.Println("  /agents     - List active agents")
 		fmt.Println("  /tools      - List registered tools")
 		fmt.Println("  /skills     - List loaded skills")
 		fmt.Println("  /status     - Show kernel status")
 		fmt.Println()
 		fmt.Println("Any other input is sent to the LLM agent for processing.")
 	case "/exit", "/quit":
 		fmt.Println("Goodbye!")
 		os.Exit(0)
 	case "/plugins":
 		plugins := k.ListPlugins()
 		if len(plugins) == 0 {
 			fmt.Println("No plugins registered.")
 		} else {
 			fmt.Println("Registered plugins:")
 			for _, p := range plugins {
 				fmt.Printf("  - %s (%s)\n", p.Name(), p.Version())
 			}
 		}
 	case "/agents":
 		as := k.ActorSystem()
 		if as == nil {
 			fmt.Println("Actor system not initialized.")
 			return
 		}
 		infos := as.AgentInfos()
 		if len(infos) == 0 {
 			fmt.Println("No agents running.")
 		} else {
 			fmt.Println("Active agents:")
 			for _, info := range infos {
 				fmt.Printf("  - %s [%s] (status: %s)\n", info.ID, info.Role, info.Status)
 			}
 		}
 	case "/tools":
 		tm := k.ToolManager()
 		if tm == nil {
 			fmt.Println("Tool manager not initialized.")
 			return
 		}
 		tools := tm.List()
 		if len(tools) == 0 {
 			fmt.Println("No tools registered.")
 		} else {
 			fmt.Println("Registered tools:")
 			for _, t := range tools {
 				fmt.Printf("  - %s: %s\n", t.Name(), t.Description())
 			}
 		}
 	case "/skills":
 		sm := k.SkillManager()
 		if sm == nil {
 			fmt.Println("Skill manager not initialized.")
 			return
 		}
 		skills := sm.ListSkills()
 		if len(skills) == 0 {
 			fmt.Println("No skills loaded.")
 		} else {
 			fmt.Println("Loaded skills:")
 			for _, s := range skills {
 				fmt.Printf("  - %s: %s\n", s.Name, s.Description)
 			}
 		}
 	case "/status":
 		fmt.Printf("Kernel running: %v\n", k.IsRunning())
 		if tm := k.ToolManager(); tm != nil {
 			fmt.Printf("Tools registered: %d\n", tm.Count())
 		}
 		if as := k.ActorSystem(); as != nil {
 			fmt.Printf("Agents active: %d\n", as.AgentCount())
 		}
 		if sm := k.SkillManager(); sm != nil {
 			fmt.Printf("Skills loaded: %d\n", len(sm.ListSkills()))
 		}
 	default:
 		fmt.Printf("Unknown command: %s\n", cmd)
 		fmt.Println("Type /help for available commands.")
 	}
 }
--- a/go.mod
+++ b/go.mod
@ -0,0 +1,3 @@
 module github.com/orca/orca
 go 1.26.1
--- a/internal/config/config.go
+++ b/internal/config/config.go
@ -0,0 +1,147 @@
 // Package config provides the configuration types for the Orca framework.
 //
 // Configuration is organized into logical groups: LLM (Ollama), sandbox,
 // and session management. Default values are provided for all settings.
 package config
 import (
 	"os"
 	"strconv"
 	"time"
 )
 // Config is the top-level configuration for the Orca framework.
 type Config struct {
 	Ollama  OllamaConfig  `json:"ollama"`
 	Sandbox SandboxConfig `json:"sandbox"`
 	Session SessionConfig `json:"session"`
 }
 // OllamaConfig holds configuration for the Ollama LLM backend.
 type OllamaConfig struct {
 	// BaseURL is the Ollama API endpoint (e.g., "http://localhost:11434").
 	BaseURL string `json:"base_url"`
 	// Model is the Ollama model name to use (e.g., "gemma4:e4b", "codellama").
 	Model string `json:"model"`
 	// Timeout is the maximum duration to wait for an Ollama response.
 	Timeout time.Duration `json:"timeout"`
 }
 // SandboxConfig holds configuration for the command execution sandbox.
 type SandboxConfig struct {
 	// Timeout is the maximum duration for a sandboxed command.
 	Timeout time.Duration `json:"timeout"`
 	// MaxMemory is the maximum memory allocation for the sandbox (in bytes).
 	MaxMemory int64 `json:"max_memory"`
 	// WorkingDir is the default working directory for sandboxed commands.
 	WorkingDir string `json:"working_dir"`
 }
 // SessionConfig holds configuration for session management.
 type SessionConfig struct {
 	// StorageDir is the directory for session JSONL files.
 	StorageDir string `json:"storage_dir"`
 	// MaxHistory is the maximum number of messages to retain per session.
 	MaxHistory int `json:"max_history"`
 }
 // DefaultConfig returns a Config with sensible defaults.
 func DefaultConfig() *Config {
 	return &Config{
 		Ollama: OllamaConfig{
 			BaseURL: "http://localhost:11434",
 			Model:   "gemma4:e4b",
 			Timeout: 120 * time.Second,
 		},
 		Sandbox: SandboxConfig{
 			Timeout:    30 * time.Second,
 			MaxMemory:  512 * 1024 * 1024, // 512 MB
 			WorkingDir: "/tmp/orca/sandbox",
 		},
 		Session: SessionConfig{
 			StorageDir: func() string {
 				home, _ := os.UserHomeDir()
 				return home + "/.orca/sessions"
 			}(),
 			MaxHistory: 100,
 		},
 	}
 }
 // LoadConfigFromEnv reads configuration from environment variables,
 // overriding defaults where environment variables are set.
 func LoadConfigFromEnv() *Config {
 	cfg := DefaultConfig()
 	if v := os.Getenv("ORCA_OLLAMA_BASE_URL"); v != "" {
 		cfg.Ollama.BaseURL = v
 	}
 	if v := os.Getenv("ORCA_OLLAMA_MODEL"); v != "" {
 		cfg.Ollama.Model = v
 	}
 	if v := os.Getenv("ORCA_OLLAMA_TIMEOUT"); v != "" {
 		if d, err := time.ParseDuration(v); err == nil {
 			cfg.Ollama.Timeout = d
 		}
 	}
 	if v := os.Getenv("ORCA_SANDBOX_TIMEOUT"); v != "" {
 		if d, err := time.ParseDuration(v); err == nil {
 			cfg.Sandbox.Timeout = d
 		}
 	}
 	if v := os.Getenv("ORCA_SANDBOX_MAX_MEMORY"); v != "" {
 		if n, err := strconv.ParseInt(v, 10, 64); err == nil {
 			cfg.Sandbox.MaxMemory = n
 		}
 	}
 	if v := os.Getenv("ORCA_SANDBOX_WORKING_DIR"); v != "" {
 		cfg.Sandbox.WorkingDir = v
 	}
 	if v := os.Getenv("ORCA_SESSION_STORAGE_DIR"); v != "" {
 		cfg.Session.StorageDir = v
 	}
 	if v := os.Getenv("ORCA_SESSION_MAX_HISTORY"); v != "" {
 		if n, err := strconv.Atoi(v); err == nil {
 			cfg.Session.MaxHistory = n
 		}
 	}
 	return cfg
 }
 // IsValid checks whether the configuration has valid values.
 func (c *Config) IsValid() error {
 	if c.Ollama.BaseURL == "" {
 		return errConfig("ollama.base_url must not be empty")
 	}
 	if c.Ollama.Model == "" {
 		return errConfig("ollama.model must not be empty")
 	}
 	if c.Ollama.Timeout <= 0 {
 		return errConfig("ollama.timeout must be positive")
 	}
 	if c.Sandbox.Timeout <= 0 {
 		return errConfig("sandbox.timeout must be positive")
 	}
 	if c.Sandbox.MaxMemory <= 0 {
 		return errConfig("sandbox.max_memory must be positive")
 	}
 	if c.Session.MaxHistory <= 0 {
 		return errConfig("session.max_history must be positive")
 	}
 	return nil
 }
 // errConfig creates a configuration error.
 func errConfig(msg string) error {
 	return &ConfigError{Message: msg}
 }
 // ConfigError represents a configuration validation error.
 type ConfigError struct {
 	Message string
 }
 func (e *ConfigError) Error() string {
 	return "config: " + e.Message
 }
--- a/internal/config/config_test.go
+++ b/internal/config/config_test.go
@ -0,0 +1,221 @@
 package config
 import (
 	"os"
 	"testing"
 	"time"
 )
 func TestDefaultConfig(t *testing.T) {
 	cfg := DefaultConfig()
 	if cfg == nil {
 		t.Fatal("DefaultConfig() returned nil")
 	}
 	// Check Ollama defaults
 	if cfg.Ollama.BaseURL != "http://localhost:11434" {
 		t.Errorf("expected default Ollama BaseURL 'http://localhost:11434', got %q", cfg.Ollama.BaseURL)
 	}
 	if cfg.Ollama.Model != "gemma4:e4b" {
 		t.Errorf("expected default Ollama Model 'gemma4:e4b', got %q", cfg.Ollama.Model)
 	}
 	if cfg.Ollama.Timeout != 120*time.Second {
 		t.Errorf("expected default Ollama Timeout 120s, got %v", cfg.Ollama.Timeout)
 	}
 	// Check Sandbox defaults
 	if cfg.Sandbox.Timeout != 30*time.Second {
 		t.Errorf("expected default Sandbox Timeout 30s, got %v", cfg.Sandbox.Timeout)
 	}
 	if cfg.Sandbox.MaxMemory != 512*1024*1024 {
 		t.Errorf("expected default Sandbox MaxMemory 512MB, got %d", cfg.Sandbox.MaxMemory)
 	}
 	if cfg.Sandbox.WorkingDir != "/tmp/orca/sandbox" {
 		t.Errorf("expected default Sandbox WorkingDir '/tmp/orca/sandbox', got %q", cfg.Sandbox.WorkingDir)
 	}
 	// Check Session defaults
 	if cfg.Session.MaxHistory != 100 {
 		t.Errorf("expected default Session MaxHistory 100, got %d", cfg.Session.MaxHistory)
 	}
 	if cfg.Session.StorageDir == "" {
 		t.Error("expected non-empty Session StorageDir")
 	}
 }
 func TestDefaultConfigStorageDir(t *testing.T) {
 	cfg := DefaultConfig()
 	home, _ := os.UserHomeDir()
 	expected := home + "/.orca/sessions"
 	if cfg.Session.StorageDir != expected {
 		t.Errorf("expected StorageDir %q, got %q", expected, cfg.Session.StorageDir)
 	}
 }
 func TestLoadConfigFromEnv(t *testing.T) {
 	// Set environment variables
 	os.Setenv("ORCA_OLLAMA_BASE_URL", "http://custom:11434")
 	os.Setenv("ORCA_OLLAMA_MODEL", "codellama")
 	os.Setenv("ORCA_OLLAMA_TIMEOUT", "60s")
 	os.Setenv("ORCA_SANDBOX_TIMEOUT", "120s")
 	os.Setenv("ORCA_SANDBOX_MAX_MEMORY", "1073741824")
 	os.Setenv("ORCA_SANDBOX_WORKING_DIR", "/custom/sandbox")
 	os.Setenv("ORCA_SESSION_STORAGE_DIR", "/custom/sessions")
 	os.Setenv("ORCA_SESSION_MAX_HISTORY", "200")
 	defer func() {
 		os.Unsetenv("ORCA_OLLAMA_BASE_URL")
 		os.Unsetenv("ORCA_OLLAMA_MODEL")
 		os.Unsetenv("ORCA_OLLAMA_TIMEOUT")
 		os.Unsetenv("ORCA_SANDBOX_TIMEOUT")
 		os.Unsetenv("ORCA_SANDBOX_MAX_MEMORY")
 		os.Unsetenv("ORCA_SANDBOX_WORKING_DIR")
 		os.Unsetenv("ORCA_SESSION_STORAGE_DIR")
 		os.Unsetenv("ORCA_SESSION_MAX_HISTORY")
 	}()
 	cfg := LoadConfigFromEnv()
 	if cfg.Ollama.BaseURL != "http://custom:11434" {
 		t.Errorf("expected Ollama BaseURL 'http://custom:11434', got %q", cfg.Ollama.BaseURL)
 	}
 	if cfg.Ollama.Model != "codellama" {
 		t.Errorf("expected Ollama Model 'codellama', got %q", cfg.Ollama.Model)
 	}
 	if cfg.Ollama.Timeout != 60*time.Second {
 		t.Errorf("expected Ollama Timeout 60s, got %v", cfg.Ollama.Timeout)
 	}
 	if cfg.Sandbox.Timeout != 120*time.Second {
 		t.Errorf("expected Sandbox Timeout 120s, got %v", cfg.Sandbox.Timeout)
 	}
 	if cfg.Sandbox.MaxMemory != 1073741824 {
 		t.Errorf("expected Sandbox MaxMemory 1073741824, got %d", cfg.Sandbox.MaxMemory)
 	}
 	if cfg.Sandbox.WorkingDir != "/custom/sandbox" {
 		t.Errorf("expected Sandbox WorkingDir '/custom/sandbox', got %q", cfg.Sandbox.WorkingDir)
 	}
 	if cfg.Session.StorageDir != "/custom/sessions" {
 		t.Errorf("expected Session StorageDir '/custom/sessions', got %q", cfg.Session.StorageDir)
 	}
 	if cfg.Session.MaxHistory != 200 {
 		t.Errorf("expected Session MaxHistory 200, got %d", cfg.Session.MaxHistory)
 	}
 }
 func TestLoadConfigFromEnvPartial(t *testing.T) {
 	os.Setenv("ORCA_OLLAMA_MODEL", "mistral")
 	defer os.Unsetenv("ORCA_OLLAMA_MODEL")
 	cfg := LoadConfigFromEnv()
 	// Should use env override
 	if cfg.Ollama.Model != "mistral" {
 		t.Errorf("expected Model 'mistral', got %q", cfg.Ollama.Model)
 	}
 	// Should keep defaults for unset values
 	if cfg.Ollama.BaseURL != "http://localhost:11434" {
 		t.Errorf("expected default BaseURL, got %q", cfg.Ollama.BaseURL)
 	}
 }
 func TestConfigIsValid(t *testing.T) {
 	cfg := DefaultConfig()
 	if err := cfg.IsValid(); err != nil {
 		t.Errorf("default config should be valid: %v", err)
 	}
 }
 func TestConfigInvalidBaseURL(t *testing.T) {
 	cfg := DefaultConfig()
 	cfg.Ollama.BaseURL = ""
 	if err := cfg.IsValid(); err == nil {
 		t.Error("expected error for empty BaseURL")
 	}
 }
 func TestConfigInvalidModel(t *testing.T) {
 	cfg := DefaultConfig()
 	cfg.Ollama.Model = ""
 	if err := cfg.IsValid(); err == nil {
 		t.Error("expected error for empty Model")
 	}
 }
 func TestConfigInvalidOllamaTimeout(t *testing.T) {
 	cfg := DefaultConfig()
 	cfg.Ollama.Timeout = 0
 	if err := cfg.IsValid(); err == nil {
 		t.Error("expected error for zero Ollama Timeout")
 	}
 }
 func TestConfigInvalidSandboxTimeout(t *testing.T) {
 	cfg := DefaultConfig()
 	cfg.Sandbox.Timeout = -1
 	if err := cfg.IsValid(); err == nil {
 		t.Error("expected error for negative Sandbox Timeout")
 	}
 }
 func TestConfigInvalidMaxMemory(t *testing.T) {
 	cfg := DefaultConfig()
 	cfg.Sandbox.MaxMemory = 0
 	if err := cfg.IsValid(); err == nil {
 		t.Error("expected error for zero MaxMemory")
 	}
 }
 func TestConfigInvalidMaxHistory(t *testing.T) {
 	cfg := DefaultConfig()
 	cfg.Session.MaxHistory = 0
 	if err := cfg.IsValid(); err == nil {
 		t.Error("expected error for zero MaxHistory")
 	}
 }
 func TestConfigError(t *testing.T) {
 	err := errConfig("test error")
 	if err.Error() != "config: test error" {
 		t.Errorf("unexpected error message: %s", err.Error())
 	}
 	ce, ok := err.(*ConfigError)
 	if !ok {
 		t.Fatal("expected ConfigError type")
 	}
 	if ce.Message != "test error" {
 		t.Errorf("expected Message 'test error', got %q", ce.Message)
 	}
 }
 func TestLoadConfigFromEnvInvalidTimeout(t *testing.T) {
 	os.Setenv("ORCA_OLLAMA_TIMEOUT", "not-a-duration")
 	defer os.Unsetenv("ORCA_OLLAMA_TIMEOUT")
 	cfg := LoadConfigFromEnv()
 	// Should keep default when env var is unparseable
 	if cfg.Ollama.Timeout != 120*time.Second {
 		t.Errorf("expected default 120s when env is invalid, got %v", cfg.Ollama.Timeout)
 	}
 }
 func TestLoadConfigFromEnvInvalidMaxMemory(t *testing.T) {
 	os.Setenv("ORCA_SANDBOX_MAX_MEMORY", "not-a-number")
 	defer os.Unsetenv("ORCA_SANDBOX_MAX_MEMORY")
 	cfg := LoadConfigFromEnv()
 	// Should keep default when env var is unparseable
 	if cfg.Sandbox.MaxMemory != 512*1024*1024 {
 		t.Errorf("expected default MaxMemory when env is invalid, got %d", cfg.Sandbox.MaxMemory)
 	}
 }
 func TestLoadConfigFromEnvInvalidMaxHistory(t *testing.T) {
 	os.Setenv("ORCA_SESSION_MAX_HISTORY", "not-a-number")
 	defer os.Unsetenv("ORCA_SESSION_MAX_HISTORY")
 	cfg := LoadConfigFromEnv()
 	if cfg.Session.MaxHistory != 100 {
 		t.Errorf("expected default MaxHistory when env is invalid, got %d", cfg.Session.MaxHistory)
 	}
 }
--- a/pkg/actor/actor.go
+++ b/pkg/actor/actor.go
@ -0,0 +1,220 @@
 // Package actor implements the Actor model for the Orca framework.
 //
 // An Agent is an independent goroutine that communicates via channels.
 // Each agent has a state machine: Idle -> Processing -> [ToolCall] ->
 // WaitingForTool -> Processing -> Completed.
 package actor
 import (
 	"context"
 	"fmt"
 	"sync"
 	"sync/atomic"
 	"github.com/orca/orca/pkg/bus"
 )
 // ActorStatus represents the current state of an agent in its state machine.
 type ActorStatus int
 const (
 	// StatusIdle indicates the agent is ready to accept messages.
 	StatusIdle ActorStatus = iota
 	// StatusProcessing indicates the agent is actively handling a message.
 	StatusProcessing
 	// StatusWaitingForTool indicates the agent has called a tool and is awaiting its result.
 	StatusWaitingForTool
 	// StatusCompleted indicates the agent has finished processing the last message.
 	StatusCompleted
 	// StatusStopped indicates the agent has been shut down.
 	StatusStopped
 )
 // String returns the human-readable name of the actor status.
 func (s ActorStatus) String() string {
 	switch s {
 	case StatusIdle:
 		return "idle"
 	case StatusProcessing:
 		return "processing"
 	case StatusWaitingForTool:
 		return "waiting_for_tool"
 	case StatusCompleted:
 		return "completed"
 	case StatusStopped:
 		return "stopped"
 	default:
 		return "unknown"
 	}
 }
 // Agent is the interface that all actors in the Orca framework must implement.
 //
 // Each Agent runs as an independent goroutine processing messages
 // through an internal channel. The Process method provides a synchronous
 // API to submit messages and await responses.
 type Agent interface {
 	// ID returns the unique identifier for this agent.
 	ID() string
 	// Role returns the role/type of this agent (e.g., "orchestrator", "worker").
 	Role() string
 	// Process sends a message to this agent and waits for a response.
 	// This is a synchronous call; the agent's goroutine handles the message.
 	Process(ctx context.Context, msg bus.Message) (bus.Message, error)
 	// Stop gracefully shuts down this agent, waiting for in-flight processing to complete.
 	Stop() error
 }
 // agentRequest wraps a message and provides a response channel.
 type agentRequest struct {
 	ctx  context.Context
 	msg  bus.Message
 	resp chan agentResponse
 }
 // agentResponse wraps the result of processing a message.
 type agentResponse struct {
 	msg bus.Message
 	err error
 }
 // BaseAgent provides shared infrastructure for all agent implementations.
 //
 // It manages the message channel, goroutine lifecycle, and status tracking.
 // Concrete agents should embed BaseAgent and set a handler via SetHandler.
 type BaseAgent struct {
 	id      string
 	role    string
 	msgCh   chan agentRequest
 	stopCh  chan struct{}
 	status  atomic.Value
 	wg      sync.WaitGroup
 	mu      sync.Mutex
 	started bool
 	handler func(context.Context, bus.Message) (bus.Message, error)
 }
 // NewBaseAgent creates a new BaseAgent with the given id and role.
 // The agent is not started until Start() is called and a handler is set.
 func NewBaseAgent(id, role string) *BaseAgent {
 	a := &BaseAgent{
 		id:     id,
 		role:   role,
 		msgCh:  make(chan agentRequest, 64),
 		stopCh: make(chan struct{}),
 	}
 	a.status.Store(StatusIdle)
 	return a
 }
 // ID returns the agent's unique identifier.
 func (a *BaseAgent) ID() string { return a.id }
 // Role returns the agent's role.
 func (a *BaseAgent) Role() string { return a.role }
 // Status returns the current ActorStatus of this agent.
 func (a *BaseAgent) Status() ActorStatus {
 	s, _ := a.status.Load().(ActorStatus)
 	return s
 }
 // setStatus atomically updates the agent's status.
 func (a *BaseAgent) setStatus(s ActorStatus) {
 	a.status.Store(s)
 }
 // SetHandler sets the message handler function for this agent.
 // Must be called before Start().
 func (a *BaseAgent) SetHandler(handler func(context.Context, bus.Message) (bus.Message, error)) {
 	a.mu.Lock()
 	defer a.mu.Unlock()
 	a.handler = handler
 }
 // Start launches the agent's message processing goroutine.
 // The handler must be set before calling Start.
 func (a *BaseAgent) Start() error {
 	a.mu.Lock()
 	defer a.mu.Unlock()
 	if a.started {
 		return fmt.Errorf("agent %s is already started", a.id)
 	}
 	if a.handler == nil {
 		return fmt.Errorf("agent %s has no handler set", a.id)
 	}
 	a.started = true
 	a.status.Store(StatusIdle)
 	a.wg.Add(1)
 	go a.loop()
 	return nil
 }
 // loop is the main goroutine that reads messages from msgCh and processes them.
 func (a *BaseAgent) loop() {
 	defer a.wg.Done()
 	for {
 		select {
 		case req := <-a.msgCh:
 			a.setStatus(StatusProcessing)
 			resp, err := a.handler(req.ctx, req.msg)
 			if err != nil {
 				a.setStatus(StatusIdle)
 			} else {
 				a.setStatus(StatusCompleted)
 			}
 			req.resp <- agentResponse{msg: resp, err: err}
 		case <-a.stopCh:
 			a.setStatus(StatusStopped)
 			return
 		}
 	}
 }
 // Process sends a message to the agent's processing loop and waits for a response.
 // It respects context cancellation and the agent's stop signal.
 func (a *BaseAgent) Process(ctx context.Context, msg bus.Message) (bus.Message, error) {
 	respCh := make(chan agentResponse, 1)
 	select {
 	case a.msgCh <- agentRequest{ctx: ctx, msg: msg, resp: respCh}:
 	case <-ctx.Done():
 		return bus.Message{}, ctx.Err()
 	case <-a.stopCh:
 		return bus.Message{}, fmt.Errorf("agent %s is stopped", a.id)
 	}
 	select {
 	case r := <-respCh:
 		return r.msg, r.err
 	case <-ctx.Done():
 		return bus.Message{}, ctx.Err()
 	}
 }
 // Stop gracefully shuts down the agent.
 // It signals the processing loop to exit and waits for it to finish.
 func (a *BaseAgent) Stop() error {
 	a.mu.Lock()
 	started := a.started
 	a.started = false
 	a.mu.Unlock()
 	if !started {
 		return nil
 	}
 	close(a.stopCh)
 	a.wg.Wait()
 	return nil
 }
 // IsStarted returns whether the agent's processing loop is running.
 func (a *BaseAgent) IsStarted() bool {
 	a.mu.Lock()
 	defer a.mu.Unlock()
 	return a.started
 }
--- a/pkg/actor/actor_test.go
+++ b/pkg/actor/actor_test.go
@ -0,0 +1,697 @@
 package actor
 import (
 	"context"
 	"errors"
 	"sync/atomic"
 	"testing"
 	"time"
 	"github.com/orca/orca/pkg/bus"
 )
 // ============================================================
 // BaseAgent Tests
 // ============================================================
 func TestNewBaseAgent(t *testing.T) {
 	a := NewBaseAgent("test-1", "worker")
 	if a == nil {
 		t.Fatal("NewBaseAgent() returned nil")
 	}
 	if a.ID() != "test-1" {
 		t.Errorf("expected id 'test-1', got %q", a.ID())
 	}
 	if a.Role() != "worker" {
 		t.Errorf("expected role 'worker', got %q", a.Role())
 	}
 	if s := a.Status(); s != StatusIdle {
 		t.Errorf("expected initial StatusIdle, got %s", s)
 	}
 }
 func TestBaseAgentStartAndStop(t *testing.T) {
 	a := NewBaseAgent("test-2", "worker")
 	a.SetHandler(func(ctx context.Context, msg bus.Message) (bus.Message, error) {
 		return bus.Message{ID: "response"}, nil
 	})
 	if err := a.Start(); err != nil {
 		t.Fatalf("Start failed: %v", err)
 	}
 	if !a.IsStarted() {
 		t.Error("expected agent to be started")
 	}
 	if err := a.Stop(); err != nil {
 		t.Fatalf("Stop failed: %v", err)
 	}
 	if a.IsStarted() {
 		t.Error("expected agent to be stopped after Stop()")
 	}
 }
 func TestBaseAgentDoubleStart(t *testing.T) {
 	a := NewBaseAgent("test-3", "worker")
 	a.SetHandler(func(ctx context.Context, msg bus.Message) (bus.Message, error) {
 		return bus.Message{ID: "response"}, nil
 	})
 	if err := a.Start(); err != nil {
 		t.Fatalf("first Start failed: %v", err)
 	}
 	err := a.Start()
 	if err == nil {
 		t.Error("expected error on double start")
 	}
 	a.Stop()
 }
 func TestBaseAgentStartWithoutHandler(t *testing.T) {
 	a := NewBaseAgent("test-4", "worker")
 	err := a.Start()
 	if err == nil {
 		t.Error("expected error starting agent without handler")
 	}
 }
 func TestBaseAgentProcessAndResponse(t *testing.T) {
 	a := NewBaseAgent("test-5", "worker")
 	a.SetHandler(func(ctx context.Context, msg bus.Message) (bus.Message, error) {
 		return bus.Message{
 			ID:      msg.ID + "-resp",
 			Type:    bus.MsgTypeTaskResponse,
 			From:    a.ID(),
 			To:      msg.From,
 			Content: "processed: " + msg.ID,
 		}, nil
 	})
 	a.Start()
 	defer a.Stop()
 	ctx := context.Background()
 	resp, err := a.Process(ctx, bus.Message{
 		ID:   "task-1",
 		Type: bus.MsgTypeTaskRequest,
 		From: "caller",
 	})
 	if err != nil {
 		t.Fatalf("Process failed: %v", err)
 	}
 	if resp.ID != "task-1-resp" {
 		t.Errorf("expected response ID 'task-1-resp', got %q", resp.ID)
 	}
 	if resp.Content != "processed: task-1" {
 		t.Errorf("expected content 'processed: task-1', got %v", resp.Content)
 	}
 	if resp.From != "test-5" {
 		t.Errorf("expected From 'test-5', got %q", resp.From)
 	}
 }
 func TestBaseAgentProcessReturnsError(t *testing.T) {
 	expectedErr := errors.New("processing failed")
 	a := NewBaseAgent("test-6", "worker")
 	a.SetHandler(func(ctx context.Context, msg bus.Message) (bus.Message, error) {
 		return bus.Message{}, expectedErr
 	})
 	a.Start()
 	defer a.Stop()
 	_, err := a.Process(context.Background(), bus.Message{ID: "task-1"})
 	if err == nil {
 		t.Fatal("expected error from Process")
 	}
 	if !errors.Is(err, expectedErr) {
 		t.Errorf("expected error %v, got %v", expectedErr, err)
 	}
 }
 func TestBaseAgentProcessOnStoppedAgent(t *testing.T) {
 	a := NewBaseAgent("test-7", "worker")
 	a.SetHandler(func(ctx context.Context, msg bus.Message) (bus.Message, error) {
 		return bus.Message{ID: "response"}, nil
 	})
 	a.Start()
 	a.Stop()
 	_, err := a.Process(context.Background(), bus.Message{ID: "task-1"})
 	if err == nil {
 		t.Error("expected error processing on stopped agent")
 	}
 }
 func TestBaseAgentContextCancellation(t *testing.T) {
 	a := NewBaseAgent("test-8", "worker")
 	a.SetHandler(func(ctx context.Context, msg bus.Message) (bus.Message, error) {
 		// Simulate long processing
 		select {
 		case <-time.After(5 * time.Second):
 			return bus.Message{ID: "response"}, nil
 		case <-ctx.Done():
 			return bus.Message{}, ctx.Err()
 		}
 	})
 	a.Start()
 	defer a.Stop()
 	ctx, cancel := context.WithTimeout(context.Background(), 10*time.Millisecond)
 	defer cancel()
 	_, err := a.Process(ctx, bus.Message{ID: "task-1"})
 	if err == nil {
 		t.Error("expected error from context cancellation")
 	}
 }
 func TestBaseAgentStatusTransitions(t *testing.T) {
 	a := NewBaseAgent("test-9", "worker")
 	a.SetHandler(func(ctx context.Context, msg bus.Message) (bus.Message, error) {
 		if a.Status() != StatusProcessing {
 			t.Errorf("expected StatusProcessing inside handler, got %s", a.Status())
 		}
 		return bus.Message{ID: "response"}, nil
 	})
 	a.Start()
 	defer a.Stop()
 	// Should be idle before processing
 	if s := a.Status(); s != StatusIdle {
 		t.Errorf("expected StatusIdle before Process, got %s", s)
 	}
 	_, err := a.Process(context.Background(), bus.Message{ID: "task-1"})
 	if err != nil {
 		t.Fatalf("Process failed: %v", err)
 	}
 	// Should be completed after processing
 	// Give the goroutine a moment to update the status
 	time.Sleep(5 * time.Millisecond)
 	if s := a.Status(); s != StatusCompleted {
 		t.Errorf("expected StatusCompleted after Process, got %s", s)
 	}
 }
 func TestBaseAgentConcurrentProcess(t *testing.T) {
 	a := NewBaseAgent("test-10", "worker")
 	var counter int32
 	a.SetHandler(func(ctx context.Context, msg bus.Message) (bus.Message, error) {
 		atomic.AddInt32(&counter, 1)
 		return bus.Message{ID: "response"}, nil
 	})
 	a.Start()
 	defer a.Stop()
 	var completed int32
 	for i := 0; i < 10; i++ {
 		go func(i int) {
 			_, err := a.Process(context.Background(), bus.Message{ID: "task"})
 			if err == nil {
 				atomic.AddInt32(&completed, 1)
 			}
 		}(i)
 	}
 	time.Sleep(200 * time.Millisecond)
 	if n := atomic.LoadInt32(&completed); n != 10 {
 		t.Errorf("expected 10 completed tasks, got %d", n)
 	}
 	if n := atomic.LoadInt32(&counter); n != 10 {
 		t.Errorf("expected 10 handler calls, got %d", n)
 	}
 }
 func TestBaseAgentStopIdempotent(t *testing.T) {
 	a := NewBaseAgent("test-11", "worker")
 	a.SetHandler(func(ctx context.Context, msg bus.Message) (bus.Message, error) {
 		return bus.Message{ID: "response"}, nil
 	})
 	a.Start()
 	if err := a.Stop(); err != nil {
 		t.Fatalf("first Stop failed: %v", err)
 	}
 	if err := a.Stop(); err != nil {
 		t.Fatalf("second Stop should be idempotent: %v", err)
 	}
 }
 func TestActorStatusString(t *testing.T) {
 	tests := []struct {
 		status ActorStatus
 		want   string
 	}{
 		{StatusIdle, "idle"},
 		{StatusProcessing, "processing"},
 		{StatusWaitingForTool, "waiting_for_tool"},
 		{StatusCompleted, "completed"},
 		{StatusStopped, "stopped"},
 		{ActorStatus(99), "unknown"},
 	}
 	for _, tt := range tests {
 		if got := tt.status.String(); got != tt.want {
 			t.Errorf("ActorStatus(%d).String() = %q, want %q", tt.status, got, tt.want)
 		}
 	}
 }
 // ============================================================
 // Worker Tests
 // ============================================================
 func TestNewWorker(t *testing.T) {
 	w := NewWorker("worker-1")
 	if w == nil {
 		t.Fatal("NewWorker() returned nil")
 	}
 	if w.ID() != "worker-1" {
 		t.Errorf("expected id 'worker-1', got %q", w.ID())
 	}
 	if w.Role() != "worker" {
 		t.Errorf("expected role 'worker', got %q", w.Role())
 	}
 	if !w.IsStarted() {
 		t.Error("expected worker to be started automatically")
 	}
 	w.Stop()
 }
 func TestWorkerProcessTask(t *testing.T) {
 	w := NewWorker("worker-2")
 	defer w.Stop()
 	resp, err := w.Process(context.Background(), bus.Message{
 		ID:      "task-1",
 		Type:    bus.MsgTypeTaskRequest,
 		From:    "caller",
 		Content: "do something",
 	})
 	if err != nil {
 		t.Fatalf("Process failed: %v", err)
 	}
 	if resp.Type != bus.MsgTypeTaskResponse {
 		t.Errorf("expected MsgTypeTaskResponse, got %s", resp.Type)
 	}
 	if resp.From != "worker-2" {
 		t.Errorf("expected From 'worker-2', got %q", resp.From)
 	}
 	if resp.Metadata["processed_by"] != "worker-2" {
 		t.Errorf("expected processed_by 'worker-2', got %q", resp.Metadata["processed_by"])
 	}
 }
 func TestWorkerProcessToolCall(t *testing.T) {
 	w := NewWorker("worker-3")
 	defer w.Stop()
 	resp, err := w.Process(context.Background(), bus.Message{
 		ID:      "tool-1",
 		Type:    bus.MsgTypeToolCall,
 		From:    "caller",
 		Content: "execute command",
 	})
 	if err != nil {
 		t.Fatalf("Process failed: %v", err)
 	}
 	if resp.Type != bus.MsgTypeToolResult {
 		t.Errorf("expected MsgTypeToolResult, got %s", resp.Type)
 	}
 }
 func TestWorkerStatusDuringToolCall(t *testing.T) {
 	w := NewWorker("worker-4")
 	// Perform a tool call
 	_, err := w.Process(context.Background(), bus.Message{
 		ID:      "tool-1",
 		Type:    bus.MsgTypeToolCall,
 		From:    "caller",
 	})
 	if err != nil {
 		t.Fatalf("Process failed: %v", err)
 	}
 	// After tool call, status should be Processing (set back by defer)
 	time.Sleep(5 * time.Millisecond)
 	// Status could be Processing or Completed depending on timing
 	s := w.Status()
 	if s != StatusProcessing && s != StatusIdle && s != StatusCompleted {
 		t.Errorf("expected Processing/Idle/Completed after tool call, got %s", s)
 	}
 	w.Stop()
 }
 func TestWorkerUnsupportedMessage(t *testing.T) {
 	w := NewWorker("worker-5")
 	defer w.Stop()
 	_, err := w.Process(context.Background(), bus.Message{
 		ID:      "unknown-1",
 		Type:    bus.MsgTypeObservation,
 		From:    "caller",
 	})
 	if err == nil {
 		t.Error("expected error for unsupported message type")
 	}
 }
 // ============================================================
 // Orchestrator Tests
 // ============================================================
 func TestNewOrchestrator(t *testing.T) {
 	o := NewOrchestrator("orch-1", nil)
 	if o == nil {
 		t.Fatal("NewOrchestrator() returned nil")
 	}
 	if o.ID() != "orch-1" {
 		t.Errorf("expected id 'orch-1', got %q", o.ID())
 	}
 	if o.Role() != "orchestrator" {
 		t.Errorf("expected role 'orchestrator', got %q", o.Role())
 	}
 	if !o.IsStarted() {
 		t.Error("expected orchestrator to be started automatically")
 	}
 	o.Stop()
 }
 func TestOrchestratorAddWorker(t *testing.T) {
 	o := NewOrchestrator("orch-2", nil)
 	defer o.Stop()
 	w := NewWorker("worker-10")
 	defer w.Stop()
 	o.AddWorker(w)
 	if n := o.WorkerCount(); n != 1 {
 		t.Errorf("expected 1 worker, got %d", n)
 	}
 	got, ok := o.GetWorker("worker-10")
 	if !ok {
 		t.Fatal("expected to find worker-10")
 	}
 	if got.ID() != "worker-10" {
 		t.Errorf("expected worker ID 'worker-10', got %q", got.ID())
 	}
 }
 func TestOrchestratorRemoveWorker(t *testing.T) {
 	o := NewOrchestrator("orch-3", nil)
 	defer o.Stop()
 	w := NewWorker("worker-11")
 	defer w.Stop()
 	o.AddWorker(w)
 	o.RemoveWorker("worker-11")
 	if n := o.WorkerCount(); n != 0 {
 		t.Errorf("expected 0 workers after removal, got %d", n)
 	}
 }
 func TestOrchestratorListWorkers(t *testing.T) {
 	o := NewOrchestrator("orch-4", nil)
 	defer o.Stop()
 	workers := []string{"w-1", "w-2", "w-3"}
 	for _, name := range workers {
 		w := NewWorker(name)
 		defer w.Stop()
 		o.AddWorker(w)
 	}
 	list := o.ListWorkers()
 	if len(list) != len(workers) {
 		t.Errorf("expected %d workers, got %d", len(workers), len(list))
 	}
 	ids := make(map[string]bool)
 	for _, w := range list {
 		ids[w.ID()] = true
 	}
 	for _, name := range workers {
 		if !ids[name] {
 			t.Errorf("missing worker %q in list", name)
 		}
 	}
 }
 func TestOrchestratorDelegatesToWorker(t *testing.T) {
 	o := NewOrchestrator("orch-5", nil)
 	defer o.Stop()
 	w := NewWorker("worker-20")
 	defer w.Stop()
 	o.AddWorker(w)
 	resp, err := o.Process(context.Background(), bus.Message{
 		ID:      "task-1",
 		Type:    bus.MsgTypeTaskRequest,
 		From:    "caller",
 		Content: "do work",
 	})
 	if err != nil {
 		t.Fatalf("Process failed: %v", err)
 	}
 	if resp.From != "worker-20" {
 		t.Errorf("expected response from 'worker-20', got %q", resp.From)
 	}
 	if resp.Metadata["processed_by"] != "worker-20" {
 		t.Errorf("expected processed_by 'worker-20', got %q", resp.Metadata["processed_by"])
 	}
 }
 func TestOrchestratorNoWorkers(t *testing.T) {
 	o := NewOrchestrator("orch-6", nil)
 	defer o.Stop()
 	_, err := o.Process(context.Background(), bus.Message{
 		ID:      "task-1",
 		Type:    bus.MsgTypeTaskRequest,
 		From:    "caller",
 	})
 	if err == nil {
 		t.Error("expected error when no workers available")
 	}
 }
 func TestOrchestratorSystemMessage(t *testing.T) {
 	o := NewOrchestrator("orch-7", nil)
 	defer o.Stop()
 	resp, err := o.Process(context.Background(), bus.Message{
 		ID:      "sys-1",
 		Type:    bus.MsgTypeSystem,
 		From:    "caller",
 	})
 	if err != nil {
 		t.Fatalf("Process failed: %v", err)
 	}
 	if resp.Content != "orchestrator acknowledged" {
 		t.Errorf("expected acknowledged message, got %v", resp.Content)
 	}
 }
 // ============================================================
 // System Tests
 // ============================================================
 func TestNewSystem(t *testing.T) {
 	s := NewSystem()
 	if s == nil {
 		t.Fatal("NewSystem() returned nil")
 	}
 	if n := s.AgentCount(); n != 0 {
 		t.Errorf("expected 0 agents, got %d", n)
 	}
 }
 func TestSystemCreateWorker(t *testing.T) {
 	s := NewSystem()
 	w, err := s.CreateWorker()
 	if err != nil {
 		t.Fatalf("CreateWorker failed: %v", err)
 	}
 	if w == nil {
 		t.Fatal("CreateWorker returned nil")
 	}
 	if w.Role() != "worker" {
 		t.Errorf("expected role 'worker', got %q", w.Role())
 	}
 	if n := s.AgentCount(); n != 1 {
 		t.Errorf("expected 1 agent, got %d", n)
 	}
 	s.StopAll()
 }
 func TestSystemStopAgent(t *testing.T) {
 	s := NewSystem()
 	w, _ := s.CreateWorker()
 	if err := s.StopAgent(w.ID()); err != nil {
 		t.Fatalf("StopAgent failed: %v", err)
 	}
 	if n := s.AgentCount(); n != 0 {
 		t.Errorf("expected 0 agents, got %d", n)
 	}
 	_, ok := s.GetAgent(w.ID())
 	if ok {
 		t.Error("expected agent to be removed after StopAgent")
 	}
 }
 func TestSystemStopAgentNotFound(t *testing.T) {
 	s := NewSystem()
 	err := s.StopAgent("nonexistent")
 	if err == nil {
 		t.Error("expected error stopping nonexistent agent")
 	}
 }
 func TestSystemListAgents(t *testing.T) {
 	s := NewSystem()
 	s.CreateWorker()
 	s.CreateWorker()
 	agents := s.ListAgents()
 	if len(agents) != 2 {
 		t.Errorf("expected 2 agents, got %d", len(agents))
 	}
 	s.StopAll()
 }
 func TestSystemAgentInfos(t *testing.T) {
 	s := NewSystem()
 	w, _ := s.CreateWorker()
 	infos := s.AgentInfos()
 	if len(infos) != 1 {
 		t.Fatalf("expected 1 agent info, got %d", len(infos))
 	}
 	if infos[0].ID != w.ID() {
 		t.Errorf("expected ID %q, got %q", w.ID(), infos[0].ID)
 	}
 	if infos[0].Role != "worker" {
 		t.Errorf("expected Role 'worker', got %q", infos[0].Role)
 	}
 	if infos[0].Status != StatusIdle {
 		t.Errorf("expected Status StatusIdle, got %s", infos[0].Status)
 	}
 	s.StopAll()
 }
 func TestSystemStopAll(t *testing.T) {
 	s := NewSystem()
 	s.CreateWorker()
 	s.CreateWorker()
 	s.CreateWorker()
 	if err := s.StopAll(); err != nil {
 		t.Fatalf("StopAll failed: %v", err)
 	}
 	if n := s.AgentCount(); n != 0 {
 		t.Errorf("expected 0 agents after StopAll, got %d", n)
 	}
 }
 // ============================================================
 // ToolWorker Tests
 // ============================================================
 func TestNewToolWorker(t *testing.T) {
 	tw := NewToolWorker("tool-1", nil)
 	if tw == nil {
 		t.Fatal("NewToolWorker() returned nil")
 	}
 	if tw.ID() != "tool-1" {
 		t.Errorf("expected id 'tool-1', got %q", tw.ID())
 	}
 	if tw.Role() != "tool_worker" {
 		t.Errorf("expected role 'tool_worker', got %q", tw.Role())
 	}
 	if !tw.IsStarted() {
 		t.Error("expected tool worker to be started automatically")
 	}
 	tw.Stop()
 }
 func TestToolWorkerProcessSystemMessage(t *testing.T) {
 	tw := NewToolWorker("tool-2", nil)
 	defer tw.Stop()
 	resp, err := tw.Process(context.Background(), bus.Message{
 		ID:      "sys-1",
 		Type:    bus.MsgTypeSystem,
 		From:    "caller",
 	})
 	if err != nil {
 		t.Fatalf("Process failed: %v", err)
 	}
 	if resp.Content != "tool_worker acknowledged" {
 		t.Errorf("expected 'tool_worker acknowledged', got %v", resp.Content)
 	}
 }
 func TestToolWorkerUnsupportedMessage(t *testing.T) {
 	tw := NewToolWorker("tool-3", nil)
 	defer tw.Stop()
 	_, err := tw.Process(context.Background(), bus.Message{
 		ID:      "obs-1",
 		Type:    bus.MsgTypeObservation,
 		From:    "caller",
 	})
 	if err == nil {
 		t.Error("expected error for unsupported message type")
 	}
 }
 func TestParseToolCallContentMap(t *testing.T) {
 	name, args, err := parseToolCallContent(map[string]interface{}{
 		"name":      "exec",
 		"arguments": map[string]interface{}{"command": "ls"},
 	})
 	if err != nil {
 		t.Fatalf("parseToolCallContent failed: %v", err)
 	}
 	if name != "exec" {
 		t.Errorf("expected name 'exec', got %q", name)
 	}
 	if args["command"] != "ls" {
 		t.Errorf("expected args['command'] = 'ls', got %v", args["command"])
 	}
 }
 func TestParseToolCallContentMissingName(t *testing.T) {
 	_, _, err := parseToolCallContent(map[string]interface{}{"foo": "bar"})
 	if err == nil {
 		t.Error("expected error for missing name")
 	}
 }
 // ============================================================
 // System ToolWorker Tests
 // ============================================================
 func TestSystemCreateToolWorker(t *testing.T) {
 	s := NewSystem()
 	tw, err := s.CreateToolWorker(nil)
 	if err != nil {
 		t.Fatalf("CreateToolWorker failed: %v", err)
 	}
 	if tw == nil {
 		t.Fatal("CreateToolWorker returned nil")
 	}
 	if tw.Role() != "tool_worker" {
 		t.Errorf("expected role 'tool_worker', got %q", tw.Role())
 	}
 	if n := s.AgentCount(); n != 1 {
 		t.Errorf("expected 1 agent, got %d", n)
 	}
 	s.StopAll()
 }
--- a/pkg/actor/agent.go
+++ b/pkg/actor/agent.go
@ -0,0 +1,18 @@
 // Package actor implements the Actor model for the Orca framework.
 //
 // This file provides additional agent types that integrate the LLM
 // and Tool systems with the actor framework. See actor.go for the
 // base Agent interface and BaseAgent implementation.
 package actor
 // This file exists alongside actor.go to provide the LLMAgent and
 // ToolWorker types, completing the integration between the actor
 // system and the LLM / Tool subsystems.
 //
 // The key types in this package are:
 //   - Agent (interface, in actor.go)
 //   - BaseAgent (struct, in actor.go)
 //   - Orchestrator (in orchestrator.go)
 //   - Worker (in worker.go)
 //   - LLMAgent (in llm_agent.go)
 //   - ToolWorker (in tool_worker.go)
--- a/pkg/actor/llm_agent.go
+++ b/pkg/actor/llm_agent.go
@ -0,0 +1,338 @@
 package actor
 import (
 	"context"
 	"encoding/json"
 	"fmt"
 	"strings"
 	"github.com/orca/orca/pkg/bus"
 	"github.com/orca/orca/pkg/llm"
 	"github.com/orca/orca/pkg/session"
 	"github.com/orca/orca/pkg/tool"
 )
 // LLMAgent implements the Agent interface by integrating an LLM backend
 // with the actor system and tool framework.
 //
 // It receives user messages, retrieves session context, calls the LLM,
 // and handles tool call responses by executing tools and feeding results
 // back to the LLM for final response generation.
 type LLMAgent struct {
 	*BaseAgent
 	llm          llm.LLM
 	sessionMgr   *session.Manager
 	sessionID    string
 	toolManager  *tool.Manager
 	toolWorker   *ToolWorker
 	windowSize   int
 }
 // LLMAgentOption is a functional option for configuring the LLMAgent.
 type LLMAgentOption func(*LLMAgent)
 // WithSessionManager sets the session manager for conversation history.
 func WithSessionManager(mgr *session.Manager) LLMAgentOption {
 	return func(a *LLMAgent) {
 		a.sessionMgr = mgr
 	}
 }
 // WithSessionID sets the session ID for conversation persistence.
 func WithSessionID(id string) LLMAgentOption {
 	return func(a *LLMAgent) {
 		a.sessionID = id
 	}
 }
 // WithToolManager sets the tool manager for executing tools.
 func WithToolManager(mgr *tool.Manager) LLMAgentOption {
 	return func(a *LLMAgent) {
 		a.toolManager = mgr
 	}
 }
 // WithToolWorker sets the tool worker for delegated tool execution.
 func WithToolWorker(w *ToolWorker) LLMAgentOption {
 	return func(a *LLMAgent) {
 		a.toolWorker = w
 	}
 }
 // WithWindowSize sets the context window size for session history.
 func WithWindowSize(size int) LLMAgentOption {
 	return func(a *LLMAgent) {
 		a.windowSize = size
 	}
 }
 // NewLLMAgent creates a new LLMAgent with the given LLM backend and options.
 // The agent is started automatically upon creation.
 func NewLLMAgent(id string, backend llm.LLM, opts ...LLMAgentOption) *LLMAgent {
 	a := &LLMAgent{
 		BaseAgent:  NewBaseAgent(id, "llm_agent"),
 		llm:        backend,
 		windowSize: 20, // Default context window
 	}
 	for _, opt := range opts {
 		opt(a)
 	}
 	a.SetHandler(a.handleMessage)
 	if err := a.Start(); err != nil {
 		panic(fmt.Sprintf("llm_agent: failed to start: %v", err))
 	}
 	return a
 }
 // handleMessage routes incoming messages to the appropriate handler.
 func (a *LLMAgent) handleMessage(ctx context.Context, msg bus.Message) (bus.Message, error) {
 	switch msg.Type {
 	case bus.MsgTypeTaskRequest:
 		return a.handleUserMessage(ctx, msg)
 	case bus.MsgTypeSystem:
 		return a.handleSystem(ctx, msg)
 	default:
 		return bus.Message{}, fmt.Errorf("llm_agent %s: unsupported message type %s", a.ID(), msg.Type)
 	}
 }
 // handleUserMessage processes a user message through the LLM.
 //
 // Flow:
 //  1. Persist the user message to session history
 //  2. Retrieve recent conversation context
 //  3. Convert to LLM message format
 //  4. Call LLM.Chat
 //  5. If response has tool calls:
 //     a. Execute each tool (directly or via ToolWorker)
 //     b. Add tool results to conversation
 //     c. Call LLM.Chat again with results
 //  6. Persist the assistant response
 //  7. Return the final response
 func (a *LLMAgent) handleUserMessage(ctx context.Context, msg bus.Message) (bus.Message, error) {
 	content, ok := msg.Content.(string)
 	if !ok {
 		return bus.Message{}, fmt.Errorf("llm_agent: expected string content, got %T", msg.Content)
 	}
 	// Ensure session exists
 	if a.sessionMgr != nil && a.sessionID != "" {
 		// Check if session exists; create if not
 		if _, err := a.sessionMgr.GetSession(a.sessionID); err != nil {
 			a.sessionMgr.CreateSession(a.sessionID, map[string]string{
 				"source": "llm_agent",
 			})
 		}
 		// Persist user message
 		a.sessionMgr.AddMessage(a.sessionID, session.RoleUser, content, nil)
 	}
 	// Build LLM messages from session context
 	llmMessages := a.buildLLMMessages()
 	// Call LLM (potentially multiple rounds for tool calls)
 	finalResponse, err := a.chatWithToolLoop(ctx, llmMessages)
 	if err != nil {
 		return bus.Message{}, fmt.Errorf("llm_agent: LLM chat failed: %w", err)
 	}
 	// Persist assistant response
 	if a.sessionMgr != nil && a.sessionID != "" {
 		a.sessionMgr.AddMessage(a.sessionID, session.RoleAssistant, finalResponse, nil)
 	}
 	return bus.Message{
 		ID:      msg.ID + "-response",
 		Type:    bus.MsgTypeTaskResponse,
 		From:    a.ID(),
 		To:      msg.From,
 		Content: finalResponse,
 	}, nil
 }
 func (a *LLMAgent) buildLLMMessages() []llm.Message {
 	messages := make([]llm.Message, 0)
 	if a.toolManager != nil {
 		messages = append(messages, llm.Message{
 			Role:    "system",
 			Content: a.buildToolSystemPrompt(),
 		})
 	}
 	if a.sessionMgr == nil || a.sessionID == "" {
 		return messages
 	}
 	sessionMsgs, err := a.sessionMgr.GetContext(a.sessionID, a.windowSize)
 	if err != nil {
 		return messages
 	}
 	for _, sm := range sessionMsgs {
 		msg := llm.Message{
 			Role:    string(sm.Role),
 			Content: sm.Content,
 		}
 		if sm.Role == session.RoleTool && sm.Metadata != nil {
 			msg.ToolCallID = sm.Metadata["tool_call_id"]
 		}
 		messages = append(messages, msg)
 	}
 	return messages
 }
 // buildToolSystemPrompt creates a system prompt describing all available tools.
 // This enables prompt-based tool calling for models without native function
 // calling support.
 func (a *LLMAgent) buildToolSystemPrompt() string {
 	if a.toolManager == nil {
 		return ""
 	}
 	var b strings.Builder
 	b.WriteString("你是一个 AI 助手，可以使用以下工具来完成用户的请求。\n\n")
 	b.WriteString("可用工具列表：\n")
 	for _, t := range a.toolManager.List() {
 		b.WriteString(fmt.Sprintf("\n工具名: %s\n", t.Name()))
 		b.WriteString(fmt.Sprintf("描述: %s\n", t.Description()))
 		paramsJSON, _ := json.Marshal(t.Parameters())
 		b.WriteString(fmt.Sprintf("参数: %s\n", string(paramsJSON)))
 	}
 	b.WriteString("\n规则：\n")
 	b.WriteString("1. 当你需要调用工具时，请在回复中**只输出**以下 JSON 格式（不要添加其他文字）：\n")
 	b.WriteString(`   {"tool": "工具名", "arguments": {"参数名": "参数值"}}` + "\n")
 	b.WriteString("2. 如果你已经看到了工具返回的结果，请直接根据结果回答用户，不要再次调用工具。\n")
 	b.WriteString("3. 如果你不需要调用工具，请直接回复用户。\n")
 	return b.String()
 }
 func (a *LLMAgent) chatWithToolLoop(ctx context.Context, messages []llm.Message) (string, error) {
 	maxRounds := 10
 	for round := 0; round < maxRounds; round++ {
 		response, err := a.llm.Chat(ctx, messages)
 		if err != nil {
 			return "", fmt.Errorf("chat round %d failed: %w", round, err)
 		}
 		toolCalls := response.ToolCalls
 		if len(toolCalls) == 0 {
 			toolCalls = a.parseToolCallsFromContent(response.Content)
 		}
 		if len(toolCalls) == 0 {
 			return response.Content, nil
 		}
 		messages = append(messages, llm.Message{
 			Role:    "assistant",
 			Content: response.Content,
 		})
 		for _, tc := range toolCalls {
 			resultContent := a.executeToolCall(ctx, tc)
 			messages = append(messages, llm.Message{
 				Role:    "user",
 				Content: fmt.Sprintf("工具 %s 的执行结果：%s", tc.Function.Name, resultContent),
 			})
 		}
 	}
 	return "", fmt.Errorf("llm_agent: exceeded maximum tool call rounds (%d)", maxRounds)
 }
 func (a *LLMAgent) parseToolCallsFromContent(content string) []llm.ToolCall {
 	var parsed struct {
 		Tool      string                 `json:"tool"`
 		Arguments map[string]interface{} `json:"arguments"`
 	}
 	if err := json.Unmarshal([]byte(content), &parsed); err != nil || parsed.Tool == "" {
 		return nil
 	}
 	argsJSON, _ := json.Marshal(parsed.Arguments)
 	return []llm.ToolCall{{
 		ID:   "call_0",
 		Type: "function",
 		Function: llm.FunctionCall{
 			Name:      parsed.Tool,
 			Arguments: string(argsJSON),
 		},
 	}}
 }
 // executeToolCall runs a single tool call and returns the result as a JSON string.
 func (a *LLMAgent) executeToolCall(ctx context.Context, tc llm.ToolCall) string {
 	toolName := tc.Function.Name
 	// Parse arguments
 	var args map[string]interface{}
 	if err := json.Unmarshal([]byte(tc.Function.Arguments), &args); err != nil {
 		args = map[string]interface{}{
 			"_raw": tc.Function.Arguments,
 		}
 	}
 	// Execute via ToolWorker (preferred) or directly via tool.Manager
 	if a.toolWorker != nil {
 		// Create a tool call message for the ToolWorker
 		toolCallMsg := bus.Message{
 			ID:      tc.ID,
 			Type:    bus.MsgTypeToolCall,
 			From:    a.ID(),
 			To:      a.toolWorker.ID(),
 			Content: map[string]interface{}{"name": toolName, "arguments": args},
 		}
 		resultMsg, err := a.toolWorker.Process(ctx, toolCallMsg)
 		if err != nil {
 			return fmt.Sprintf(`{"error": "tool execution failed: %v"}`, err)
 		}
 		// Serialize the result
 		resultJSON, err := json.Marshal(resultMsg.Content)
 		if err != nil {
 			return fmt.Sprintf(`{"error": "failed to marshal result: %v"}`, err)
 		}
 		return string(resultJSON)
 	}
 	// Fallback: execute directly via tool.Manager
 	if a.toolManager != nil {
 		result, err := a.toolManager.Execute(toolName, ctx, args)
 		if err != nil {
 			return fmt.Sprintf(`{"error": "tool execution failed: %v"}`, err)
 		}
 		resultJSON, err := json.Marshal(result)
 		if err != nil {
 			return fmt.Sprintf(`{"error": "failed to marshal result: %v"}`, err)
 		}
 		return string(resultJSON)
 	}
 	return fmt.Sprintf(`{"error": "no tool worker or tool manager available for %q"}`, toolName)
 }
 // handleSystem processes internal system messages.
 func (a *LLMAgent) handleSystem(ctx context.Context, msg bus.Message) (bus.Message, error) {
 	return bus.Message{
 		ID:      msg.ID + "-ack",
 		Type:    bus.MsgTypeSystem,
 		From:    a.ID(),
 		To:      msg.From,
 		Content: "llm_agent acknowledged",
 	}, nil
 }
 // Compile-time interface checks.
 var _ Agent = (*LLMAgent)(nil)
 var _ Agent = (*ToolWorker)(nil)
--- a/pkg/actor/orchestrator.go
+++ b/pkg/actor/orchestrator.go
@ -0,0 +1,123 @@
 package actor
 import (
 	"context"
 	"fmt"
 	"sync"
 	"github.com/orca/orca/pkg/bus"
 )
 // Orchestrator is an agent that coordinates task execution across a pool of workers.
 //
 // It receives task requests, delegates them to available workers, and
 // collects responses. The orchestrator maintains a registry of worker
 // agents and can dynamically add or remove them.
 type Orchestrator struct {
 	*BaseAgent
 	workers map[string]Agent
 	bus     bus.MessageBus
 	mu      sync.RWMutex
 }
 // NewOrchestrator creates a new Orchestrator agent with the given id and message bus.
 // The agent is started automatically upon creation.
 func NewOrchestrator(id string, mb bus.MessageBus) *Orchestrator {
 	o := &Orchestrator{
 		BaseAgent: NewBaseAgent(id, "orchestrator"),
 		workers:   make(map[string]Agent),
 		bus:       mb,
 	}
 	o.SetHandler(o.handleMessage)
 	// Start the agent's processing loop
 	if err := o.Start(); err != nil {
 		// This should not happen since handler is set above
 		panic(fmt.Sprintf("orchestrator: failed to start: %v", err))
 	}
 	return o
 }
 // handleMessage routes incoming messages to the appropriate handler.
 func (o *Orchestrator) handleMessage(ctx context.Context, msg bus.Message) (bus.Message, error) {
 	switch msg.Type {
 	case bus.MsgTypeTaskRequest:
 		return o.handleTask(ctx, msg)
 	case bus.MsgTypeSystem:
 		return o.handleSystem(ctx, msg)
 	default:
 		return bus.Message{}, fmt.Errorf("orchestrator %s: unsupported message type %s", o.ID(), msg.Type)
 	}
 }
 // handleTask processes a task request by delegating to an available worker.
 func (o *Orchestrator) handleTask(ctx context.Context, msg bus.Message) (bus.Message, error) {
 	o.mu.RLock()
 	defer o.mu.RUnlock()
 	if len(o.workers) == 0 {
 		return bus.Message{}, fmt.Errorf("orchestrator %s: no workers available", o.ID())
 	}
 	// Simple round-robin: pick the first available worker
 	for _, w := range o.workers {
 		return w.Process(ctx, msg)
 	}
 	return bus.Message{}, fmt.Errorf("orchestrator %s: no workers available", o.ID())
 }
 // handleSystem processes internal system messages.
 func (o *Orchestrator) handleSystem(ctx context.Context, msg bus.Message) (bus.Message, error) {
 	return bus.Message{
 		ID:      msg.ID + "-ack",
 		Type:    bus.MsgTypeSystem,
 		From:    o.ID(),
 		To:      msg.From,
 		Content: "orchestrator acknowledged",
 	}, nil
 }
 // AddWorker registers a worker agent with this orchestrator.
 func (o *Orchestrator) AddWorker(w Agent) {
 	o.mu.Lock()
 	defer o.mu.Unlock()
 	o.workers[w.ID()] = w
 }
 // RemoveWorker unregisters a worker agent from this orchestrator.
 func (o *Orchestrator) RemoveWorker(id string) {
 	o.mu.Lock()
 	defer o.mu.Unlock()
 	delete(o.workers, id)
 }
 // WorkerCount returns the number of registered workers.
 func (o *Orchestrator) WorkerCount() int {
 	o.mu.RLock()
 	defer o.mu.RUnlock()
 	return len(o.workers)
 }
 // GetWorker retrieves a registered worker by ID.
 func (o *Orchestrator) GetWorker(id string) (Agent, bool) {
 	o.mu.RLock()
 	defer o.mu.RUnlock()
 	w, ok := o.workers[id]
 	return w, ok
 }
 // ListWorkers returns all registered workers.
 func (o *Orchestrator) ListWorkers() []Agent {
 	o.mu.RLock()
 	defer o.mu.RUnlock()
 	workers := make([]Agent, 0, len(o.workers))
 	for _, w := range o.workers {
 		workers = append(workers, w)
 	}
 	return workers
 }
 // Bus returns the orchestrator's message bus reference.
 func (o *Orchestrator) Bus() bus.MessageBus {
 	return o.bus
 }
--- a/pkg/actor/system.go
+++ b/pkg/actor/system.go
@ -0,0 +1,180 @@
 package actor
 import (
 	"fmt"
 	"sync"
 	"sync/atomic"
 	"github.com/orca/orca/pkg/tool"
 )
 // System manages the lifecycle of all agents in the Orca actor framework.
 //
 // It provides centralized agent creation, monitoring, and shutdown
 // capabilities. Agents are identified by unique IDs and organized by role.
 type System struct {
 	mu     sync.RWMutex
 	agents map[string]Agent
 	nextID int64
 }
 // NewSystem creates a new empty actor System.
 func NewSystem() *System {
 	return &System{
 		agents: make(map[string]Agent),
 	}
 }
 // AgentInfo holds summary information about a managed agent.
 type AgentInfo struct {
 	ID     string      `json:"id"`
 	Role   string      `json:"role"`
 	Status ActorStatus `json:"status"`
 }
 // CreateOrchestrator creates a new Orchestrator agent and registers it.
 func (s *System) CreateOrchestrator(bus interface{}) (*Orchestrator, error) {
 	id := s.nextAgentID("orch")
 	return s.addOrchestrator(id, bus)
 }
 // CreateWorker creates a new Worker agent and registers it.
 func (s *System) CreateWorker() (*Worker, error) {
 	id := s.nextAgentID("worker")
 	return s.addWorker(id)
 }
 // CreateToolWorker creates a new ToolWorker agent with the given tool manager and registers it.
 func (s *System) CreateToolWorker(manager *tool.Manager) (*ToolWorker, error) {
 	id := s.nextAgentID("tool")
 	return s.addToolWorker(id, manager)
 }
 // nextAgentID generates a unique agent ID with the given prefix.
 func (s *System) nextAgentID(prefix string) string {
 	n := atomic.AddInt64(&s.nextID, 1)
 	return fmt.Sprintf("%s-%d", prefix, n)
 }
 // addOrchestrator creates and registers an orchestrator.
 func (s *System) addOrchestrator(id string, busInterface interface{}) (*Orchestrator, error) {
 	mb, ok := busInterface.(interface{ Bus() })
 	var orch *Orchestrator
 	if ok {
 		// If busInterface has a Bus() method, we could extract it here
 		_ = mb
 	}
 	orch = NewOrchestrator(id, nil)
 	s.mu.Lock()
 	s.agents[id] = orch
 	s.mu.Unlock()
 	return orch, nil
 }
 // addWorker creates and registers a worker.
 func (s *System) addWorker(id string) (*Worker, error) {
 	w := NewWorker(id)
 	s.mu.Lock()
 	s.agents[id] = w
 	s.mu.Unlock()
 	return w, nil
 }
 // addToolWorker creates and registers a tool worker with the given tool manager.
 func (s *System) addToolWorker(id string, manager *tool.Manager) (*ToolWorker, error) {
 	w := NewToolWorker(id, manager)
 	s.mu.Lock()
 	s.agents[id] = w
 	s.mu.Unlock()
 	return w, nil
 }
 // StopAgent stops and removes a single agent by ID.
 func (s *System) StopAgent(id string) error {
 	s.mu.Lock()
 	agent, ok := s.agents[id]
 	if !ok {
 		s.mu.Unlock()
 		return fmt.Errorf("agent %s not found", id)
 	}
 	delete(s.agents, id)
 	s.mu.Unlock()
 	return agent.Stop()
 }
 // GetAgent retrieves a registered agent by ID.
 func (s *System) GetAgent(id string) (Agent, bool) {
 	s.mu.RLock()
 	defer s.mu.RUnlock()
 	agent, ok := s.agents[id]
 	return agent, ok
 }
 // ListAgents returns all registered agents.
 func (s *System) ListAgents() []Agent {
 	s.mu.RLock()
 	defer s.mu.RUnlock()
 	agents := make([]Agent, 0, len(s.agents))
 	for _, a := range s.agents {
 		agents = append(agents, a)
 	}
 	return agents
 }
 // AgentInfos returns summary information for all registered agents.
 func (s *System) AgentInfos() []AgentInfo {
 	s.mu.RLock()
 	defer s.mu.RUnlock()
 	infos := make([]AgentInfo, 0, len(s.agents))
 	for _, a := range s.agents {
 		// Try to get status from BaseAgent
 		status := StatusIdle
 		if ba, ok := a.(*BaseAgent); ok {
 			status = ba.Status()
 		} else if orch, ok := a.(*Orchestrator); ok {
 			status = orch.Status()
 		} else if w, ok := a.(*Worker); ok {
 			status = w.Status()
 		} else if tw, ok := a.(*ToolWorker); ok {
 			status = tw.Status()
 		}
 		infos = append(infos, AgentInfo{
 			ID:     a.ID(),
 			Role:   a.Role(),
 			Status: status,
 		})
 	}
 	return infos
 }
 // StopAll gracefully stops all registered agents.
 func (s *System) StopAll() error {
 	s.mu.Lock()
 	defer s.mu.Unlock()
 	var lastErr error
 	for id, agent := range s.agents {
 		if err := agent.Stop(); err != nil {
 			lastErr = err
 		}
 		delete(s.agents, id)
 	}
 	return lastErr
 }
 // AgentCount returns the number of registered agents.
 func (s *System) AgentCount() int {
 	s.mu.RLock()
 	defer s.mu.RUnlock()
 	return len(s.agents)
 }
--- a/pkg/actor/tool_worker.go
+++ b/pkg/actor/tool_worker.go
@ -0,0 +1,153 @@
 package actor
 import (
 	"context"
 	"encoding/json"
 	"fmt"
 	"github.com/orca/orca/pkg/bus"
 	"github.com/orca/orca/pkg/tool"
 )
 // ToolWorker is an agent that processes tool call messages by executing
 // tools through the tool.Manager.
 //
 // It implements the Agent interface and handles MsgTypeToolCall messages.
 // When a tool call is received, it extracts the tool name and arguments
 // from the message content, executes the tool via the Manager, and
 // returns a MsgTypeToolResult with the execution result.
 type ToolWorker struct {
 	*BaseAgent
 	manager *tool.Manager
 }
 // NewToolWorker creates a new ToolWorker agent with the given id and tool manager.
 // The agent is started automatically upon creation.
 func NewToolWorker(id string, manager *tool.Manager) *ToolWorker {
 	w := &ToolWorker{
 		BaseAgent: NewBaseAgent(id, "tool_worker"),
 		manager:   manager,
 	}
 	w.SetHandler(w.handleMessage)
 	if err := w.Start(); err != nil {
 		panic(fmt.Sprintf("tool_worker: failed to start: %v", err))
 	}
 	return w
 }
 // handleMessage routes incoming messages to the appropriate handler.
 func (w *ToolWorker) handleMessage(ctx context.Context, msg bus.Message) (bus.Message, error) {
 	switch msg.Type {
 	case bus.MsgTypeToolCall:
 		return w.handleToolCall(ctx, msg)
 	case bus.MsgTypeTaskRequest:
 		return w.handleTask(ctx, msg)
 	case bus.MsgTypeSystem:
 		return w.handleSystem(ctx, msg)
 	default:
 		return bus.Message{}, fmt.Errorf("tool_worker %s: unsupported message type %s", w.ID(), msg.Type)
 	}
 }
 // handleToolCall processes a tool call by executing the named tool
 // with the provided arguments.
 //
 // The msg.Content is expected to contain a JSON object with:
 //   - "name": the tool name (string)
 //   - "arguments": the tool arguments (object)
 //
 // Or alternatively, msg.Content can be a string in the format:
 //   tool_name(arg1=val1, arg2=val2)
 func (w *ToolWorker) handleToolCall(ctx context.Context, msg bus.Message) (bus.Message, error) {
 	w.setStatus(StatusWaitingForTool)
 	defer w.setStatus(StatusProcessing)
 	toolName, args, err := parseToolCallContent(msg.Content)
 	if err != nil {
 		return bus.Message{
 			ID:      msg.ID + "-result",
 			Type:    bus.MsgTypeToolResult,
 			From:    w.ID(),
 			To:      msg.From,
 			Content: map[string]interface{}{"error": err.Error()},
 		}, nil
 	}
 	// Execute the tool
 	result, err := w.manager.Execute(toolName, ctx, args)
 	if err != nil {
 		return bus.Message{
 			ID:      msg.ID + "-result",
 			Type:    bus.MsgTypeToolResult,
 			From:    w.ID(),
 			To:      msg.From,
 			Content: map[string]interface{}{"error": err.Error()},
 		}, nil
 	}
 	return bus.Message{
 		ID:      msg.ID + "-result",
 		Type:    bus.MsgTypeToolResult,
 		From:    w.ID(),
 		To:      msg.From,
 		Content: result,
 	}, nil
 }
 // parseToolCallContent extracts the tool name and arguments from various
 // content formats.
 func parseToolCallContent(content interface{}) (string, map[string]interface{}, error) {
 	switch v := content.(type) {
 	case map[string]interface{}:
 		// Format: {"name": "tool_name", "arguments": {...}}
 		name, ok := v["name"].(string)
 		if !ok || name == "" {
 			return "", nil, fmt.Errorf("tool call content missing 'name' field")
 		}
 		args, _ := v["arguments"].(map[string]interface{})
 		if args == nil {
 			args = make(map[string]interface{})
 		}
 		return name, args, nil
 	case string:
 		// Try JSON format
 		var parsed map[string]interface{}
 		if err := json.Unmarshal([]byte(v), &parsed); err == nil {
 			name, ok := parsed["name"].(string)
 			if ok && name != "" {
 				args, _ := parsed["arguments"].(map[string]interface{})
 				if args == nil {
 					args = make(map[string]interface{})
 				}
 				return name, args, nil
 			}
 		}
 		return "", nil, fmt.Errorf("cannot parse tool call from string content: %s", v)
 	default:
 		return "", nil, fmt.Errorf("unsupported tool call content type: %T", content)
 	}
 }
 // handleTask processes a task request by returning a task response.
 func (w *ToolWorker) handleTask(ctx context.Context, msg bus.Message) (bus.Message, error) {
 	return bus.Message{
 		ID:      msg.ID + "-response",
 		Type:    bus.MsgTypeTaskResponse,
 		From:    w.ID(),
 		To:      msg.From,
 		Content: msg.Content,
 	}, nil
 }
 // handleSystem processes internal system messages.
 func (w *ToolWorker) handleSystem(ctx context.Context, msg bus.Message) (bus.Message, error) {
 	return bus.Message{
 		ID:      msg.ID + "-ack",
 		Type:    bus.MsgTypeSystem,
 		From:    w.ID(),
 		To:      msg.From,
 		Content: "tool_worker acknowledged",
 	}, nil
 }
--- a/pkg/actor/worker.go
+++ b/pkg/actor/worker.go
@ -0,0 +1,88 @@
 package actor
 import (
 	"context"
 	"fmt"
 	"github.com/orca/orca/pkg/bus"
 )
 // Worker is an agent that processes tasks and makes tool calls.
 //
 // Workers are the execution units in the actor system. They receive
 // task requests from the orchestrator, process them (potentially making
 // tool calls), and return results.
 type Worker struct {
 	*BaseAgent
 }
 // NewWorker creates a new Worker agent with the given id.
 // The agent is started automatically upon creation.
 func NewWorker(id string) *Worker {
 	w := &Worker{
 		BaseAgent: NewBaseAgent(id, "worker"),
 	}
 	w.SetHandler(w.handleMessage)
 	if err := w.Start(); err != nil {
 		panic(fmt.Sprintf("worker: failed to start: %v", err))
 	}
 	return w
 }
 // handleMessage routes incoming messages to the appropriate handler.
 func (w *Worker) handleMessage(ctx context.Context, msg bus.Message) (bus.Message, error) {
 	switch msg.Type {
 	case bus.MsgTypeTaskRequest:
 		return w.handleTask(ctx, msg)
 	case bus.MsgTypeToolCall:
 		return w.handleToolCall(ctx, msg)
 	case bus.MsgTypeSystem:
 		return w.handleSystem(ctx, msg)
 	default:
 		return bus.Message{}, fmt.Errorf("worker %s: unsupported message type %s", w.ID(), msg.Type)
 	}
 }
 // handleTask processes a task request and returns a task response.
 func (w *Worker) handleTask(ctx context.Context, msg bus.Message) (bus.Message, error) {
 	// Process the task - in a real implementation this would involve
 	// the LLM, tool calls, etc.
 	return bus.Message{
 		ID:      msg.ID + "-response",
 		Type:    bus.MsgTypeTaskResponse,
 		From:    w.ID(),
 		To:      msg.From,
 		Content: msg.Content,
 		Metadata: map[string]string{
 			"processed_by": w.ID(),
 		},
 	}, nil
 }
 // handleToolCall processes a tool call request, transitions to WaitingForTool
 // state, and returns the result.
 func (w *Worker) handleToolCall(ctx context.Context, msg bus.Message) (bus.Message, error) {
 	w.setStatus(StatusWaitingForTool)
 	defer w.setStatus(StatusProcessing)
 	// In a real implementation, this would invoke the actual tool.
 	// For now, acknowledge the tool call.
 	return bus.Message{
 		ID:      msg.ID + "-result",
 		Type:    bus.MsgTypeToolResult,
 		From:    w.ID(),
 		To:      msg.From,
 		Content: msg.Content,
 	}, nil
 }
 // handleSystem processes internal system messages.
 func (w *Worker) handleSystem(ctx context.Context, msg bus.Message) (bus.Message, error) {
 	return bus.Message{
 		ID:      msg.ID + "-ack",
 		Type:    bus.MsgTypeSystem,
 		From:    w.ID(),
 		To:      msg.From,
 		Content: "worker acknowledged",
 	}, nil
 }
--- a/pkg/bus/bus.go
+++ b/pkg/bus/bus.go
@ -0,0 +1,164 @@
 package bus
 import (
 	"errors"
 	"fmt"
 	"sync"
 	"sync/atomic"
 )
 // Handler is a callback function that processes a delivered message.
 type Handler func(Message)
 // Subscription represents an active subscription to a message bus topic.
 type Subscription interface {
 	ID() string
 	Topic() string
 	Unsubscribe()
 }
 // MessageBus is the central communication hub of the Orca framework.
 //
 // It uses a publish/subscribe pattern built on Go channels. Components
 // publish messages to named topics, and all subscribers to that topic
 // receive the message asynchronously.
 type MessageBus interface {
 	// Publish sends a message to all active subscribers of the given topic.
 	Publish(topic string, msg Message) error
 	// Subscribe registers a handler for the given topic.
 	Subscribe(topic string, handler Handler) (Subscription, error)
 	// Close gracefully shuts down the bus, cleaning up all subscriptions.
 	Close() error
 }
 // subscription implements the Subscription interface.
 type subscription struct {
 	id     string
 	topic  string
 	ch     chan Message
 	bus    *messageBus
 	active *atomic.Bool
 }
 func (s *subscription) ID() string   { return s.id }
 func (s *subscription) Topic() string { return s.topic }
 func (s *subscription) Unsubscribe()  { s.bus.unsubscribe(s) }
 // messageBus is the channel-based implementation of MessageBus.
 type messageBus struct {
 	mu     sync.RWMutex
 	topics map[string][]*subscription
 	nextID int64
 	closed bool
 }
 // New creates a new message bus instance.
 func New() MessageBus {
 	return &messageBus{
 		topics: make(map[string][]*subscription),
 	}
 }
 // Publish sends a message to all subscribers of the given topic.
 // The send is non-blocking: if a subscriber's channel buffer is full,
 // the message is dropped for that subscriber.
 func (mb *messageBus) Publish(topic string, msg Message) error {
 	mb.mu.RLock()
 	defer mb.mu.RUnlock()
 	if mb.closed {
 		return errors.New("message bus is closed")
 	}
 	subs, ok := mb.topics[topic]
 	if !ok {
 		return nil
 	}
 	for _, sub := range subs {
 		if sub.active.Load() {
 			select {
 			case sub.ch <- msg:
 			default:
 			}
 		}
 	}
 	return nil
 }
 // Subscribe adds a handler for the given topic.
 func (mb *messageBus) Subscribe(topic string, handler Handler) (Subscription, error) {
 	mb.mu.Lock()
 	defer mb.mu.Unlock()
 	if mb.closed {
 		return nil, errors.New("message bus is closed")
 	}
 	id := fmt.Sprintf("sub-%d", atomic.AddInt64(&mb.nextID, 1))
 	sub := &subscription{
 		id:     id,
 		topic:  topic,
 		ch:     make(chan Message, 64),
 		bus:    mb,
 		active: &atomic.Bool{},
 	}
 	sub.active.Store(true)
 	mb.topics[topic] = append(mb.topics[topic], sub)
 	go sub.deliver(handler)
 	return sub, nil
 }
 // deliver reads messages from the subscription channel and calls the handler.
 func (s *subscription) deliver(handler Handler) {
 	for msg := range s.ch {
 		if !s.active.Load() {
 			return
 		}
 		handler(msg)
 	}
 }
 // unsubscribe removes a subscription from the bus and closes its channel.
 func (mb *messageBus) unsubscribe(sub *subscription) {
 	mb.mu.Lock()
 	defer mb.mu.Unlock()
 	sub.active.Store(false)
 	subs, ok := mb.topics[sub.Topic()]
 	if !ok {
 		return
 	}
 	for i, s := range subs {
 		if s.ID() == sub.ID() {
 			mb.topics[sub.Topic()] = append(subs[:i], subs[i+1:]...)
 			close(s.ch)
 			return
 		}
 	}
 }
 // Close shuts down the bus, unsubscribing all active subscriptions.
 func (mb *messageBus) Close() error {
 	mb.mu.Lock()
 	defer mb.mu.Unlock()
 	if mb.closed {
 		return nil
 	}
 	mb.closed = true
 	for topic, subs := range mb.topics {
 		for _, sub := range subs {
 			sub.active.Store(false)
 			close(sub.ch)
 		}
 		delete(mb.topics, topic)
 	}
 	return nil
 }
--- a/pkg/bus/bus_test.go
+++ b/pkg/bus/bus_test.go
@ -0,0 +1,252 @@
 package bus
 import (
 	"sync"
 	"sync/atomic"
 	"testing"
 	"time"
 )
 func TestNewBus(t *testing.T) {
 	b := New()
 	if b == nil {
 		t.Fatal("New() returned nil")
 	}
 }
 func TestPublishSubscribe(t *testing.T) {
 	b := New()
 	defer b.Close()
 	var received int32
 	var wg sync.WaitGroup
 	wg.Add(1)
 	sub, err := b.Subscribe("test", func(msg Message) {
 		atomic.AddInt32(&received, 1)
 		wg.Done()
 	})
 	if err != nil {
 		t.Fatalf("Subscribe failed: %v", err)
 	}
 	defer sub.Unsubscribe()
 	err = b.Publish("test", Message{
 		ID:   "msg-1",
 		Type: MsgTypeSystem,
 		From: "test",
 	})
 	if err != nil {
 		t.Fatalf("Publish failed: %v", err)
 	}
 	wg.Wait()
 	if atomic.LoadInt32(&received) != 1 {
 		t.Errorf("expected 1 message, got %d", received)
 	}
 }
 func TestPublishNoSubscribers(t *testing.T) {
 	b := New()
 	defer b.Close()
 	err := b.Publish("nonexistent", Message{ID: "msg-1"})
 	if err != nil {
 		t.Fatalf("Publish to nonexistent topic should not error: %v", err)
 	}
 }
 func TestMultipleSubscribers(t *testing.T) {
 	b := New()
 	defer b.Close()
 	var received int32
 	var wg sync.WaitGroup
 	wg.Add(3)
 	for i := 0; i < 3; i++ {
 		sub, err := b.Subscribe("multi", func(msg Message) {
 			atomic.AddInt32(&received, 1)
 			wg.Done()
 		})
 		if err != nil {
 			t.Fatalf("Subscribe %d failed: %v", i, err)
 		}
 		defer sub.Unsubscribe()
 	}
 	err := b.Publish("multi", Message{ID: "msg-1"})
 	if err != nil {
 		t.Fatalf("Publish failed: %v", err)
 	}
 	wg.Wait()
 	if n := atomic.LoadInt32(&received); n != 3 {
 		t.Errorf("expected 3 messages, got %d", n)
 	}
 }
 func TestUnsubscribe(t *testing.T) {
 	b := New()
 	defer b.Close()
 	var received int32
 	sub, err := b.Subscribe("test", func(msg Message) {
 		atomic.AddInt32(&received, 1)
 	})
 	if err != nil {
 		t.Fatalf("Subscribe failed: %v", err)
 	}
 	// Publish before unsubscribe
 	b.Publish("test", Message{ID: "msg-1"})
 	time.Sleep(50 * time.Millisecond)
 	sub.Unsubscribe()
 	// Publish after unsubscribe
 	b.Publish("test", Message{ID: "msg-2"})
 	time.Sleep(50 * time.Millisecond)
 	if n := atomic.LoadInt32(&received); n != 1 {
 		t.Errorf("expected 1 message after unsubscribe, got %d", n)
 	}
 }
 func TestSubscribeAfterClose(t *testing.T) {
 	b := New()
 	b.Close()
 	_, err := b.Subscribe("test", func(msg Message) {})
 	if err == nil {
 		t.Error("expected error subscribing to closed bus")
 	}
 }
 func TestPublishAfterClose(t *testing.T) {
 	b := New()
 	b.Close()
 	err := b.Publish("test", Message{ID: "msg-1"})
 	if err == nil {
 		t.Error("expected error publishing to closed bus")
 	}
 }
 func TestSubscriptionID(t *testing.T) {
 	b := New()
 	defer b.Close()
 	sub1, _ := b.Subscribe("a", func(msg Message) {})
 	defer sub1.Unsubscribe()
 	sub2, _ := b.Subscribe("b", func(msg Message) {})
 	defer sub2.Unsubscribe()
 	if sub1.ID() == sub2.ID() {
 		t.Error("subscription IDs should be unique")
 	}
 	if sub1.Topic() != "a" || sub2.Topic() != "b" {
 		t.Error("topic mismatch")
 	}
 }
 func TestConcurrentPublish(t *testing.T) {
 	b := New()
 	defer b.Close()
 	var received int32
 	var wg sync.WaitGroup
 	wg.Add(100)
 	sub, err := b.Subscribe("concurrent", func(msg Message) {
 		atomic.AddInt32(&received, 1)
 		wg.Done()
 	})
 	if err != nil {
 		t.Fatalf("Subscribe failed: %v", err)
 	}
 	defer sub.Unsubscribe()
 	for i := 0; i < 100; i++ {
 		go func(i int) {
 			b.Publish("concurrent", Message{
 				ID:   time.Now().String(),
 				Type: MsgTypeSystem,
 			})
 		}(i)
 	}
 	wg.Wait()
 	if n := atomic.LoadInt32(&received); n != 100 {
 		t.Errorf("expected 100 messages, got %d", n)
 	}
 }
 func TestDifferentTopics(t *testing.T) {
 	b := New()
 	defer b.Close()
 	var topics []string
 	var mu sync.Mutex
 	sub1, _ := b.Subscribe("topic-a", func(msg Message) {
 		mu.Lock()
 		topics = append(topics, "a")
 		mu.Unlock()
 	})
 	defer sub1.Unsubscribe()
 	sub2, _ := b.Subscribe("topic-b", func(msg Message) {
 		mu.Lock()
 		topics = append(topics, "b")
 		mu.Unlock()
 	})
 	defer sub2.Unsubscribe()
 	b.Publish("topic-a", Message{ID: "msg-1"})
 	time.Sleep(50 * time.Millisecond)
 	if len(topics) != 1 || topics[0] != "a" {
 		t.Errorf("expected only topic-a to receive message, got %v", topics)
 	}
 }
 func TestCloseIdempotent(t *testing.T) {
 	b := New()
 	err1 := b.Close()
 	err2 := b.Close()
 	if err1 != nil {
 		t.Fatalf("first Close failed: %v", err1)
 	}
 	if err2 != nil {
 		t.Fatalf("second Close should be idempotent: %v", err2)
 	}
 }
 func TestMessageTypeString(t *testing.T) {
 	tests := []struct {
 		mt   MessageType
 		want string
 	}{
 		{MsgTypeSystem, "system"},
 		{MsgTypeTaskRequest, "task_request"},
 		{MsgTypeTaskResponse, "task_response"},
 		{MsgTypeToolCall, "tool_call"},
 		{MsgTypeToolResult, "tool_result"},
 		{MsgTypeObservation, "observation"},
 		{MsgTypeError, "error"},
 		{MsgTypeLog, "log"},
 		{MessageType(99), "unknown"},
 	}
 	for _, tt := range tests {
 		if got := tt.mt.String(); got != tt.want {
 			t.Errorf("MessageType(%d).String() = %q, want %q", tt.mt, got, tt.want)
 		}
 	}
 }
--- a/pkg/bus/types.go
+++ b/pkg/bus/types.go
@ -0,0 +1,67 @@
 // Package bus provides the message bus system for inter-component communication.
 //
 // The message bus is the central nervous system of the Orca framework.
 // All components (kernel, plugins, agents) communicate through it
 // via a publish/subscribe pattern over Go channels.
 package bus
 import "time"
 // MessageType represents the category of a message in the bus system.
 type MessageType int
 const (
 	// MsgTypeSystem is for internal kernel messages.
 	MsgTypeSystem MessageType = iota
 	// MsgTypeTaskRequest is a request to perform a task.
 	MsgTypeTaskRequest
 	// MsgTypeTaskResponse is the result of a task.
 	MsgTypeTaskResponse
 	// MsgTypeToolCall is a request to invoke a tool.
 	MsgTypeToolCall
 	// MsgTypeToolResult is the result of a tool execution.
 	MsgTypeToolResult
 	// MsgTypeObservation is an observation from tool/command execution.
 	MsgTypeObservation
 	// MsgTypeError is an error message.
 	MsgTypeError
 	// MsgTypeLog is a log message for observability.
 	MsgTypeLog
 )
 // String returns the human-readable name of the message type.
 func (mt MessageType) String() string {
 	switch mt {
 	case MsgTypeSystem:
 		return "system"
 	case MsgTypeTaskRequest:
 		return "task_request"
 	case MsgTypeTaskResponse:
 		return "task_response"
 	case MsgTypeToolCall:
 		return "tool_call"
 	case MsgTypeToolResult:
 		return "tool_result"
 	case MsgTypeObservation:
 		return "observation"
 	case MsgTypeError:
 		return "error"
 	case MsgTypeLog:
 		return "log"
 	default:
 		return "unknown"
 	}
 }
 // Message is the universal data unit in the message bus system.
 //
 // Every component communicates by publishing and subscribing to Messages.
 type Message struct {
 	ID        string            `json:"id"`
 	Type      MessageType       `json:"type"`
 	From      string            `json:"from"`
 	To        string            `json:"to"`
 	Content   interface{}       `json:"content"`
 	Metadata  map[string]string `json:"metadata,omitempty"`
 	Timestamp time.Time         `json:"timestamp"`
 }
--- a/pkg/kernel/kernel.go
+++ b/pkg/kernel/kernel.go
@ -0,0 +1,392 @@
 // Package kernel implements the microkernel core of the Orca framework.
 //
 // The kernel is the minimal runtime that manages plugin lifecycle,
 // message routing, and inter-component communication.
 package kernel
 import (
 	"context"
 	"fmt"
 	"log"
 	"os"
 	"sync"
 	"time"
 	"github.com/orca/orca/internal/config"
 	"github.com/orca/orca/pkg/actor"
 	"github.com/orca/orca/pkg/bus"
 	"github.com/orca/orca/pkg/llm"
 	"github.com/orca/orca/pkg/plugin"
 	"github.com/orca/orca/pkg/session"
 	"github.com/orca/orca/pkg/skill"
 	"github.com/orca/orca/pkg/tool"
 )
 // Kernel is the microkernel core of the Orca framework.
 //
 // It orchestrates plugin lifecycle, message routing, and inter-component
 // communication. The kernel initializes and manages:
 //   - Message bus for inter-component communication
 //   - Plugin registry for extensibility
 //   - Session manager for conversation persistence
 //   - Tool manager with built-in tools
 //   - Skill manager for skill-based automation
 //   - Actor system with orchestrator, workers, and LLM agent
 type Kernel struct {
 	mu       sync.RWMutex
 	mb       bus.MessageBus
 	registry *plugin.Registry
 	plugins  []plugin.Plugin
 	started  bool
 	// Integration components
 	config      *config.Config
 	sessionMgr  *session.Manager
 	toolMgr     *tool.Manager
 	skillMgr    *skill.Manager
 	actorSystem *actor.System
 	orch        *actor.Orchestrator
 	llmAgent    *actor.LLMAgent
 	toolWorker  *actor.ToolWorker
 }
 // New creates a new Kernel instance with default configuration.
 func New() *Kernel {
 	return NewWithConfig(config.DefaultConfig())
 }
 // NewWithConfig creates a new Kernel instance with the given configuration.
 func NewWithConfig(cfg *config.Config) *Kernel {
 	if cfg == nil {
 		cfg = config.DefaultConfig()
 	}
 	k := &Kernel{
 		mb:          bus.New(),
 		registry:    plugin.NewRegistry(),
 		config:      cfg,
 		actorSystem: actor.NewSystem(),
 	}
 	// Initialize session manager
 	store, err := session.NewJSONLStore(cfg.Session.StorageDir)
 	if err != nil {
 		log.Printf("kernel: warning: failed to create session store: %v", err)
 	} else {
 		k.sessionMgr = session.NewManager(store, k.mb)
 	}
 	// Initialize tool manager with all built-in tools
 	k.toolMgr = tool.NewManager()
 	k.registerBuiltinTools()
 	// Initialize skill manager
 	k.skillMgr = skill.NewManager(cfg.Session.StorageDir + "/skills")
 	// Initialize actor system
 	k.initializeActorSystem()
 	return k
 }
 // registerBuiltinTools registers all built-in tools with the tool manager.
 func (k *Kernel) registerBuiltinTools() {
 	tools := []tool.Tool{
 		tool.NewExecTool(nil),     // exec - shell commands
 		tool.NewReadFileTool(),    // read_file
 		tool.NewWriteFileTool(),   // write_file
 		tool.NewListDirTool(),     // list_dir
 		tool.NewSearchFilesTool(), // search_files
 	}
 	for _, t := range tools {
 		if err := k.toolMgr.Register(t); err != nil {
 			log.Printf("kernel: warning: failed to register tool %q: %v", t.Name(), err)
 		}
 	}
 }
 // initializeActorSystem sets up the orchestrator, tool worker, and LLM agent.
 func (k *Kernel) initializeActorSystem() {
 	// Create orchestrator
 	orch, err := k.actorSystem.CreateOrchestrator(k)
 	if err != nil {
 		log.Printf("kernel: warning: failed to create orchestrator: %v", err)
 		return
 	}
 	k.orch = orch
 	// Create tool worker
 	tw, err := k.actorSystem.CreateToolWorker(k.toolMgr)
 	if err != nil {
 		log.Printf("kernel: warning: failed to create tool worker: %v", err)
 		return
 	}
 	k.toolWorker = tw
 	// Create LLM backend
 	ollama := k.createLLMBackend()
 	// Create LLM agent
 	llmAgentID := fmt.Sprintf("llm-%d", len(k.actorSystem.ListAgents())+1)
 	llmOpts := []actor.LLMAgentOption{
 		actor.WithToolManager(k.toolMgr),
 		actor.WithToolWorker(k.toolWorker),
 		actor.WithWindowSize(k.config.Session.MaxHistory),
 	}
 	if k.sessionMgr != nil {
 		sessionID := "default"
 		if _, err := k.sessionMgr.GetSession(sessionID); err != nil {
 			k.sessionMgr.CreateSession(sessionID, map[string]string{
 				"source": "kernel",
 			})
 		}
 		llmOpts = append(llmOpts,
 			actor.WithSessionManager(k.sessionMgr),
 			actor.WithSessionID(sessionID),
 		)
 	}
 	llmAgent := actor.NewLLMAgent(llmAgentID, ollama, llmOpts...)
 	k.llmAgent = llmAgent
 	// Register LLM agent as orchestrator's worker
 	k.orch.AddWorker(llmAgent)
 	// Also register tool worker as a fallback worker
 	k.orch.AddWorker(tw)
 }
 // createLLMBackend creates the LLM backend based on configuration.
 func (k *Kernel) createLLMBackend() llm.LLM {
 	baseURL := k.config.Ollama.BaseURL
 	model := k.config.Ollama.Model
 	timeout := k.config.Ollama.Timeout
 	// Allow shorter env var names to override
 	if v := os.Getenv("OLLAMA_BASE_URL"); v != "" {
 		baseURL = v
 	}
 	if v := os.Getenv("OLLAMA_MODEL"); v != "" {
 		model = v
 	}
 	if v := os.Getenv("OLLAMA_TIMEOUT"); v != "" {
 		if d, err := time.ParseDuration(v); err == nil {
 			timeout = d
 		}
 	}
 	client := llm.NewOllamaClient(
 		llm.WithBaseURL(baseURL),
 		llm.WithModel(model),
 		llm.WithTimeout(timeout),
 	)
 	log.Printf("kernel: created Ollama client (model=%s, url=%s)", model, baseURL)
 	return client
 }
 // Bus returns the kernel's message bus.
 func (k *Kernel) Bus() bus.MessageBus {
 	return k.mb
 }
 // Registry returns the plugin registry.
 func (k *Kernel) Registry() *plugin.Registry {
 	return k.registry
 }
 // SessionManager returns the session manager.
 func (k *Kernel) SessionManager() *session.Manager {
 	return k.sessionMgr
 }
 // ToolManager returns the tool manager.
 func (k *Kernel) ToolManager() *tool.Manager {
 	return k.toolMgr
 }
 // SkillManager returns the skill manager.
 func (k *Kernel) SkillManager() *skill.Manager {
 	return k.skillMgr
 }
 // ActorSystem returns the actor system.
 func (k *Kernel) ActorSystem() *actor.System {
 	return k.actorSystem
 }
 // Orchestrator returns the orchestrator agent.
 func (k *Kernel) Orchestrator() *actor.Orchestrator {
 	return k.orch
 }
 // LLMAgent returns the LLM agent.
 func (k *Kernel) LLMAgent() *actor.LLMAgent {
 	return k.llmAgent
 }
 // SendMessage sends a message from a source to the LLM agent.
 //
 // This is the primary public API for interacting with the Orca system.
 // It creates a task request message and sends it through the orchestrator
 // to the LLM agent for processing.
 //
 // Parameters:
 //   - from: the sender identifier (e.g., "user", "cli")
 //   - to: the recipient (use "llm" for the LLM agent)
 //   - content: the message content (plain text)
 //
 // Returns the response content as a string, or an error.
 func (k *Kernel) SendMessage(from, to, content string) (string, error) {
 	if !k.IsRunning() {
 		return "", fmt.Errorf("kernel: kernel is not running")
 	}
 	if k.orch == nil {
 		return "", fmt.Errorf("kernel: orchestrator not initialized")
 	}
 	// Create a task request message
 	msg := bus.Message{
 		Type:    bus.MsgTypeTaskRequest,
 		From:    from,
 		To:      to,
 		Content: content,
 	}
 	// Send through the orchestrator
 	ctx := context.Background()
 	resp, err := k.orch.Process(ctx, msg)
 	if err != nil {
 		return "", fmt.Errorf("kernel: orchestrator processing failed: %w", err)
 	}
 	// Extract response content
 	switch v := resp.Content.(type) {
 	case string:
 		return v, nil
 	default:
 		return fmt.Sprintf("%v", v), nil
 	}
 }
 // InitPlugins loads and initializes skills from the skills directory.
 func (k *Kernel) InitPlugins() error {
 	if k.skillMgr == nil {
 		return nil
 	}
 	count, err := k.skillMgr.LoadAll()
 	if err != nil {
 		log.Printf("kernel: warning: skill loading had errors: %v", err)
 	}
 	if count > 0 {
 		log.Printf("kernel: loaded %d skills", count)
 	}
 	return nil
 }
 // GetPlugin returns a registered plugin by name.
 func (k *Kernel) GetPlugin(name string) (plugin.Plugin, bool) {
 	return k.registry.Get(name)
 }
 // ListPlugins returns all currently registered plugins.
 func (k *Kernel) ListPlugins() []plugin.Plugin {
 	return k.registry.List()
 }
 // RegisterPlugin registers a plugin without starting it.
 func (k *Kernel) RegisterPlugin(p plugin.Plugin) error {
 	k.mu.Lock()
 	defer k.mu.Unlock()
 	if k.started {
 		return fmt.Errorf("kernel: cannot register plugin %q: kernel already started", p.Name())
 	}
 	return k.registry.Register(p)
 }
 // UnregisterPlugin removes a plugin from the registry.
 func (k *Kernel) UnregisterPlugin(name string) error {
 	k.mu.Lock()
 	defer k.mu.Unlock()
 	return k.registry.Unregister(name)
 }
 // Start initializes all registered plugins and marks the kernel as running.
 func (k *Kernel) Start() error {
 	k.mu.Lock()
 	defer k.mu.Unlock()
 	if k.started {
 		return fmt.Errorf("kernel: already started")
 	}
 	k.started = true
 	// Initialize plugins
 	plugins := k.registry.List()
 	k.plugins = make([]plugin.Plugin, 0, len(plugins))
 	for _, p := range plugins {
 		k.registry.SetState(p.Name(), plugin.StateInitialized)
 		if err := p.Init(k); err != nil {
 			log.Printf("kernel: warning: failed to init plugin %q: %v", p.Name(), err)
 			k.registry.SetState(p.Name(), plugin.StateError)
 			continue
 		}
 		k.registry.SetState(p.Name(), plugin.StateRunning)
 		k.plugins = append(k.plugins, p)
 		log.Printf("kernel: plugin %q (%s) initialized", p.Name(), p.Version())
 	}
 	log.Printf("kernel: started (tools=%d)", k.toolMgr.Count())
 	return nil
 }
 // Stop gracefully shuts down the kernel.
 func (k *Kernel) Stop() error {
 	k.mu.Lock()
 	defer k.mu.Unlock()
 	if !k.started {
 		return nil
 	}
 	// Stop actor system first
 	if k.actorSystem != nil {
 		if err := k.actorSystem.StopAll(); err != nil {
 			log.Printf("kernel: warning: error stopping actor system: %v", err)
 		}
 	}
 	// Stop plugins
 	for i := len(k.plugins) - 1; i >= 0; i-- {
 		p := k.plugins[i]
 		k.registry.SetState(p.Name(), plugin.StateStopped)
 		if err := p.Shutdown(); err != nil {
 			log.Printf("kernel: warning: error shutting down plugin %q: %v", p.Name(), err)
 			continue
 		}
 		log.Printf("kernel: plugin %q shut down", p.Name())
 	}
 	k.plugins = nil
 	k.started = false
 	return k.mb.Close()
 }
 // IsRunning returns whether the kernel has been started and not yet stopped.
 func (k *Kernel) IsRunning() bool {
 	k.mu.RLock()
 	defer k.mu.RUnlock()
 	return k.started
 }
--- a/pkg/kernel/kernel_test.go
+++ b/pkg/kernel/kernel_test.go
@ -0,0 +1,343 @@
 package kernel
 import (
 	"errors"
 	"sync/atomic"
 	"testing"
 	"time"
 	"github.com/orca/orca/pkg/bus"
 	"github.com/orca/orca/pkg/plugin"
 )
 // testPlugin implements Plugin for kernel testing.
 type testPlugin struct {
 	name    string
 	version string
 	initFn  func(host plugin.PluginHost) error
 	closeFn func() error
 }
 func (p *testPlugin) Name() string                       { return p.name }
 func (p *testPlugin) Version() string                     { return p.version }
 func (p *testPlugin) Init(host plugin.PluginHost) error {
 	if p.initFn != nil {
 		return p.initFn(host)
 	}
 	return nil
 }
 func (p *testPlugin) Shutdown() error {
 	if p.closeFn != nil {
 		return p.closeFn()
 	}
 	return nil
 }
 func TestNewKernel(t *testing.T) {
 	k := New()
 	if k == nil {
 		t.Fatal("New() returned nil")
 	}
 	if k.Bus() == nil {
 		t.Error("Bus() returned nil")
 	}
 	if k.Registry() == nil {
 		t.Error("Registry() returned nil")
 	}
 }
 func TestKernelStartStop(t *testing.T) {
 	k := New()
 	if err := k.Start(); err != nil {
 		t.Fatalf("Start failed: %v", err)
 	}
 	if !k.IsRunning() {
 		t.Error("expected kernel running after Start")
 	}
 	if err := k.Stop(); err != nil {
 		t.Fatalf("Stop failed: %v", err)
 	}
 	if k.IsRunning() {
 		t.Error("expected kernel stopped after Stop")
 	}
 }
 func TestKernelDoubleStart(t *testing.T) {
 	k := New()
 	k.Start()
 	err := k.Start()
 	if err == nil {
 		t.Error("expected error on double start")
 	}
 	k.Stop()
 }
 func TestKernelRegisterPlugin(t *testing.T) {
 	k := New()
 	p := &testPlugin{name: "test", version: "1.0.0"}
 	err := k.RegisterPlugin(p)
 	if err != nil {
 		t.Fatalf("RegisterPlugin failed: %v", err)
 	}
 	got, ok := k.GetPlugin("test")
 	if !ok {
 		t.Fatal("GetPlugin returned not found")
 	}
 	if got.Name() != "test" {
 		t.Errorf("expected name 'test', got %q", got.Name())
 	}
 }
 func TestKernelRegisterPluginAfterStart(t *testing.T) {
 	k := New()
 	k.Start()
 	defer k.Stop()
 	err := k.RegisterPlugin(&testPlugin{name: "test", version: "1.0.0"})
 	if err == nil {
 		t.Error("expected error registering plugin after start")
 	}
 }
 func TestKernelPluginLifecycle(t *testing.T) {
 	k := New()
 	var initCount int32
 	var shutdownCount int32
 	p := &testPlugin{
 		name:    "lifecycle",
 		version: "1.0.0",
 		initFn: func(host plugin.PluginHost) error {
 			atomic.AddInt32(&initCount, 1)
 			return nil
 		},
 		closeFn: func() error {
 			atomic.AddInt32(&shutdownCount, 1)
 			return nil
 		},
 	}
 	k.RegisterPlugin(p)
 	k.Start()
 	if n := atomic.LoadInt32(&initCount); n != 1 {
 		t.Errorf("expected init called once, got %d", n)
 	}
 	k.Stop()
 	if n := atomic.LoadInt32(&shutdownCount); n != 1 {
 		t.Errorf("expected shutdown called once, got %d", n)
 	}
 }
 func TestKernelPluginInitFailure(t *testing.T) {
 	k := New()
 	p := &testPlugin{
 		name:    "failing",
 		version: "1.0.0",
 		initFn: func(host plugin.PluginHost) error {
 			return errors.New("init failed")
 		},
 	}
 	k.RegisterPlugin(p)
 	// Init failure should not prevent Start from succeeding (graceful degradation)
 	err := k.Start()
 	if err != nil {
 		t.Fatalf("Start should succeed even with failing plugin: %v", err)
 	}
 	k.Stop()
 }
 func TestKernelPluginShutdownFailure(t *testing.T) {
 	k := New()
 	p := &testPlugin{
 		name:    "failing-shutdown",
 		version: "1.0.0",
 		initFn: func(host plugin.PluginHost) error {
 			return nil
 		},
 		closeFn: func() error {
 			return errors.New("shutdown failed")
 		},
 	}
 	k.RegisterPlugin(p)
 	k.Start()
 	// Shutdown failure should not prevent Stop from succeeding
 	err := k.Stop()
 	if err != nil {
 		t.Fatalf("Stop should succeed even with failing plugin shutdown: %v", err)
 	}
 }
 func TestKernelMultiplePlugins(t *testing.T) {
 	k := New()
 	names := []string{"alpha", "beta", "gamma"}
 	for _, name := range names {
 		k.RegisterPlugin(&testPlugin{name: name, version: "1.0.0"})
 	}
 	k.Start()
 	plugins := k.ListPlugins()
 	if len(plugins) != len(names) {
 		t.Errorf("expected %d plugins, got %d", len(names), len(plugins))
 	}
 	k.Stop()
 }
 func TestKernelUnregisterPlugin(t *testing.T) {
 	k := New()
 	k.RegisterPlugin(&testPlugin{name: "remove-me", version: "1.0.0"})
 	err := k.UnregisterPlugin("remove-me")
 	if err != nil {
 		t.Fatalf("UnregisterPlugin failed: %v", err)
 	}
 	_, ok := k.GetPlugin("remove-me")
 	if ok {
 		t.Error("plugin should not exist after unregister")
 	}
 }
 func TestKernelStopWithoutStart(t *testing.T) {
 	k := New()
 	err := k.Stop()
 	if err != nil {
 		t.Fatalf("Stop without Start should be a no-op: %v", err)
 	}
 }
 func TestKernelPluginReceivesHost(t *testing.T) {
 	k := New()
 	var gotHost plugin.PluginHost
 	p := &testPlugin{
 		name:    "host-check",
 		version: "1.0.0",
 		initFn: func(host plugin.PluginHost) error {
 			gotHost = host
 			return nil
 		},
 	}
 	k.RegisterPlugin(p)
 	k.Start()
 	if gotHost == nil {
 		t.Fatal("plugin did not receive PluginHost")
 	}
 	// Verify the host can access bus
 	if gotHost.Bus() == nil {
 		t.Error("PluginHost.Bus() returned nil")
 	}
 	// Verify plugin discovery through host
 	p2, ok := gotHost.GetPlugin("host-check")
 	if !ok {
 		t.Error("PluginHost.GetPlugin should find itself")
 	}
 	if p2.Name() != "host-check" {
 		t.Errorf("expected name 'host-check', got %q", p2.Name())
 	}
 	k.Stop()
 }
 func TestKernelAllPluginsInitialized(t *testing.T) {
 	k := New()
 	names := []string{"a", "b", "c"}
 	initialized := make(map[string]bool)
 	for _, name := range names {
 		n := name
 		k.RegisterPlugin(&testPlugin{
 			name: n,
 			initFn: func(host plugin.PluginHost) error {
 				initialized[n] = true
 				return nil
 			},
 		})
 	}
 	k.Start()
 	for _, name := range names {
 		if !initialized[name] {
 			t.Errorf("plugin %q was not initialized", name)
 		}
 	}
 	k.Stop()
 }
 func TestKernelShutdownAllPlugins(t *testing.T) {
 	k := New()
 	names := []string{"x", "y", "z"}
 	shutdown := make(map[string]bool)
 	for _, name := range names {
 		n := name
 		k.RegisterPlugin(&testPlugin{
 			name: n,
 			initFn: func(host plugin.PluginHost) error {
 				return nil
 			},
 			closeFn: func() error {
 				shutdown[n] = true
 				return nil
 			},
 		})
 	}
 	k.Start()
 	k.Stop()
 	for _, name := range names {
 		if !shutdown[name] {
 			t.Errorf("plugin %q was not shut down", name)
 		}
 	}
 }
 func TestKernelMessageBusIntegration(t *testing.T) {
 	k := New()
 	k.Start()
 	defer k.Stop()
 	mb := k.Bus()
 	var received int32
 	sub, err := mb.Subscribe("kernel-test", func(msg bus.Message) {
 		atomic.AddInt32(&received, 1)
 	})
 	if err != nil {
 		t.Fatalf("Subscribe failed: %v", err)
 	}
 	defer sub.Unsubscribe()
 	mb.Publish("kernel-test", bus.Message{ID: "test-msg"})
 	time.Sleep(50 * time.Millisecond)
 	if n := atomic.LoadInt32(&received); n != 1 {
 		t.Errorf("expected 1 message via kernel bus, got %d", n)
 	}
 }
--- a/pkg/llm/llm.go
+++ b/pkg/llm/llm.go
@ -0,0 +1,24 @@
 // Package llm provides the LLM integration layer for the Orca framework.
 //
 // It defines the LLM interface for interacting with language models,
 // the Ollama client implementation, and the shared types for chat
 // messages, tool calls, and streaming responses.
 package llm
 import "context"
 // LLM is the interface for interacting with language models.
 //
 // Implementations provide Chat (for complete responses) and Stream
 // (for streaming token-by-token responses) methods. Both methods
 // accept a list of messages and return the model's response.
 type LLM interface {
 	// Chat sends a list of messages to the LLM and returns a complete response.
 	// If the model decides to call tools, the response contains ToolCalls.
 	Chat(ctx context.Context, messages []Message) (*Response, error)
 	// Stream sends messages and streams the response token-by-token.
 	// The handler is called for each chunk. The final response is not
 	// collected; use Chat for complete responses.
 	Stream(ctx context.Context, messages []Message, handler StreamHandler) error
 }
--- a/pkg/llm/ollama.go
+++ b/pkg/llm/ollama.go
@ -0,0 +1,301 @@
 package llm
 import (
 	"bufio"
 	"bytes"
 	"context"
 	"encoding/json"
 	"fmt"
 	"io"
 	"net/http"
 	"strings"
 	"time"
 )
 // OllamaClient implements the LLM interface for Ollama's API.
 //
 // It communicates with a running Ollama server via its REST API.
 // Supports chat, streaming, tool calling (function calling), and
 // embedding generation.
 type OllamaClient struct {
 	baseURL    string
 	model      string
 	httpClient *http.Client
 }
 // OllamaOption is a functional option for configuring the OllamaClient.
 type OllamaOption func(*OllamaClient)
 // WithBaseURL sets the Ollama server base URL.
 func WithBaseURL(url string) OllamaOption {
 	return func(c *OllamaClient) {
 		c.baseURL = strings.TrimRight(url, "/")
 	}
 }
 // WithModel sets the default model name.
 func WithModel(model string) OllamaOption {
 	return func(c *OllamaClient) {
 		c.model = model
 	}
 }
 // WithTimeout sets the HTTP client timeout.
 func WithTimeout(timeout time.Duration) OllamaOption {
 	return func(c *OllamaClient) {
 		c.httpClient.Timeout = timeout
 	}
 }
 // WithHTTPClient sets a custom HTTP client.
 func WithHTTPClient(client *http.Client) OllamaOption {
 	return func(c *OllamaClient) {
 		c.httpClient = client
 	}
 }
 // NewOllamaClient creates a new OllamaClient with the given options.
 //
 // Default values:
 //   - BaseURL: http://localhost:11434
 //   - Model: gemma4:e4b
 //   - Timeout: 30s
 func NewOllamaClient(opts ...OllamaOption) *OllamaClient {
 	c := &OllamaClient{
 		baseURL: "http://localhost:11434",
 		model:   "gemma4:e4b",
 		httpClient: &http.Client{
 			Timeout: 30 * time.Second,
 		},
 	}
 	for _, opt := range opts {
 		opt(c)
 	}
 	return c
 }
 // Chat sends a chat request to Ollama and returns the complete response.
 // If the Ollama model returns tool calls, they are parsed and included
 // in the Response.
 func (c *OllamaClient) Chat(ctx context.Context, messages []Message) (*Response, error) {
 	req := OllamaChatRequest{
 		Model:    c.model,
 		Messages: messages,
 		Stream:   false,
 	}
 	// Build tool definitions if tool package is integrated
 	// (tools are added externally via BuildToolDefs)
 	body, err := json.Marshal(req)
 	if err != nil {
 		return nil, fmt.Errorf("ollama: failed to marshal request: %w", err)
 	}
 	httpReq, err := http.NewRequestWithContext(ctx, http.MethodPost,
 		c.baseURL+"/api/chat", bytes.NewReader(body))
 	if err != nil {
 		return nil, fmt.Errorf("ollama: failed to create request: %w", err)
 	}
 	httpReq.Header.Set("Content-Type", "application/json")
 	resp, err := c.httpClient.Do(httpReq)
 	if err != nil {
 		return nil, fmt.Errorf("ollama: request failed: %w", err)
 	}
 	defer resp.Body.Close()
 	if resp.StatusCode != http.StatusOK {
 		respBody, _ := io.ReadAll(resp.Body)
 		return nil, fmt.Errorf("ollama: API error (status %d): %s",
 			resp.StatusCode, string(respBody))
 	}
 	var rawResp json.RawMessage
 	if err := json.NewDecoder(resp.Body).Decode(&rawResp); err != nil {
 		return nil, fmt.Errorf("ollama: failed to decode response: %w", err)
 	}
 	return parseOllamaResponse(rawResp)
 }
 // parseOllamaResponse attempts to parse the Ollama API response,
 // handling both regular text responses and tool call responses.
 func parseOllamaResponse(raw json.RawMessage) (*Response, error) {
 	// Try as tool call response first (has message.tool_calls)
 	var toolResp OllamaToolCallResponse
 	if err := json.Unmarshal(raw, &toolResp); err == nil && len(toolResp.Message.ToolCalls) > 0 {
 		return &Response{
 			Content:   toolResp.Message.Content,
 			ToolCalls: toolResp.Message.ToolCalls,
 		}, nil
 	}
 	// Try as regular response
 	var chatResp OllamaChatResponse
 	if err := json.Unmarshal(raw, &chatResp); err != nil {
 		return nil, fmt.Errorf("ollama: failed to parse response: %w", err)
 	}
 	return &Response{
 		Content: chatResp.Message.Content,
 	}, nil
 }
 // Stream sends a chat request to Ollama with streaming enabled.
 // The handler receives each content chunk as it arrives.
 func (c *OllamaClient) Stream(ctx context.Context, messages []Message, handler StreamHandler) error {
 	req := OllamaChatRequest{
 		Model:    c.model,
 		Messages: messages,
 		Stream:   true,
 	}
 	body, err := json.Marshal(req)
 	if err != nil {
 		return fmt.Errorf("ollama: failed to marshal request: %w", err)
 	}
 	httpReq, err := http.NewRequestWithContext(ctx, http.MethodPost,
 		c.baseURL+"/api/chat", bytes.NewReader(body))
 	if err != nil {
 		return fmt.Errorf("ollama: failed to create request: %w", err)
 	}
 	httpReq.Header.Set("Content-Type", "application/json")
 	resp, err := c.httpClient.Do(httpReq)
 	if err != nil {
 		return fmt.Errorf("ollama: stream request failed: %w", err)
 	}
 	defer resp.Body.Close()
 	if resp.StatusCode != http.StatusOK {
 		respBody, _ := io.ReadAll(resp.Body)
 		return fmt.Errorf("ollama: stream API error (status %d): %s",
 			resp.StatusCode, string(respBody))
 	}
 	scanner := bufio.NewScanner(resp.Body)
 	for scanner.Scan() {
 		line := scanner.Text()
 		if line == "" {
 			continue
 		}
 		// Each line is a JSON object: {"model":"...","created_at":"...","message":{"role":"assistant","content":"..."},"done":false}
 		var streamResp OllamaChatResponse
 		if err := json.Unmarshal([]byte(line), &streamResp); err != nil {
 			continue // Skip malformed lines
 		}
 		if streamResp.Message.Content != "" {
 			if err := handler(streamResp.Message.Content); err != nil {
 				return err
 			}
 		}
 		if streamResp.Done {
 			break
 		}
 	}
 	return scanner.Err()
 }
 // Embed generates an embedding vector for the given input text.
 func (c *OllamaClient) Embed(ctx context.Context, input string) (*EmbeddingResponse, error) {
 	req := OllamaEmbedRequest{
 		Model: c.model,
 		Input: input,
 	}
 	body, err := json.Marshal(req)
 	if err != nil {
 		return nil, fmt.Errorf("ollama: failed to marshal embed request: %w", err)
 	}
 	httpReq, err := http.NewRequestWithContext(ctx, http.MethodPost,
 		c.baseURL+"/api/embed", bytes.NewReader(body))
 	if err != nil {
 		return nil, fmt.Errorf("ollama: failed to create embed request: %w", err)
 	}
 	httpReq.Header.Set("Content-Type", "application/json")
 	resp, err := c.httpClient.Do(httpReq)
 	if err != nil {
 		return nil, fmt.Errorf("ollama: embed request failed: %w", err)
 	}
 	defer resp.Body.Close()
 	if resp.StatusCode != http.StatusOK {
 		respBody, _ := io.ReadAll(resp.Body)
 		return nil, fmt.Errorf("ollama: embed API error (status %d): %s",
 			resp.StatusCode, string(respBody))
 	}
 	var apiResp OllamaEmbedResponse
 	if err := json.NewDecoder(resp.Body).Decode(&apiResp); err != nil {
 		return nil, fmt.Errorf("ollama: failed to decode embed response: %w", err)
 	}
 	return &EmbeddingResponse{
 		Embedding: apiResp.Embedding,
 	}, nil
 }
 // BuildToolDefsFromMap converts a generic tool definition map into Ollama ToolDefs.
 // This is used to bridge the tool package's Tool interface with Ollama's API format.
 func BuildToolDefsFromMap(tools []map[string]interface{}) []ToolDef {
 	var defs []ToolDef
 	for _, t := range tools {
 		name, _ := t["name"].(string)
 		desc, _ := t["description"].(string)
 		def := ToolDef{
 			Type: "function",
 			Function: ToolFunction{
 				Name:        name,
 				Description: desc,
 				Parameters: ToolFunctionParameters{
 					Type:       "object",
 					Properties: make(map[string]ToolProperty),
 				},
 			},
 		}
 		if params, ok := t["parameters"].(map[string]interface{}); ok {
 			if props, ok := params["properties"].(map[string]interface{}); ok {
 				for key, val := range props {
 					if p, ok := val.(map[string]interface{}); ok {
 						prop := ToolProperty{
 							Type:        toString(p["type"]),
 							Description: toString(p["description"]),
 						}
 						def.Function.Parameters.Properties[key] = prop
 						if isRequired(p) {
 							def.Function.Parameters.Required = append(def.Function.Parameters.Required, key)
 						}
 					}
 				}
 			}
 		}
 		defs = append(defs, def)
 	}
 	return defs
 }
 func toString(v interface{}) string {
 	if v == nil {
 		return ""
 	}
 	s, _ := v.(string)
 	return s
 }
 func isRequired(p map[string]interface{}) bool {
 	req, _ := p["required"].(bool)
 	return req
 }
--- a/pkg/llm/ollama_test.go
+++ b/pkg/llm/ollama_test.go
@ -0,0 +1,385 @@
 package llm
 import (
 	"context"
 	"encoding/json"
 	"net/http"
 	"net/http/httptest"
 	"strings"
 	"testing"
 )
 // ============================================================
 // Helper: create a mock Ollama server
 // ============================================================
 // mockOllamaHandler returns an http.Handler that simulates the Ollama API.
 func mockOllamaHandler(t *testing.T, responseFunc func(reqBody map[string]interface{}) (int, interface{})) *httptest.Server {
 	t.Helper()
 	return httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
 		// Verify request path
 		if r.URL.Path != "/api/chat" && r.URL.Path != "/api/embed" {
 			t.Errorf("unexpected path: %s", r.URL.Path)
 			w.WriteHeader(http.StatusNotFound)
 			return
 		}
 		// Decode request body
 		var reqBody map[string]interface{}
 		if err := json.NewDecoder(r.Body).Decode(&reqBody); err != nil {
 			t.Fatalf("failed to decode request body: %v", err)
 		}
 		status, resp := responseFunc(reqBody)
 		w.Header().Set("Content-Type", "application/json")
 		w.WriteHeader(status)
 		if err := json.NewEncoder(w).Encode(resp); err != nil {
 			t.Fatalf("failed to encode response: %v", err)
 		}
 	}))
 }
 // ============================================================
 // NewOllamaClient Tests
 // ============================================================
 func TestNewOllamaClientDefaults(t *testing.T) {
 	c := NewOllamaClient()
 	if c == nil {
 		t.Fatal("NewOllamaClient() returned nil")
 	}
 	if c.baseURL != "http://localhost:11434" {
 		t.Errorf("expected default base URL 'http://localhost:11434', got %q", c.baseURL)
 	}
 	if c.model != "gemma4:e4b" {
 		t.Errorf("expected default model 'gemma4:e4b', got %q", c.model)
 	}
 }
 func TestNewOllamaClientWithOptions(t *testing.T) {
 	c := NewOllamaClient(
 		WithBaseURL("http://custom:11434"),
 		WithModel("codellama"),
 		WithTimeout(60),
 	)
 	if c.baseURL != "http://custom:11434" {
 		t.Errorf("expected base URL 'http://custom:11434', got %q", c.baseURL)
 	}
 	if c.model != "codellama" {
 		t.Errorf("expected model 'codellama', got %q", c.model)
 	}
 }
 // ============================================================
 // Chat Tests
 // ============================================================
 func TestChat(t *testing.T) {
 	srv := mockOllamaHandler(t, func(reqBody map[string]interface{}) (int, interface{}) {
 		// Verify the request has the expected shape
 		if model, ok := reqBody["model"]; !ok || model != "gemma4:e4b" {
 			t.Errorf("expected model 'gemma4:e4b', got %v", model)
 		}
 		if stream, ok := reqBody["stream"]; !ok || stream != false {
 			t.Errorf("expected stream false, got %v", stream)
 		}
 		return http.StatusOK, OllamaChatResponse{
 			Model: "gemma4:e4b",
 			Message: Message{
 				Role:    "assistant",
 				Content: "Hello! How can I help you?",
 			},
 			Done: true,
 		}
 	})
 	defer srv.Close()
 	client := NewOllamaClient(WithBaseURL(srv.URL))
 	resp, err := client.Chat(context.Background(), []Message{
 		{Role: "user", Content: "Hello"},
 	})
 	if err != nil {
 		t.Fatalf("Chat failed: %v", err)
 	}
 	if resp.Content != "Hello! How can I help you?" {
 		t.Errorf("expected content 'Hello! How can I help you?', got %q", resp.Content)
 	}
 	if len(resp.ToolCalls) != 0 {
 		t.Errorf("expected no tool calls, got %d", len(resp.ToolCalls))
 	}
 }
 func TestChatWithToolCalls(t *testing.T) {
 	srv := mockOllamaHandler(t, func(reqBody map[string]interface{}) (int, interface{}) {
 		return http.StatusOK, OllamaToolCallResponse{
 			Model: "gemma4:e4b",
 			Message: OllamaToolMsg{
 				Role:    "assistant",
 				Content: "",
 				ToolCalls: []ToolCall{
 					{
 						ID:   "call-1",
 						Type: "function",
 						Function: FunctionCall{
 							Name:      "exec",
 							Arguments: `{"command":"ls -la"}`,
 						},
 					},
 				},
 			},
 			Done: true,
 		}
 	})
 	defer srv.Close()
 	client := NewOllamaClient(WithBaseURL(srv.URL))
 	resp, err := client.Chat(context.Background(), []Message{
 		{Role: "user", Content: "List files"},
 	})
 	if err != nil {
 		t.Fatalf("Chat failed: %v", err)
 	}
 	if len(resp.ToolCalls) != 1 {
 		t.Fatalf("expected 1 tool call, got %d", len(resp.ToolCalls))
 	}
 	if resp.ToolCalls[0].Function.Name != "exec" {
 		t.Errorf("expected tool name 'exec', got %q", resp.ToolCalls[0].Function.Name)
 	}
 	if resp.ToolCalls[0].Function.Arguments != `{"command":"ls -la"}` {
 		t.Errorf("unexpected arguments: %q", resp.ToolCalls[0].Function.Arguments)
 	}
 }
 func TestChatAPIError(t *testing.T) {
 	srv := mockOllamaHandler(t, func(reqBody map[string]interface{}) (int, interface{}) {
 		return http.StatusInternalServerError, map[string]string{"error": "internal error"}
 	})
 	defer srv.Close()
 	client := NewOllamaClient(WithBaseURL(srv.URL))
 	_, err := client.Chat(context.Background(), []Message{
 		{Role: "user", Content: "Hello"},
 	})
 	if err == nil {
 		t.Fatal("expected error for API error response")
 	}
 	if !strings.Contains(err.Error(), "500") {
 		t.Errorf("expected error to contain status code, got: %v", err)
 	}
 }
 func TestChatContextCancellation(t *testing.T) {
 	ctx, cancel := context.WithCancel(context.Background())
 	cancel() // Cancel immediately
 	client := NewOllamaClient(WithBaseURL("http://localhost:11434"))
 	_, err := client.Chat(ctx, []Message{{Role: "user", Content: "Hello"}})
 	if err == nil {
 		t.Error("expected error for cancelled context")
 	}
 }
 // ============================================================
 // Stream Tests
 // ============================================================
 func TestStream(t *testing.T) {
 	chunks := []string{"Hello", "!", " How", " can", " I", " help?"}
 	srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
 		if r.URL.Path != "/api/chat" {
 			t.Errorf("unexpected path: %s", r.URL.Path)
 			w.WriteHeader(http.StatusNotFound)
 			return
 		}
 		w.Header().Set("Content-Type", "application/x-ndjson")
 		w.WriteHeader(http.StatusOK)
 		flusher, ok := w.(http.Flusher)
 		if !ok {
 			t.Fatal("expected http.Flusher")
 		}
 		for _, chunk := range chunks {
 			resp := OllamaChatResponse{
 				Model: "gemma4:e4b",
 				Message: Message{
 					Role:    "assistant",
 					Content: chunk,
 				},
 				Done: false,
 			}
 			data, _ := json.Marshal(resp)
 			w.Write(append(data, '\n'))
 			flusher.Flush()
 		}
 		// Send done signal
 		doneResp := OllamaChatResponse{
 			Model: "gemma4:e4b",
 			Message: Message{
 				Role:    "assistant",
 				Content: "",
 			},
 			Done: true,
 		}
 		data, _ := json.Marshal(doneResp)
 		w.Write(append(data, '\n'))
 		flusher.Flush()
 	}))
 	defer srv.Close()
 	client := NewOllamaClient(WithBaseURL(srv.URL))
 	var received []string
 	err := client.Stream(context.Background(), []Message{{Role: "user", Content: "Hi"}},
 		func(chunk string) error {
 			received = append(received, chunk)
 			return nil
 		})
 	if err != nil {
 		t.Fatalf("Stream failed: %v", err)
 	}
 	if len(received) != len(chunks) {
 		t.Errorf("expected %d chunks, got %d", len(chunks), len(received))
 	}
 }
 func TestStreamHandlerError(t *testing.T) {
 	srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
 		w.Header().Set("Content-Type", "application/x-ndjson")
 		w.WriteHeader(http.StatusOK)
 		resp := OllamaChatResponse{
 			Model: "gemma4:e4b",
 			Message: Message{
 				Role:    "assistant",
 				Content: "chunk",
 			},
 			Done: false,
 		}
 		data, _ := json.Marshal(resp)
 		w.Write(append(data, '\n'))
 		if f, ok := w.(http.Flusher); ok {
 			f.Flush()
 		}
 	}))
 	defer srv.Close()
 	client := NewOllamaClient(WithBaseURL(srv.URL))
 	err := client.Stream(context.Background(), []Message{{Role: "user", Content: "Hi"}},
 		func(chunk string) error {
 			return &streamError{msg: "handler error"}
 		})
 	if err == nil {
 		t.Fatal("expected error from handler")
 	}
 	if !strings.Contains(err.Error(), "handler error") {
 		t.Errorf("expected 'handler error', got: %v", err)
 	}
 }
 type streamError struct{ msg string }
 func (e *streamError) Error() string { return e.msg }
 // ============================================================
 // Embed Tests
 // ============================================================
 func TestEmbed(t *testing.T) {
 	srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
 		if r.URL.Path != "/api/embed" {
 			t.Errorf("unexpected path: %s", r.URL.Path)
 			w.WriteHeader(http.StatusNotFound)
 			return
 		}
 		w.Header().Set("Content-Type", "application/json")
 		w.WriteHeader(http.StatusOK)
 		json.NewEncoder(w).Encode(OllamaEmbedResponse{
 			Embedding: []float64{0.1, 0.2, 0.3, 0.4, 0.5},
 		})
 	}))
 	defer srv.Close()
 	client := NewOllamaClient(WithBaseURL(srv.URL))
 	resp, err := client.Embed(context.Background(), "test input")
 	if err != nil {
 		t.Fatalf("Embed failed: %v", err)
 	}
 	if len(resp.Embedding) != 5 {
 		t.Errorf("expected 5 embedding values, got %d", len(resp.Embedding))
 	}
 	if resp.Embedding[0] != 0.1 {
 		t.Errorf("expected first value 0.1, got %f", resp.Embedding[0])
 	}
 }
 // ============================================================
 // Tool Def Builder Tests
 // ============================================================
 func TestBuildToolDefsFromMap(t *testing.T) {
 	tools := []map[string]interface{}{
 		{
 			"name":        "exec",
 			"description": "Execute a shell command",
 			"parameters": map[string]interface{}{
 				"properties": map[string]interface{}{
 					"command": map[string]interface{}{
 						"type":        "string",
 						"description": "Command to run",
 						"required":    true,
 					},
 					"timeout": map[string]interface{}{
 						"type":        "number",
 						"description": "Timeout in seconds",
 						"required":    false,
 					},
 				},
 			},
 		},
 	}
 	defs := BuildToolDefsFromMap(tools)
 	if len(defs) != 1 {
 		t.Fatalf("expected 1 tool def, got %d", len(defs))
 	}
 	if defs[0].Function.Name != "exec" {
 		t.Errorf("expected name 'exec', got %q", defs[0].Function.Name)
 	}
 	if len(defs[0].Function.Parameters.Required) != 1 {
 		t.Errorf("expected 1 required parameter, got %d", len(defs[0].Function.Parameters.Required))
 	}
 	if defs[0].Function.Parameters.Required[0] != "command" {
 		t.Errorf("expected required 'command', got %q", defs[0].Function.Parameters.Required[0])
 	}
 }
 // ============================================================
 // Mock LLM (for use by other tests)
 // ============================================================
 // MockLLM is a configurable mock implementation of the LLM interface for testing.
 type MockLLM struct {
 	ChatFunc    func(ctx context.Context, messages []Message) (*Response, error)
 	StreamFunc  func(ctx context.Context, messages []Message, handler StreamHandler) error
 }
 func (m *MockLLM) Chat(ctx context.Context, messages []Message) (*Response, error) {
 	if m.ChatFunc != nil {
 		return m.ChatFunc(ctx, messages)
 	}
 	return &Response{Content: "mock response"}, nil
 }
 func (m *MockLLM) Stream(ctx context.Context, messages []Message, handler StreamHandler) error {
 	if m.StreamFunc != nil {
 		return m.StreamFunc(ctx, messages, handler)
 	}
 	return handler("mock stream response")
 }
--- a/pkg/llm/types.go
+++ b/pkg/llm/types.go
@ -0,0 +1,128 @@
 // Package llm provides the LLM integration layer for the Orca framework.
 //
 // It defines the LLM interface for interacting with language models,
 // the Ollama client implementation, and the shared types for chat
 // messages, tool calls, and streaming responses.
 package llm
 // Message represents a single message in a chat conversation.
 //
 // The Role field identifies the sender: "user", "assistant", "system",
 // or "tool". For tool results, ToolCallID links the result back to the
 // tool call that produced it.
 type Message struct {
 	Role       string `json:"role"`
 	Content    string `json:"content"`
 	ToolCallID string `json:"tool_call_id,omitempty"`
 }
 // ToolCall represents a function calling request from the LLM.
 //
 // Ollama returns tool calls in the format expected by OpenAI-compatible
 // APIs: each call has a unique ID, a type ("function"), and a Function
 // object containing the tool name and JSON-encoded arguments.
 type ToolCall struct {
 	ID       string       `json:"id"`
 	Type     string       `json:"type"`
 	Function FunctionCall `json:"function"`
 }
 // FunctionCall holds the name and arguments for a tool invocation.
 //
 // Arguments is a raw JSON string that should be unmarshalled into
 // the tool's expected argument shape.
 type FunctionCall struct {
 	Name      string `json:"name"`
 	Arguments string `json:"arguments"` // JSON-encoded arguments
 }
 // Response represents a complete (non-streaming) response from an LLM.
 //
 // If the LLM decides to invoke tools, Content may be empty and ToolCalls
 // will contain one or more entries. The caller should execute each tool
 // call and feed the results back to the LLM.
 type Response struct {
 	Content   string     `json:"content"`
 	ToolCalls []ToolCall `json:"tool_calls,omitempty"`
 }
 // StreamHandler is a callback function for processing streaming response chunks.
 //
 // Each chunk is a partial string of the ongoing response. The handler is
 // called sequentially for each chunk. Returning an error stops the stream.
 type StreamHandler func(chunk string) error
 // EmbeddingResponse holds the result of an embedding request.
 type EmbeddingResponse struct {
 	Embedding []float64 `json:"embedding"`
 }
 // OllamaChatRequest is the request body sent to Ollama's /api/chat endpoint.
 type OllamaChatRequest struct {
 	Model    string    `json:"model"`
 	Messages []Message `json:"messages"`
 	Stream   bool      `json:"stream"`
 	Tools    []ToolDef `json:"tools,omitempty"`
 }
 // OllamaChatResponse is the response body from Ollama's /api/chat endpoint.
 type OllamaChatResponse struct {
 	Model     string    `json:"model"`
 	CreatedAt string    `json:"created_at"`
 	Message   Message   `json:"message"`
 	Done      bool      `json:"done"`
 }
 // OllamaToolCallResponse is the wire format Ollama returns for tool calls.
 type OllamaToolCallResponse struct {
 	Model     string          `json:"model"`
 	CreatedAt string          `json:"created_at"`
 	Message   OllamaToolMsg   `json:"message"`
 	Done      bool            `json:"done"`
 }
 // OllamaToolMsg wraps the tool_calls field in Ollama's response.
 type OllamaToolMsg struct {
 	Role      string     `json:"role"`
 	Content   string     `json:"content"`
 	ToolCalls []ToolCall `json:"tool_calls,omitempty"`
 }
 // ToolDef describes a tool that the LLM may call, in the format
 // expected by Ollama's function calling API.
 type ToolDef struct {
 	Type     string       `json:"type"`
 	Function ToolFunction `json:"function"`
 }
 // ToolFunction describes a function available to the LLM.
 type ToolFunction struct {
 	Name        string                   `json:"name"`
 	Description string                   `json:"description"`
 	Parameters  ToolFunctionParameters   `json:"parameters"`
 }
 // ToolFunctionParameters is the JSON Schema for a tool's parameters.
 type ToolFunctionParameters struct {
 	Type       string                  `json:"type"`
 	Required   []string                `json:"required,omitempty"`
 	Properties map[string]ToolProperty `json:"properties"`
 }
 // ToolProperty describes a single parameter of a tool function.
 type ToolProperty struct {
 	Type        string   `json:"type"`
 	Description string   `json:"description"`
 	Enum        []string `json:"enum,omitempty"`
 }
 // OllamaEmbedRequest is the request body for Ollama's /api/embed endpoint.
 type OllamaEmbedRequest struct {
 	Model string `json:"model"`
 	Input string `json:"input"`
 }
 // OllamaEmbedResponse is the response body from Ollama's /api/embed endpoint.
 type OllamaEmbedResponse struct {
 	Embedding []float64 `json:"embedding"`
 }
--- a/pkg/plugin/plugin.go
+++ b/pkg/plugin/plugin.go
@ -0,0 +1,58 @@
 // Package plugin defines the plugin system for the Orca framework.
 //
 // All extensions to the framework (skills, tools, LLM drivers, etc.)
 // are implemented as plugins that implement the Plugin interface.
 // The kernel manages plugin lifecycle: load, init, start, stop, shutdown.
 package plugin
 import "github.com/orca/orca/pkg/bus"
 // PluginState represents the current lifecycle state of a plugin.
 type PluginState int
 const (
 	StateUnknown     PluginState = iota
 	StateRegistered
 	StateInitialized
 	StateRunning
 	StateStopped
 	StateError
 )
 func (ps PluginState) String() string {
 	switch ps {
 	case StateUnknown:
 		return "unknown"
 	case StateRegistered:
 		return "registered"
 	case StateInitialized:
 		return "initialized"
 	case StateRunning:
 		return "running"
 	case StateStopped:
 		return "stopped"
 	case StateError:
 		return "error"
 	default:
 		return "unknown"
 	}
 }
 // PluginHost is the interface that the kernel provides to plugins.
 //
 // Plugins receive a PluginHost reference during Init() to interact
 // with the framework: publishing/subscribing to messages, discovering
 // other plugins, and accessing shared resources.
 type PluginHost interface {
 	Bus() bus.MessageBus
 	GetPlugin(name string) (Plugin, bool)
 	ListPlugins() []Plugin
 }
 // Plugin defines the interface that all Orca plugins must implement.
 type Plugin interface {
 	Name() string
 	Version() string
 	Init(host PluginHost) error
 	Shutdown() error
 }
--- a/pkg/plugin/registry.go
+++ b/pkg/plugin/registry.go
@ -0,0 +1,100 @@
 package plugin
 import (
 	"fmt"
 	"sync"
 )
 // Registry is a thread-safe map that manages plugin registration.
 type Registry struct {
 	mu      sync.RWMutex
 	plugins map[string]Plugin
 	states  map[string]PluginState
 }
 // NewRegistry creates a new empty plugin registry.
 func NewRegistry() *Registry {
 	return &Registry{
 		plugins: make(map[string]Plugin),
 		states:  make(map[string]PluginState),
 	}
 }
 // Register adds a plugin to the registry.
 func (r *Registry) Register(p Plugin) error {
 	r.mu.Lock()
 	defer r.mu.Unlock()
 	name := p.Name()
 	if _, exists := r.plugins[name]; exists {
 		return fmt.Errorf("plugin %q is already registered", name)
 	}
 	r.plugins[name] = p
 	r.states[name] = StateRegistered
 	return nil
 }
 // Unregister removes a plugin from the registry.
 func (r *Registry) Unregister(name string) error {
 	r.mu.Lock()
 	defer r.mu.Unlock()
 	if _, exists := r.plugins[name]; !exists {
 		return fmt.Errorf("plugin %q is not registered", name)
 	}
 	delete(r.plugins, name)
 	delete(r.states, name)
 	return nil
 }
 // Get retrieves a plugin by name.
 func (r *Registry) Get(name string) (Plugin, bool) {
 	r.mu.RLock()
 	defer r.mu.RUnlock()
 	p, ok := r.plugins[name]
 	return p, ok
 }
 // List returns all registered plugins.
 func (r *Registry) List() []Plugin {
 	r.mu.RLock()
 	defer r.mu.RUnlock()
 	plugins := make([]Plugin, 0, len(r.plugins))
 	for _, p := range r.plugins {
 		plugins = append(plugins, p)
 	}
 	return plugins
 }
 // State returns the lifecycle state of a registered plugin.
 func (r *Registry) State(name string) PluginState {
 	r.mu.RLock()
 	defer r.mu.RUnlock()
 	if state, ok := r.states[name]; ok {
 		return state
 	}
 	return StateUnknown
 }
 // SetState updates the lifecycle state of a registered plugin.
 func (r *Registry) SetState(name string, state PluginState) {
 	r.mu.Lock()
 	defer r.mu.Unlock()
 	if _, ok := r.plugins[name]; ok {
 		r.states[name] = state
 	}
 }
 // Count returns the number of registered plugins.
 func (r *Registry) Count() int {
 	r.mu.RLock()
 	defer r.mu.RUnlock()
 	return len(r.plugins)
 }
--- a/pkg/plugin/registry_test.go
+++ b/pkg/plugin/registry_test.go
@ -0,0 +1,256 @@
 package plugin
 import (
 	"errors"
 	"testing"
 	"github.com/orca/orca/pkg/bus"
 )
 // mockPlugin implements Plugin for testing.
 type mockPlugin struct {
 	name    string
 	version string
 	initFn  func(host PluginHost) error
 	closeFn func() error
 }
 func (m *mockPlugin) Name() string            { return m.name }
 func (m *mockPlugin) Version() string          { return m.version }
 func (m *mockPlugin) Init(host PluginHost) error {
 	if m.initFn != nil {
 		return m.initFn(host)
 	}
 	return nil
 }
 func (m *mockPlugin) Shutdown() error {
 	if m.closeFn != nil {
 		return m.closeFn()
 	}
 	return nil
 }
 func TestRegistryNew(t *testing.T) {
 	r := NewRegistry()
 	if r == nil {
 		t.Fatal("NewRegistry() returned nil")
 	}
 	if n := r.Count(); n != 0 {
 		t.Errorf("expected empty registry, got %d plugins", n)
 	}
 }
 func TestRegistryRegister(t *testing.T) {
 	r := NewRegistry()
 	p := &mockPlugin{name: "test", version: "1.0.0"}
 	err := r.Register(p)
 	if err != nil {
 		t.Fatalf("Register failed: %v", err)
 	}
 	if n := r.Count(); n != 1 {
 		t.Errorf("expected 1 plugin, got %d", n)
 	}
 }
 func TestRegistryRegisterDuplicate(t *testing.T) {
 	r := NewRegistry()
 	p1 := &mockPlugin{name: "test", version: "1.0.0"}
 	p2 := &mockPlugin{name: "test", version: "2.0.0"}
 	r.Register(p1)
 	err := r.Register(p2)
 	if err == nil {
 		t.Error("expected error registering duplicate plugin")
 	}
 }
 func TestRegistryGet(t *testing.T) {
 	r := NewRegistry()
 	p := &mockPlugin{name: "test", version: "1.0.0"}
 	r.Register(p)
 	got, ok := r.Get("test")
 	if !ok {
 		t.Fatal("Get returned not found")
 	}
 	if got.Name() != "test" {
 		t.Errorf("expected name 'test', got %q", got.Name())
 	}
 }
 func TestRegistryGetNotFound(t *testing.T) {
 	r := NewRegistry()
 	_, ok := r.Get("nonexistent")
 	if ok {
 		t.Error("expected false for nonexistent plugin")
 	}
 }
 func TestRegistryUnregister(t *testing.T) {
 	r := NewRegistry()
 	p := &mockPlugin{name: "test", version: "1.0.0"}
 	r.Register(p)
 	err := r.Unregister("test")
 	if err != nil {
 		t.Fatalf("Unregister failed: %v", err)
 	}
 	if n := r.Count(); n != 0 {
 		t.Errorf("expected 0 plugins, got %d", n)
 	}
 }
 func TestRegistryUnregisterNotFound(t *testing.T) {
 	r := NewRegistry()
 	err := r.Unregister("nonexistent")
 	if err == nil {
 		t.Error("expected error unregistering nonexistent plugin")
 	}
 }
 func TestRegistryList(t *testing.T) {
 	r := NewRegistry()
 	r.Register(&mockPlugin{name: "a", version: "1.0.0"})
 	r.Register(&mockPlugin{name: "b", version: "1.0.0"})
 	r.Register(&mockPlugin{name: "c", version: "1.0.0"})
 	plugins := r.List()
 	if len(plugins) != 3 {
 		t.Errorf("expected 3 plugins, got %d", len(plugins))
 	}
 	names := make(map[string]bool)
 	for _, p := range plugins {
 		names[p.Name()] = true
 	}
 	for _, n := range []string{"a", "b", "c"} {
 		if !names[n] {
 			t.Errorf("missing plugin %q in list", n)
 		}
 	}
 }
 func TestRegistryState(t *testing.T) {
 	r := NewRegistry()
 	p := &mockPlugin{name: "test", version: "1.0.0"}
 	r.Register(p)
 	if s := r.State("test"); s != StateRegistered {
 		t.Errorf("expected StateRegistered, got %s", s)
 	}
 	r.SetState("test", StateRunning)
 	if s := r.State("test"); s != StateRunning {
 		t.Errorf("expected StateRunning, got %s", s)
 	}
 }
 func TestRegistryStateUnknown(t *testing.T) {
 	r := NewRegistry()
 	if s := r.State("nonexistent"); s != StateUnknown {
 		t.Errorf("expected StateUnknown for nonexistent, got %s", s)
 	}
 }
 func TestRegistrySetStateNoOp(t *testing.T) {
 	r := NewRegistry()
 	r.SetState("nonexistent", StateRunning)
 	if n := r.Count(); n != 0 {
 		t.Errorf("SetState should not add plugins")
 	}
 }
 func TestPluginStateString(t *testing.T) {
 	tests := []struct {
 		state PluginState
 		want  string
 	}{
 		{StateUnknown, "unknown"},
 		{StateRegistered, "registered"},
 		{StateInitialized, "initialized"},
 		{StateRunning, "running"},
 		{StateStopped, "stopped"},
 		{StateError, "error"},
 		{PluginState(99), "unknown"},
 	}
 	for _, tt := range tests {
 		if got := tt.state.String(); got != tt.want {
 			t.Errorf("PluginState(%d).String() = %q, want %q", tt.state, got, tt.want)
 		}
 	}
 }
 func TestRegistryConcurrent(t *testing.T) {
 	r := NewRegistry()
 	done := make(chan struct{}, 2)
 	go func() {
 		for i := 0; i < 100; i++ {
 			r.Register(&mockPlugin{name: "a", version: "1.0.0"})
 			r.Get("a")
 			r.Unregister("a")
 		}
 		done <- struct{}{}
 	}()
 	go func() {
 		for i := 0; i < 100; i++ {
 			r.Register(&mockPlugin{name: "b", version: "1.0.0"})
 			r.List()
 			r.State("b")
 			r.Unregister("b")
 		}
 		done <- struct{}{}
 	}()
 	<-done
 	<-done
 }
 // mockPluginHost implements PluginHost for testing kernel-level plugin init.
 type mockPluginHost struct{}
 func (m *mockPluginHost) Bus() bus.MessageBus                  { return nil }
 func (m *mockPluginHost) GetPlugin(name string) (Plugin, bool) { return nil, false }
 func (m *mockPluginHost) ListPlugins() []Plugin                 { return nil }
 func TestPluginInitAndShutdown(t *testing.T) {
 	var initCalled, shutdownCalled bool
 	p := &mockPlugin{
 		name:    "test",
 		version: "1.0.0",
 		initFn: func(host PluginHost) error {
 			initCalled = true
 			if host == nil {
 				return errors.New("host is nil")
 			}
 			return nil
 		},
 		closeFn: func() error {
 			shutdownCalled = true
 			return nil
 		},
 	}
 	host := &mockPluginHost{}
 	if err := p.Init(host); err != nil {
 		t.Fatalf("Init failed: %v", err)
 	}
 	if !initCalled {
 		t.Error("Init function was not called")
 	}
 	if err := p.Shutdown(); err != nil {
 		t.Fatalf("Shutdown failed: %v", err)
 	}
 	if !shutdownCalled {
 		t.Error("Shutdown function was not called")
 	}
 }
--- a/pkg/sandbox/process.go
+++ b/pkg/sandbox/process.go
@ -0,0 +1,246 @@
 package sandbox
 import (
 	"bytes"
 	"context"
 	"fmt"
 	"io"
 	"os"
 	"os/exec"
 	"path/filepath"
 )
 const (
 	// DefaultOutputLimit is the maximum number of bytes captured from stdout/stderr (64 KB).
 	DefaultOutputLimit = 64 * 1024
 	// DefaultWorkingDir is the default working directory for sandboxed commands.
 	DefaultWorkingDir = "/tmp/orca/sandbox"
 )
 // AllowedEnvVars is the whitelist of environment variables accessible inside the sandbox.
 // Only these variables are passed through from the parent process.
 var AllowedEnvVars = []string{
 	"HOME",
 	"USER",
 	"PATH",
 	"LANG",
 	"SHELL",
 	"TMPDIR",
 	"ORCA_HOME",
 }
 // ProcessSandbox is a Sandbox implementation that uses os/exec to run commands
 // as child processes with resource restrictions.
 type ProcessSandbox struct {
 	// WorkingDir is the directory in which commands execute.
 	WorkingDir string
 	// OutputLimit is the maximum bytes to capture from stdout/stderr.
 	OutputLimit int
 	// EnvWhitelist controls which environment variables are passed to child processes.
 	// If nil, AllowedEnvVars is used. If empty, no env vars are passed.
 	EnvWhitelist []string
 }
 // NewProcessSandbox creates a ProcessSandbox with sensible defaults.
 func NewProcessSandbox() *ProcessSandbox {
 	return &ProcessSandbox{
 		WorkingDir:   DefaultWorkingDir,
 		OutputLimit:  DefaultOutputLimit,
 		EnvWhitelist: nil, // uses AllowedEnvVars
 	}
 }
 // Execute runs a command as a child process with resource restrictions.
 func (ps *ProcessSandbox) Execute(ctx context.Context, cmd string, args ...string) (*Result, error) {
 	// Ensure working directory exists
 	if err := os.MkdirAll(ps.WorkingDir, 0755); err != nil {
 		return nil, fmt.Errorf("sandbox: failed to create working directory %q: %w", ps.WorkingDir, err)
 	}
 	// Build the command
 	c := exec.CommandContext(ctx, cmd, args...)
 	c.Dir = ps.WorkingDir
 	// Set up environment variable whitelist
 	env := ps.buildEnv()
 	c.Env = env
 	// Capture stdout and stderr with size limits
 	stdoutBuf := newLimitedBuffer(ps.outputLimit())
 	stderrBuf := newLimitedBuffer(ps.outputLimit())
 	stdoutPipe, err := c.StdoutPipe()
 	if err != nil {
 		return nil, fmt.Errorf("sandbox: failed to create stdout pipe: %w", err)
 	}
 	stderrPipe, err := c.StderrPipe()
 	if err != nil {
 		return nil, fmt.Errorf("sandbox: failed to create stderr pipe: %w", err)
 	}
 	// Start the command
 	if err := c.Start(); err != nil {
 		return nil, fmt.Errorf("sandbox: failed to start command: %w", err)
 	}
 	// Read stdout and stderr concurrently
 	var readStdout, readStderr error
 	var wg syncWaitGroup
 	wg.Add(2)
 	go func() {
 		defer wg.Done()
 		_, readStdout = io.Copy(stdoutBuf, stdoutPipe)
 		// ErrShortWrite is expected when the output limit is reached — not a real error.
 		if readStdout != nil && readStdout != io.EOF && readStdout != io.ErrShortWrite {
 			readStdout = fmt.Errorf("sandbox: stdout read error: %w", readStdout)
 		} else {
 			readStdout = nil
 		}
 	}()
 	go func() {
 		defer wg.Done()
 		_, readStderr = io.Copy(stderrBuf, stderrPipe)
 		if readStderr != nil && readStderr != io.EOF && readStderr != io.ErrShortWrite {
 			readStderr = fmt.Errorf("sandbox: stderr read error: %w", readStderr)
 		} else {
 			readStderr = nil
 		}
 	}()
 	wg.Wait()
 	// Wait for the command to finish
 	err = c.Wait()
 	exitCode := 0
 	if err != nil {
 		// Check if the process was killed due to context cancellation (timeout)
 		if ctx.Err() != nil {
 			return nil, fmt.Errorf("sandbox: command timed out: %w", ctx.Err())
 		}
 		// Normal non-zero exit
 		if exitErr, ok := err.(*exec.ExitError); ok {
 			exitCode = exitErr.ExitCode()
 			err = nil
 		}
 	}
 	// Combine errors: prefer command error, then read errors
 	if err != nil {
 		return nil, err
 	}
 	if readStdout != nil {
 		return nil, readStdout
 	}
 	if readStderr != nil {
 		return nil, readStderr
 	}
 	return &Result{
 		Stdout:   stdoutBuf.String(),
 		Stderr:   stderrBuf.String(),
 		ExitCode: exitCode,
 	}, nil
 }
 // buildEnv constructs the environment variable list for the child process
 // based on the whitelist configuration.
 func (ps *ProcessSandbox) buildEnv() []string {
 	whitelist := ps.EnvWhitelist
 	if whitelist == nil {
 		whitelist = AllowedEnvVars
 	}
 	env := make([]string, 0, len(whitelist))
 	for _, key := range whitelist {
 		if val, ok := os.LookupEnv(key); ok {
 			env = append(env, key+"="+val)
 		}
 	}
 	return env
 }
 // outputLimit returns the effective output size limit.
 func (ps *ProcessSandbox) outputLimit() int {
 	if ps.OutputLimit <= 0 {
 		return DefaultOutputLimit
 	}
 	return ps.OutputLimit
 }
 // WorkingDirPath returns the absolute path of the sandbox working directory.
 func (ps *ProcessSandbox) WorkingDirPath() string {
 	abs, err := filepath.Abs(ps.WorkingDir)
 	if err != nil {
 		return ps.WorkingDir
 	}
 	return abs
 }
 // ---------------------------------------------------------------------------
 // limitedBuffer — a writer that stops accepting data after MaxSize bytes.
 // Uses a named field (not embedded) to avoid promoting bytes.Buffer.ReadFrom
 // which would bypass the size limit when used with io.Copy.
 // ---------------------------------------------------------------------------
 type limitedBuffer struct {
 	buf     bytes.Buffer
 	MaxSize int
 }
 func newLimitedBuffer(maxSize int) *limitedBuffer {
 	return &limitedBuffer{MaxSize: maxSize}
 }
 func (lb *limitedBuffer) Write(p []byte) (int, error) {
 	remaining := lb.MaxSize - lb.buf.Len()
 	if remaining <= 0 {
 		return len(p), nil // silently drop excess; io.Copy sees nw==nr, continues draining pipe
 	}
 	if len(p) > remaining {
 		p = p[:remaining]
 		n, err := lb.buf.Write(p)
 		// Return n < original len(p) so io.Copy stops with ErrShortWrite.
 		return n, err
 	}
 	return lb.buf.Write(p)
 }
 func (lb *limitedBuffer) String() string {
 	return lb.buf.String()
 }
 func (lb *limitedBuffer) Len() int {
 	return lb.buf.Len()
 }
 // ---------------------------------------------------------------------------
 // syncWaitGroup — a simple goroutine synchronization mechanism.
 // ---------------------------------------------------------------------------
 type syncWaitGroup struct {
 	ch chan struct{}
 }
 func (wg *syncWaitGroup) Add(n int) {
 	if wg.ch == nil {
 		wg.ch = make(chan struct{}, n)
 	}
 }
 func (wg *syncWaitGroup) Done() {
 	wg.ch <- struct{}{}
 }
 func (wg *syncWaitGroup) Wait() {
 	for i := 0; i < cap(wg.ch); i++ {
 		<-wg.ch
 	}
 }
 // Compile-time interface check.
 var _ Sandbox = (*ProcessSandbox)(nil)
--- a/pkg/sandbox/process_test.go
+++ b/pkg/sandbox/process_test.go
@ -0,0 +1,212 @@
 package sandbox
 import (
 	"context"
 	"os"
 	"path/filepath"
 	"strings"
 	"testing"
 	"time"
 )
 func TestNewProcessSandbox(t *testing.T) {
 	ps := NewProcessSandbox()
 	if ps == nil {
 		t.Fatal("NewProcessSandbox() returned nil")
 	}
 	if ps.WorkingDir != DefaultWorkingDir {
 		t.Errorf("expected WorkingDir %q, got %q", DefaultWorkingDir, ps.WorkingDir)
 	}
 	if ps.OutputLimit != DefaultOutputLimit {
 		t.Errorf("expected OutputLimit %d, got %d", DefaultOutputLimit, ps.OutputLimit)
 	}
 }
 func TestExecuteEcho(t *testing.T) {
 	ps := NewProcessSandbox()
 	ctx := context.Background()
 	result, err := ps.Execute(ctx, "echo", "hello", "world")
 	if err != nil {
 		t.Fatalf("Execute failed: %v", err)
 	}
 	if result.ExitCode != 0 {
 		t.Errorf("expected exit code 0, got %d", result.ExitCode)
 	}
 	if strings.TrimSpace(result.Stdout) != "hello world" {
 		t.Errorf("expected stdout 'hello world', got %q", result.Stdout)
 	}
 }
 func TestExecuteWithArgs(t *testing.T) {
 	ps := NewProcessSandbox()
 	ctx := context.Background()
 	result, err := ps.Execute(ctx, "sh", "-c", "echo 'arg1 arg2'")
 	if err != nil {
 		t.Fatalf("Execute failed: %v", err)
 	}
 	if result.ExitCode != 0 {
 		t.Errorf("expected exit code 0, got %d", result.ExitCode)
 	}
 	if strings.TrimSpace(result.Stdout) != "arg1 arg2" {
 		t.Errorf("expected stdout 'arg1 arg2', got %q", result.Stdout)
 	}
 }
 func TestExecuteNonZeroExit(t *testing.T) {
 	ps := NewProcessSandbox()
 	ctx := context.Background()
 	result, err := ps.Execute(ctx, "sh", "-c", "exit 42")
 	if err != nil {
 		t.Fatalf("Execute should not error on non-zero exit: %v", err)
 	}
 	if result.ExitCode != 42 {
 		t.Errorf("expected exit code 42, got %d", result.ExitCode)
 	}
 }
 func TestExecuteCommandNotFound(t *testing.T) {
 	ps := NewProcessSandbox()
 	ctx := context.Background()
 	_, err := ps.Execute(ctx, "nonexistent-command-12345")
 	if err == nil {
 		t.Fatal("expected error for nonexistent command")
 	}
 }
 func TestExecuteTimeout(t *testing.T) {
 	ps := NewProcessSandbox()
 	ctx, cancel := context.WithTimeout(context.Background(), 50*time.Millisecond)
 	defer cancel()
 	_, err := ps.Execute(ctx, "sleep", "10")
 	if err == nil {
 		t.Fatal("expected timeout error")
 	}
 	// On macOS the error may be "signal: killed" or "context deadline exceeded".
 	// Just verify an error occurred — the exact message varies by platform.
 	t.Logf("timeout produced error: %v", err)
 }
 func TestExecuteWorkingDirectory(t *testing.T) {
 	// Use a temp directory for this test
 	tmpDir, err := os.MkdirTemp("", "sandbox-test-*")
 	if err != nil {
 		t.Fatalf("failed to create temp dir: %v", err)
 	}
 	defer os.RemoveAll(tmpDir)
 	ps := &ProcessSandbox{
 		WorkingDir:   tmpDir,
 		OutputLimit:  DefaultOutputLimit,
 		EnvWhitelist: AllowedEnvVars,
 	}
 	ctx := context.Background()
 	result, err := ps.Execute(ctx, "pwd")
 	if err != nil {
 		t.Fatalf("Execute failed: %v", err)
 	}
 	if result.ExitCode != 0 {
 		t.Errorf("expected exit code 0, got %d", result.ExitCode)
 	}
 	// pwd should return the temp directory
 	gotDir := strings.TrimSpace(result.Stdout)
 	absGot, _ := filepath.EvalSymlinks(gotDir)
 	absTmp, _ := filepath.EvalSymlinks(tmpDir)
 	if absGot != absTmp {
 		t.Errorf("expected working dir %q, got %q", absTmp, absGot)
 	}
 }
 func TestEnvironmentWhitelist(t *testing.T) {
 	ps := NewProcessSandbox()
 	ps.EnvWhitelist = []string{"HOME"}
 	ctx := context.Background()
 	result, err := ps.Execute(ctx, "sh", "-c", "echo $HOME")
 	if err != nil {
 		t.Fatalf("Execute failed: %v", err)
 	}
 	if result.ExitCode != 0 {
 		t.Errorf("expected exit code 0, got %d", result.ExitCode)
 	}
 	home := os.Getenv("HOME")
 	if home != "" && strings.TrimSpace(result.Stdout) != home {
 		t.Errorf("expected HOME=%q, got %q", home, strings.TrimSpace(result.Stdout))
 	}
 }
 func TestEnvironmentIsolation(t *testing.T) {
 	ps := NewProcessSandbox()
 	// Use an empty whitelist to ensure no env vars are passed
 	ps.EnvWhitelist = []string{}
 	ctx := context.Background()
 	result, err := ps.Execute(ctx, "sh", "-c", "echo $HOME")
 	if err != nil {
 		t.Fatalf("Execute failed: %v", err)
 	}
 	// HOME should be empty in the child process
 	if strings.TrimSpace(result.Stdout) != "" {
 		t.Errorf("expected empty HOME in isolated env, got %q", result.Stdout)
 	}
 }
 func TestOutputLimit(t *testing.T) {
 	ps := NewProcessSandbox()
 	ps.OutputLimit = 10 // Only 10 bytes
 	ctx := context.Background()
 	// Generate a long output well beyond the 10-byte limit
 	result, err := ps.Execute(ctx, "sh", "-c", "echo 'AAAAAAAAAABBBBBBBBBBCCCCCCCCCCDDDDDDDDDDEEEEEEEEEEFFFFFFFFFF'")
 	if err != nil {
 		t.Fatalf("Execute failed: %v", err)
 	}
 	// The output should be truncated to approximately 10 bytes (plus newline)
 	if len(result.Stdout) > 15 {
 		t.Errorf("expected truncated output (<=15 bytes), got %d bytes: %q", len(result.Stdout), result.Stdout)
 	}
 }
 func TestExecuteStderr(t *testing.T) {
 	ps := NewProcessSandbox()
 	ctx := context.Background()
 	result, err := ps.Execute(ctx, "sh", "-c", "echo 'error output' >&2; echo 'normal output'")
 	if err != nil {
 		t.Fatalf("Execute failed: %v", err)
 	}
 	if result.ExitCode != 0 {
 		t.Errorf("expected exit code 0, got %d", result.ExitCode)
 	}
 	if strings.TrimSpace(result.Stderr) != "error output" {
 		t.Errorf("expected stderr 'error output', got %q", result.Stderr)
 	}
 	if strings.TrimSpace(result.Stdout) != "normal output" {
 		t.Errorf("expected stdout 'normal output', got %q", result.Stdout)
 	}
 }
 func TestSandboxInterfaceSatisfied(t *testing.T) {
 	// Compile-time check
 	var ps Sandbox = NewProcessSandbox()
 	if ps == nil {
 		t.Fatal("ProcessSandbox does not satisfy Sandbox interface")
 	}
 }
 func TestWorkingDirPath(t *testing.T) {
 	ps := NewProcessSandbox()
 	path := ps.WorkingDirPath()
 	if !filepath.IsAbs(path) {
 		t.Errorf("expected absolute path, got %q", path)
 	}
 }
--- a/pkg/sandbox/sandbox.go
+++ b/pkg/sandbox/sandbox.go
@ -0,0 +1,28 @@
 // Package sandbox provides a secure execution environment for running commands.
 //
 // The sandbox restricts resource usage (timeout, output size, working directory)
 // and environment variable access to prevent runaway or malicious commands.
 // This is the execution backend used by the Tool system's built-in exec tool.
 package sandbox
 import (
 	"context"
 )
 // Result holds the output and exit status of a sandboxed command execution.
 type Result struct {
 	Stdout   string `json:"stdout"`
 	Stderr   string `json:"stderr"`
 	ExitCode int    `json:"exit_code"`
 }
 // Sandbox defines the interface for command execution environments.
 //
 // Implementations may use OS processes (os/exec), containers, or other
 // isolation mechanisms. The context controls cancellation and timeouts.
 type Sandbox interface {
 	// Execute runs a command with the given arguments inside the sandbox.
 	// The context can be used to set timeouts or cancel the execution.
 	// Returns the combined output, error output, and exit code.
 	Execute(ctx context.Context, cmd string, args ...string) (*Result, error)
 }
--- a/pkg/session/jsonl.go
+++ b/pkg/session/jsonl.go
@ -0,0 +1,190 @@
 package session
 import (
 	"encoding/json"
 	"fmt"
 	"os"
 	"path/filepath"
 	"strings"
 	"sync"
 )
 // JSONLStore implements the Store interface using JSONL files.
 //
 // Each session is stored in a separate file named {session_id}.jsonl
 // under the configured storage directory. Every line in the file is a
 // JSON-encoded SessionMessage. New messages are appended in O(1) time.
 type JSONLStore struct {
 	storageDir string
 	mu         sync.RWMutex
 }
 // NewJSONLStore creates a new JSONLStore with the given storage directory.
 // The directory is created if it does not exist.
 func NewJSONLStore(storageDir string) (*JSONLStore, error) {
 	if err := os.MkdirAll(storageDir, 0755); err != nil {
 		return nil, fmt.Errorf("failed to create session storage directory %q: %w", storageDir, err)
 	}
 	return &JSONLStore{storageDir: storageDir}, nil
 }
 // path returns the full file path for the given session ID.
 func (s *JSONLStore) path(sessionID string) string {
 	return filepath.Join(s.storageDir, sessionID+".jsonl")
 }
 // archivePath returns the archive file path for the given session ID.
 func (s *JSONLStore) archivePath(sessionID string) string {
 	return filepath.Join(s.storageDir, sessionID+".jsonl.archived")
 }
 // Save appends a message to a session's JSONL file.
 // If the file does not exist, it is created.
 // This is an O(1) append operation.
 func (s *JSONLStore) Save(sessionID string, msg SessionMessage) error {
 	s.mu.Lock()
 	defer s.mu.Unlock()
 	f, err := os.OpenFile(s.path(sessionID), os.O_APPEND|os.O_CREATE|os.O_WRONLY, 0644)
 	if err != nil {
 		return fmt.Errorf("failed to open session file for %q: %w", sessionID, err)
 	}
 	defer f.Close()
 	data, err := json.Marshal(msg)
 	if err != nil {
 		return fmt.Errorf("failed to marshal session message: %w", err)
 	}
 	if _, err := f.Write(append(data, '\n')); err != nil {
 		return fmt.Errorf("failed to write session message: %w", err)
 	}
 	return nil
 }
 // Load retrieves all messages for a session in chronological order.
 // Returns an error if the session file does not exist.
 func (s *JSONLStore) Load(sessionID string) ([]SessionMessage, error) {
 	s.mu.RLock()
 	defer s.mu.RUnlock()
 	data, err := os.ReadFile(s.path(sessionID))
 	if err != nil {
 		if os.IsNotExist(err) {
 			// Check archive
 			archiveData, archiveErr := os.ReadFile(s.archivePath(sessionID))
 			if archiveErr != nil {
 				return nil, fmt.Errorf("session %q not found", sessionID)
 			}
 			data = archiveData
 		} else {
 			return nil, fmt.Errorf("failed to read session file for %q: %w", sessionID, err)
 		}
 	}
 	return parseJSONL(data)
 }
 // parseJSONL parses a JSONL byte slice into a slice of SessionMessage.
 func parseJSONL(data []byte) ([]SessionMessage, error) {
 	var messages []SessionMessage
 	trimmed := strings.TrimSpace(string(data))
 	if trimmed == "" {
 		return messages, nil
 	}
 	lines := strings.Split(trimmed, "\n")
 	for _, line := range lines {
 		line = strings.TrimSpace(line)
 		if line == "" {
 			continue
 		}
 		var msg SessionMessage
 		if err := json.Unmarshal([]byte(line), &msg); err != nil {
 			return nil, fmt.Errorf("failed to unmarshal session message: %w", err)
 		}
 		messages = append(messages, msg)
 	}
 	return messages, nil
 }
 // List returns all session IDs by scanning the storage directory.
 func (s *JSONLStore) List() ([]string, error) {
 	s.mu.RLock()
 	defer s.mu.RUnlock()
 	entries, err := os.ReadDir(s.storageDir)
 	if err != nil {
 		return nil, fmt.Errorf("failed to read storage directory %q: %w", s.storageDir, err)
 	}
 	var sessions []string
 	for _, entry := range entries {
 		name := entry.Name()
 		if strings.HasSuffix(name, ".jsonl") && !strings.HasSuffix(name, ".archived") {
 			sessions = append(sessions, strings.TrimSuffix(name, ".jsonl"))
 		}
 	}
 	return sessions, nil
 }
 // Exists checks whether a session file exists (active or archived).
 func (s *JSONLStore) Exists(sessionID string) (bool, error) {
 	s.mu.RLock()
 	defer s.mu.RUnlock()
 	if _, err := os.Stat(s.path(sessionID)); err == nil {
 		return true, nil
 	} else if !os.IsNotExist(err) {
 		return false, fmt.Errorf("failed to check session %q: %w", sessionID, err)
 	}
 	// Check archive
 	if _, err := os.Stat(s.archivePath(sessionID)); err == nil {
 		return true, nil
 	} else if !os.IsNotExist(err) {
 		return false, fmt.Errorf("failed to check archived session %q: %w", sessionID, err)
 	}
 	return false, nil
 }
 // Archive moves a session file to the archived state by renaming it.
 func (s *JSONLStore) Archive(sessionID string) error {
 	s.mu.Lock()
 	defer s.mu.Unlock()
 	if err := os.Rename(s.path(sessionID), s.archivePath(sessionID)); err != nil {
 		if os.IsNotExist(err) {
 			return fmt.Errorf("session %q not found", sessionID)
 		}
 		return fmt.Errorf("failed to archive session %q: %w", sessionID, err)
 	}
 	return nil
 }
 // Delete permanently removes a session file and its archive.
 func (s *JSONLStore) Delete(sessionID string) error {
 	s.mu.Lock()
 	defer s.mu.Unlock()
 	var lastErr error
 	// Remove active file
 	if err := os.Remove(s.path(sessionID)); err != nil && !os.IsNotExist(err) {
 		lastErr = fmt.Errorf("failed to delete session %q: %w", sessionID, err)
 	}
 	// Also remove archived file if it exists
 	if err := os.Remove(s.archivePath(sessionID)); err != nil && !os.IsNotExist(err) {
 		lastErr = fmt.Errorf("failed to delete archived session %q: %w", sessionID, err)
 	}
 	return lastErr
 }
 // StorageDir returns the storage directory path.
 func (s *JSONLStore) StorageDir() string {
 	return s.storageDir
 }
--- a/pkg/session/manager.go
+++ b/pkg/session/manager.go
@ -0,0 +1,198 @@
 package session
 import (
 	"fmt"
 	"sync"
 	"time"
 	"github.com/orca/orca/pkg/bus"
 )
 // Manager provides high-level session lifecycle operations.
 //
 // It wraps a Store with caching, context window management, and
 // event publishing on the message bus.
 type Manager struct {
 	store  Store
 	bus    bus.MessageBus
 	cache  map[string]*Session
 	mu     sync.RWMutex
 }
 // NewManager creates a new session Manager with the given store and optional message bus.
 func NewManager(store Store, mb bus.MessageBus) *Manager {
 	return &Manager{
 		store: store,
 		bus:   mb,
 		cache: make(map[string]*Session),
 	}
 }
 // CreateSession creates a new session with the given ID and optional metadata.
 func (m *Manager) CreateSession(id string, metadata map[string]string) (*Session, error) {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	if _, exists := m.cache[id]; exists {
 		return nil, fmt.Errorf("session %q already exists", id)
 	}
 	now := time.Now()
 	session := &Session{
 		ID:        id,
 		Status:    SessionActive,
 		Messages:  make([]SessionMessage, 0),
 		CreatedAt: now,
 		UpdatedAt: now,
 		Metadata:  metadata,
 	}
 	m.cache[id] = session
 	// Publish session created event
 	if m.bus != nil {
 		m.bus.Publish("session.created", bus.Message{
 			ID:      "session-" + id,
 			Type:    bus.MsgTypeSystem,
 			From:    "session.manager",
 			Content: map[string]interface{}{"session_id": id},
 		})
 	}
 	return session, nil
 }
 // GetSession retrieves a session by ID, checking the cache and then the store.
 func (m *Manager) GetSession(id string) (*Session, error) {
 	m.mu.RLock()
 	session, ok := m.cache[id]
 	m.mu.RUnlock()
 	if ok {
 		return session, nil
 	}
 	// Try to load from store
 	messages, err := m.store.Load(id)
 	if err != nil {
 		return nil, fmt.Errorf("failed to load session %q: %w", id, err)
 	}
 	// Check if we can determine created/updated timestamps from messages
 	var createdAt, updatedAt time.Time
 	if len(messages) > 0 {
 		createdAt = messages[0].Timestamp
 		updatedAt = messages[len(messages)-1].Timestamp
 	}
 	if createdAt.IsZero() {
 		createdAt = time.Now()
 	}
 	if updatedAt.IsZero() {
 		updatedAt = time.Now()
 	}
 	session = &Session{
 		ID:        id,
 		Status:    SessionActive,
 		Messages:  messages,
 		CreatedAt: createdAt,
 		UpdatedAt: updatedAt,
 	}
 	m.mu.Lock()
 	m.cache[id] = session
 	m.mu.Unlock()
 	return session, nil
 }
 // AddMessage appends a message to a session and persists it.
 func (m *Manager) AddMessage(sessionID string, role MessageRole, content string, metadata map[string]string) (*SessionMessage, error) {
 	msg := SessionMessage{
 		Role:      role,
 		Content:   content,
 		Timestamp: time.Now(),
 		Metadata:  metadata,
 	}
 	if err := m.store.Save(sessionID, msg); err != nil {
 		return nil, fmt.Errorf("failed to save message to session %q: %w", sessionID, err)
 	}
 	// Upsert cache
 	m.mu.Lock()
 	if session, ok := m.cache[sessionID]; ok {
 		session.Messages = append(session.Messages, msg)
 		session.UpdatedAt = msg.Timestamp
 	} else {
 		m.cache[sessionID] = &Session{
 			ID:        sessionID,
 			Status:    SessionActive,
 			Messages:  []SessionMessage{msg},
 			CreatedAt: msg.Timestamp,
 			UpdatedAt: msg.Timestamp,
 		}
 	}
 	m.mu.Unlock()
 	return &msg, nil
 }
 // GetContext returns the most recent N messages in a session.
 // If windowSize <= 0 or >= total messages, all messages are returned.
 func (m *Manager) GetContext(sessionID string, windowSize int) ([]SessionMessage, error) {
 	session, err := m.GetSession(sessionID)
 	if err != nil {
 		return nil, err
 	}
 	messages := session.Messages
 	if windowSize > 0 && windowSize < len(messages) {
 		return messages[len(messages)-windowSize:], nil
 	}
 	return messages, nil
 }
 // ArchiveSession archives a session, making it read-only.
 func (m *Manager) ArchiveSession(id string) error {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	if session, ok := m.cache[id]; ok {
 		session.Status = SessionArchived
 	}
 	if err := m.store.Archive(id); err != nil {
 		return err
 	}
 	// Publish event
 	if m.bus != nil {
 		m.bus.Publish("session.archived", bus.Message{
 			ID:      "session-" + id,
 			Type:    bus.MsgTypeSystem,
 			From:    "session.manager",
 			Content: map[string]interface{}{"session_id": id},
 		})
 	}
 	return nil
 }
 // DeleteSession permanently removes a session.
 func (m *Manager) DeleteSession(id string) error {
 	m.mu.Lock()
 	delete(m.cache, id)
 	m.mu.Unlock()
 	return m.store.Delete(id)
 }
 // ListSessions returns all known session IDs.
 func (m *Manager) ListSessions() ([]string, error) {
 	return m.store.List()
 }
 // Store returns the underlying Store.
 func (m *Manager) Store() Store {
 	return m.store
 }
--- a/pkg/session/session_test.go
+++ b/pkg/session/session_test.go
@ -0,0 +1,550 @@
 package session
 import (
 	"os"
 	"path/filepath"
 	"testing"
 	"time"
 	"github.com/orca/orca/pkg/bus"
 )
 // ============================================================
 // JSONL Store Tests
 // ============================================================
 func setupTestStore(t *testing.T) (*JSONLStore, func()) {
 	t.Helper()
 	dir, err := os.MkdirTemp("", "orca-session-test-*")
 	if err != nil {
 		t.Fatalf("failed to create temp dir: %v", err)
 	}
 	store, err := NewJSONLStore(dir)
 	if err != nil {
 		os.RemoveAll(dir)
 		t.Fatalf("NewJSONLStore failed: %v", err)
 	}
 	cleanup := func() {
 		os.RemoveAll(dir)
 	}
 	return store, cleanup
 }
 func TestNewJSONLStore(t *testing.T) {
 	store, cleanup := setupTestStore(t)
 	defer cleanup()
 	if store == nil {
 		t.Fatal("NewJSONLStore returned nil")
 	}
 	if store.StorageDir() == "" {
 		t.Error("StorageDir should not be empty")
 	}
 }
 func TestJSONLStoreSaveAndLoad(t *testing.T) {
 	store, cleanup := setupTestStore(t)
 	defer cleanup()
 	msg := SessionMessage{
 		Role:      RoleUser,
 		Content:   "Hello, world!",
 		Timestamp: time.Now(),
 	}
 	if err := store.Save("session-1", msg); err != nil {
 		t.Fatalf("Save failed: %v", err)
 	}
 	messages, err := store.Load("session-1")
 	if err != nil {
 		t.Fatalf("Load failed: %v", err)
 	}
 	if len(messages) != 1 {
 		t.Fatalf("expected 1 message, got %d", len(messages))
 	}
 	if messages[0].Role != RoleUser {
 		t.Errorf("expected RoleUser, got %s", messages[0].Role)
 	}
 	if messages[0].Content != "Hello, world!" {
 		t.Errorf("expected content 'Hello, world!', got %q", messages[0].Content)
 	}
 }
 func TestJSONLStoreAppendMultiple(t *testing.T) {
 	store, cleanup := setupTestStore(t)
 	defer cleanup()
 	roles := []MessageRole{RoleUser, RoleAssistant, RoleUser, RoleSystem}
 	for i, role := range roles {
 		msg := SessionMessage{
 			Role:      role,
 			Content:   "message " + string(rune('0'+i)),
 			Timestamp: time.Now(),
 		}
 		if err := store.Save("session-append", msg); err != nil {
 			t.Fatalf("Save %d failed: %v", i, err)
 		}
 	}
 	messages, err := store.Load("session-append")
 	if err != nil {
 		t.Fatalf("Load failed: %v", err)
 	}
 	if len(messages) != len(roles) {
 		t.Fatalf("expected %d messages, got %d", len(roles), len(messages))
 	}
 	for i, msg := range messages {
 		if msg.Role != roles[i] {
 			t.Errorf("message %d: expected role %s, got %s", i, roles[i], msg.Role)
 		}
 	}
 }
 func TestJSONLStoreLoadNonexistent(t *testing.T) {
 	store, cleanup := setupTestStore(t)
 	defer cleanup()
 	_, err := store.Load("nonexistent")
 	if err == nil {
 		t.Error("expected error loading nonexistent session")
 	}
 }
 func TestJSONLStoreExists(t *testing.T) {
 	store, cleanup := setupTestStore(t)
 	defer cleanup()
 	exists, err := store.Exists("nonexistent")
 	if err != nil {
 		t.Fatalf("Exists failed: %v", err)
 	}
 	if exists {
 		t.Error("expected nonexistent session to return false")
 	}
 	store.Save("session-exists", SessionMessage{Role: RoleUser, Content: "test"})
 	exists, err = store.Exists("session-exists")
 	if err != nil {
 		t.Fatalf("Exists failed: %v", err)
 	}
 	if !exists {
 		t.Error("expected existing session to return true")
 	}
 }
 func TestJSONLStoreList(t *testing.T) {
 	store, cleanup := setupTestStore(t)
 	defer cleanup()
 	ids := []string{"sess-a", "sess-b", "sess-c"}
 	for _, id := range ids {
 		store.Save(id, SessionMessage{Role: RoleUser, Content: "test"})
 	}
 	list, err := store.List()
 	if err != nil {
 		t.Fatalf("List failed: %v", err)
 	}
 	if len(list) != len(ids) {
 		t.Fatalf("expected %d sessions, got %d", len(ids), len(list))
 	}
 	found := make(map[string]bool)
 	for _, id := range list {
 		found[id] = true
 	}
 	for _, id := range ids {
 		if !found[id] {
 			t.Errorf("missing session %q in list", id)
 		}
 	}
 }
 func TestJSONLStoreArchiveAndLoad(t *testing.T) {
 	store, cleanup := setupTestStore(t)
 	defer cleanup()
 	msg := SessionMessage{Role: RoleUser, Content: "archive test"}
 	store.Save("sess-archive", msg)
 	if err := store.Archive("sess-archive"); err != nil {
 		t.Fatalf("Archive failed: %v", err)
 	}
 	// Should still be loadable (archived files are in .archived suffix)
 	messages, err := store.Load("sess-archive")
 	if err != nil {
 		t.Fatalf("Load after archive failed: %v", err)
 	}
 	if len(messages) != 1 {
 		t.Errorf("expected 1 message after archive, got %d", len(messages))
 	}
 	// Should not appear in List
 	list, _ := store.List()
 	for _, id := range list {
 		if id == "sess-archive" {
 			t.Error("archived session should not appear in List")
 		}
 	}
 }
 func TestJSONLStoreArchiveNonexistent(t *testing.T) {
 	store, cleanup := setupTestStore(t)
 	defer cleanup()
 	err := store.Archive("nonexistent")
 	if err == nil {
 		t.Error("expected error archiving nonexistent session")
 	}
 }
 func TestJSONLStoreDelete(t *testing.T) {
 	store, cleanup := setupTestStore(t)
 	defer cleanup()
 	store.Save("sess-delete", SessionMessage{Role: RoleUser, Content: "delete me"})
 	if err := store.Delete("sess-delete"); err != nil {
 		t.Fatalf("Delete failed: %v", err)
 	}
 	exists, _ := store.Exists("sess-delete")
 	if exists {
 		t.Error("expected deleted session to not exist")
 	}
 }
 func TestJSONLStoreDeleteNonexistent(t *testing.T) {
 	store, cleanup := setupTestStore(t)
 	defer cleanup()
 	err := store.Delete("nonexistent")
 	if err != nil {
 		t.Fatalf("Delete nonexistent should succeed: %v", err)
 	}
 }
 func TestJSONLStoreConcurrentWrites(t *testing.T) {
 	store, cleanup := setupTestStore(t)
 	defer cleanup()
 	done := make(chan struct{}, 2)
 	go func() {
 		for i := 0; i < 50; i++ {
 			store.Save("concurrent", SessionMessage{Role: RoleUser, Content: "from-a"})
 		}
 		done <- struct{}{}
 	}()
 	go func() {
 		for i := 0; i < 50; i++ {
 			store.Save("concurrent", SessionMessage{Role: RoleAssistant, Content: "from-b"})
 		}
 		done <- struct{}{}
 	}()
 	<-done
 	<-done
 	messages, err := store.Load("concurrent")
 	if err != nil {
 		t.Fatalf("Load failed: %v", err)
 	}
 	if len(messages) != 100 {
 		t.Errorf("expected 100 messages, got %d", len(messages))
 	}
 }
 func TestJSONLStoreEmptyFile(t *testing.T) {
 	store, cleanup := setupTestStore(t)
 	defer cleanup()
 	dir := store.StorageDir()
 	// Create an empty file
 	f, _ := os.Create(filepath.Join(dir, "empty.jsonl"))
 	f.Close()
 	messages, err := store.Load("empty")
 	if err != nil {
 		t.Fatalf("Load empty session failed: %v", err)
 	}
 	if len(messages) != 0 {
 		t.Errorf("expected 0 messages from empty file, got %d", len(messages))
 	}
 }
 // ============================================================
 // Session Manager Tests
 // ============================================================
 func setupTestManager(t *testing.T) (*Manager, func()) {
 	t.Helper()
 	store, cleanup := setupTestStore(t)
 	mb := bus.New()
 	mgr := NewManager(store, mb)
 	return mgr, func() {
 		mb.Close()
 		cleanup()
 	}
 }
 func TestNewManager(t *testing.T) {
 	mgr, cleanup := setupTestManager(t)
 	defer cleanup()
 	if mgr == nil {
 		t.Fatal("NewManager returned nil")
 	}
 }
 func TestManagerCreateSession(t *testing.T) {
 	mgr, cleanup := setupTestManager(t)
 	defer cleanup()
 	session, err := mgr.CreateSession("sess-1", map[string]string{"key": "value"})
 	if err != nil {
 		t.Fatalf("CreateSession failed: %v", err)
 	}
 	if session.ID != "sess-1" {
 		t.Errorf("expected ID 'sess-1', got %q", session.ID)
 	}
 	if session.Status != SessionActive {
 		t.Errorf("expected SessionActive, got %s", session.Status)
 	}
 	if session.Metadata["key"] != "value" {
 		t.Errorf("expected metadata key 'value', got %q", session.Metadata["key"])
 	}
 	if session.MessageCount() != 0 {
 		t.Errorf("expected 0 messages, got %d", session.MessageCount())
 	}
 	if session.CreatedAt.IsZero() {
 		t.Error("CreatedAt should not be zero")
 	}
 }
 func TestManagerCreateDuplicate(t *testing.T) {
 	mgr, cleanup := setupTestManager(t)
 	defer cleanup()
 	mgr.CreateSession("dup", nil)
 	_, err := mgr.CreateSession("dup", nil)
 	if err == nil {
 		t.Error("expected error creating duplicate session")
 	}
 }
 func TestManagerAddMessage(t *testing.T) {
 	mgr, cleanup := setupTestManager(t)
 	defer cleanup()
 	msg, err := mgr.AddMessage("sess-add", RoleUser, "Hello!", map[string]string{"source": "test"})
 	if err != nil {
 		t.Fatalf("AddMessage failed: %v", err)
 	}
 	if msg.Role != RoleUser {
 		t.Errorf("expected RoleUser, got %s", msg.Role)
 	}
 	if msg.Content != "Hello!" {
 		t.Errorf("expected 'Hello!', got %q", msg.Content)
 	}
 	if msg.Metadata["source"] != "test" {
 		t.Errorf("expected metadata source 'test', got %q", msg.Metadata["source"])
 	}
 	if msg.Timestamp.IsZero() {
 		t.Error("Timestamp should not be zero")
 	}
 	// Verify it was persisted
 	messages, _ := mgr.GetContext("sess-add", 10)
 	if len(messages) != 1 {
 		t.Fatalf("expected 1 message, got %d", len(messages))
 	}
 }
 func TestManagerAddMessageAutoCreatesSession(t *testing.T) {
 	mgr, cleanup := setupTestManager(t)
 	defer cleanup()
 	mgr.AddMessage("auto-session", RoleUser, "auto create", nil)
 	session, err := mgr.GetSession("auto-session")
 	if err != nil {
 		t.Fatalf("GetSession failed: %v", err)
 	}
 	if session.MessageCount() != 1 {
 		t.Errorf("expected 1 message, got %d", session.MessageCount())
 	}
 }
 func TestManagerGetContextWindow(t *testing.T) {
 	mgr, cleanup := setupTestManager(t)
 	defer cleanup()
 	// Add 10 messages
 	for i := 0; i < 10; i++ {
 		mgr.AddMessage("window-test", RoleUser, "msg", nil)
 	}
 	// Get last 3
 	messages, err := mgr.GetContext("window-test", 3)
 	if err != nil {
 		t.Fatalf("GetContext failed: %v", err)
 	}
 	if len(messages) != 3 {
 		t.Errorf("expected 3 messages, got %d", len(messages))
 	}
 	// Get all (window larger than total)
 	all, _ := mgr.GetContext("window-test", 100)
 	if len(all) != 10 {
 		t.Errorf("expected 10 messages, got %d", len(all))
 	}
 	// Get with window <= 0
 	all2, _ := mgr.GetContext("window-test", 0)
 	if len(all2) != 10 {
 		t.Errorf("expected 10 messages with window=0, got %d", len(all2))
 	}
 }
 func TestManagerGetContextNonexistent(t *testing.T) {
 	mgr, cleanup := setupTestManager(t)
 	defer cleanup()
 	_, err := mgr.GetContext("nonexistent", 10)
 	if err == nil {
 		t.Error("expected error getting context for nonexistent session")
 	}
 }
 func TestManagerArchiveSession(t *testing.T) {
 	mgr, cleanup := setupTestManager(t)
 	defer cleanup()
 	mgr.CreateSession("archivable", nil)
 	mgr.AddMessage("archivable", RoleUser, "test", nil)
 	if err := mgr.ArchiveSession("archivable"); err != nil {
 		t.Fatalf("ArchiveSession failed: %v", err)
 	}
 	session, _ := mgr.GetSession("archivable")
 	if session.Status != SessionArchived {
 		t.Errorf("expected SessionArchived, got %s", session.Status)
 	}
 	if session.IsArchived() != true {
 		t.Error("expected IsArchived to return true")
 	}
 }
 func TestManagerDeleteSession(t *testing.T) {
 	mgr, cleanup := setupTestManager(t)
 	defer cleanup()
 	mgr.CreateSession("deletable", nil)
 	if err := mgr.DeleteSession("deletable"); err != nil {
 		t.Fatalf("DeleteSession failed: %v", err)
 	}
 	_, err := mgr.GetSession("deletable")
 	if err == nil {
 		t.Error("expected error getting deleted session")
 	}
 }
 func TestManagerListSessions(t *testing.T) {
 	mgr, cleanup := setupTestManager(t)
 	defer cleanup()
 	mgr.AddMessage("list-a", RoleUser, "a", nil)
 	mgr.AddMessage("list-b", RoleUser, "b", nil)
 	sessions, err := mgr.ListSessions()
 	if err != nil {
 		t.Fatalf("ListSessions failed: %v", err)
 	}
 	if len(sessions) != 2 {
 		t.Errorf("expected 2 sessions, got %d", len(sessions))
 	}
 }
 func TestManagerMultipleMessagesOrder(t *testing.T) {
 	mgr, cleanup := setupTestManager(t)
 	defer cleanup()
 	contents := []string{"first", "second", "third"}
 	for i, c := range contents {
 		mgr.AddMessage("order-test", RoleUser, c, nil)
 		_ = i
 	}
 	messages, _ := mgr.GetContext("order-test", 10)
 	if len(messages) != 3 {
 		t.Fatalf("expected 3 messages, got %d", len(messages))
 	}
 	if messages[0].Content != "first" {
 		t.Errorf("expected first message content 'first', got %q", messages[0].Content)
 	}
 	if messages[2].Content != "third" {
 		t.Errorf("expected third message content 'third', got %q", messages[2].Content)
 	}
 }
 func TestManagerStoreAccess(t *testing.T) {
 	mgr, cleanup := setupTestManager(t)
 	defer cleanup()
 	store := mgr.Store()
 	if store == nil {
 		t.Error("Store() should not return nil")
 	}
 }
 // ============================================================
 // Session Types Tests
 // ============================================================
 func TestSessionIsArchived(t *testing.T) {
 	s := &Session{Status: SessionActive}
 	if s.IsArchived() {
 		t.Error("active session should not be archived")
 	}
 	s.Status = SessionArchived
 	if !s.IsArchived() {
 		t.Error("archived session should be archived")
 	}
 }
 func TestSessionMessageCount(t *testing.T) {
 	s := &Session{Messages: make([]SessionMessage, 5)}
 	if n := s.MessageCount(); n != 5 {
 		t.Errorf("expected 5 messages, got %d", n)
 	}
 }
 func TestMessageRoleConstants(t *testing.T) {
 	if RoleUser != "user" {
 		t.Errorf("expected RoleUser 'user', got %q", RoleUser)
 	}
 	if RoleAssistant != "assistant" {
 		t.Errorf("expected RoleAssistant 'assistant', got %q", RoleAssistant)
 	}
 	if RoleSystem != "system" {
 		t.Errorf("expected RoleSystem 'system', got %q", RoleSystem)
 	}
 	if RoleTool != "tool" {
 		t.Errorf("expected RoleTool 'tool', got %q", RoleTool)
 	}
 }
 func TestSessionStatusConstants(t *testing.T) {
 	if SessionActive != "active" {
 		t.Errorf("expected SessionActive 'active', got %q", SessionActive)
 	}
 	if SessionArchived != "archived" {
 		t.Errorf("expected SessionArchived 'archived', got %q", SessionArchived)
 	}
 }
--- a/pkg/session/store.go
+++ b/pkg/session/store.go
@ -0,0 +1,28 @@
 package session
 // Store defines the persistence interface for session message storage.
 //
 // Implementations must be safe for concurrent use. The default implementation
 // uses JSONL files (one file per session) with O(1) append writes.
 type Store interface {
 	// Save appends a single message to a session's history.
 	// Creates the session file if it does not exist.
 	Save(sessionID string, msg SessionMessage) error
 	// Load retrieves all messages for a session in chronological order.
 	// Returns an error if the session does not exist.
 	Load(sessionID string) ([]SessionMessage, error)
 	// List returns all known session IDs.
 	List() ([]string, error)
 	// Exists checks whether a session exists in the store.
 	Exists(sessionID string) (bool, error)
 	// Archive marks a session as archived (read-only).
 	// This is a soft delete that preserves the data.
 	Archive(sessionID string) error
 	// Delete removes a session permanently from the store.
 	Delete(sessionID string) error
 }
--- a/pkg/session/types.go
+++ b/pkg/session/types.go
@ -0,0 +1,60 @@
 // Package session provides conversation session management for the Orca framework.
 //
 // Sessions persist conversation history and provide context-window-based
 // retrieval for LLM interactions. The default storage backend uses JSONL
 // files with O(1) append writes.
 package session
 import "time"
 // MessageRole represents the role of a message sender in a session.
 type MessageRole string
 const (
 	// RoleUser represents a human user message.
 	RoleUser MessageRole = "user"
 	// RoleAssistant represents an AI assistant message.
 	RoleAssistant MessageRole = "assistant"
 	// RoleSystem represents a system-level message.
 	RoleSystem MessageRole = "system"
 	// RoleTool represents a tool execution result.
 	RoleTool MessageRole = "tool"
 )
 // SessionMessage represents a single message entry in a session's history.
 type SessionMessage struct {
 	Role      MessageRole       `json:"role"`
 	Content   string            `json:"content"`
 	Timestamp time.Time         `json:"timestamp"`
 	Metadata  map[string]string `json:"metadata,omitempty"`
 }
 // SessionStatus represents the lifecycle status of a session.
 type SessionStatus string
 const (
 	// SessionActive indicates an active, in-use session.
 	SessionActive SessionStatus = "active"
 	// SessionArchived indicates an archived (read-only) session.
 	SessionArchived SessionStatus = "archived"
 )
 // Session represents a conversation session with full history.
 type Session struct {
 	ID        string            `json:"id"`
 	Status    SessionStatus     `json:"status"`
 	Messages  []SessionMessage  `json:"messages,omitempty"`
 	CreatedAt time.Time         `json:"created_at"`
 	UpdatedAt time.Time         `json:"updated_at"`
 	Metadata  map[string]string `json:"metadata,omitempty"`
 }
 // IsArchived returns true if the session has been archived.
 func (s *Session) IsArchived() bool {
 	return s.Status == SessionArchived
 }
 // MessageCount returns the number of messages in the session.
 func (s *Session) MessageCount() int {
 	return len(s.Messages)
 }
--- a/pkg/skill/manager.go
+++ b/pkg/skill/manager.go
@ -0,0 +1,197 @@
 package skill
 import (
 	"fmt"
 	"os"
 	"path/filepath"
 	"sort"
 	"strings"
 	"sync"
 )
 const (
 	// DefaultSkillsDir is the default directory for user-installed skills.
 	DefaultSkillsDir = "~/.agents/skills"
 	// SkillManifestFile is the name of the skill manifest file.
 	SkillManifestFile = "SKILL.md"
 )
 // Manager is a thread-safe registry for loading, storing, and querying Skills.
 //
 // Skills are loaded from a directory tree where each subdirectory containing
 // a SKILL.md file is treated as a skill. The Manager automatically discovers
 // skills on initialization and provides methods for finding skills by trigger
 // keywords or by name.
 type Manager struct {
 	mu        sync.RWMutex
 	skillsDir string
 	skills    map[string]*Skill
 }
 // NewManager creates a new Skill manager that scans the given directory for skills.
 // If skillsDir is empty, DefaultSkillsDir is used.
 func NewManager(skillsDir string) *Manager {
 	if skillsDir == "" {
 		skillsDir = DefaultSkillsDir
 	}
 	// Expand ~ to home directory
 	skillsDir = expandHome(skillsDir)
 	return &Manager{
 		skillsDir: skillsDir,
 		skills:    make(map[string]*Skill),
 	}
 }
 // LoadAll scans the skills directory and loads all skills found.
 // It returns the number of skills loaded and any errors encountered.
 func (m *Manager) LoadAll() (int, error) {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	// Clear existing skills
 	m.skills = make(map[string]*Skill)
 	// Check if skills directory exists
 	info, err := os.Stat(m.skillsDir)
 	if err != nil {
 		if os.IsNotExist(err) {
 			return 0, nil // No skills directory yet — not an error
 		}
 		return 0, fmt.Errorf("skill: cannot access skills directory %q: %w", m.skillsDir, err)
 	}
 	if !info.IsDir() {
 		return 0, fmt.Errorf("skill: %q is not a directory", m.skillsDir)
 	}
 	// Read all entries in the skills directory
 	entries, err := os.ReadDir(m.skillsDir)
 	if err != nil {
 		return 0, fmt.Errorf("skill: failed to read skills directory %q: %w", m.skillsDir, err)
 	}
 	var loadErrors []string
 	loaded := 0
 	for _, entry := range entries {
 		if !entry.IsDir() {
 			continue
 		}
 		skillDir := filepath.Join(m.skillsDir, entry.Name())
 		skillPath := filepath.Join(skillDir, SkillManifestFile)
 		if _, err := os.Stat(skillPath); os.IsNotExist(err) {
 			continue // No SKILL.md in this directory — skip
 		}
 		skill, err := ParseSkillFile(skillPath)
 		if err != nil {
 			loadErrors = append(loadErrors, fmt.Sprintf("%s: %v", entry.Name(), err))
 			continue
 		}
 		m.skills[skill.Name] = skill
 		loaded++
 	}
 	if len(loadErrors) > 0 {
 		return loaded, fmt.Errorf("skill: loaded %d skills with %d errors: %s",
 			loaded, len(loadErrors), joinStrings(loadErrors, "; "))
 	}
 	return loaded, nil
 }
 // GetSkill retrieves a skill by its name. Returns false if not found.
 func (m *Manager) GetSkill(name string) (*Skill, bool) {
 	m.mu.RLock()
 	defer m.mu.RUnlock()
 	skill, ok := m.skills[name]
 	return skill, ok
 }
 // ListSkills returns all loaded skills sorted by name.
 func (m *Manager) ListSkills() []*Skill {
 	m.mu.RLock()
 	defer m.mu.RUnlock()
 	result := make([]*Skill, 0, len(m.skills))
 	for _, skill := range m.skills {
 		result = append(result, skill)
 	}
 	sort.Slice(result, func(i, j int) bool {
 		return result[i].Name < result[j].Name
 	})
 	return result
 }
 // FindSkill finds skills whose triggers match the given query string.
 // Returns all matching skills sorted by relevance (more trigger matches first).
 func (m *Manager) FindSkill(query string) []*Skill {
 	m.mu.RLock()
 	defer m.mu.RUnlock()
 	var matches []*Skill
 	for _, skill := range m.skills {
 		if skill.MatchTrigger(query) {
 			matches = append(matches, skill)
 		}
 	}
 	// Sort by number of matching triggers (descending)
 	sort.Slice(matches, func(i, j int) bool {
 		return countMatches(matches[i], query) > countMatches(matches[j], query)
 	})
 	return matches
 }
 // SkillsDir returns the directory being scanned for skills.
 func (m *Manager) SkillsDir() string {
 	return m.skillsDir
 }
 // Reload refreshes all skills from disk.
 func (m *Manager) Reload() (int, error) {
 	return m.LoadAll()
 }
 // countMatches counts how many of the skill's triggers match the query.
 func countMatches(skill *Skill, query string) int {
 	count := 0
 	queryLower := strings.ToLower(query)
 	for _, trigger := range skill.Triggers {
 		if strings.Contains(queryLower, strings.ToLower(trigger)) {
 			count++
 		}
 	}
 	return count
 }
 // expandHome replaces "~" with the user's home directory.
 func expandHome(path string) string {
 	if len(path) > 0 && path[0] == '~' {
 		home, err := os.UserHomeDir()
 		if err != nil {
 			return path
 		}
 		return filepath.Join(home, path[1:])
 	}
 	return path
 }
 // joinStrings joins a slice of strings with a separator.
 func joinStrings(parts []string, sep string) string {
 	if len(parts) == 0 {
 		return ""
 	}
 	result := parts[0]
 	for _, p := range parts[1:] {
 		result += sep + p
 	}
 	return result
 }
--- a/pkg/skill/manager_test.go
+++ b/pkg/skill/manager_test.go
@ -0,0 +1,309 @@
 package skill
 import (
 	"os"
 	"path/filepath"
 	"strings"
 	"testing"
 )
 // createTestSkill creates a temporary SKILL.md file for testing.
 func createTestSkill(t *testing.T, dir, name, description string, triggers []string, body string) string {
 	t.Helper()
 	skillDir := filepath.Join(dir, name)
 	if err := os.MkdirAll(skillDir, 0755); err != nil {
 		t.Fatalf("failed to create skill dir: %v", err)
 	}
 	triggerStr := "[]"
 	if len(triggers) > 0 {
 		quoted := make([]string, len(triggers))
 		for i, tr := range triggers {
 			quoted[i] = `"` + tr + `"`
 		}
 		triggerStr = "[" + strings.Join(quoted, ", ") + "]"
 	}
 	manifest := "---\n"
 	manifest += "name: " + name + "\n"
 	manifest += "description: " + description + "\n"
 	manifest += "triggers: " + triggerStr + "\n"
 	manifest += "---\n\n"
 	manifest += body
 	manifestPath := filepath.Join(skillDir, "SKILL.md")
 	if err := os.WriteFile(manifestPath, []byte(manifest), 0644); err != nil {
 		t.Fatalf("failed to write SKILL.md: %v", err)
 	}
 	return manifestPath
 }
 func TestNewManager(t *testing.T) {
 	m := NewManager("")
 	if m == nil {
 		t.Fatal("NewManager() returned nil")
 	}
 	if m.SkillsDir() == "" {
 		t.Error("expected non-empty skills directory")
 	}
 }
 func TestNewManagerWithCustomDir(t *testing.T) {
 	tmpDir := t.TempDir()
 	m := NewManager(tmpDir)
 	if m.SkillsDir() != tmpDir {
 		t.Errorf("expected skills dir %q, got %q", tmpDir, m.SkillsDir())
 	}
 }
 func TestLoadAllNoDirectory(t *testing.T) {
 	tmpDir := filepath.Join(t.TempDir(), "nonexistent")
 	m := NewManager(tmpDir)
 	count, err := m.LoadAll()
 	if err != nil {
 		t.Fatalf("LoadAll on nonexistent dir should not error: %v", err)
 	}
 	if count != 0 {
 		t.Errorf("expected 0 skills, got %d", count)
 	}
 }
 func TestLoadAllWithSkills(t *testing.T) {
 	tmpDir := t.TempDir()
 	createTestSkill(t, tmpDir, "skill-a", "Skill A", []string{"alpha", "a"}, "# Skill A\nContent")
 	createTestSkill(t, tmpDir, "skill-b", "Skill B", []string{"beta", "b"}, "# Skill B\nContent")
 	m := NewManager(tmpDir)
 	count, err := m.LoadAll()
 	if err != nil {
 		t.Fatalf("LoadAll failed: %v", err)
 	}
 	if count != 2 {
 		t.Errorf("expected 2 skills, got %d", count)
 	}
 }
 func TestGetSkill(t *testing.T) {
 	tmpDir := t.TempDir()
 	createTestSkill(t, tmpDir, "test-skill", "Test Skill", []string{"test"}, "# Test")
 	m := NewManager(tmpDir)
 	m.LoadAll()
 	skill, ok := m.GetSkill("test-skill")
 	if !ok {
 		t.Fatal("GetSkill returned false for existing skill")
 	}
 	if skill.Name != "test-skill" {
 		t.Errorf("expected name 'test-skill', got %q", skill.Name)
 	}
 	if skill.Description != "Test Skill" {
 		t.Errorf("expected description 'Test Skill', got %q", skill.Description)
 	}
 }
 func TestGetSkillNotFound(t *testing.T) {
 	tmpDir := t.TempDir()
 	m := NewManager(tmpDir)
 	m.LoadAll()
 	_, ok := m.GetSkill("nonexistent")
 	if ok {
 		t.Error("expected false for nonexistent skill")
 	}
 }
 func TestListSkills(t *testing.T) {
 	tmpDir := t.TempDir()
 	createTestSkill(t, tmpDir, "beta", "Beta", nil, "# Beta")
 	createTestSkill(t, tmpDir, "alpha", "Alpha", nil, "# Alpha")
 	m := NewManager(tmpDir)
 	m.LoadAll()
 	skills := m.ListSkills()
 	if len(skills) != 2 {
 		t.Errorf("expected 2 skills, got %d", len(skills))
 	}
 	// Should be sorted alphabetically
 	if len(skills) >= 2 {
 		if skills[0].Name != "alpha" {
 			t.Errorf("expected first skill 'alpha', got %q", skills[0].Name)
 		}
 		if skills[1].Name != "beta" {
 			t.Errorf("expected second skill 'beta', got %q", skills[1].Name)
 		}
 	}
 }
 func TestListSkillsEmpty(t *testing.T) {
 	m := NewManager(t.TempDir())
 	m.LoadAll()
 	skills := m.ListSkills()
 	if len(skills) != 0 {
 		t.Errorf("expected empty list, got %d skills", len(skills))
 	}
 }
 func TestFindSkill(t *testing.T) {
 	tmpDir := t.TempDir()
 	createTestSkill(t, tmpDir, "browser", "Browser automation", []string{"browser", "navigate", "screenshot"}, "# Browser")
 	createTestSkill(t, tmpDir, "memory", "Project memory", []string{"memory", "remember"}, "# Memory")
 	createTestSkill(t, tmpDir, "convert", "File converter", []string{"convert", "pdf"}, "# Convert")
 	m := NewManager(tmpDir)
 	m.LoadAll()
 	// Find by trigger matching "browser"
 	results := m.FindSkill("I need to use the browser to navigate")
 	if len(results) == 0 {
 		t.Fatal("expected at least 1 match for 'browser'")
 	}
 	found := false
 	for _, s := range results {
 		if s.Name == "browser" {
 			found = true
 			break
 		}
 	}
 	if !found {
 		t.Error("expected 'browser' skill in results")
 	}
 }
 func TestFindSkillNoMatch(t *testing.T) {
 	tmpDir := t.TempDir()
 	createTestSkill(t, tmpDir, "browser", "Browser", []string{"browser"}, "# Browser")
 	m := NewManager(tmpDir)
 	m.LoadAll()
 	results := m.FindSkill("completely unrelated query")
 	if len(results) != 0 {
 		t.Errorf("expected 0 matches, got %d", len(results))
 	}
 }
 func TestFindSkillCaseInsensitive(t *testing.T) {
 	tmpDir := t.TempDir()
 	createTestSkill(t, tmpDir, "browser", "Browser", []string{"Browser"}, "# Browser")
 	m := NewManager(tmpDir)
 	m.LoadAll()
 	results := m.FindSkill("browser")
 	if len(results) != 1 {
 		t.Errorf("expected 1 match for lowercase 'browser', got %d", len(results))
 	}
 	results = m.FindSkill("BROWSER")
 	if len(results) != 1 {
 		t.Errorf("expected 1 match for uppercase 'BROWSER', got %d", len(results))
 	}
 }
 func TestFindSkillRelevanceOrder(t *testing.T) {
 	tmpDir := t.TempDir()
 	createTestSkill(t, tmpDir, "multi-match", "Multiple matches", []string{"alpha", "beta", "gamma"}, "# Multi")
 	createTestSkill(t, tmpDir, "single-match", "Single match", []string{"alpha"}, "# Single")
 	m := NewManager(tmpDir)
 	m.LoadAll()
 	// A query mentioning multiple triggers
 	results := m.FindSkill("alpha beta")
 	if len(results) != 2 {
 		t.Errorf("expected 2 matches, got %d", len(results))
 	}
 	// The multi-match skill should come first (more trigger matches)
 	if len(results) >= 2 {
 		if results[0].Name != "multi-match" {
 			t.Errorf("expected 'multi-match' first (more relevance), got %q", results[0].Name)
 		}
 	}
 }
 func TestReload(t *testing.T) {
 	tmpDir := t.TempDir()
 	createTestSkill(t, tmpDir, "initial", "Initial", []string{"init"}, "# Initial")
 	m := NewManager(tmpDir)
 	m.LoadAll()
 	if len(m.ListSkills()) != 1 {
 		t.Errorf("expected 1 skill after load, got %d", len(m.ListSkills()))
 	}
 	// Add another skill
 	createTestSkill(t, tmpDir, "added", "Added later", []string{"new"}, "# New")
 	count, err := m.Reload()
 	if err != nil {
 		t.Fatalf("Reload failed: %v", err)
 	}
 	if count != 2 {
 		t.Errorf("expected 2 skills after reload, got %d", count)
 	}
 }
 func TestSkillMatchTrigger(t *testing.T) {
 	skill := &Skill{
 		Name:     "test",
 		Triggers: []string{"browser", "navigate"},
 	}
 	tests := []struct {
 		query string
 		want  bool
 	}{
 		{"I need to use the browser", true},
 		{"navigate to a page", true},
 		{"Browser automation", true},
 		{"something unrelated", false},
 	}
 	for _, tt := range tests {
 		got := skill.MatchTrigger(tt.query)
 		if got != tt.want {
 			t.Errorf("MatchTrigger(%q) = %v, want %v", tt.query, got, tt.want)
 		}
 	}
 }
 func TestSkillHasScripts(t *testing.T) {
 	s1 := &Skill{Name: "no-scripts"}
 	if s1.HasScripts() {
 		t.Error("expected HasScripts() = false for empty scripts")
 	}
 	s2 := &Skill{Name: "has-scripts", Scripts: []string{"script.sh"}}
 	if !s2.HasScripts() {
 		t.Error("expected HasScripts() = true for non-empty scripts")
 	}
 }
 func TestExpandHome(t *testing.T) {
 	home, err := os.UserHomeDir()
 	if err != nil {
 		t.Fatalf("failed to get home dir: %v", err)
 	}
 	result := expandHome("~/test/path")
 	if !strings.HasPrefix(result, home) {
 		t.Errorf("expected path starting with %q, got %q", home, result)
 	}
 	// Non-tilde path should not change
 	if expandHome("/absolute/path") != "/absolute/path" {
 		t.Error("absolute path should not be modified")
 	}
 }
--- a/pkg/skill/parser.go
+++ b/pkg/skill/parser.go
@ -0,0 +1,246 @@
 package skill
 import (
 	"fmt"
 	"os"
 	"path/filepath"
 	"sort"
 	"strings"
 )
 // FrontmatterDelimiters for YAML frontmatter in SKILL.md files.
 const (
 	frontmatterDelim = "---"
 )
 // ParseSkillFile parses a SKILL.md file and returns a populated Skill struct.
 //
 // The expected format is:
 //
 //	---
 //	name: my-skill
 //	description: Does something useful
 //	triggers: ["keyword1", "keyword2"]
 //	---
 //
 //	# My Skill
 //
 //	Detailed description...
 func ParseSkillFile(path string) (*Skill, error) {
 	data, err := os.ReadFile(path)
 	if err != nil {
 		return nil, fmt.Errorf("skill: cannot read %q: %w", path, err)
 	}
 	return ParseSkillData(path, data)
 }
 // ParseSkillData parses SKILL.md content from raw bytes.
 // The path parameter is used to locate the scripts/ directory.
 func ParseSkillData(path string, data []byte) (*Skill, error) {
 	content := string(data)
 	skill := &Skill{
 		Path:  path,
 		Body:  content,
 		Triggers: []string{},
 	}
 	// Parse YAML frontmatter
 	rest, err := parseFrontmatter(content, skill)
 	if err != nil {
 		return nil, err
 	}
 	skill.Body = strings.TrimSpace(rest)
 	// Validate required fields
 	if skill.Name == "" {
 		return nil, fmt.Errorf("skill: %q is missing 'name' in frontmatter", path)
 	}
 	// Discover scripts directory
 	skillDir := filepath.Dir(path)
 	scriptsDir := filepath.Join(skillDir, "scripts")
 	skill.ScriptsDir = scriptsDir
 	if info, err := os.Stat(scriptsDir); err == nil && info.IsDir() {
 		scripts, err := discoverScripts(scriptsDir)
 		if err != nil {
 			return nil, fmt.Errorf("skill: failed to discover scripts in %q: %w", scriptsDir, err)
 		}
 		skill.Scripts = scripts
 	}
 	return skill, nil
 }
 // parseFrontmatter extracts YAML frontmatter delimited by "---" lines
 // and populates the Skill struct fields.
 func parseFrontmatter(content string, skill *Skill) (string, error) {
 	content = strings.TrimSpace(content)
 	if !strings.HasPrefix(content, frontmatterDelim) {
 		// No frontmatter — treat entire content as body
 		return content, nil
 	}
 	// Find the closing delimiter
 	rest := content[len(frontmatterDelim):]
 	rest = strings.TrimLeft(rest, "\n\r")
 	endIdx := strings.Index(rest, "\n"+frontmatterDelim)
 	if endIdx < 0 {
 		// Also check for end-of-file style
 		endIdx = strings.Index(rest, frontmatterDelim)
 		if endIdx < 0 {
 			return "", fmt.Errorf("skill: unclosed frontmatter in skill file")
 		}
 	}
 	frontmatter := rest[:endIdx]
 	body := rest[endIdx+len(frontmatterDelim)+1:]
 	// Parse the YAML frontmatter (simple key-value parser)
 	if err := parseSimpleYAML(frontmatter, skill); err != nil {
 		return "", err
 	}
 	return body, nil
 }
 // parseSimpleYAML parses a simplified YAML format for skill frontmatter.
 // Supports: string values, quoted strings, and array values.
 func parseSimpleYAML(yaml string, skill *Skill) error {
 	lines := strings.Split(yaml, "\n")
 	for _, line := range lines {
 		line = strings.TrimSpace(line)
 		if line == "" || strings.HasPrefix(line, "#") {
 			continue
 		}
 		colonIdx := strings.Index(line, ":")
 		if colonIdx < 0 {
 			continue
 		}
 		key := strings.TrimSpace(line[:colonIdx])
 		value := strings.TrimSpace(line[colonIdx+1:])
 		switch key {
 		case "name":
 			skill.Name = trimQuotes(value)
 		case "description":
 			skill.Description = trimQuotes(value)
 		case "triggers":
 			triggers, err := parseYAMLArray(value)
 			if err != nil {
 				return fmt.Errorf("skill: invalid triggers format: %w", err)
 			}
 			skill.Triggers = triggers
 		}
 	}
 	return nil
 }
 // parseYAMLArray parses a YAML array like '["a", "b", "c"]' or '[a, b, c]'.
 func parseYAMLArray(value string) ([]string, error) {
 	value = strings.TrimSpace(value)
 	// Handle YAML list format: ["a", "b"] or [a, b]
 	if strings.HasPrefix(value, "[") && strings.HasSuffix(value, "]") {
 		inner := value[1 : len(value)-1]
 		if strings.TrimSpace(inner) == "" {
 			return []string{}, nil
 		}
 		parts := splitCommas(inner)
 		result := make([]string, len(parts))
 		for i, p := range parts {
 			result[i] = trimQuotes(strings.TrimSpace(p))
 		}
 		return result, nil
 	}
 	// Handle YAML list format with dashes:
 	// triggers:
 	//   - browser
 	//   - navigate
 	// (This would be handled line-by-line in a different flow)
 	// For now, treat single value as a one-element list
 	if value != "" && value != "[]" {
 		return []string{trimQuotes(value)}, nil
 	}
 	return []string{}, nil
 }
 // splitCommas splits a comma-separated string respecting quoted sections.
 func splitCommas(s string) []string {
 	var parts []string
 	var current strings.Builder
 	inQuote := false
 	quoteChar := byte(0)
 	for i := 0; i < len(s); i++ {
 		c := s[i]
 		if inQuote {
 			current.WriteByte(c)
 			if c == quoteChar {
 				inQuote = false
 			}
 		} else if c == '"' || c == '\'' {
 			current.WriteByte(c)
 			inQuote = true
 			quoteChar = c
 		} else if c == ',' {
 			parts = append(parts, current.String())
 			current.Reset()
 		} else {
 			current.WriteByte(c)
 		}
 	}
 	if current.Len() > 0 {
 		parts = append(parts, current.String())
 	}
 	return parts
 }
 // trimQuotes removes surrounding quotes from a string value.
 func trimQuotes(s string) string {
 	s = strings.TrimSpace(s)
 	if len(s) >= 2 {
 		if (s[0] == '"' && s[len(s)-1] == '"') || (s[0] == '\'' && s[len(s)-1] == '\'') {
 			return s[1 : len(s)-1]
 		}
 	}
 	return s
 }
 // discoverScripts lists all executable/readable files in a scripts directory.
 func discoverScripts(scriptsDir string) ([]string, error) {
 	entries, err := os.ReadDir(scriptsDir)
 	if err != nil {
 		return nil, err
 	}
 	var scripts []string
 	for _, entry := range entries {
 		if entry.IsDir() {
 			continue
 		}
 		scripts = append(scripts, entry.Name())
 	}
 	sort.Strings(scripts)
 	return scripts, nil
 }
 // LoadSkillFromDir loads a skill from a directory containing a SKILL.md file.
 func LoadSkillFromDir(dir string) (*Skill, error) {
 	skillPath := filepath.Join(dir, "SKILL.md")
 	if _, err := os.Stat(skillPath); os.IsNotExist(err) {
 		return nil, fmt.Errorf("skill: no SKILL.md found in %q", dir)
 	}
 	return ParseSkillFile(skillPath)
 }
--- a/pkg/skill/skill.go
+++ b/pkg/skill/skill.go
@ -0,0 +1,56 @@
 // Package skill provides the Skill definition and management system.
 //
 // Skills are composable capabilities loaded from ~/.agents/skills/.
 // Each skill has a SKILL.md manifest with YAML frontmatter and optional
 // scripts in a scripts/ subdirectory. Skills can be discovered and
 // invoked by trigger keywords.
 package skill
 import (
 	"fmt"
 	"strings"
 )
 // Skill represents a composable capability loaded from the skills directory.
 //
 // Each Skill is defined by a SKILL.md file with YAML frontmatter containing
 // metadata (name, description, triggers) and optional executable scripts
 // in a scripts/ subdirectory.
 type Skill struct {
 	// Name is the unique identifier for this skill (e.g., "dev-browser").
 	Name string `yaml:"name"`
 	// Description is a human-readable explanation of what this skill does.
 	Description string `yaml:"description"`
 	// Triggers are keywords that activate this skill from natural language.
 	Triggers []string `yaml:"triggers"`
 	// Scripts is the list of script file names in the scripts/ directory.
 	Scripts []string `yaml:"-"`
 	// ScriptsDir is the absolute path to the scripts/ directory.
 	ScriptsDir string `yaml:"-"`
 	// Body is the markdown content after the YAML frontmatter.
 	Body string `yaml:"-"`
 	// Path is the absolute path to the SKILL.md file.
 	Path string `yaml:"-"`
 }
 // MatchTrigger checks if the given query matches any of the skill's triggers.
 // Matching is case-insensitive and supports partial matches.
 func (s *Skill) MatchTrigger(query string) bool {
 	query = strings.ToLower(query)
 	for _, trigger := range s.Triggers {
 		if strings.Contains(strings.ToLower(query), strings.ToLower(trigger)) {
 			return true
 		}
 	}
 	return false
 }
 // String returns a human-readable representation of the skill.
 func (s *Skill) String() string {
 	return fmt.Sprintf("Skill{Name: %q, Triggers: %v, Scripts: %d}", s.Name, s.Triggers, len(s.Scripts))
 }
 // HasScripts returns true if the skill has at least one script.
 func (s *Skill) HasScripts() bool {
 	return len(s.Scripts) > 0
 }
--- a/pkg/tool/builtin.go
+++ b/pkg/tool/builtin.go
@ -0,0 +1,433 @@
 package tool
 import (
 	"context"
 	"encoding/json"
 	"fmt"
 	"os"
 	"path/filepath"
 	"strings"
 	"time"
 	"github.com/orca/orca/pkg/sandbox"
 )
 // ---------------------------------------------------------------------------
 // exec — Execute a shell command via the sandbox
 // ---------------------------------------------------------------------------
 // execTool runs shell commands through the ProcessSandbox.
 type execTool struct {
 	sandbox sandbox.Sandbox
 }
 // NewExecTool creates a new exec tool backed by the given sandbox.
 func NewExecTool(sb sandbox.Sandbox) Tool {
 	if sb == nil {
 		sb = sandbox.NewProcessSandbox()
 	}
 	return &execTool{sandbox: sb}
 }
 func (t *execTool) Name() string { return "exec" }
 func (t *execTool) Description() string {
 	return "Execute a shell command and return its output. Use this for running scripts, " +
 		"installing packages, compiling code, or any command-line operation."
 }
 func (t *execTool) Parameters() map[string]ParameterSchema {
 	return map[string]ParameterSchema{
 		"command": {
 			Type:        "string",
 			Description: "The shell command to execute (e.g., 'ls -la' or 'python script.py')",
 			Required:    true,
 		},
 		"timeout": {
 			Type:        "number",
 			Description: "Timeout in seconds for the command execution (default: 30)",
 			Required:    false,
 			Default:     float64(30),
 		},
 		"workdir": {
 			Type:        "string",
 			Description: "Working directory for the command (default: sandbox default)",
 			Required:    false,
 		},
 	}
 }
 func (t *execTool) Execute(ctx context.Context, args map[string]interface{}) (*Result, error) {
 	cmdStr, ok := args["command"].(string)
 	if !ok || cmdStr == "" {
 		return ErrorResult("'command' argument is required and must be a string"), nil
 	}
 	// Use a timeout if specified in args
 	execCtx := ctx
 	if timeoutVal, ok := args["timeout"]; ok {
 		if timeout, err := toFloat64(timeoutVal); err == nil && timeout > 0 {
 			var cancel context.CancelFunc
 			execCtx, cancel = context.WithTimeout(ctx, time.Duration(timeout*float64(time.Second)))
 			defer cancel()
 		}
 	}
 	// Set working directory if specified
 	sb := t.sandbox
 	if wd, ok := args["workdir"].(string); ok && wd != "" {
 		if ps, ok := sb.(*sandbox.ProcessSandbox); ok {
 			ps.WorkingDir = wd
 		}
 	}
 	// Execute the command via shell
 	result, err := sb.Execute(execCtx, "sh", "-c", cmdStr)
 	if err != nil {
 		return nil, fmt.Errorf("exec tool: %w", err)
 	}
 	return &Result{
 		Success: result.ExitCode == 0,
 		Data: map[string]interface{}{
 			"stdout":    result.Stdout,
 			"stderr":    result.Stderr,
 			"exit_code": result.ExitCode,
 		},
 	}, nil
 }
 // ---------------------------------------------------------------------------
 // read_file — Read the contents of a file
 // ---------------------------------------------------------------------------
 type readFileTool struct{}
 func NewReadFileTool() Tool { return &readFileTool{} }
 func (t *readFileTool) Name() string { return "read_file" }
 func (t *readFileTool) Description() string {
 	return "Read the contents of a file from the local filesystem. Returns the file content as a string."
 }
 func (t *readFileTool) Parameters() map[string]ParameterSchema {
 	return map[string]ParameterSchema{
 		"path": {
 			Type:        "string",
 			Description: "Absolute path to the file to read",
 			Required:    true,
 		},
 	}
 }
 func (t *readFileTool) Execute(ctx context.Context, args map[string]interface{}) (*Result, error) {
 	path, ok := args["path"].(string)
 	if !ok || path == "" {
 		return ErrorResult("'path' argument is required and must be a string"), nil
 	}
 	// Prevent directory traversal / read of non-regular files
 	info, err := os.Stat(path)
 	if err != nil {
 		return ErrorResult(fmt.Sprintf("cannot access %q: %v", path, err)), nil
 	}
 	if info.IsDir() {
 		return ErrorResult(fmt.Sprintf("%q is a directory, not a file", path)), nil
 	}
 	data, err := os.ReadFile(path)
 	if err != nil {
 		return ErrorResult(fmt.Sprintf("failed to read %q: %v", path, err)), nil
 	}
 	return SuccessResult(map[string]interface{}{
 		"path":    path,
 		"content": string(data),
 		"size":    len(data),
 	}), nil
 }
 // ---------------------------------------------------------------------------
 // write_file — Write content to a file
 // ---------------------------------------------------------------------------
 type writeFileTool struct{}
 func NewWriteFileTool() Tool { return &writeFileTool{} }
 func (t *writeFileTool) Name() string { return "write_file" }
 func (t *writeFileTool) Description() string {
 	return "Write content to a file on the local filesystem. Creates parent directories if needed."
 }
 func (t *writeFileTool) Parameters() map[string]ParameterSchema {
 	return map[string]ParameterSchema{
 		"path": {
 			Type:        "string",
 			Description: "Absolute path where the file should be written",
 			Required:    true,
 		},
 		"content": {
 			Type:        "string",
 			Description: "The content to write to the file",
 			Required:    true,
 		},
 	}
 }
 func (t *writeFileTool) Execute(ctx context.Context, args map[string]interface{}) (*Result, error) {
 	path, ok := args["path"].(string)
 	if !ok || path == "" {
 		return ErrorResult("'path' argument is required and must be a string"), nil
 	}
 	content, ok := args["content"].(string)
 	if !ok {
 		return ErrorResult("'content' argument is required and must be a string"), nil
 	}
 	// Create parent directories
 	dir := filepath.Dir(path)
 	if err := os.MkdirAll(dir, 0755); err != nil {
 		return ErrorResult(fmt.Sprintf("failed to create directories for %q: %v", path, err)), nil
 	}
 	if err := os.WriteFile(path, []byte(content), 0644); err != nil {
 		return ErrorResult(fmt.Sprintf("failed to write %q: %v", path, err)), nil
 	}
 	return SuccessResult(map[string]interface{}{
 		"path": path,
 		"size": len(content),
 	}), nil
 }
 // ---------------------------------------------------------------------------
 // list_dir — List the contents of a directory
 // ---------------------------------------------------------------------------
 type listDirTool struct{}
 func NewListDirTool() Tool { return &listDirTool{} }
 func (t *listDirTool) Name() string { return "list_dir" }
 func (t *listDirTool) Description() string {
 	return "List files and directories in a given path. Returns names, sizes, and modification times."
 }
 func (t *listDirTool) Parameters() map[string]ParameterSchema {
 	return map[string]ParameterSchema{
 		"path": {
 			Type:        "string",
 			Description: "Absolute path to the directory to list",
 			Required:    true,
 		},
 		"recursive": {
 			Type:        "boolean",
 			Description: "Whether to list recursively (default: false)",
 			Required:    false,
 			Default:     false,
 		},
 	}
 }
 func (t *listDirTool) Execute(ctx context.Context, args map[string]interface{}) (*Result, error) {
 	path, ok := args["path"].(string)
 	if !ok || path == "" {
 		return ErrorResult("'path' argument is required and must be a string"), nil
 	}
 	recursive, _ := args["recursive"].(bool)
 	info, err := os.Stat(path)
 	if err != nil {
 		return ErrorResult(fmt.Sprintf("cannot access %q: %v", path, err)), nil
 	}
 	if !info.IsDir() {
 		return ErrorResult(fmt.Sprintf("%q is not a directory", path)), nil
 	}
 	var entries []map[string]interface{}
 	if recursive {
 		err = filepath.Walk(path, func(p string, fi os.FileInfo, err error) error {
 			if err != nil {
 				return err
 			}
 			rel, _ := filepath.Rel(path, p)
 			if rel == "." {
 				return nil
 			}
 			entries = append(entries, entryToMap(p, rel, fi))
 			return nil
 		})
 	} else {
 		files, err := os.ReadDir(path)
 		if err != nil {
 			return ErrorResult(fmt.Sprintf("failed to list %q: %v", path, err)), nil
 		}
 		for _, f := range files {
 			fi, err := f.Info()
 			if err != nil {
 				continue
 			}
 			fullPath := filepath.Join(path, f.Name())
 			entries = append(entries, entryToMap(fullPath, f.Name(), fi))
 		}
 	}
 	if err != nil {
 		return ErrorResult(fmt.Sprintf("failed to list %q: %v", path, err)), nil
 	}
 	return SuccessResult(map[string]interface{}{
 		"path":    path,
 		"entries": entries,
 		"count":   len(entries),
 	}), nil
 }
 func entryToMap(fullPath, name string, fi os.FileInfo) map[string]interface{} {
 	return map[string]interface{}{
 		"name":    name,
 		"path":    fullPath,
 		"size":    fi.Size(),
 		"is_dir":  fi.IsDir(),
 		"mode":    fi.Mode().String(),
 		"modtime": fi.ModTime().Format("2006-01-02T15:04:05Z07:00"),
 	}
 }
 // ---------------------------------------------------------------------------
 // search_files — Search for content in files
 // ---------------------------------------------------------------------------
 type searchFilesTool struct{}
 func NewSearchFilesTool() Tool { return &searchFilesTool{} }
 func (t *searchFilesTool) Name() string { return "search_files" }
 func (t *searchFilesTool) Description() string {
 	return "Search for a pattern in files within a directory. Supports simple substring matching."
 }
 func (t *searchFilesTool) Parameters() map[string]ParameterSchema {
 	return map[string]ParameterSchema{
 		"pattern": {
 			Type:        "string",
 			Description: "The text pattern to search for (substring match)",
 			Required:    true,
 		},
 		"path": {
 			Type:        "string",
 			Description: "Directory to search in (default: current directory)",
 			Required:    false,
 			Default:     ".",
 		},
 		"include": {
 			Type:        "string",
 			Description: "File glob pattern to include (e.g., '*.go', '*.{ts,tsx}')",
 			Required:    false,
 		},
 	}
 }
 func (t *searchFilesTool) Execute(ctx context.Context, args map[string]interface{}) (*Result, error) {
 	pattern, ok := args["pattern"].(string)
 	if !ok || pattern == "" {
 		return ErrorResult("'pattern' argument is required and must be a string"), nil
 	}
 	searchPath := "."
 	if p, ok := args["path"].(string); ok && p != "" {
 		searchPath = p
 	}
 	include, _ := args["include"].(string)
 	// Verify search path exists
 	info, err := os.Stat(searchPath)
 	if err != nil {
 		return ErrorResult(fmt.Sprintf("cannot access search path %q: %v", searchPath, err)), nil
 	}
 	if !info.IsDir() {
 		return ErrorResult(fmt.Sprintf("%q is not a directory", searchPath)), nil
 	}
 	var matches []map[string]interface{}
 	err = filepath.Walk(searchPath, func(p string, fi os.FileInfo, err error) error {
 		if err != nil {
 			return nil // skip files we can't access
 		}
 		if fi.IsDir() {
 			return nil
 		}
 		// Apply include filter
 		if include != "" {
 			matched, err := filepath.Match(include, fi.Name())
 			if err != nil || !matched {
 				return nil
 			}
 		}
 		// Read file and search
 		data, err := os.ReadFile(p)
 		if err != nil {
 			return nil // skip unreadable files
 		}
 		content := string(data)
 		if strings.Contains(content, pattern) {
 			matches = append(matches, map[string]interface{}{
 				"path": p,
 				"size": len(data),
 			})
 		}
 		return nil
 	})
 	if err != nil {
 		return ErrorResult(fmt.Sprintf("search failed: %v", err)), nil
 	}
 	return SuccessResult(map[string]interface{}{
 		"pattern": pattern,
 		"path":    searchPath,
 		"matches": matches,
 		"count":   len(matches),
 	}), nil
 }
 // ---------------------------------------------------------------------------
 // Helpers
 // ---------------------------------------------------------------------------
 // toFloat64 converts an interface{} value to float64.
 // Supports float64, int, int64, and json.Number types.
 func toFloat64(v interface{}) (float64, error) {
 	switch val := v.(type) {
 	case float64:
 		return val, nil
 	case int:
 		return float64(val), nil
 	case int64:
 		return float64(val), nil
 	case json.Number:
 		return val.Float64()
 	default:
 		return 0, fmt.Errorf("cannot convert %T to float64", v)
 	}
 }
 // Compile-time interface checks.
 var _ Tool = (*execTool)(nil)
 var _ Tool = (*readFileTool)(nil)
 var _ Tool = (*writeFileTool)(nil)
 var _ Tool = (*listDirTool)(nil)
 var _ Tool = (*searchFilesTool)(nil)
--- a/pkg/tool/builtin_test.go
+++ b/pkg/tool/builtin_test.go
@ -0,0 +1,399 @@
 package tool
 import (
 	"context"
 	"os"
 	"path/filepath"
 	"strings"
 	"testing"
 	"github.com/orca/orca/pkg/sandbox"
 )
 func TestExecTool(t *testing.T) {
 	sb := sandbox.NewProcessSandbox()
 	execT := NewExecTool(sb)
 	if execT.Name() != "exec" {
 		t.Errorf("expected name 'exec', got %q", execT.Name())
 	}
 	if execT.Description() == "" {
 		t.Error("expected non-empty description")
 	}
 	params := execT.Parameters()
 	if _, ok := params["command"]; !ok {
 		t.Error("expected 'command' parameter")
 	}
 }
 func TestExecToolExecute(t *testing.T) {
 	sb := sandbox.NewProcessSandbox()
 	execT := NewExecTool(sb)
 	ctx := context.Background()
 	result, err := execT.Execute(ctx, map[string]interface{}{
 		"command": "echo hello",
 	})
 	if err != nil {
 		t.Fatalf("Execute failed: %v", err)
 	}
 	if !result.Success {
 		t.Errorf("expected success, got error: %s", result.Error)
 	}
 	data := result.Data.(map[string]interface{})
 	stdout := data["stdout"].(string)
 	if strings.TrimSpace(stdout) != "hello" {
 		t.Errorf("expected stdout 'hello', got %q", stdout)
 	}
 }
 func TestExecToolMissingCommand(t *testing.T) {
 	sb := sandbox.NewProcessSandbox()
 	execT := NewExecTool(sb)
 	ctx := context.Background()
 	result, err := execT.Execute(ctx, map[string]interface{}{})
 	if err != nil {
 		t.Fatalf("Execute should not error for invalid args: %v", err)
 	}
 	if result.Success {
 		t.Error("expected failure for missing command")
 	}
 	if !strings.Contains(result.Error, "command") {
 		t.Errorf("error should mention 'command', got: %s", result.Error)
 	}
 }
 func TestReadFileTool(t *testing.T) {
 	readT := NewReadFileTool()
 	if readT.Name() != "read_file" {
 		t.Errorf("expected name 'read_file', got %q", readT.Name())
 	}
 }
 func TestReadFileToolExecute(t *testing.T) {
 	// Create a temp file
 	tmpFile, err := os.CreateTemp("", "orca-test-*")
 	if err != nil {
 		t.Fatalf("failed to create temp file: %v", err)
 	}
 	content := "test content\nline 2\n"
 	if _, err := tmpFile.WriteString(content); err != nil {
 		t.Fatalf("failed to write temp file: %v", err)
 	}
 	tmpFile.Close()
 	defer os.Remove(tmpFile.Name())
 	readT := NewReadFileTool()
 	ctx := context.Background()
 	result, err := readT.Execute(ctx, map[string]interface{}{
 		"path": tmpFile.Name(),
 	})
 	if err != nil {
 		t.Fatalf("Execute failed: %v", err)
 	}
 	if !result.Success {
 		t.Errorf("expected success, got error: %s", result.Error)
 	}
 	data := result.Data.(map[string]interface{})
 	gotContent := data["content"].(string)
 	if gotContent != content {
 		t.Errorf("expected content %q, got %q", content, gotContent)
 	}
 }
 func TestReadFileToolMissingPath(t *testing.T) {
 	readT := NewReadFileTool()
 	ctx := context.Background()
 	result, err := readT.Execute(ctx, map[string]interface{}{})
 	if err != nil {
 		t.Fatalf("Execute should not error for invalid args: %v", err)
 	}
 	if result.Success {
 		t.Error("expected failure for missing path")
 	}
 }
 func TestReadFileToolNonexistent(t *testing.T) {
 	readT := NewReadFileTool()
 	ctx := context.Background()
 	result, err := readT.Execute(ctx, map[string]interface{}{
 		"path": "/nonexistent/path/that/does/not/exist.txt",
 	})
 	if err != nil {
 		t.Fatalf("Execute should not error for missing file: %v", err)
 	}
 	if result.Success {
 		t.Error("expected failure for nonexistent file")
 	}
 }
 func TestWriteFileTool(t *testing.T) {
 	writeT := NewWriteFileTool()
 	if writeT.Name() != "write_file" {
 		t.Errorf("expected name 'write_file', got %q", writeT.Name())
 	}
 }
 func TestWriteFileToolExecute(t *testing.T) {
 	tmpDir, err := os.MkdirTemp("", "orca-write-test-*")
 	if err != nil {
 		t.Fatalf("failed to create temp dir: %v", err)
 	}
 	defer os.RemoveAll(tmpDir)
 	testPath := filepath.Join(tmpDir, "nested", "test.txt")
 	content := "hello world"
 	writeT := NewWriteFileTool()
 	ctx := context.Background()
 	result, err := writeT.Execute(ctx, map[string]interface{}{
 		"path":    testPath,
 		"content": content,
 	})
 	if err != nil {
 		t.Fatalf("Execute failed: %v", err)
 	}
 	if !result.Success {
 		t.Errorf("expected success, got error: %s", result.Error)
 	}
 	// Verify the file was written
 	data, err := os.ReadFile(testPath)
 	if err != nil {
 		t.Fatalf("failed to read written file: %v", err)
 	}
 	if string(data) != content {
 		t.Errorf("expected content %q, got %q", content, string(data))
 	}
 }
 func TestWriteFileToolMissingArgs(t *testing.T) {
 	writeT := NewWriteFileTool()
 	ctx := context.Background()
 	// Missing path
 	result, err := writeT.Execute(ctx, map[string]interface{}{
 		"content": "test",
 	})
 	if err != nil {
 		t.Fatalf("Execute should not error for invalid args: %v", err)
 	}
 	if result.Success {
 		t.Error("expected failure for missing path")
 	}
 	// Missing content
 	result, err = writeT.Execute(ctx, map[string]interface{}{
 		"path": "/tmp/test.txt",
 	})
 	if err != nil {
 		t.Fatalf("Execute should not error for invalid args: %v", err)
 	}
 	if result.Success {
 		t.Error("expected failure for missing content")
 	}
 }
 func TestListDirTool(t *testing.T) {
 	listT := NewListDirTool()
 	if listT.Name() != "list_dir" {
 		t.Errorf("expected name 'list_dir', got %q", listT.Name())
 	}
 }
 func TestListDirToolExecute(t *testing.T) {
 	tmpDir, err := os.MkdirTemp("", "orca-list-test-*")
 	if err != nil {
 		t.Fatalf("failed to create temp dir: %v", err)
 	}
 	defer os.RemoveAll(tmpDir)
 	// Create some test files
 	os.WriteFile(filepath.Join(tmpDir, "a.txt"), []byte("a"), 0644)
 	os.WriteFile(filepath.Join(tmpDir, "b.txt"), []byte("bb"), 0644)
 	os.Mkdir(filepath.Join(tmpDir, "subdir"), 0755)
 	listT := NewListDirTool()
 	ctx := context.Background()
 	result, err := listT.Execute(ctx, map[string]interface{}{
 		"path": tmpDir,
 	})
 	if err != nil {
 		t.Fatalf("Execute failed: %v", err)
 	}
 	if !result.Success {
 		t.Errorf("expected success, got error: %s", result.Error)
 	}
 	data := result.Data.(map[string]interface{})
 	count := data["count"].(int)
 	if count != 3 {
 		t.Errorf("expected 3 entries, got %d", count)
 	}
 }
 func TestListDirToolRecursive(t *testing.T) {
 	tmpDir, err := os.MkdirTemp("", "orca-list-rec-*")
 	if err != nil {
 		t.Fatalf("failed to create temp dir: %v", err)
 	}
 	defer os.RemoveAll(tmpDir)
 	os.MkdirAll(filepath.Join(tmpDir, "a", "b"), 0755)
 	os.WriteFile(filepath.Join(tmpDir, "a", "b", "c.txt"), []byte("c"), 0644)
 	listT := NewListDirTool()
 	ctx := context.Background()
 	result, err := listT.Execute(ctx, map[string]interface{}{
 		"path":      tmpDir,
 		"recursive": true,
 	})
 	if err != nil {
 		t.Fatalf("Execute failed: %v", err)
 	}
 	if !result.Success {
 		t.Errorf("expected success, got error: %s", result.Error)
 	}
 	data := result.Data.(map[string]interface{})
 	entries := data["entries"].([]map[string]interface{})
 	if len(entries) < 2 {
 		t.Errorf("expected at least 2 recursive entries, got %d", len(entries))
 	}
 }
 func TestListDirToolNonexistent(t *testing.T) {
 	listT := NewListDirTool()
 	ctx := context.Background()
 	result, err := listT.Execute(ctx, map[string]interface{}{
 		"path": "/nonexistent/path",
 	})
 	if err != nil {
 		t.Fatalf("Execute should not error for missing path: %v", err)
 	}
 	if result.Success {
 		t.Error("expected failure for nonexistent path")
 	}
 }
 func TestSearchFilesTool(t *testing.T) {
 	searchT := NewSearchFilesTool()
 	if searchT.Name() != "search_files" {
 		t.Errorf("expected name 'search_files', got %q", searchT.Name())
 	}
 }
 func TestSearchFilesToolExecute(t *testing.T) {
 	tmpDir, err := os.MkdirTemp("", "orca-search-test-*")
 	if err != nil {
 		t.Fatalf("failed to create temp dir: %v", err)
 	}
 	defer os.RemoveAll(tmpDir)
 	// Create test files
 	os.WriteFile(filepath.Join(tmpDir, "findme.go"), []byte("package main\nfunc hello() {\n}\n"), 0644)
 	os.WriteFile(filepath.Join(tmpDir, "other.py"), []byte("def world():\n    pass\n"), 0644)
 	searchT := NewSearchFilesTool()
 	ctx := context.Background()
 	result, err := searchT.Execute(ctx, map[string]interface{}{
 		"pattern": "hello",
 		"path":    tmpDir,
 	})
 	if err != nil {
 		t.Fatalf("Execute failed: %v", err)
 	}
 	if !result.Success {
 		t.Errorf("expected success, got error: %s", result.Error)
 	}
 	data := result.Data.(map[string]interface{})
 	count := data["count"].(int)
 	if count != 1 {
 		t.Errorf("expected 1 match for 'hello', got %d", count)
 	}
 }
 func TestSearchFilesToolNoMatch(t *testing.T) {
 	tmpDir, err := os.MkdirTemp("", "orca-search-nomatch-*")
 	if err != nil {
 		t.Fatalf("failed to create temp dir: %v", err)
 	}
 	defer os.RemoveAll(tmpDir)
 	os.WriteFile(filepath.Join(tmpDir, "test.txt"), []byte("nothing here"), 0644)
 	searchT := NewSearchFilesTool()
 	ctx := context.Background()
 	result, err := searchT.Execute(ctx, map[string]interface{}{
 		"pattern": "nonexistent-pattern-xyz",
 		"path":    tmpDir,
 	})
 	if err != nil {
 		t.Fatalf("Execute failed: %v", err)
 	}
 	if !result.Success {
 		t.Errorf("expected success even with no matches, got error: %s", result.Error)
 	}
 	data := result.Data.(map[string]interface{})
 	count := data["count"].(int)
 	if count != 0 {
 		t.Errorf("expected 0 matches, got %d", count)
 	}
 }
 func TestSearchFilesToolMissingPattern(t *testing.T) {
 	searchT := NewSearchFilesTool()
 	ctx := context.Background()
 	result, err := searchT.Execute(ctx, map[string]interface{}{})
 	if err != nil {
 		t.Fatalf("Execute should not error for invalid args: %v", err)
 	}
 	if result.Success {
 		t.Error("expected failure for missing pattern")
 	}
 }
 func TestToolInterfaceSatisfied(t *testing.T) {
 	sb := sandbox.NewProcessSandbox()
 	tools := []Tool{
 		NewExecTool(sb),
 		NewReadFileTool(),
 		NewWriteFileTool(),
 		NewListDirTool(),
 		NewSearchFilesTool(),
 	}
 	names := []string{"exec", "read_file", "write_file", "list_dir", "search_files"}
 	for i, tool := range tools {
 		if tool.Name() != names[i] {
 			t.Errorf("expected name %q, got %q", names[i], tool.Name())
 		}
 		if tool.Description() == "" {
 			t.Errorf("tool %q has empty description", names[i])
 		}
 		if tool.Parameters() == nil {
 			t.Errorf("tool %q has nil parameters", names[i])
 		}
 	}
 }
--- a/pkg/tool/manager.go
+++ b/pkg/tool/manager.go
@ -0,0 +1,108 @@
 package tool
 import (
 	"context"
 	"fmt"
 	"sort"
 	"sync"
 )
 // Manager is a thread-safe registry that manages tool registration and execution.
 //
 // Tools are registered by name (case-sensitive) and can be discovered,
 // listed, and invoked through the Manager. Duplicate registration returns
 // an error.
 type Manager struct {
 	mu    sync.RWMutex
 	tools map[string]Tool
 }
 // NewManager creates a new empty tool manager.
 func NewManager() *Manager {
 	return &Manager{
 		tools: make(map[string]Tool),
 	}
 }
 // Register adds a tool to the manager. Returns an error if a tool with the
 // same name is already registered.
 func (m *Manager) Register(tool Tool) error {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	name := tool.Name()
 	if _, exists := m.tools[name]; exists {
 		return fmt.Errorf("tool %q is already registered", name)
 	}
 	m.tools[name] = tool
 	return nil
 }
 // Unregister removes a tool from the manager by name.
 func (m *Manager) Unregister(name string) error {
 	m.mu.Lock()
 	defer m.mu.Unlock()
 	if _, exists := m.tools[name]; !exists {
 		return fmt.Errorf("tool %q is not registered", name)
 	}
 	delete(m.tools, name)
 	return nil
 }
 // Get retrieves a tool by name. Returns false if not found.
 func (m *Manager) Get(name string) (Tool, bool) {
 	m.mu.RLock()
 	defer m.mu.RUnlock()
 	t, ok := m.tools[name]
 	return t, ok
 }
 // List returns all registered tools sorted by name.
 func (m *Manager) List() []Tool {
 	m.mu.RLock()
 	defer m.mu.RUnlock()
 	result := make([]Tool, 0, len(m.tools))
 	for _, t := range m.tools {
 		result = append(result, t)
 	}
 	sort.Slice(result, func(i, j int) bool {
 		return result[i].Name() < result[j].Name()
 	})
 	return result
 }
 // Execute looks up a tool by name and invokes it with the given arguments.
 // Returns an error if the tool is not found.
 func (m *Manager) Execute(name string, ctx context.Context, args map[string]interface{}) (*Result, error) {
 	tool, ok := m.Get(name)
 	if !ok {
 		return nil, fmt.Errorf("tool %q not found", name)
 	}
 	return tool.Execute(ctx, args)
 }
 // Count returns the number of registered tools.
 func (m *Manager) Count() int {
 	m.mu.RLock()
 	defer m.mu.RUnlock()
 	return len(m.tools)
 }
 // Names returns the names of all registered tools sorted alphabetically.
 func (m *Manager) Names() []string {
 	m.mu.RLock()
 	defer m.mu.RUnlock()
 	names := make([]string, 0, len(m.tools))
 	for name := range m.tools {
 		names = append(names, name)
 	}
 	sort.Strings(names)
 	return names
 }
--- a/pkg/tool/tool.go
+++ b/pkg/tool/tool.go
@ -0,0 +1,81 @@
 // Package tool defines the Tool interface and the tool management system.
 //
 // Tools are the atomic capabilities that can be invoked by agents or LLMs.
 // Each tool has a name, description, a parameter schema (for LLM function calling),
 // and an Execute method that performs the actual work.
 //
 // Built-in tools include file operations (read, write, list, search) and
 // command execution through the sandbox. Custom tools can be registered
 // via the Manager.
 package tool
 import (
 	"context"
 	"encoding/json"
 )
 // ParameterSchema describes a single parameter accepted by a tool.
 type ParameterSchema struct {
 	Type        string              `json:"type"`
 	Description string              `json:"description"`
 	Required    bool                `json:"required"`
 	Default     interface{}         `json:"default,omitempty"`
 	Properties  map[string]ParameterSchema `json:"properties,omitempty"`
 	Items       *ParameterSchema    `json:"items,omitempty"`
 	Enum        []string            `json:"enum,omitempty"`
 }
 // Result holds the output of a tool execution.
 type Result struct {
 	Success  bool                   `json:"success"`
 	Data     interface{}            `json:"data,omitempty"`
 	Error    string                 `json:"error,omitempty"`
 	Metadata map[string]interface{} `json:"metadata,omitempty"`
 }
 // Tool defines the interface that all tools must implement.
 //
 // Tools are registered with a Manager and can be discovered and invoked
 // by name. The Execute method receives a context for cancellation and
 // a map of string-keyed arguments.
 type Tool interface {
 	// Name returns the unique identifier for this tool.
 	Name() string
 	// Description returns a human-readable description of what this tool does.
 	Description() string
 	// Parameters returns the schema describing accepted arguments.
 	// Used for LLM function calling and validation.
 	Parameters() map[string]ParameterSchema
 	// Execute performs the tool's function with the given arguments.
 	// The context controls cancellation and timeouts.
 	Execute(ctx context.Context, args map[string]interface{}) (*Result, error)
 }
 // SuccessResult creates a successful tool result with the given data.
 func SuccessResult(data interface{}) *Result {
 	return &Result{
 		Success: true,
 		Data:    data,
 	}
 }
 // ErrorResult creates a failed tool result with the given error message.
 func ErrorResult(err string) *Result {
 	return &Result{
 		Success: false,
 		Error:   err,
 	}
 }
 // MustMarshalArgs converts a map of arguments to JSON bytes, panicking on error.
 // Useful for logging and debugging.
 func MustMarshalArgs(args map[string]interface{}) []byte {
 	b, err := json.Marshal(args)
 	if err != nil {
 		panic("tool: failed to marshal args: " + err.Error())
 	}
 	return b
 }
--- a/thoughts/shared/designs/2026-05-07-orca-agent-framework-design.md
+++ b/thoughts/shared/designs/2026-05-07-orca-agent-framework-design.md
@ -0,0 +1,416 @@
 ---
 date: 2026-05-07
 topic: "Go Agent Framework - Orca"
 status: validated
 ---
 # Go Agent Framework (Orca) 设计文档
 ## Problem Statement
 构建一个基于 Go 的基础 Agent 框架，支持多 Agent 协作、持久化会话记忆、Skill 技能自动识别、沙箱安全执行、自定义 Tool 注册扩展，并接入 Ollama 本地模型（gemma4:e4b）。
 **核心挑战：**
 - 如何在 Go 中实现轻量、高并发的多 Agent 系统
 - 如何安全地执行用户命令和 Skill 脚本
 - 如何设计可扩展的插件机制（Skill / Tool）
 - 如何管理会话上下文和记忆
 ## Constraints
 1. **语言约束：** 纯 Go 实现，最小化外部依赖
 2. **存储约束：** 使用 JSON Lines（无 SQLite/数据库依赖）
 3. **隔离约束：** 进程级限制（chroot + 资源限制），不依赖 Docker
 4. **模型约束：** 仅接入 Ollama 本地模型，默认 gemma4:e4b
 5. **Skill 目录：** 读取 `~/.agents/skills/` 下的 Skill 定义
 6. **部署约束：** 单二进制文件，零配置启动
 ## Approach
 ### 架构风格：微内核 + Actor 模型
 采用**微内核架构**作为基础，所有功能（Skill、Tool、LLM 驱动）都以**插件**形式注册到核心。
 每个 **Agent 实例是一个独立的 Actor**，通过 **消息总线（Message Bus）** 进行通信。这完美契合 Go 的 goroutine + channel 并发模型。
 **为什么选择这个组合？**
 - 微内核保证核心最小化，Skill 和 Tool 热插拔
 - Actor 模型天然支持高并发，避免共享状态
 - 两者结合 = 轻量级、高扩展、Go 原生友好
 **放弃的其他方案：**
 - Docker 沙箱：太重，违背最小依赖原则
 - SQLite 存储：增加依赖，JSONL 已足够
 - 中央协调器：单点瓶颈，不如 Actor 模型灵活
 ## Architecture
 ### 整体架构图
 ```
 ┌─────────────────────────────────────────────────────────────┐
 │                        CLI / API Layer                       │
 └─────────────────────────────────────────────────────────────┘
                              │
                              ▼
 ┌─────────────────────────────────────────────────────────────┐
 │                      Core Kernel (微内核)                     │
 │  ┌──────────────┐  ┌──────────────┐  ┌──────────────────┐  │
 │  │  Message Bus │  │  Plugin Reg  │  │  Session Manager │  │
 │  │  (channel)   │  │  (registry)  │  │   (JSONL-based)  │  │
 │  └──────────────┘  └──────────────┘  └──────────────────┘  │
 └─────────────────────────────────────────────────────────────┘
                              │
              ┌───────────────┼───────────────┐
              ▼               ▼               ▼
 ┌─────────────────┐ ┌─────────────────┐ ┌─────────────────┐
 │   Agent Actor   │ │   Agent Actor   │ │   Agent Actor   │
 │  (Specialist 1) │ │  (Specialist 2) │ │  (Orchestrator) │
 └────────┬────────┘ └────────┬────────┘ └────────┬────────┘
         │                   │                   │
         └───────────────────┼───────────────────┘
                             ▼
 ┌─────────────────────────────────────────────────────────────┐
 │                      Plugin Layer                            │
 │  ┌──────────┐  ┌──────────┐  ┌──────────┐  ┌──────────────┐│
 │  │  Skills  │  │  Tools   │  │  Ollama  │  │ Custom Tools ││
 │  │(Skill Mgr)│  │(Tool Mgr)│  │ (Driver) │  │  (Registry)  ││
 │  └──────────┘  └──────────┘  └──────────┘  └──────────────┘│
 └─────────────────────────────────────────────────────────────┘
                              │
                              ▼
 ┌─────────────────────────────────────────────────────────────┐
 │                      Sandbox Layer                           │
 │         (Process-level isolation + Resource limits)          │
 └─────────────────────────────────────────────────────────────┘
 ```
 ### 模块职责
 | 模块 | 职责 |
 |------|------|
 | **Core Kernel** | 消息路由、插件生命周期管理、会话协调 |
 | **Message Bus** | 基于 Go channel 的异步消息传递系统 |
 | **Plugin Registry** | 统一的 Skill/Tool/LLM 驱动注册中心 |
 | **Session Manager** | 基于 JSONL 的会话历史读写和上下文窗口管理 |
 | **Agent Actor** | 独立 goroutine，持有状态，接收/发送消息 |
 | **Skill Manager** | 扫描 `~/.agents/skills/`，解析 SKILL.md，加载技能 |
 | **Tool Manager** | 管理内置工具和自定义工具的注册/调用 |
 | **Ollama Driver** | 封装 Ollama HTTP API，支持流式响应 |
 | **Sandbox** | 安全执行 shell 命令和脚本，限制资源和时间 |
 ## Components
 ### 1. Core Kernel (微内核)
 **职责：** 框架的最小化核心，只负责消息路由和插件生命周期。
 **设计要点：**
 - 使用 Go 的 `interface{}` 或泛型定义插件契约
 - 启动时加载所有已注册的插件
 - 提供事件总线供插件间通信
 - **不**包含任何业务逻辑（如 LLM 调用、命令执行）
 **核心接口：**
 ```
 // 所有插件必须实现
 Plugin interface {
    Name() string
    Init(kernel *Kernel) error
    Shutdown() error
 }
 // 消息总线
 MessageBus interface {
    Publish(topic string, msg Message) error
    Subscribe(topic string, handler Handler) (Subscription, error)
 }
 ```
 ### 2. Actor System (多 Agent 引擎)
 **职责：** 管理 Agent 生命周期和消息通信。
 **设计要点：**
 - 每个 Agent 是一个独立的 goroutine，通过 channel 接收消息
 - Agent 持有自己的状态（角色、上下文、工具列表）
 - 支持三种 Agent 类型：Orchestrator（协调者）、Worker（执行者）、Specialist（专家）
 - 消息类型：`TaskRequest`、`TaskResponse`、`ToolCall`、`Observation`
 **Agent 状态机：**
 ```
 Idle → Processing → [ToolCall] → WaitingForTool → Processing → Completed
                    ↓
              [Error] → Failed
 ```
 ### 3. Session Manager (会话记忆)
 **职责：** 持久化会话历史，支持上下文窗口管理。
 **设计要点：**
 - 每个会话一个 JSONL 文件：`~/.orca/sessions/{session_id}.jsonl`
 - 每行一个 JSON 对象：`{role, content, timestamp, metadata}`
 - 提供 `GetContext(windowSize)` 方法，返回最近的 N 条消息
 - 支持会话列表、搜索、归档
 **为什么 JSON Lines？**
 - 追加写入 O(1)，无需加载整个文件
 - 人类可读，便于调试
 - 零依赖，无需数据库驱动
 - 通过简单文件锁保证并发安全
 ### 4. Skill Manager (技能系统)
 **职责：** 自动发现和加载 Skill。
 **设计要点：**
 - 启动时扫描 `~/.agents/skills/` 下的所有子目录
 - 解析每个 Skill 目录下的 `SKILL.md`
 - 提取元数据：`name`、`description`、`triggers`（触发词）
 - Skill 可以包含脚本文件（`scripts/` 目录）
 - 提供 `FindSkill(query string)` 方法，基于触发词匹配
 **Skill 结构：**
 ```yaml
 name: "md2pdf"
 description: "Convert Markdown to PDF..."
 triggers: ["pdf", "markdown", "export"]
 scripts:
  - "scripts/convert.py"
  - "scripts/setup.sh"
 ```
 ### 5. Tool Manager (工具系统)
 **职责：** 管理可执行工具的注册和调用。
 **设计要点：**
 - **内置工具：** `exec`（执行命令）、`read_file`、`write_file`、`list_dir`
 - **Skill 工具：** 从 Skill 的 `scripts/` 目录自动注册
 - **自定义工具：** 通过代码注册，实现 `Tool` 接口
 - 每个工具定义：名称、描述、参数 schema、执行函数
 - LLM 通过 Function Calling 调用工具
 **Tool 接口：**
 ```
 Tool interface {
    Name() string
    Description() string
    Parameters() JSONSchema
    Execute(ctx Context, args map[string]any) (Result, error)
 }
 ```
 ### 6. Ollama Driver (LLM 驱动)
 **职责：** 封装 Ollama API，提供统一的 LLM 调用接口。
 **设计要点：**
 - 默认模型：`gemma4:e4b`
 - 支持流式响应（SSE）
 - 支持 Function Calling（通过 tools 参数）
 - 自动处理上下文窗口截断
 - 可配置参数：temperature、top_p、max_tokens
 **API 封装：**
 ```
 LLMClient interface {
    Chat(messages []Message, tools []Tool) (Response, error)
    ChatStream(messages []Message, tools []Tool) (Stream, error)
 }
 ```
 ### 7. Sandbox (沙箱执行)
 **职责：** 安全地执行终端命令和脚本。
 **设计要点：**
 - 使用 `os/exec` 创建子进程
 - 资源限制：CPU 时间、内存、输出大小
 - 超时控制：默认 30 秒，可配置
 - 工作目录限制：可选 chroot 或指定工作目录
 - 环境变量隔离：只允许白名单环境变量
 - **不**使用 Docker，保持轻量
 **安全策略：**
 ```yaml
 sandbox:
  timeout: 30s
  max_memory: 512MB
  max_output: 64KB
  allowed_env: [PATH, HOME, USER]
  working_dir: /tmp/orca-sandbox
  read_only_dirs: []
  blocked_commands: [rm -rf /, mkfs, dd]
 ```
 ## Data Flow
 ### 典型交互流程
 ```
 用户输入
    │
    ▼
 ┌─────────────┐
 │   CLI/API   │
 └──────┬──────┘
       │
       ▼
 ┌─────────────┐     ┌─────────────┐
 │ Session Mgr │────▶│ 加载历史上下文 │
 └──────┬──────┘     └─────────────┘
       │
       ▼
 ┌─────────────┐
 │ Orchestrator │ (Agent Actor)
 │   Agent      │
 └──────┬──────┘
       │
       ▼
 ┌─────────────┐     ┌─────────────┐
 │  Skill Mgr  │────▶│ 匹配相关 Skill │
 └──────┬──────┘     └─────────────┘
       │
       ▼
 ┌─────────────┐     ┌─────────────┐
 │ Ollama Driver│────▶│ 发送 prompt  │
 └──────┬──────┘     └─────────────┘
       │
       ▼
 ┌─────────────┐
 │ LLM Response │
 │ (Function    │
 │   Calling)   │
 └──────┬──────┘
       │
       ▼
 ┌─────────────┐     ┌─────────────┐
 │  Tool Call   │────▶│ 执行 Tool/   │
 │              │     │ 沙箱命令     │
 └──────┬──────┘     └─────────────┘
       │
       ▼
 ┌─────────────┐
 │ Observation  │ (工具执行结果)
 └──────┬──────┘
       │
       ▼
 ┌─────────────┐     ┌─────────────┐
 │ Orchestrator │────▶│ 决策：继续/完成 │
 └──────┬──────┘     └─────────────┘
       │
       ▼
 ┌─────────────┐
 │  保存会话     │
 │  返回结果     │
 └─────────────┘
 ```
 ### 消息类型定义
 ```go
 type Message struct {
    ID        string
    Type      MessageType // TaskRequest, TaskResponse, ToolCall, Observation, Error
    From      string      // Agent ID
    To        string      // Agent ID or "broadcast"
    Content   interface{} // 根据 Type 不同而变化
    Timestamp time.Time
 }
 type TaskRequest struct {
    Query    string
    SessionID string
    Context  []ChatMessage
 }
 type ToolCall struct {
    ToolName string
    Arguments map[string]interface{}
 }
 type Observation struct {
    ToolCallID string
    Output     string
    Error      string
 }
 ```
 ## Error Handling
 ### 策略
 1. **分层错误处理：**
   - **Kernel 层：** 插件加载失败 → 记录日志，跳过该插件，继续启动
   - **Agent 层：** 任务执行失败 → 返回错误消息，让 Orchestrator 决策重试或终止
   - **Tool 层：** 工具执行失败 → 返回结构化错误，LLM 可据此调整策略
   - **Sandbox 层：** 命令超时/内存超限 → 强制终止进程，返回错误
 2. **重试机制：**
   - LLM API 调用：指数退避重试 3 次
   - 工具执行：不重试（避免循环），由 LLM 决策
 3. **优雅降级：**
   - Ollama 不可用 → 提示用户检查服务
   - Skill 解析失败 → 跳过该 Skill，不影响其他
   - 沙箱执行失败 → 返回错误信息，LLM 可尝试其他工具
 ### 错误类型
 ```go
 type ErrorCategory int
 const (
    ErrCategoryKernel    ErrorCategory = iota // 内核错误
    ErrCategoryAgent                          // Agent 错误
    ErrCategoryTool                           // 工具错误
    ErrCategorySandbox                        // 沙箱错误
    ErrCategoryLLM                            // LLM 错误
    ErrCategoryNetwork                        // 网络错误
 )
 ```
 ## Testing Strategy
 ### 测试金字塔
 1. **单元测试（60%）：**
   - `Kernel`：插件注册/卸载、消息路由
   - `SessionManager`：JSONL 读写、上下文窗口截断
   - `SkillManager`：Skill 解析、触发词匹配
   - `Sandbox`：资源限制、超时控制
   - `OllamaDriver`：HTTP 请求封装（使用 mock server）
 2. **集成测试（30%）：**
   - Agent + Tool：端到端任务执行
   - Agent + LLM：使用 mock LLM 测试 Function Calling 流程
   - Skill + Sandbox：加载 Skill 并执行其脚本
 3. **E2E 测试（10%）：**
   - 完整 CLI 工作流
   - 多 Agent 协作场景
 ### Mock 策略
 - `LLMClient`：使用接口，测试时注入 mock
 - `Sandbox`：提供 `DryRun` 模式，记录命令但不执行
 - `MessageBus`：内存实现，用于测试
 ## Open Questions
 1. **Skill 执行方式：** Skill 脚本是用 Shell 调用还是直接在 Go 中执行？当前设计倾向 Shell 调用（通过 Sandbox），但 Python/Node 脚本需要对应运行时。
   - **假设：** 用户环境已安装所需运行时（Python、Node 等），Sandbox 只负责安全执行。
 2. **Function Calling 格式：** gemma4:e4b 对 Function Calling 的支持程度？
   - **假设：** 使用 Ollama 的 `tools` 参数格式，如果不支持则 fallback 到 prompt-based tool calling。
 3. **多 Agent 协作粒度：** Agent 之间是平等协作还是有层级？
   - **假设：** 支持两种模式：层级（Orchestrator + Workers）和平等（对等协作），由用户配置。
 4. **会话共享：** 多个 Agent 是否可以共享同一个会话上下文？
   - **假设：** 是，Session Manager 通过文件锁支持并发读取，但同一时间只有一个 Agent 写入。
 5. **Tool 参数 Schema：** 使用 JSON Schema 还是简化格式？
   - **假设：** 使用简化版 JSON Schema（支持 string/number/boolean/array/object + description）。
--- a/thoughts/shared/plans/2026-05-07-orca-agent-framework.md
+++ b/thoughts/shared/plans/2026-05-07-orca-agent-framework.md
@ -0,0 +1,373 @@
 ---
 date: 2026-05-07
 topic: "Go Agent Framework - Orca"
 status: draft
 ---
 # Orca Agent Framework - 实现计划
 ## 项目概览
 - **项目名称:** orca
 - **语言:** Go 1.22+
 - **路径:** /Users/wang/agent_dev/orca.ai/
 - **架构:** 微内核 + Actor 模型
 ## 实现阶段
 ### Phase 1: 项目骨架与核心基础设施（Day 1）
 **目标:** 建立项目结构，实现消息总线和插件注册机制。
 **任务清单:**
 1. **初始化 Go 模块**
   - `go mod init github.com/orca/orca`
   - 创建基础目录结构
 2. **目录结构**
   ```
   orca/
   ├── cmd/orca/              # CLI 入口
   ├── pkg/
   │   ├── kernel/            # 微内核核心
   │   ├── actor/             # Actor 系统
   │   ├── bus/               # 消息总线
   │   ├── plugin/            # 插件接口和注册
   │   ├── session/           # 会话管理 (JSONL)
   │   ├── skill/             # Skill 管理
   │   ├── tool/              # Tool 系统
   │   ├── llm/               # LLM 接口
   │   ├── ollama/            # Ollama 驱动
   │   └── sandbox/           # 沙箱执行
   ├── internal/
   │   ├── config/            # 配置管理
   │   └── util/              # 工具函数
   ├── plugins/
   │   ├── builtin/           # 内置插件
   │   └── tools/             # 内置工具
   ├── test/
   │   └── fixtures/          # 测试固件
   └── go.mod
   ```
 3. **核心接口定义**
   - `pkg/plugin/plugin.go`: Plugin 接口
   - `pkg/bus/bus.go`: MessageBus 接口和实现
   - `pkg/kernel/kernel.go`: Kernel 结构体，插件生命周期管理
 4. **消息总线实现**
   - 基于 Go channel 的发布/订阅
   - 支持同步和异步消息
   - 消息类型枚举定义
 **验收标准:**
 - `go build ./...` 成功
 - 消息总线单元测试通过（Publish/Subscribe）
 - 插件注册/卸载测试通过
 ---
 ### Phase 2: Actor 系统与会话管理（Day 2）
 **目标:** 实现多 Agent Actor 和 JSONL 会话存储。
 **任务清单:**
 1. **Actor 系统**
   - `pkg/actor/actor.go`: Agent Actor 接口
   - `pkg/actor/orchestrator.go`: 协调者 Agent
   - `pkg/actor/worker.go`: 工作者 Agent
   - `pkg/actor/system.go`: Actor 生命周期管理（创建、停止、监控）
   - 状态机实现：Idle → Processing → WaitingForTool → Completed/Failed
 2. **会话管理（JSONL）**
   - `pkg/session/store.go`: 存储接口
   - `pkg/session/jsonl.go`: JSONL 实现
   - `pkg/session/manager.go`: 会话管理器（创建、加载、归档）
   - 上下文窗口截断逻辑
   - 文件锁保证并发安全（`flock` 或简单文件锁）
 3. **配置系统**
   - `internal/config/config.go`: 配置结构体
   - 支持 YAML 配置文件（`~/.orca/config.yaml`）
   - 环境变量覆盖
   - 默认值设置
 **验收标准:**
 - 创建 10 个 Agent Actor 并发运行测试通过
 - 会话 CRUD 测试通过
 - 上下文窗口截断测试通过
 ---
 ### Phase 3: Skill 与 Tool 系统（Day 3）
 **目标:** 实现 Skill 自动发现和 Tool 注册执行。
 **任务清单:**
 1. **Skill 管理器**
   - `pkg/skill/manager.go`: Skill 扫描和加载
   - `pkg/skill/parser.go`: SKILL.md 解析器（提取 name, description, triggers）
   - `pkg/skill/skill.go`: Skill 结构体定义
   - 扫描目录：`~/.agents/skills/` 和 `~/.config/opencode/skills/`
   - 触发词匹配算法（简单关键词匹配或 TF-IDF）
 2. **Tool 系统**
   - `pkg/tool/tool.go`: Tool 接口定义
   - `pkg/tool/manager.go`: Tool 注册中心
   - `pkg/tool/registry.go`: 内置工具注册
   - **内置工具实现:**
     - `exec`: 执行 shell 命令（通过 sandbox）
     - `read_file`: 读取文件内容
     - `write_file`: 写入文件
     - `list_dir`: 列出目录
     - `search_files`: 文件内容搜索
 3. **自定义 Tool 注册**
   - 支持通过代码注册 Tool
   - Tool 参数 Schema 定义（简化版 JSON Schema）
   - Tool 执行上下文传递
 **验收标准:**
 - 扫描现有 `~/.agents/skills/` 目录，正确解析所有 Skill
 - 触发词匹配测试通过
 - 所有内置工具单元测试通过
 ---
 ### Phase 4: 沙箱与 Ollama 集成（Day 4）
 **目标:** 实现安全执行环境和 LLM 驱动。
 **任务清单:**
 1. **沙箱执行器**
   - `pkg/sandbox/sandbox.go`: Sandbox 接口
   - `pkg/sandbox/process.go`: 进程级实现
   - 资源限制：
     - 超时控制（context.WithTimeout）
     - 内存限制（通过 cgroup 或 ulimit，若不可用则软限制）
     - 输出大小限制
   - 工作目录隔离
   - 环境变量白名单
   - 危险命令黑名单
 2. **Ollama 驱动**
   - `pkg/ollama/client.go`: HTTP 客户端
   - `pkg/ollama/chat.go`: Chat API 封装
   - `pkg/ollama/stream.go`: 流式响应处理（SSE）
   - `pkg/ollama/tools.go`: Function Calling 支持
   - 模型配置：temperature、top_p、max_tokens
   - 自动重试机制（指数退避，3 次）
 3. **LLM 抽象层**
   - `pkg/llm/client.go`: LLMClient 接口
   - `pkg/llm/message.go`: Message 结构体定义
   - `pkg/llm/options.go`: 调用选项
 **验收标准:**
 - 沙箱执行命令并正确限制资源测试通过
 - 超时和内存限制测试通过
 - Ollama API 调用测试通过（需要本地 Ollama 服务）
 - Function Calling 格式正确
 ---
 ### Phase 5: CLI 与集成（Day 5）
 **目标:** 实现命令行界面和端到端集成。
 **任务清单:**
 1. **CLI 实现**
   - `cmd/orca/main.go`: 入口点
   - `cmd/orca/commands.go`: 子命令定义
   - 支持命令：
     - `orca chat`: 交互式对话
     - `orca run "query"`: 单次执行
     - `orca sessions`: 会话列表
     - `orca skills`: 已加载 Skill 列表
     - `orca tools`: 已注册 Tool 列表
     - `orca config`: 配置查看/设置
 2. **交互式对话**
   - 读取用户输入
   - 创建/恢复会话
   - 调用 Orchestrator Agent
   - 显示 Agent 思考过程和结果
   - 支持多轮对话
 3. **端到端集成测试**
   - 完整对话流程测试
   - Skill 触发和调用测试
   - Tool 调用链测试
   - 错误恢复测试
 **验收标准:**
 - `orca --help` 显示正确
 - `orca chat` 可以开始对话
 - 完整对话流程测试通过
 ---
 ### Phase 6: 多 Agent 协作与优化（Day 6-7）
 **目标:** 实现多 Agent 协作和性能优化。
 **任务清单:**
 1. **多 Agent 协作**
   - Orchestrator 任务分解逻辑
   - Worker Agent 分配策略
   - Agent 间消息传递
   - 结果汇总和冲突解决
 2. **性能优化**
   - 会话缓存（最近 N 个会话驻留内存）
   - Skill 索引（倒排索引加速匹配）
   - 连接池（Ollama HTTP 连接复用）
 3. **可观测性**
   - 结构化日志（slog）
   - Agent 执行追踪
   - 性能指标收集
 **验收标准:**
 - 多 Agent 协作测试通过
 - 性能基准测试通过（单次对话 < 5s）
 ---
 ## 依赖管理
 ### 外部依赖（最小化）
 | 依赖 | 用途 | 版本 |
 |------|------|------|
 | `github.com/spf13/cobra` | CLI 框架 | latest |
 | `github.com/spf13/viper` | 配置管理 | latest |
 | `github.com/stretchr/testify` | 测试 | latest |
 **原则:** 优先使用标准库，必要时才引入外部依赖。
 ### 内部依赖图
 ```
 kernel
 ├── bus
 ├── plugin
 ├── actor
 │   ├── bus
 │   ├── tool
 │   └── llm
 ├── session
 ├── skill
 ├── tool
 │   └── sandbox
 ├── llm
 │   └── ollama
 └── sandbox
 ```
 ## 关键接口定义
 ### Plugin 接口
 ```go
 type Plugin interface {
    Name() string
    Version() string
    Init(kernel *Kernel) error
    Shutdown() error
 }
 ```
 ### Agent 接口
 ```go
 type Agent interface {
    ID() string
    Role() string
    Process(ctx context.Context, msg Message) (Message, error)
    Stop() error
 }
 ```
 ### Tool 接口
 ```go
 type Tool interface {
    Name() string
    Description() string
    Parameters() ParameterSchema
    Execute(ctx context.Context, args map[string]interface{}) (ToolResult, error)
 }
 ```
 ### LLMClient 接口
 ```go
 type LLMClient interface {
    Chat(ctx context.Context, messages []Message, tools []Tool) (*ChatResponse, error)
    ChatStream(ctx context.Context, messages []Message, tools []Tool) (StreamReader, error)
 }
 ```
 ## 测试策略
 ### 单元测试覆盖目标
 | 模块 | 覆盖率目标 |
 |------|-----------|
 | bus | 90% |
 | kernel | 85% |
 | session | 90% |
 | skill | 85% |
 | tool | 90% |
 | sandbox | 80% |
 | ollama | 75% (mock) |
 ### Mock 实现
 ```go
 // MockLLMClient 用于测试
 type MockLLMClient struct {
    Responses []ChatResponse
    Index     int
 }
 func (m *MockLLMClient) Chat(ctx context.Context, messages []Message, tools []Tool) (*ChatResponse, error) {
    if m.Index >= len(m.Responses) {
        return nil, errors.New("no more mock responses")
    }
    resp := m.Responses[m.Index]
    m.Index++
    return &resp, nil
 }
 ```
 ## 风险与回退方案
 | 风险 | 影响 | 概率 | 回退方案 |
 |------|------|------|----------|
 | gemma4:e4b 不支持 Function Calling | 高 | 中 | 使用 prompt-based tool calling |
 | 进程级沙箱限制不足 | 中 | 低 | 添加 Docker 支持作为可选 |
 | JSONL 性能瓶颈 | 中 | 低 | 迁移到 SQLite（保留接口） |
 | Actor 模型复杂度 | 中 | 中 | 简化中央协调器模式 |
 ## 里程碑
 | 里程碑 | 时间 | 交付物 |
 |--------|------|--------|
 | M1 | Day 1 | 项目骨架 + 消息总线 + 插件系统 |
 | M2 | Day 2 | Actor 系统 + 会话管理 |
 | M3 | Day 3 | Skill + Tool 系统 |
 | M4 | Day 4 | 沙箱 + Ollama 集成 |
 | M5 | Day 5 | CLI + 端到端集成 |
 | M6 | Day 6-7 | 多 Agent + 优化 |
 ## 下一步
 执行 Phase 1，建立项目骨架。