feat: M7 Elfs — sub-agents with router-integrated spawning

internal/elf/:
- BackgroundElf: runs on own goroutine with independent engine,
  history, and provider. No shared mutable state.
- Manager: spawns elfs via router.Select() (picks best arm per
  task type), tracks lifecycle, WaitAll(), CancelAll(), Cleanup().

internal/tool/agent/:
- Agent tool: LLM can call 'agent' to spawn sub-agents.
  Supports task_type hint for routing, wait/background mode.
  5-minute timeout, context cancellation propagated.

Concurrent tool execution:
- Read-only tools (fs.read, fs.grep, fs.glob, etc.) execute in
  parallel via goroutines.
- Write tools (bash, fs.write, fs.edit) execute sequentially.
- Partition by tool.IsReadOnly().

TUI: /elf command explains how to use sub-agents.
5 elf tests. Exit criteria: parent spawns 3 background elfs on
different providers, collects and synthesizes results.
This commit is contained in:
2026-04-03 19:16:46 +02:00
parent ec9a918da9
commit 07c739795c
7 changed files with 826 additions and 54 deletions

153
internal/elf/elf.go Normal file
View File

@@ -0,0 +1,153 @@
package elf
import (
"context"
"fmt"
"sync/atomic"
"time"
"somegit.dev/Owlibou/gnoma/internal/engine"
"somegit.dev/Owlibou/gnoma/internal/message"
"somegit.dev/Owlibou/gnoma/internal/stream"
)
// Status tracks the lifecycle of an elf.
type Status int
const (
StatusPending Status = iota
StatusRunning
StatusCompleted
StatusFailed
StatusCancelled
)
func (s Status) String() string {
switch s {
case StatusPending:
return "pending"
case StatusRunning:
return "running"
case StatusCompleted:
return "completed"
case StatusFailed:
return "failed"
case StatusCancelled:
return "cancelled"
default:
return "unknown"
}
}
// Result is the output of a completed elf.
type Result struct {
ID string
Status Status
Messages []message.Message
Usage message.Usage
Output string // final text output
Error error
Duration time.Duration
}
// Elf is a sub-agent with its own engine and conversation history.
type Elf interface {
// ID returns the unique elf identifier.
ID() string
// Status returns the current lifecycle status.
Status() Status
// Events returns a channel for streaming events (nil for sync elfs).
Events() <-chan stream.Event
// Wait blocks until the elf completes and returns its result.
Wait() Result
// Cancel aborts the elf.
Cancel()
}
var elfCounter atomic.Int64
func nextID(prefix string) string {
n := elfCounter.Add(1)
return fmt.Sprintf("%s-%d", prefix, n)
}
// BackgroundElf runs on its own goroutine with an independent engine.
type BackgroundElf struct {
id string
eng *engine.Engine
events chan stream.Event
result chan Result
cancel context.CancelFunc
status atomic.Int32
startAt time.Time
}
// SpawnBackground creates and starts a background elf.
func SpawnBackground(eng *engine.Engine, prompt string) *BackgroundElf {
ctx, cancel := context.WithCancel(context.Background())
elf := &BackgroundElf{
id: nextID("elf"),
eng: eng,
events: make(chan stream.Event, 64),
result: make(chan Result, 1),
cancel: cancel,
startAt: time.Now(),
}
elf.status.Store(int32(StatusRunning))
go elf.run(ctx, prompt)
return elf
}
func (e *BackgroundElf) run(ctx context.Context, prompt string) {
cb := func(evt stream.Event) {
select {
case e.events <- evt:
case <-ctx.Done():
}
}
turn, err := e.eng.Submit(ctx, prompt, cb)
close(e.events)
r := Result{
ID: e.id,
Duration: time.Since(e.startAt),
}
if ctx.Err() != nil {
r.Status = StatusCancelled
r.Error = ctx.Err()
e.status.Store(int32(StatusCancelled))
} else if err != nil {
r.Status = StatusFailed
r.Error = err
e.status.Store(int32(StatusFailed))
} else {
r.Status = StatusCompleted
r.Messages = turn.Messages
r.Usage = turn.Usage
// Extract final text from last assistant message
for i := len(turn.Messages) - 1; i >= 0; i-- {
if turn.Messages[i].Role == message.RoleAssistant {
r.Output = turn.Messages[i].TextContent()
break
}
}
e.status.Store(int32(StatusCompleted))
}
e.result <- r
}
func (e *BackgroundElf) ID() string { return e.id }
func (e *BackgroundElf) Status() Status { return Status(e.status.Load()) }
func (e *BackgroundElf) Events() <-chan stream.Event { return e.events }
func (e *BackgroundElf) Cancel() { e.cancel() }
func (e *BackgroundElf) Wait() Result {
return <-e.result
}

239
internal/elf/elf_test.go Normal file
View File

@@ -0,0 +1,239 @@
package elf
import (
"context"
"fmt"
"testing"
"time"
"somegit.dev/Owlibou/gnoma/internal/engine"
"somegit.dev/Owlibou/gnoma/internal/message"
"somegit.dev/Owlibou/gnoma/internal/provider"
"somegit.dev/Owlibou/gnoma/internal/router"
"somegit.dev/Owlibou/gnoma/internal/stream"
"somegit.dev/Owlibou/gnoma/internal/tool"
)
// --- Mock Provider ---
type mockProvider struct {
name string
calls int
streams []stream.Stream
}
func (m *mockProvider) Name() string { return m.name }
func (m *mockProvider) DefaultModel() string { return "mock" }
func (m *mockProvider) Models(_ context.Context) ([]provider.ModelInfo, error) { return nil, nil }
func (m *mockProvider) Stream(_ context.Context, _ provider.Request) (stream.Stream, error) {
if m.calls >= len(m.streams) {
return nil, fmt.Errorf("no more streams")
}
s := m.streams[m.calls]
m.calls++
return s, nil
}
type eventStream struct {
events []stream.Event
idx int
}
func newEventStream(text string) *eventStream {
return &eventStream{
events: []stream.Event{
{Type: stream.EventTextDelta, Text: text},
{Type: stream.EventTextDelta, StopReason: message.StopEndTurn},
},
}
}
func (s *eventStream) Next() bool { s.idx++; return s.idx <= len(s.events) }
func (s *eventStream) Current() stream.Event { return s.events[s.idx-1] }
func (s *eventStream) Err() error { return nil }
func (s *eventStream) Close() error { return nil }
// --- Tests ---
func TestBackgroundElf_RunsAndCompletes(t *testing.T) {
mp := &mockProvider{
name: "test",
streams: []stream.Stream{newEventStream("Hello from elf!")},
}
eng, _ := engine.New(engine.Config{Provider: mp, Tools: tool.NewRegistry()})
elf := SpawnBackground(eng, "say hello")
if elf.Status() != StatusRunning {
t.Errorf("initial status = %s, want running", elf.Status())
}
result := elf.Wait()
if result.Status != StatusCompleted {
t.Errorf("result status = %s, want completed", result.Status)
}
if result.Output != "Hello from elf!" {
t.Errorf("output = %q", result.Output)
}
if result.Duration <= 0 {
t.Error("duration should be positive")
}
if elf.Status() != StatusCompleted {
t.Errorf("final status = %s, want completed", elf.Status())
}
}
func TestBackgroundElf_Cancel(t *testing.T) {
// Stream that blocks
slowStream := &slowEventStream{}
mp := &mockProvider{
name: "test",
streams: []stream.Stream{slowStream},
}
eng, _ := engine.New(engine.Config{Provider: mp, Tools: tool.NewRegistry()})
elf := SpawnBackground(eng, "slow task")
time.Sleep(10 * time.Millisecond)
elf.Cancel()
result := elf.Wait()
if result.Status != StatusCancelled && result.Status != StatusFailed {
t.Errorf("status = %s, want cancelled or failed", result.Status)
}
}
func TestBackgroundElf_CollectEvents(t *testing.T) {
mp := &mockProvider{
name: "test",
streams: []stream.Stream{newEventStream("event test")},
}
eng, _ := engine.New(engine.Config{Provider: mp, Tools: tool.NewRegistry()})
elf := SpawnBackground(eng, "generate events")
var events []stream.Event
for evt := range elf.Events() {
events = append(events, evt)
}
if len(events) == 0 {
t.Error("should receive events")
}
}
func TestManager_SpawnAndList(t *testing.T) {
mp := &mockProvider{
name: "test",
streams: []stream.Stream{
newEventStream("elf 1"),
newEventStream("elf 2"),
},
}
rtr := router.New(router.Config{})
rtr.RegisterArm(&router.Arm{
ID: "test/mock",
Provider: mp,
ModelName: "mock",
Capabilities: provider.Capabilities{ToolUse: true},
})
mgr := NewManager(ManagerConfig{
Router: rtr,
Tools: tool.NewRegistry(),
})
// Spawn two elfs
e1, err := mgr.Spawn(context.Background(), router.TaskGeneration, "task 1", "you are elf 1")
if err != nil {
t.Fatalf("Spawn 1: %v", err)
}
e2, err := mgr.Spawn(context.Background(), router.TaskReview, "task 2", "you are elf 2")
if err != nil {
t.Fatalf("Spawn 2: %v", err)
}
// List should have 2
if len(mgr.List()) != 2 {
t.Errorf("List() = %d, want 2", len(mgr.List()))
}
// Wait for both
r1 := e1.Wait()
r2 := e2.Wait()
if r1.Status != StatusCompleted {
t.Errorf("elf 1 status = %s", r1.Status)
}
if r2.Status != StatusCompleted {
t.Errorf("elf 2 status = %s", r2.Status)
}
// Active should be 0
if len(mgr.Active()) != 0 {
t.Errorf("Active() = %d, want 0", len(mgr.Active()))
}
// Cleanup
mgr.Cleanup()
if len(mgr.List()) != 0 {
t.Errorf("after cleanup, List() = %d", len(mgr.List()))
}
}
func TestManager_WaitAll(t *testing.T) {
mp := &mockProvider{
name: "test",
streams: []stream.Stream{
newEventStream("result A"),
newEventStream("result B"),
newEventStream("result C"),
},
}
rtr := router.New(router.Config{})
rtr.RegisterArm(&router.Arm{
ID: "test/mock", Provider: mp, ModelName: "mock",
Capabilities: provider.Capabilities{ToolUse: true},
})
mgr := NewManager(ManagerConfig{Router: rtr, Tools: tool.NewRegistry()})
mgr.Spawn(context.Background(), router.TaskGeneration, "a", "")
mgr.Spawn(context.Background(), router.TaskGeneration, "b", "")
mgr.Spawn(context.Background(), router.TaskGeneration, "c", "")
results := mgr.WaitAll()
if len(results) != 3 {
t.Fatalf("WaitAll() = %d results, want 3", len(results))
}
completed := 0
for _, r := range results {
if r.Status == StatusCompleted {
completed++
}
}
if completed != 3 {
t.Errorf("%d completed, want 3", completed)
}
}
// slowEventStream blocks until context cancelled
type slowEventStream struct {
done bool
}
func (s *slowEventStream) Next() bool {
if s.done {
return false
}
time.Sleep(100 * time.Millisecond)
return false
}
func (s *slowEventStream) Current() stream.Event { return stream.Event{} }
func (s *slowEventStream) Err() error { return context.Canceled }
func (s *slowEventStream) Close() error { s.done = true; return nil }

184
internal/elf/manager.go Normal file
View File

@@ -0,0 +1,184 @@
package elf
import (
"context"
"fmt"
"log/slog"
"sync"
"somegit.dev/Owlibou/gnoma/internal/engine"
"somegit.dev/Owlibou/gnoma/internal/provider"
"somegit.dev/Owlibou/gnoma/internal/router"
"somegit.dev/Owlibou/gnoma/internal/tool"
)
// Manager spawns, tracks, and manages elfs.
type Manager struct {
mu sync.RWMutex
elfs map[string]Elf
router *router.Router
tools *tool.Registry
logger *slog.Logger
}
type ManagerConfig struct {
Router *router.Router
Tools *tool.Registry
Logger *slog.Logger
}
func NewManager(cfg ManagerConfig) *Manager {
logger := cfg.Logger
if logger == nil {
logger = slog.Default()
}
return &Manager{
elfs: make(map[string]Elf),
router: cfg.Router,
tools: cfg.Tools,
logger: logger,
}
}
// Spawn creates a new background elf with a router-selected provider.
// The elf gets its own engine, history, and tools — no shared state.
func (m *Manager) Spawn(ctx context.Context, taskType router.TaskType, prompt, systemPrompt string) (Elf, error) {
// Ask router for the best arm for this task type
task := router.Task{
Type: taskType,
RequiresTools: true,
Priority: router.PriorityNormal,
EstimatedTokens: 4000,
}
decision := m.router.Select(task)
if decision.Error != nil {
return nil, fmt.Errorf("no arm available for elf: %w", decision.Error)
}
arm := decision.Arm
m.logger.Info("spawning elf",
"arm", arm.ID,
"task_type", taskType,
"model", arm.ModelName,
)
// Create independent engine for the elf
eng, err := engine.New(engine.Config{
Provider: arm.Provider,
Tools: m.tools,
System: systemPrompt,
Model: arm.ModelName,
MaxTurns: 20,
Logger: m.logger,
})
if err != nil {
return nil, fmt.Errorf("create elf engine: %w", err)
}
elf := SpawnBackground(eng, prompt)
m.mu.Lock()
m.elfs[elf.ID()] = elf
m.mu.Unlock()
m.logger.Info("elf spawned", "id", elf.ID(), "arm", arm.ID)
return elf, nil
}
// SpawnWithProvider creates an elf using a specific provider (bypasses router).
func (m *Manager) SpawnWithProvider(prov provider.Provider, model, prompt, systemPrompt string) (Elf, error) {
eng, err := engine.New(engine.Config{
Provider: prov,
Tools: m.tools,
System: systemPrompt,
Model: model,
MaxTurns: 20,
Logger: m.logger,
})
if err != nil {
return nil, fmt.Errorf("create elf engine: %w", err)
}
elf := SpawnBackground(eng, prompt)
m.mu.Lock()
m.elfs[elf.ID()] = elf
m.mu.Unlock()
m.logger.Info("elf spawned (direct)", "id", elf.ID(), "model", model)
return elf, nil
}
// Get returns an elf by ID.
func (m *Manager) Get(id string) (Elf, bool) {
m.mu.RLock()
defer m.mu.RUnlock()
e, ok := m.elfs[id]
return e, ok
}
// List returns all tracked elfs.
func (m *Manager) List() []Elf {
m.mu.RLock()
defer m.mu.RUnlock()
elfs := make([]Elf, 0, len(m.elfs))
for _, e := range m.elfs {
elfs = append(elfs, e)
}
return elfs
}
// Active returns elfs that are still running.
func (m *Manager) Active() []Elf {
m.mu.RLock()
defer m.mu.RUnlock()
var active []Elf
for _, e := range m.elfs {
if e.Status() == StatusRunning {
active = append(active, e)
}
}
return active
}
// CancelAll cancels all running elfs.
func (m *Manager) CancelAll() {
m.mu.RLock()
defer m.mu.RUnlock()
for _, e := range m.elfs {
if e.Status() == StatusRunning {
e.Cancel()
}
}
}
// WaitAll waits for all elfs to complete and returns their results.
func (m *Manager) WaitAll() []Result {
elfs := m.List()
results := make([]Result, len(elfs))
var wg sync.WaitGroup
for i, e := range elfs {
wg.Add(1)
go func(idx int, elf Elf) {
defer wg.Done()
results[idx] = elf.Wait()
}(i, e)
}
wg.Wait()
return results
}
// Cleanup removes completed/failed/cancelled elfs from tracking.
func (m *Manager) Cleanup() {
m.mu.Lock()
defer m.mu.Unlock()
for id, e := range m.elfs {
s := e.Status()
if s == StatusCompleted || s == StatusFailed || s == StatusCancelled {
delete(m.elfs, id)
}
}
}