fix(agent): improve ReAct parser and tool schemas for better LLM compatibility

- Fix ACTION_INPUT regex to properly capture multiline JSON responses - Changed from stopping at first newline to capturing all remaining text - Resolves parsing errors when LLM generates formatted JSON with line breaks - Enhance tool schemas with detailed descriptions and parameter specifications - Add comprehensive Message schema for generate_text tool - Clarify distinction between resources/get (file read) and resources/list (directory listing) - Include clear usage guidance in tool descriptions - Set default model to llama3.2:latest instead of invalid "ollama" - Add parse error debugging to help troubleshoot LLM response issues The agent infrastructure now correctly handles multiline tool arguments and provides better guidance to LLMs through improved tool schemas. Remaining errors are due to LLM quality (model making poor tool choices or generating malformed responses), not infrastructure bugs. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com>
2025-10-09 19:43:07 +02:00
parent 05e90d3e2b
commit 33d11ae223
25 changed files with 1348 additions and 121 deletions
--- a/crates/owlen-mcp-llm-server/Cargo.toml
+++ b/crates/owlen-mcp-llm-server/Cargo.toml
@@ -12,9 +12,9 @@ serde_json = "1.0"
 anyhow = "1.0"
 tokio-stream = "0.1"

+[lib]
+path = "src/lib.rs"
+
 [[bin]]
 name = "owlen-mcp-llm-server"
 path = "src/lib.rs"
-
-[lib]
-path = "src/lib.rs"
--- a/crates/owlen-mcp-llm-server/src/lib.rs
+++ b/crates/owlen-mcp-llm-server/src/lib.rs
@@ -38,16 +38,33 @@ struct GenerateTextArgs {
 fn generate_text_descriptor() -> McpToolDescriptor {
    McpToolDescriptor {
        name: "generate_text".to_string(),
-        description: "Generate text using Ollama LLM".to_string(),
-        // Very permissive schema; callers must supply proper fields
+        description: "Generate text using Ollama LLM. Each message must have 'role' (user/assistant/system) and 'content' (string) fields.".to_string(),
        input_schema: json!({
            "type": "object",
            "properties": {
-                "messages": {"type": "array"},
-                "temperature": {"type": ["number", "null"]},
-                "max_tokens": {"type": ["integer", "null"]},
-                "model": {"type": "string"},
-                "stream": {"type": "boolean"}
+                "messages": {
+                    "type": "array",
+                    "items": {
+                        "type": "object",
+                        "properties": {
+                            "role": {
+                                "type": "string",
+                                "enum": ["user", "assistant", "system"],
+                                "description": "The role of the message sender"
+                            },
+                            "content": {
+                                "type": "string",
+                                "description": "The message content"
+                            }
+                        },
+                        "required": ["role", "content"]
+                    },
+                    "description": "Array of message objects with role and content"
+                },
+                "temperature": {"type": ["number", "null"], "description": "Sampling temperature (0.0-2.0)"},
+                "max_tokens": {"type": ["integer", "null"], "description": "Maximum tokens to generate"},
+                "model": {"type": "string", "description": "Model name (e.g., llama3.2:latest)"},
+                "stream": {"type": "boolean", "description": "Whether to stream the response"}
            },
            "required": ["messages", "model", "stream"]
        }),
@@ -56,6 +73,39 @@ fn generate_text_descriptor() -> McpToolDescriptor {
    }
 }

+/// Tool descriptor for resources/get (read file)
+fn resources_get_descriptor() -> McpToolDescriptor {
+    McpToolDescriptor {
+        name: "resources/get".to_string(),
+        description: "Read and return the TEXT CONTENTS of a single FILE. Use this to read the contents of code files, config files, or text documents. Do NOT use for directories.".to_string(),
+        input_schema: json!({
+            "type": "object",
+            "properties": {
+                "path": {"type": "string", "description": "Path to the FILE (not directory) to read"}
+            },
+            "required": ["path"]
+        }),
+        requires_network: false,
+        requires_filesystem: vec!["read".to_string()],
+    }
+}
+
+/// Tool descriptor for resources/list (list directory)
+fn resources_list_descriptor() -> McpToolDescriptor {
+    McpToolDescriptor {
+        name: "resources/list".to_string(),
+        description: "List the NAMES of all files and directories in a directory. Use this to see what files exist in a folder, or to list directory contents. Returns an array of file/directory names.".to_string(),
+        input_schema: json!({
+            "type": "object",
+            "properties": {
+                "path": {"type": "string", "description": "Path to the DIRECTORY to list (use '.' for current directory)"}
+            }
+        }),
+        requires_network: false,
+        requires_filesystem: vec!["read".to_string()],
+    }
+}
+
 async fn handle_generate_text(args: GenerateTextArgs) -> Result<String, RpcError> {
    // Create provider with default local Ollama URL
    let provider = OllamaProvider::new("http://localhost:11434")
@@ -130,8 +180,12 @@ async fn handle_request(req: &RpcRequest) -> Result<Value, RpcError> {
            Ok(serde_json::to_value(result).unwrap())
        }
        methods::TOOLS_LIST => {
-            let desc = generate_text_descriptor();
-            Ok(json!([desc]))
+            let tools = vec![
+                generate_text_descriptor(),
+                resources_get_descriptor(),
+                resources_list_descriptor(),
+            ];
+            Ok(json!(tools))
        }
        // New method to list available Ollama models via the provider.
        methods::MODELS_LIST => {
@@ -213,8 +267,6 @@ async fn main() -> anyhow::Result<()> {
                        }
                    };
                    // Dispatch based on the requested tool name.
-                    // Debug tool name for troubleshooting
-                    eprintln!("Tool name received: {}", call.name);
                    // Handle resources tools manually.
                    if call.name.starts_with("resources/get") {
                        let path = call