add orchestrator tests

Raezil · Raezil · commit 1b97b50b44ec · 2025-11-19T12:57:22.000+01:00
diff --git a/src/plugins/codemode/codemode.go b/src/plugins/codemode/codemode.go
@@ -42,6 +42,8 @@ type CodeModeUTCP struct {
 	model  interface {
 		Generate(ctx context.Context, prompt string) (any, error)
 	}
+	// For testing purposes, to mock the Execute method.
+	executeFunc func(ctx context.Context, args CodeModeArgs) (CodeModeResult, error)
 }
 
 func NewCodeModeUTCP(client utcp.UtcpClientInterface, model interface {
@@ -243,6 +245,10 @@ func indent(s, prefix string) string {
 }
 
 func (c *CodeModeUTCP) Execute(ctx context.Context, args CodeModeArgs) (CodeModeResult, error) {
+	// Allow mocking for tests
+	if c.executeFunc != nil {
+		return c.executeFunc(ctx, args)
+	}
 
 	i, stdout, stderr := newInterpreter()
 
diff --git a/src/plugins/codemode/orchestrator_test.go b/src/plugins/codemode/orchestrator_test.go
@@ -0,0 +1,287 @@
+package codemode
+
+import (
+	"context"
+	"encoding/json"
+	"errors"
+	"fmt"
+	"strings"
+	"testing"
+
+	"github.com/stretchr/testify/assert"
+	"github.com/stretchr/testify/require"
+	"github.com/universal-tool-calling-protocol/go-utcp/src/tools"
+)
+
+// mockModel simulates the behavior of an LLM for testing purposes.
+type mockModel struct {
+	GenerateFunc func(ctx context.Context, prompt string) (any, error)
+}
+
+func (m *mockModel) Generate(ctx context.Context, prompt string) (any, error) {
+	if m.GenerateFunc != nil {
+		return m.GenerateFunc(ctx, prompt)
+	}
+	return nil, errors.New("GenerateFunc not implemented")
+}
+
+func TestDecideIfToolsNeeded(t *testing.T) {
+	ctx := context.Background()
+
+	tests := []struct {
+		name           string
+		mockResponse   any
+		mockError      error
+		expectedNeeds  bool
+		expectedError  bool
+		responseIsJSON bool
+	}{
+		{
+			name:           "LLM decides tools are needed",
+			mockResponse:   `{"needs": true}`,
+			expectedNeeds:  true,
+			expectedError:  false,
+			responseIsJSON: true,
+		},
+		{
+			name:           "LLM decides tools are not needed",
+			mockResponse:   `{"needs": false}`,
+			expectedNeeds:  false,
+			expectedError:  false,
+			responseIsJSON: true,
+		},
+		{
+			name:          "LLM returns an error",
+			mockError:     errors.New("LLM error"),
+			expectedNeeds: false,
+			expectedError: true,
+		},
+		{
+			name:           "LLM returns invalid JSON",
+			mockResponse:   `{"needs": tru}`,
+			expectedNeeds:  false,
+			expectedError:  false,
+			responseIsJSON: true,
+		},
+		{
+			name:           "LLM returns non-JSON string",
+			mockResponse:   "I don't know.",
+			expectedNeeds:  false,
+			expectedError:  false,
+			responseIsJSON: false,
+		},
+	}
+
+	for _, tc := range tests {
+		t.Run(tc.name, func(t *testing.T) {
+			mock := &mockModel{
+				GenerateFunc: func(ctx context.Context, prompt string) (any, error) {
+					if tc.responseIsJSON {
+						return tc.mockResponse, tc.mockError
+					}
+					return fmt.Sprintf("%v", tc.mockResponse), tc.mockError
+				},
+			}
+			cm := CodeModeUTCP{model: mock}
+
+			needs, err := cm.decideIfToolsNeeded(ctx, "some query", "some tools")
+
+			if tc.expectedError {
+				require.Error(t, err)
+			} else {
+				require.NoError(t, err)
+				assert.Equal(t, tc.expectedNeeds, needs)
+			}
+		})
+	}
+}
+
+func TestSelectTools(t *testing.T) {
+	ctx := context.Background()
+	mock := &mockModel{
+		GenerateFunc: func(ctx context.Context, prompt string) (any, error) {
+			return `{"tools": ["tool1", "tool2"]}`, nil
+		},
+	}
+	cm := &CodeModeUTCP{model: mock}
+
+	selected, err := cm.selectTools(ctx, "some query", "some tools")
+
+	require.NoError(t, err)
+	assert.Equal(t, []string{"tool1", "tool2"}, selected)
+}
+
+func TestGenerateSnippet(t *testing.T) {
+	ctx := context.Background()
+	mockResp := struct {
+		Code   string `json:"code"`
+		Stream bool   `json:"stream"`
+	}{
+		Code:   `__out = "result"`,
+		Stream: false,
+	}
+	respBytes, _ := json.Marshal(mockResp)
+
+	mock := &mockModel{
+		GenerateFunc: func(ctx context.Context, prompt string) (any, error) {
+			return string(respBytes), nil
+		},
+	}
+	cm := &CodeModeUTCP{model: mock}
+
+	snippet, stream, err := cm.generateSnippet(ctx, "query", []string{"tool1"}, "specs")
+
+	require.NoError(t, err)
+	assert.Equal(t, mockResp.Code, snippet)
+	assert.Equal(t, mockResp.Stream, stream)
+}
+
+func TestRenderUtcpToolsForPrompt(t *testing.T) {
+	specs := []tools.Tool{
+		{
+			Name:        "test.tool",
+			Description: "A test tool.",
+			Inputs: tools.ToolInputOutputSchema{
+				Properties: map[string]any{
+					"arg1": map[string]any{"type": "string"},
+				},
+				Required: []string{"arg1"},
+			},
+			Outputs: tools.ToolInputOutputSchema{
+				Properties: map[string]any{
+					"result": map[string]any{"type": "string"},
+				},
+			},
+		},
+	}
+
+	output := renderUtcpToolsForPrompt(specs)
+
+	assert.Contains(t, output, "TOOL: test.tool")
+	assert.Contains(t, output, "DESCRIPTION: A test tool.")
+	assert.Contains(t, output, "INPUT FIELDS (USE EXACTLY THESE KEYS):")
+	assert.Contains(t, output, "- arg1: string")
+	assert.Contains(t, output, "REQUIRED FIELDS:")
+	assert.Contains(t, output, "FULL INPUT SCHEMA (JSON):")
+	assert.Contains(t, output, "OUTPUT SCHEMA (EXACT SHAPE RETURNED BY TOOL):")
+}
+
+func TestExtractJSON(t *testing.T) {
+	tests := []struct {
+		name     string
+		input    string
+		expected string
+	}{
+		{"pure json", `{"key": "value"}`, `{"key": "value"}`},
+		{"json with markdown", "```json\n{\"key\": \"value\"}\n```", `{"key": "value"}`},
+		{"json with markdown no lang", "```\n{\"key\": \"value\"}\n```", `{"key": "value"}`},
+		{"json with trailing text", `{"key": "value"} | some other text`, `{"key": "value"}`},
+		{"nested json", `{"key": {"nested_key": "nested_value"}}`, `{"key": {"nested_key": "nested_value"}}`},
+		{"text before json", `Here is the JSON: {"key": "value"}`, `{"key": "value"}`},
+		{"empty string", "", ""},
+		{"not a json", "just a string", ""},
+		{"incomplete json", `{"key":`, ""},
+		{"json with escaped quotes", `{"key": "value with \"quotes\""}`, `{"key": "value with \"quotes\""}`},
+	}
+
+	for _, tc := range tests {
+		t.Run(tc.name, func(t *testing.T) {
+			assert.Equal(t, tc.expected, extractJSON(tc.input))
+		})
+	}
+}
+
+func TestIsValidSnippet(t *testing.T) {
+	tests := []struct {
+		name     string
+		code     string
+		expected bool
+	}{
+		{
+			name:     "valid snippet",
+			code:     `__out, err := codemode.CallTool("test", nil)`,
+			expected: true,
+		},
+		{
+			name:     "valid snippet with assignment",
+			code:     `__out = "hello"`,
+			expected: true,
+		},
+		{
+			name:     "invalid due to map[value:]",
+			code:     `__out = map[value:"hello"]`,
+			expected: false,
+		},
+		{
+			name:     "invalid due to missing __out",
+			code:     `result, err := codemode.CallTool("test", nil)`,
+			expected: false,
+		},
+		{
+			name:     "empty code",
+			code:     "",
+			expected: false,
+		},
+	}
+
+	for _, tc := range tests {
+		t.Run(tc.name, func(t *testing.T) {
+			assert.Equal(t, tc.expected, isValidSnippet(tc.code))
+		})
+	}
+}
+
+func TestCallTool_NoToolsNeeded(t *testing.T) {
+	ctx := context.Background()
+	mock := &mockModel{
+		GenerateFunc: func(ctx context.Context, prompt string) (any, error) {
+			// This is for decideIfToolsNeeded
+			return `{"needs": false}`, nil
+		},
+	}
+	cm := &CodeModeUTCP{model: mock}
+
+	needed, result, err := cm.CallTool(ctx, "a prompt that doesn't need tools")
+
+	require.NoError(t, err)
+	assert.False(t, needed)
+	assert.Equal(t, "", result)
+}
+
+func TestCallTool_ToolsNeededAndExecuted(t *testing.T) {
+	ctx := context.Background()
+
+	// 1. Mock LLM responses for each step of the orchestration
+	mock := &mockModel{
+		GenerateFunc: func(ctx context.Context, prompt string) (any, error) {
+			switch {
+			case strings.Contains(prompt, "Decide if the following user query requires using ANY UTCP tools"):
+				return `{"needs": true}`, nil
+			case strings.Contains(prompt, "Select ALL UTCP tools that match the user's intent"):
+				return `{"tools": ["test.tool"]}`, nil
+			case strings.Contains(prompt, "Generate a Go snippet"):
+				return `{"code": "__out = \"success\""}`, nil
+			default:
+				return nil, fmt.Errorf("unexpected prompt: %s", prompt)
+			}
+		},
+	}
+
+	// 2. Create a CodeModeUTCP instance with the mock model and a mock Execute function
+	cm := &CodeModeUTCP{
+		model: mock,
+		// We override the Execute method for this test to avoid using the real interpreter.
+		// This is a common testing pattern, but in a real-world scenario,
+		// using an interface for the executor would be a cleaner approach.
+		executeFunc: func(ctx context.Context, args CodeModeArgs) (CodeModeResult, error) {
+			require.Equal(t, `__out = "success"`, args.Code, "Code passed to Execute should match the generated snippet")
+			return CodeModeResult{Value: "execution result"}, nil
+		},
+	}
+
+	// 3. Call the function and assert the results
+	needed, result, err := cm.CallTool(ctx, "a prompt that needs tools")
+	require.NoError(t, err)
+	assert.True(t, needed, "Should indicate that tools were needed")
+	assert.Equal(t, "execution result", result.(CodeModeResult).Value, "Should return the result from the mocked Execute function")
+}

Original file line number	Diff line number	Diff line change
`@@ -42,6 +42,8 @@ type CodeModeUTCP struct {`
`42`	`42`	`model interface {`
`43`	`43`	`Generate(ctx context.Context, prompt string) (any, error)`
`44`	`44`	`}`
	`45`	`+ // For testing purposes, to mock the Execute method.`
	`46`	`+ executeFunc func(ctx context.Context, args CodeModeArgs) (CodeModeResult, error)`
`45`	`47`	`}`
`46`	`48`
`47`	`49`	`func NewCodeModeUTCP(client utcp.UtcpClientInterface, model interface {`
`@@ -243,6 +245,10 @@ func indent(s, prefix string) string {`
`243`	`245`	`}`
`244`	`246`
`245`	`247`	`func (c *CodeModeUTCP) Execute(ctx context.Context, args CodeModeArgs) (CodeModeResult, error) {`
	`248`	`+ // Allow mocking for tests`
	`249`	`+ if c.executeFunc != nil {`
	`250`	`+ return c.executeFunc(ctx, args)`
	`251`	`+ }`
`246`	`252`
`247`	`253`	`i, stdout, stderr := newInterpreter()`
`248`	`254`