fix: redo ollama llm provider using ollama sdk

bhouston · bhouston · commit 586fe827d048 · 2025-03-12T21:33:38.000-04:00
diff --git a/mycoder.config.js b/mycoder.config.js
@@ -9,12 +9,13 @@ export default {
   pageFilter: 'none', // 'simple', 'none', or 'readability'
 
   // Model settings
-  provider: 'anthropic',
-  model: 'claude-3-7-sonnet-20250219',
+  //provider: 'anthropic',
+  //model: 'claude-3-7-sonnet-20250219',
   //provider: 'openai',
   //model: 'gpt-4o',
   //provider: 'ollama',
   //model: 'medragondot/Sky-T1-32B-Preview:latest',
+  //model: 'llama3.2:3b',
   maxTokens: 4096,
   temperature: 0.7,
 
diff --git a/packages/agent/CHANGELOG.md b/packages/agent/CHANGELOG.md
@@ -1,23 +1,20 @@
 # [mycoder-agent-v1.3.0](https://github.com/drivecore/mycoder/compare/mycoder-agent-v1.2.0...mycoder-agent-v1.3.0) (2025-03-12)
 
-
 ### Features
 
-* implement MCP tools support ([2d99ac8](https://github.com/drivecore/mycoder/commit/2d99ac8cefaa770e368d469355a509739aafe6a3))
+- implement MCP tools support ([2d99ac8](https://github.com/drivecore/mycoder/commit/2d99ac8cefaa770e368d469355a509739aafe6a3))
 
 # [mycoder-agent-v1.2.0](https://github.com/drivecore/mycoder/compare/mycoder-agent-v1.1.0...mycoder-agent-v1.2.0) (2025-03-12)
 
-
 ### Bug Fixes
 
-* Fix TypeScript errors in MCP implementation ([f5837d3](https://github.com/drivecore/mycoder/commit/f5837d3a5dd219efc8e1d811e467f4bb695a1d94))
-
+- Fix TypeScript errors in MCP implementation ([f5837d3](https://github.com/drivecore/mycoder/commit/f5837d3a5dd219efc8e1d811e467f4bb695a1d94))
 
 ### Features
 
-* Add basic Model Context Protocol (MCP) support ([8ec9619](https://github.com/drivecore/mycoder/commit/8ec9619c3cc63df8f14222762f5da0bcabe273a5))
-* **agent:** implement incremental resource cleanup for agent lifecycle ([576436e](https://github.com/drivecore/mycoder/commit/576436ef2c7c5f234f088b7dba2e7fd65590738f)), closes [#236](https://github.com/drivecore/mycoder/issues/236)
-* background tools is now scope to agents ([e55817f](https://github.com/drivecore/mycoder/commit/e55817f32b373fdbff8bb1ac90105b272044d33f))
+- Add basic Model Context Protocol (MCP) support ([8ec9619](https://github.com/drivecore/mycoder/commit/8ec9619c3cc63df8f14222762f5da0bcabe273a5))
+- **agent:** implement incremental resource cleanup for agent lifecycle ([576436e](https://github.com/drivecore/mycoder/commit/576436ef2c7c5f234f088b7dba2e7fd65590738f)), closes [#236](https://github.com/drivecore/mycoder/issues/236)
+- background tools is now scope to agents ([e55817f](https://github.com/drivecore/mycoder/commit/e55817f32b373fdbff8bb1ac90105b272044d33f))
 
 # [mycoder-agent-v1.1.0](https://github.com/drivecore/mycoder/compare/mycoder-agent-v1.0.0...mycoder-agent-v1.1.0) (2025-03-12)
 
diff --git a/packages/agent/package.json b/packages/agent/package.json
@@ -52,6 +52,7 @@
     "chalk": "^5.4.1",
     "dotenv": "^16",
     "jsdom": "^26.0.0",
+    "ollama": "^0.5.14",
     "openai": "^4.87.3",
     "playwright": "^1.50.1",
     "uuid": "^11",
diff --git a/packages/agent/src/core/executeToolCall.ts b/packages/agent/src/core/executeToolCall.ts
@@ -14,7 +14,10 @@ export const executeToolCall = async (
 ): Promise<string> => {
   const tool = tools.find((t) => t.name === toolCall.name);
   if (!tool) {
-    throw new Error(`No tool with the name '${toolCall.name}' exists.`);
+    return JSON.stringify({
+      error: true,
+      message: `No tool with the name '${toolCall.name}' exists.`,
+    });
   }
 
   const logger = new Logger({
diff --git a/packages/agent/src/core/llm/providers/ollama.ts b/packages/agent/src/core/llm/providers/ollama.ts
@@ -2,15 +2,24 @@
  * Ollama provider implementation using the official Ollama npm package
  */
 
-import ollama, { Ollama, ChatResponse, Tool } from 'ollama';
+import {
+  ChatRequest as OllamaChatRequest,
+  ChatResponse as OllamaChatResponse,
+  Ollama,
+  ToolCall as OllamaTooCall,
+  Tool as OllamaTool,
+  Message as OllamaMessage,
+} from 'ollama';
+
 import { TokenUsage } from '../../tokens.js';
+import { ToolCall } from '../../types.js';
 import { LLMProvider } from '../provider.js';
 import {
-  FunctionDefinition,
   GenerateOptions,
   LLMResponse,
   Message,
   ProviderOptions,
+  FunctionDefinition,
 } from '../types.js';
 
 /**
@@ -31,9 +40,9 @@ export class OllamaProvider implements LLMProvider {
 
   constructor(model: string, options: OllamaOptions = {}) {
     this.model = model;
-    const baseUrl = 
-      options.baseUrl || 
-      process.env.OLLAMA_BASE_URL || 
+    const baseUrl =
+      options.baseUrl ||
+      process.env.OLLAMA_BASE_URL ||
       'http://localhost:11434';
 
     this.client = new Ollama({ host: baseUrl });
@@ -57,133 +66,165 @@ export class OllamaProvider implements LLMProvider {
     // Format messages for Ollama API
     const formattedMessages = this.formatMessages(messages);
 
-    try {
-      // Prepare chat options
-      const ollamaOptions: Record<string, any> = {
-        temperature,
-      };
-      
-      // Add optional parameters if provided
-      if (topP !== undefined) ollamaOptions.top_p = topP;
-      if (frequencyPenalty !== undefined) ollamaOptions.frequency_penalty = frequencyPenalty;
-      if (presencePenalty !== undefined) ollamaOptions.presence_penalty = presencePenalty;
-      if (maxTokens !== undefined) ollamaOptions.num_predict = maxTokens;
-      if (stopSequences && stopSequences.length > 0) ollamaOptions.stop = stopSequences;
-
-      // Prepare request parameters
-      const requestParams: any = {
-        model: this.model,
-        messages: formattedMessages,
-        stream: false,
-        options: ollamaOptions,
+    // Prepare request options
+    const requestOptions: OllamaChatRequest = {
+      model: this.model,
+      messages: formattedMessages,
+      stream: false,
+      options: {
+        temperature: temperature,
+        ...(topP !== undefined && { top_p: topP }),
+        ...(frequencyPenalty !== undefined && {
+          frequency_penalty: frequencyPenalty,
+        }),
+        ...(presencePenalty !== undefined && {
+          presence_penalty: presencePenalty,
+        }),
+        ...(stopSequences &&
+          stopSequences.length > 0 && { stop: stopSequences }),
+      },
+    };
+
+    // Add max_tokens if provided
+    if (maxTokens !== undefined) {
+      requestOptions.options = {
+        ...requestOptions.options,
+        num_predict: maxTokens,
       };
+    }
 
-      // Add functions/tools if provided
-      if (functions && functions.length > 0) {
-        requestParams.tools = this.convertFunctionsToTools(functions);
-      }
+    // Add functions/tools if provided
+    if (functions && functions.length > 0) {
+      requestOptions.tools = this.convertFunctionsToTools(functions);
+    }
 
-      // Make the API request using the Ollama client
-      const response = await this.client.chat(requestParams);
+    // Make the API request using the Ollama client
+    const response: OllamaChatResponse = await this.client.chat({
+      ...requestOptions,
+      stream: false,
+    });
 
-      // Extract content from response
-      const content = response.message?.content || '';
-      
-      // Process tool calls if present
-      const toolCalls = this.processToolCalls(response);
+    // Extract content and tool calls
+    const content = response.message?.content || '';
 
-      // Create token usage from response data
-      const tokenUsage = new TokenUsage();
-      if (response.prompt_eval_count) {
-        tokenUsage.input = response.prompt_eval_count;
-      }
-      if (response.eval_count) {
-        tokenUsage.output = response.eval_count;
-      }
+    // Handle tool calls if present
+    const toolCalls = this.extractToolCalls(response);
 
-      return {
-        text: content,
-        toolCalls: toolCalls,
-        tokenUsage: tokenUsage,
-      };
-    } catch (error) {
-      throw new Error(`Error calling Ollama API: ${(error as Error).message}`);
-    }
+    // Create token usage from response data
+    const tokenUsage = new TokenUsage();
+    tokenUsage.output = response.eval_count || 0;
+    tokenUsage.input = response.prompt_eval_count || 0;
+
+    return {
+      text: content,
+      toolCalls: toolCalls,
+      tokenUsage: tokenUsage,
+    };
   }
 
+  /*
+  interface Tool {
+    type: string;
+    function: {
+        name: string;
+        description: string;
+        parameters: {
+            type: string;
+            required: string[];
+            properties: {
+                [key: string]: {
+                    type: string;
+                    description: string;
+                    enum?: string[];
+                };
+            };
+        };
+    };
+}*/
+
   /**
-   * Convert our FunctionDefinition format to Ollama's Tool format
+   * Convert our function definitions to Ollama tool format
    */
-  private convertFunctionsToTools(functions: FunctionDefinition[]): Tool[] {
-    return functions.map((fn) => ({
-      type: 'function',
-      function: {
-        name: fn.name,
-        description: fn.description,
-        parameters: fn.parameters,
-      }
-    }));
+  private convertFunctionsToTools(
+    functions: FunctionDefinition[],
+  ): OllamaTool[] {
+    return functions.map(
+      (fn) =>
+        ({
+          type: 'function',
+          function: {
+            name: fn.name,
+            description: fn.description,
+            parameters: fn.parameters,
+          },
+        }) as OllamaTool,
+    );
   }
 
   /**
-   * Process tool calls from the Ollama response
+   * Extract tool calls from Ollama response
    */
-  private processToolCalls(response: ChatResponse): any[] {
-    if (!response.message?.tool_calls || response.message.tool_calls.length === 0) {
+  private extractToolCalls(response: OllamaChatResponse): ToolCall[] {
+    if (!response.message?.tool_calls) {
       return [];
     }
 
-    return response.message.tool_calls.map((toolCall) => ({
-      id: toolCall.function?.name 
-        ? `tool-${Date.now()}-${Math.random().toString(36).substring(2, 11)}`
-        : toolCall.id,
-      name: toolCall.function?.name,
-      content: JSON.stringify(toolCall.function?.arguments || {}),
-    }));
+    return response.message.tool_calls.map((toolCall: OllamaTooCall) => {
+      //console.log('ollama tool call', toolCall);
+      return {
+        id: `tool-${Date.now()}-${Math.random().toString(36).substring(2, 11)}`,
+        name: toolCall.function?.name,
+        content:
+          typeof toolCall.function?.arguments === 'string'
+            ? toolCall.function.arguments
+            : JSON.stringify(toolCall.function?.arguments || {}),
+      };
+    });
   }
 
   /**
    * Format messages for Ollama API
    */
-  private formatMessages(messages: Message[]): any[] {
-    return messages.map((msg) => {
-      if (
-        msg.role === 'user' ||
-        msg.role === 'assistant' ||
-        msg.role === 'system'
-      ) {
-        return {
-          role: msg.role,
-          content: msg.content,
-        };
-      } else if (msg.role === 'tool_result') {
-        // Ollama expects tool results as a 'tool' role
-        return {
-          role: 'tool',
-          content: msg.content,
-          tool_call_id: msg.tool_use_id,
-        };
-      } else if (msg.role === 'tool_use') {
-        // We'll convert tool_use to assistant messages with tool_calls
-        return {
-          role: 'assistant',
-          content: '',
-          tool_calls: [
+  private formatMessages(messages: Message[]): OllamaMessage[] {
+    const output: OllamaMessage[] = [];
+
+    messages.forEach((msg) => {
+      switch (msg.role) {
+        case 'user':
+        case 'assistant':
+        case 'system':
+          output.push({
+            role: msg.role,
+            content: msg.content,
+          } satisfies OllamaMessage);
+          break;
+        case 'tool_result':
+          // Ollama expects tool results as a 'tool' role
+          output.push({
+            role: 'tool',
+            content:
+              typeof msg.content === 'string'
+                ? msg.content
+                : JSON.stringify(msg.content),
+          } as OllamaMessage);
+          break;
+        case 'tool_use': {
+          // So there is an issue here is that ollama expects tool calls to be part of the assistant message
+          // get last message and add tool call to it
+          const lastMessage: OllamaMessage = output[output.length - 1]!;
+          lastMessage.tool_calls = [
             {
-              id: msg.id,
               function: {
                 name: msg.name,
-                arguments: msg.content,
-              }
+                arguments: JSON.parse(msg.content),
+              },
             },
-          ],
-        };
+          ];
+          break;
+        }
       }
-      // Default fallback for unknown message types
-      return {
-        role: 'user',
-        content: (msg as any).content || '',
-      };
     });
+
+    return output;
   }
-}
+}
diff --git a/packages/agent/src/tools/getTools.ts b/packages/agent/src/tools/getTools.ts
@@ -4,8 +4,7 @@ import { Tool } from '../core/types.js';
 // Import tools
 import { browseMessageTool } from './browser/browseMessage.js';
 import { browseStartTool } from './browser/browseStart.js';
-import { agentMessageTool } from './interaction/agentMessage.js';
-import { agentStartTool } from './interaction/agentStart.js';
+import { subAgentTool } from './interaction/subAgent.js';
 import { userPromptTool } from './interaction/userPrompt.js';
 import { fetchTool } from './io/fetch.js';
 import { textEditorTool } from './io/textEditor.js';
@@ -31,8 +30,9 @@ export function getTools(options?: GetToolsOptions): Tool[] {
   // Force cast to Tool type to avoid TypeScript issues
   const tools: Tool[] = [
     textEditorTool as unknown as Tool,
-    agentStartTool as unknown as Tool,
-    agentMessageTool as unknown as Tool,
+    subAgentTool as unknown as Tool,
+    /*agentStartTool as unknown as Tool,
+    agentMessageTool as unknown as Tool,*/
     sequenceCompleteTool as unknown as Tool,
     fetchTool as unknown as Tool,
     shellStartTool as unknown as Tool,
diff --git a/packages/cli/CHANGELOG.md b/packages/cli/CHANGELOG.md
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml