Enhance the Ollama model definitions (#149)

ptitjes · Ololoshechkin · commit 3603dc028b18 · 2025-06-05T02:33:53.000+02:00
diff --git a/prompt/prompt-executor/prompt-executor-clients/prompt-executor-ollama-client/src/commonMain/kotlin/ai/koog/prompt/executor/ollama/client/OllamaClient.kt b/prompt/prompt-executor/prompt-executor-clients/prompt-executor-ollama-client/src/commonMain/kotlin/ai/koog/prompt/executor/ollama/client/OllamaClient.kt
@@ -7,6 +7,7 @@ import ai.koog.prompt.executor.clients.LLMClient
 import ai.koog.prompt.executor.clients.LLMEmbeddingProvider
 import ai.koog.prompt.executor.ollama.client.dto.*
 import ai.koog.prompt.llm.LLMCapability
+import ai.koog.prompt.llm.LLMProvider
 import ai.koog.prompt.llm.LLModel
 import ai.koog.prompt.message.Message
 import io.ktor.client.*
@@ -30,13 +31,11 @@ import kotlinx.serialization.json.Json
  * @property baseUrl The base URL of the Ollama API server.
  * @property baseClient The HTTP client used for making requests.
  * @property timeoutConfig Timeout configuration for HTTP requests.
- * @property enableDynamicModels Whether to enable dynamic model resolution.
  */
 public class OllamaClient(
     private val baseUrl: String = "http://localhost:11434",
     baseClient: HttpClient = HttpClient(engineFactoryProvider()),
     timeoutConfig: ConnectionTimeoutConfig = ConnectionTimeoutConfig(),
-    private val enableDynamicModels: Boolean = true
 ): LLMClient, LLMEmbeddingProvider {
 
     private val ollamaJson = Json {
@@ -65,17 +64,13 @@ public class OllamaClient(
         model: LLModel,
         tools: List<ToolDescriptor>
     ): List<Message.Response> {
-        val ollamaModelName = if (enableDynamicModels) {
-            modelResolver.resolveToOllamaName(model)
-        } else {
-            model.toOllamaModelId()
-        }
+        require(model.provider == LLMProvider.Ollama) { "Model not supported by Ollama" }
 
         val response = client.post("$baseUrl/api/chat") {
             contentType(ContentType.Application.Json)
             setBody(
                 OllamaChatRequestDTO(
-                    model = ollamaModelName,
+                    model = model.id,
                     messages = prompt.toOllamaChatMessages(),
                     stream = false,
                     tools = if (tools.isNotEmpty()) tools.map { it.toOllamaTool() } else null
@@ -97,17 +92,13 @@ public class OllamaClient(
         prompt: Prompt,
         model: LLModel
     ): Flow<String> = flow {
-        val ollamaModelName = if (enableDynamicModels) {
-            modelResolver.resolveToOllamaName(model)
-        } else {
-            model.toOllamaModelId()
-        }
+        require(model.provider == LLMProvider.Ollama) { "Model not supported by Ollama" }
 
         val response = client.post("$baseUrl/api/chat") {
             contentType(ContentType.Application.Json)
             setBody(
                 OllamaChatRequestDTO(
-                    model = ollamaModelName,
+                    model = model.id,
                     messages = prompt.toOllamaChatMessages(),
                     stream = true,
                 )
@@ -127,7 +118,7 @@ public class OllamaClient(
                         emit(content)
                     }
                 }
-            } catch (e: Exception) {
+            } catch (_: Exception) {
                 // Skip malformed JSON lines
                 continue
             }
@@ -143,19 +134,15 @@ public class OllamaClient(
      * @throws IllegalArgumentException if the model does not have the Embed capability.
      */
     override suspend fun embed(text: String, model: LLModel): List<Double> {
+        require(model.provider == LLMProvider.Ollama) { "Model not supported by Ollama" }
+
         if (!model.capabilities.contains(LLMCapability.Embed)) {
             throw IllegalArgumentException("Model ${model.id} does not have the Embed capability")
         }
 
-        val ollamaModelName = if (enableDynamicModels) {
-            modelResolver.resolveToOllamaName(model)
-        } else {
-            model.id
-        }
-
         val response = client.post("$baseUrl/api/embeddings") {
             contentType(ContentType.Application.Json)
-            setBody(EmbeddingRequest(model = ollamaModelName, prompt = text))
+            setBody(EmbeddingRequest(model = model.id, prompt = text))
         }
 
         val embeddingResponse = response.body<EmbeddingResponse>()
diff --git a/prompt/prompt-executor/prompt-executor-clients/prompt-executor-ollama-client/src/commonMain/kotlin/ai/koog/prompt/executor/ollama/client/OllamaModelManager.kt b/prompt/prompt-executor/prompt-executor-clients/prompt-executor-ollama-client/src/commonMain/kotlin/ai/koog/prompt/executor/ollama/client/OllamaModelManager.kt
@@ -91,9 +91,9 @@ public class OllamaModelManager(
         val capabilities = detectCapabilities(matchedModel)
         
         return LLModel(
-            provider = LLMProvider.Meta, // Default to Meta for now
-            id = "ollama-${matchedModel.name}",
-            capabilities = capabilities
+            provider = LLMProvider.Ollama,
+            id = matchedModel.name,
+            capabilities = capabilities,
         )
     }
 
@@ -122,8 +122,6 @@ public class OllamaModelManager(
         return null
     }
 
-
-
     /**
      * Detects capabilities based on model information - purely dynamic.
      */
@@ -189,9 +187,9 @@ public class OllamaModelManager(
         val capabilities = getCapabilitiesForFamily(family)
         
         return LLModel(
-            provider = LLMProvider.Meta, // Default provider
-            id = "ollama-dynamic-$modelName",
-            capabilities = capabilities
+            provider = LLMProvider.Ollama,
+            id = modelName,
+            capabilities = capabilities,
         )
     }
 
diff --git a/prompt/prompt-executor/prompt-executor-clients/prompt-executor-ollama-client/src/commonMain/kotlin/ai/koog/prompt/executor/ollama/client/OllamaModelResolver.kt b/prompt/prompt-executor/prompt-executor-clients/prompt-executor-ollama-client/src/commonMain/kotlin/ai/koog/prompt/executor/ollama/client/OllamaModelResolver.kt
@@ -10,60 +10,6 @@ import io.github.oshai.kotlinlogging.KotlinLogging
 public class OllamaModelResolver(
     private val modelManager: OllamaModelManager
 ) {
-    private val logger = KotlinLogging.logger { }
-
-    /**
-     * Only the absolute minimum static mappings for backward compatibility.
-     * These are for the existing hardcoded models in the codebase.
-     */
-    private val backwardCompatibilityMappings = mapOf(
-        "meta-llama-3-2" to "llama3.2",
-        "alibaba-qwq" to "qwq",
-        "alibaba-qwen-coder-2-5-32b" to "qwen2.5-coder:32b"
-    )
-
-    /**
-     * Resolves an LLModel to the actual Ollama model name - fully dynamic.
-     */
-    public suspend fun resolveToOllamaName(model: LLModel): String {
-        // Check backward compatibility mappings first (only for existing hardcoded models)
-        backwardCompatibilityMappings[model.id]?.let { 
-            logger.debug { "Resolved ${model.id} to $it via backward compatibility mapping" }
-            return it 
-        }
-
-        // If the model ID starts with "ollama-", extract the actual model name
-        if (model.id.startsWith("ollama-")) {
-            val extractedName = model.id.removePrefix("ollama-")
-            if (extractedName.startsWith("dynamic-")) {
-                return extractedName.removePrefix("dynamic-")
-            }
-            return extractedName
-        }
-
-        // Try to find the model in available models by exact match
-        val availableModels = modelManager.getAvailableModels()
-        
-        // First try exact match
-        availableModels.find { it.name.equals(model.id, ignoreCase = true) }?.let {
-            logger.debug { "Found exact match for ${model.id} as ${it.name}" }
-            return it.name
-        }
-
-        // Try to find by partial match
-        availableModels.find { 
-            it.name.contains(model.id, ignoreCase = true) ||
-            it.model.contains(model.id, ignoreCase = true)
-        }?.let {
-            logger.debug { "Found partial match for ${model.id} as ${it.name}" }
-            return it.name
-        }
-
-        // As a last resort, use the model ID directly
-        logger.warn { "No mapping found for model ${model.id}, using ID directly" }
-        return model.id
-    }
-
     /**
      * Attempts to resolve a model name and create an LLModel if it doesn't exist.
      */
diff --git a/prompt/prompt-executor/prompt-executor-clients/prompt-executor-ollama-client/src/commonMain/kotlin/ai/koog/prompt/executor/ollama/client/dto/OllamaConverters.kt b/prompt/prompt-executor/prompt-executor-clients/prompt-executor-ollama-client/src/commonMain/kotlin/ai/koog/prompt/executor/ollama/client/dto/OllamaConverters.kt
@@ -3,42 +3,10 @@ package ai.koog.prompt.executor.ollama.client.dto
 import ai.koog.agents.core.tools.ToolDescriptor
 import ai.koog.prompt.dsl.Prompt
 import ai.koog.prompt.executor.ollama.tools.json.toJSONSchema
-import ai.koog.prompt.llm.LLModel
-import ai.koog.prompt.llm.OllamaModels
 import ai.koog.prompt.message.Message
 import kotlinx.serialization.encodeToString
 import kotlinx.serialization.json.Json
 
-/**
- * Converts LLModel to Ollama model ID string.
- * This function provides backward compatibility for hardcoded models.
- * For dynamic model resolution, use OllamaModelResolver instead.
- */
-internal fun LLModel.toOllamaModelId(): String = when (this.id) {
-    OllamaModels.Meta.LLAMA_3_2.id -> "llama3.2"
-    OllamaModels.Alibaba.QWQ.id -> "qwq"
-    OllamaModels.Alibaba.QWEN_CODER_2_5_32B.id -> "qwen2.5-coder:32b"
-    else -> {
-        // Try to extract model name from dynamic model IDs
-        when {
-            this.id.startsWith("ollama-") -> {
-                val extractedName = this.id.removePrefix("ollama-")
-                if (extractedName.startsWith("dynamic-")) {
-                    extractedName.removePrefix("dynamic-")
-                } else {
-                    extractedName
-                }
-            }
-
-            else -> {
-                // Log warning and use ID directly as fallback
-                println("Warning: Unknown model ID ${this.id}, using ID directly. Consider using OllamaModelResolver for dynamic model support.")
-                this.id
-            }
-        }
-    }
-}
-
 /**
  * Converts a Prompt to a list of ChatMessage objects for the Ollama API.
  */
diff --git a/prompt/prompt-llm/src/commonMain/kotlin/ai/koog/prompt/llm/LLMProvider.kt b/prompt/prompt-llm/src/commonMain/kotlin/ai/koog/prompt/llm/LLMProvider.kt
@@ -70,7 +70,7 @@ public sealed class LLMProvider(public val id: String, public val display: Strin
      */
     @Serializable
     public data object Alibaba : LLMProvider("alibaba", "Alibaba")
-    
+
     /**
      * Represents the OpenRouter provider within the available set of large language model providers.
      *
@@ -83,4 +83,17 @@ public sealed class LLMProvider(public val id: String, public val display: Strin
      */
     @Serializable
     public data object OpenRouter : LLMProvider("openrouter", "OpenRouter")
+
+    /**
+     * Represents the Ollama provider within the available set of large language model providers.
+     *
+     * Ollama is identified by its unique ID ("ollama") and display name ("Ollama").
+     * It extends the `LLMProvider` sealed class, which serves as a base class for all supported language model providers.
+     *
+     * This data object adheres to the structure and serialization requirements defined by the parent class.
+     * It is part of the available LLM provider hierarchy, which is used to configure and identify specific
+     * providers for large language model functionalities and capabilities.
+     */
+    @Serializable
+    public data object Ollama : LLMProvider("ollama", "Ollama")
 }
diff --git a/prompt/prompt-llm/src/commonMain/kotlin/ai/koog/prompt/llm/OllamaModels.kt b/prompt/prompt-llm/src/commonMain/kotlin/ai/koog/prompt/llm/OllamaModels.kt
@@ -1,20 +1,20 @@
 package ai.koog.prompt.llm
 
 /**
- * Represents a collection of predefined Large Language Models (LLM) categorized by providers.
- * Each provider contains specific models with configurations such as unique identifiers and capabilities.
+ * Represents a collection of predefined Large Language Models (LLM) categorized by makers.
+ * Each maker contains specific models with configurations such as unique identifiers and capabilities.
  */
 public object OllamaModels {
     /**
-     * The `Meta` object represents the configuration for the Meta-provided large language models (LLMs).
+     * The `Meta` object represents the configuration for the Meta large language models (LLMs).
      * It contains the predefined model specifications for Meta's LLMs, including their identifiers
      * and supported capabilities.
      */
     public object Meta {
         /**
          * Represents the LLAMA version 3.2 model provided by Meta.
          *
-         * This variable defines an instance of the `LLModel` class with the Meta provider, a unique identifier "meta-llama-3-2",
+         * This variable defines an instance of the `LLModel` class with the Ollama provider, a unique identifier "llama3.2",
          * and a set of capabilities. The supported capabilities include:
          *  - Temperature adjustment.
          *  - JSON Schema-based tasks (Simple Schema).
@@ -24,8 +24,8 @@ public object OllamaModels {
          * that require dynamic behavior adjustments, schema adherence, and tool-based interactions.
          */
         public val LLAMA_3_2: LLModel = LLModel(
-            provider = LLMProvider.Meta,
-            id = "meta-llama-3-2",
+            provider = LLMProvider.Ollama,
+            id = "llama3.2",
             capabilities = listOf(
                 LLMCapability.Temperature,
                 LLMCapability.Schema.JSON.Simple,
@@ -35,16 +35,16 @@ public object OllamaModels {
     }
 
     /**
-     * Represents an object that contains predefined Large Language Models (LLMs) provided by Alibaba.
+     * Represents an object that contains predefined Large Language Models (LLMs) made by Alibaba.
      *
      * The `Alibaba` object provides access to multiple LLM instances, each with specific identifiers and capabilities.
-     * These models are configured with Alibaba as the provider and are characterized by their unique capabilities.
+     * These models are configured with Ollama as the provider and are characterized by their unique capabilities.
      */
     public object Alibaba {
         /**
          * Represents the `QWQ` language model instance provided by Alibaba with specific capabilities.
          *
-         * The model is identified by its unique `id` "alibaba-qwq". It belongs to the Alibaba provider
+         * The model is identified by its unique `id` "qwq". It belongs to the Ollama provider
          * and supports multiple advanced capabilities:
          * - Temperature Adjustment: Enables control over the randomness of the model's output.
          * - JSON Schema (Simple): Supports tasks structured through simple JSON schemas.
@@ -54,8 +54,8 @@ public object OllamaModels {
          * require these capabilities for varied and advanced tasks.
          */
         public val QWQ: LLModel = LLModel(
-            provider = LLMProvider.Alibaba,
-            id = "alibaba-qwq",
+            provider = LLMProvider.Ollama,
+            id = "qwq",
             capabilities = listOf(
                 LLMCapability.Temperature,
                 LLMCapability.Schema.JSON.Simple,
@@ -71,11 +71,11 @@ public object OllamaModels {
          * - `Schema.JSON.Simple`: Supports tasks requiring JSON schema validation and handling in a simplified manner.
          * - `Tools`: Enables interaction with external tools or functionalities within the model's ecosystem.
          *
-         * The model is identified by the unique ID "alibaba-qwen-coder-2-5-32b" and categorized under the Alibaba provider.
+         * The model is identified by the unique ID "qwen2.5-coder:32b" and categorized under the Ollama provider.
          */
         public val QWEN_CODER_2_5_32B: LLModel = LLModel(
-            provider = LLMProvider.Alibaba,
-            id = "alibaba-qwen-coder-2-5-32b",
+            provider = LLMProvider.Ollama,
+            id = "qwen2.5-coder:32b",
             capabilities = listOf(
                 LLMCapability.Temperature,
                 LLMCapability.Schema.JSON.Simple,

Original file line number	Diff line number	Diff line change
`@@ -91,9 +91,9 @@ public class OllamaModelManager(`
`91`	`91`	`val capabilities = detectCapabilities(matchedModel)`
`92`	`92`
`93`	`93`	`return LLModel(`
`94`		`- provider = LLMProvider.Meta, // Default to Meta for now`
`95`		`- id = "ollama-${matchedModel.name}",`
`96`		`- capabilities = capabilities`
	`94`	`+ provider = LLMProvider.Ollama,`
	`95`	`+ id = matchedModel.name,`
	`96`	`+ capabilities = capabilities,`
`97`	`97`	`)`
`98`	`98`	`}`
`99`	`99`
`@@ -122,8 +122,6 @@ public class OllamaModelManager(`
`122`	`122`	`return null`
`123`	`123`	`}`
`124`	`124`
`125`		`-`
`126`		`-`
`127`	`125`	`/**`
`128`	`126`	`* Detects capabilities based on model information - purely dynamic.`
`129`	`127`	`*/`
`@@ -189,9 +187,9 @@ public class OllamaModelManager(`
`189`	`187`	`val capabilities = getCapabilitiesForFamily(family)`
`190`	`188`
`191`	`189`	`return LLModel(`
`192`		`- provider = LLMProvider.Meta, // Default provider`
`193`		`- id = "ollama-dynamic-$modelName",`
`194`		`- capabilities = capabilities`
	`190`	`+ provider = LLMProvider.Ollama,`
	`191`	`+ id = modelName,`
	`192`	`+ capabilities = capabilities,`
`195`	`193`	`)`
`196`	`194`	`}`
`197`	`195`