JetBrains
diff --git a/‎integration-tests/src/jvmTest/kotlin/ai/koog/integration/tests/AIAgentIntegrationTest.kt
Lines changed: 14 additions & 9 deletions b/‎integration-tests/src/jvmTest/kotlin/ai/koog/integration/tests/AIAgentIntegrationTest.kt
Lines changed: 14 additions & 9 deletions
diff --git a/‎integration-tests/src/jvmTest/kotlin/ai/koog/integration/tests/MultipleLLMPromptExecutorIntegrationTest.kt
Lines changed: 83 additions & 74 deletions b/‎integration-tests/src/jvmTest/kotlin/ai/koog/integration/tests/MultipleLLMPromptExecutorIntegrationTest.kt
Lines changed: 83 additions & 74 deletions
@@ -31,6 +31,7 @@ import ai.koog.integration.tests.utils.TestUtils.readTestGoogleAIKeyFromEnv
 import ai.koog.integration.tests.utils.TestUtils.readTestOpenAIKeyFromEnv
 import ai.koog.prompt.dsl.prompt
 import ai.koog.prompt.executor.clients.anthropic.AnthropicModels
+import ai.koog.prompt.executor.clients.google.GoogleModels
 import ai.koog.prompt.executor.clients.openai.OpenAIModels
 import ai.koog.prompt.executor.llms.SingleLLMPromptExecutor
 import ai.koog.prompt.executor.llms.all.simpleAnthropicExecutor
@@ -639,7 +640,7 @@ class AIAgentIntegrationTest {
         val bye = "Bye"
 
         val checkpointStrategy = strategy("checkpoint-strategy") {
-            val nodeHello by node<String, String>(hello) { input ->
+            val nodeHello by node<String, String>(hello) {
                 sayHello
             }
 
@@ -656,7 +657,7 @@ class AIAgentIntegrationTest {
                 savedMessage
             }
 
-            val nodeBye by node<String, String>(bye) { input ->
+            val nodeBye by node<String, String>(bye) {
                 sayBye
             }
 
@@ -744,7 +745,7 @@ class AIAgentIntegrationTest {
         val executionLog = StringBuilder()
 
         val rollbackStrategy = strategy("rollback-strategy") {
-            val nodeHello by node<String, String>(hello) { input ->
+            val nodeHello by node<String, String>(hello) {
                 executionLog.append(sayHelloLog)
                 sayHello
             }
@@ -762,12 +763,12 @@ class AIAgentIntegrationTest {
                 saySave
             }
 
-            val nodeBye by node<String, String>(bye) { input ->
+            val nodeBye by node<String, String>(bye) {
                 executionLog.append(sayByeLog)
                 sayBye
             }
 
-            val rollbackNode by node<String, String>(rollback) { input ->
+            val rollbackNode by node<String, String>(rollback) {
                 // Use a shared variable to prevent infinite rollbacks
                 // Only roll back once, then continue
                 if (!hasRolledBack) {
@@ -856,15 +857,15 @@ class AIAgentIntegrationTest {
         val noCheckpointByeError = "No checkpoint for Node Bye"
 
         val simpleStrategy = strategy(strategyName) {
-            val nodeHello by node<String, String>(hello) { input ->
+            val nodeHello by node<String, String>(hello) {
                 sayHello
             }
 
-            val nodeWorld by node<String, String>(world) { input ->
+            val nodeWorld by node<String, String>(world) {
                 sayWorld
             }
 
-            val node3 by node<String, String>(bye) { input ->
+            val node3 by node<String, String>(bye) {
                 sayBye
             }
 
@@ -929,7 +930,7 @@ class AIAgentIntegrationTest {
             JVMFilePersistencyStorageProvider(tempDir, "integration_AgentCheckpointStorageProvidersTest")
 
         val simpleStrategy = strategy(strategyName) {
-            val nodeHello by node<String, String>(hello) { input ->
+            val nodeHello by node<String, String>(hello) {
                 sayHello
             }
 
@@ -980,6 +981,10 @@ class AIAgentIntegrationTest {
     @MethodSource("openAIModels", "anthropicModels", "googleModels")
     fun integration_AgentWithToolsWithoutParamsTest(model: LLModel) = runTest(timeout = 120.seconds) {
         assumeTrue(model.capabilities.contains(LLMCapability.Tools), "Model $model does not support tools")
+        assumeTrue(
+            model.id != GoogleModels.Gemini2_0Flash.id,
+            "gemini-2.0-flash-001 returns flaky results and fails to call tools on a permanent basis"
+        )
 
         val registry = ToolRegistry {
             tool(CalculatorToolNoArgs)
 
@@ -43,7 +43,7 @@ import org.junit.jupiter.params.provider.Arguments
 import org.junit.jupiter.params.provider.MethodSource
 import java.nio.file.Path
 import java.nio.file.Paths
-import java.util.*
+import java.util.Base64
 import java.util.stream.Stream
 import kotlin.io.path.pathString
 import kotlin.io.path.readBytes
@@ -670,8 +670,6 @@ class MultipleLLMPromptExecutorIntegrationTest {
         }
     }
 
-    // ToDo add video & pdf specific scenarios
-
     @ParameterizedTest
     @MethodSource("markdownScenarioModelCombinations")
     fun integration_testMarkdownProcessingBasic(
@@ -681,35 +679,36 @@ class MultipleLLMPromptExecutorIntegrationTest {
         runTest(timeout = 300.seconds) {
             Models.assumeAvailable(model.provider)
             val file = MediaTestUtils.createMarkdownFileForScenario(scenario, testResourcesDir)
-            val prompt = if (model.capabilities.contains(LLMCapability.Document)) {
-                prompt("markdown-test-${scenario.name.lowercase()}") {
-                    system("You are a helpful assistant that can analyze markdown files.")
-
-                    user {
-                        markdown {
-                            "I'm sending you a markdown file with different markdown elements. "
-                            +"Please list all the markdown elements used in it and describe its structure clearly."
-                        }
+            val prompt =
+                if (model.capabilities.contains(LLMCapability.Document) && model.provider != LLMProvider.OpenAI) {
+                    prompt("markdown-test-${scenario.name.lowercase()}") {
+                        system("You are a helpful assistant that can analyze markdown files.")
+
+                        user {
+                            markdown {
+                                +"I'm sending you a markdown file with different markdown elements. "
+                                +"Please list all the markdown elements used in it and describe its structure clearly."
+                            }
 
-                        attachments {
-                            file(file.pathString, "text/markdown")
+                            attachments {
+                                textFile(KtPath(file.pathString), "text/plain")
+                            }
                         }
                     }
-                }
-            } else {
-                prompt("markdown-test-${scenario.name.lowercase()}") {
-                    system("You are a helpful assistant that can analyze markdown files.")
-
-                    user {
-                        markdown {
-                            "I'm sending you a markdown file with different markdown elements. "
-                            +"Please list all the markdown elements used in it and describe its structure clearly."
-                            newline()
-                            +file.readText()
+                } else {
+                    prompt("markdown-test-${scenario.name.lowercase()}") {
+                        system("You are a helpful assistant that can analyze markdown files.")
+
+                        user {
+                            markdown {
+                                +"I'm sending you a markdown file with different markdown elements. "
+                                +"Please list all the markdown elements used in it and describe its structure clearly."
+                                newline()
+                                +file.readText()
+                            }
                         }
                     }
                 }
-            }
 
             withRetry {
                 try {
@@ -787,32 +786,36 @@ class MultipleLLMPromptExecutorIntegrationTest {
                     // For some edge cases, exceptions are expected
                     when (scenario) {
                         ImageTestScenario.LARGE_IMAGE_ANTHROPIC, ImageTestScenario.LARGE_IMAGE -> {
-                            assertTrue(
-                                e.message?.contains("400 Bad Request") == true,
+                            assertEquals(
+                                e.message?.contains("400 Bad Request"),
+                                true,
                                 "Expected exception for a large image [400 Bad Request] was not found, got [${e.message}] instead"
                             )
-                            assertTrue(
-                                e.message?.contains("image exceeds") == true,
+                            assertEquals(
+                                e.message?.contains("image exceeds"),
+                                true,
                                 "Expected exception for a large image [image exceeds] was not found, got [${e.message}] instead"
                             )
                         }
 
                         ImageTestScenario.CORRUPTED_IMAGE, ImageTestScenario.EMPTY_IMAGE -> {
-                            assertTrue(
-                                e.message?.contains("400 Bad Request") == true,
+                            assertEquals(
+                                e.message?.contains("400 Bad Request"),
+                                true,
                                 "Expected exception for a corrupted image [400 Bad Request] was not found, got [${e.message}] instead"
                             )
                             if (model.provider == LLMProvider.Anthropic) {
-                                assertTrue(
-                                    e.message?.contains("Could not process image") == true,
+                                assertEquals(
+                                    e.message?.contains("Could not process image"),
+                                    true,
                                     "Expected exception for a corrupted image [Could not process image] was not found, got [${e.message}] instead"
                                 )
                             } else if (model.provider == LLMProvider.OpenAI) {
-                                assertTrue(
+                                assertEquals(
                                     e.message?.contains(
                                         "You uploaded an unsupported image. Please make sure your image is valid."
-                                    ) ==
-                                        true,
+                                    ),
+                                    true,
                                     "Expected exception for a corrupted image [You uploaded an unsupported image. Please make sure your image is valid.] was not found, got [${e.message}] instead"
                                 )
                             }
@@ -831,37 +834,37 @@ class MultipleLLMPromptExecutorIntegrationTest {
     fun integration_testTextProcessingBasic(scenario: TextTestScenario, model: LLModel) =
         runTest(timeout = 300.seconds) {
             Models.assumeAvailable(model.provider)
-            assumeTrue(model.provider != LLMProvider.OpenAI, "File format txt not supported for OpenAI")
 
             val file = MediaTestUtils.createTextFileForScenario(scenario, testResourcesDir)
 
-            val prompt = if (model.capabilities.contains(LLMCapability.Document)) {
-                prompt("text-test-${scenario.name.lowercase()}") {
-                    system("You are a helpful assistant that can analyze and process text.")
+            val prompt =
+                if (model.capabilities.contains(LLMCapability.Document) && model.provider != LLMProvider.OpenAI) {
+                    prompt("text-test-${scenario.name.lowercase()}") {
+                        system("You are a helpful assistant that can analyze and process text.")
 
-                    user {
-                        markdown {
-                            "I'm sending you a text file. Please analyze it and summarize its content."
-                        }
+                        user {
+                            markdown {
+                                +"I'm sending you a text file. Please analyze it and summarize its content."
+                            }
 
-                        attachments {
-                            textFile(KtPath(file.pathString), "text/plain")
+                            attachments {
+                                textFile(KtPath(file.pathString), "text/plain")
+                            }
                         }
                     }
-                }
-            } else {
-                prompt("text-test-${scenario.name.lowercase()}") {
-                    system("You are a helpful assistant that can analyze and process text.")
-
-                    user {
-                        markdown {
-                            +"I'm sending you a text file. Please analyze it and summarize its content."
-                            newline()
-                            +file.readText()
+                } else {
+                    prompt("text-test-${scenario.name.lowercase()}") {
+                        system("You are a helpful assistant that can analyze and process text.")
+
+                        user {
+                            markdown {
+                                +"I'm sending you a text file. Please analyze it and summarize its content."
+                                newline()
+                                +file.readText()
+                            }
                         }
                     }
                 }
-            }
 
             withRetry {
                 try {
@@ -871,28 +874,31 @@ class MultipleLLMPromptExecutorIntegrationTest {
                     when (scenario) {
                         TextTestScenario.EMPTY_TEXT -> {
                             if (model.provider == LLMProvider.Google) {
-                                assertTrue(
-                                    e.message?.contains("400 Bad Request") == true,
+                                assertEquals(
+                                    e.message?.contains("400 Bad Request"),
+                                    true,
                                     "Expected exception for empty text [400 Bad Request] was not found, got [${e.message}] instead"
                                 )
-                                assertTrue(
+                                assertEquals(
                                     e.message?.contains(
                                         "Unable to submit request because it has an empty inlineData parameter. Add a value to the parameter and try again."
-                                    ) ==
-                                        true,
+                                    ),
+                                    true,
                                     "Expected exception for empty text [Unable to submit request because it has an empty inlineData parameter. Add a value to the parameter and try again] was not found, got [${e.message}] instead"
                                 )
                             }
                         }
 
                         TextTestScenario.LONG_TEXT_5_MB -> {
                             if (model.provider == LLMProvider.Anthropic) {
-                                assertTrue(
-                                    e.message?.contains("400 Bad Request") == true,
+                                assertEquals(
+                                    e.message?.contains("400 Bad Request"),
+                                    true,
                                     "Expected exception for long text [400 Bad Request] was not found, got [${e.message}] instead"
                                 )
-                                assertTrue(
-                                    e.message?.contains("prompt is too long") == true,
+                                assertEquals(
+                                    e.message?.contains("prompt is too long"),
+                                    true,
                                     "Expected exception for long text [prompt is too long:] was not found, got [${e.message}] instead"
                                 )
                             } else if (model.provider == LLMProvider.Google) {
@@ -925,7 +931,7 @@ class MultipleLLMPromptExecutorIntegrationTest {
 
                 user {
                     markdown {
-                        "I'm sending you an audio file. Please tell me a couple of words about it."
+                        +"I'm sending you an audio file. Please tell me a couple of words about it."
                     }
 
                     attachments {
@@ -940,18 +946,21 @@ class MultipleLLMPromptExecutorIntegrationTest {
                     checkExecutorMediaResponse(response)
                 } catch (e: Exception) {
                     if (scenario == AudioTestScenario.CORRUPTED_AUDIO) {
-                        assertTrue(
-                            e.message?.contains("400 Bad Request") == true,
+                        assertEquals(
+                            e.message?.contains("400 Bad Request"),
+                            true,
                             "Expected exception for empty text [400 Bad Request] was not found, got [${e.message}] instead"
                         )
                         if (model.provider == LLMProvider.OpenAI) {
-                            assertTrue(
-                                e.message?.contains("This model does not support the format you provided.") == true,
+                            assertEquals(
+                                e.message?.contains("This model does not support the format you provided."),
+                                true,
                                 "Expected exception for corrupted audio [This model does not support the format you provided.]"
                             )
                         } else if (model.provider == LLMProvider.Google) {
-                            assertTrue(
-                                e.message?.contains("Request contains an invalid argument.") == true,
+                            assertEquals(
+                                e.message?.contains("Request contains an invalid argument."),
+                                true,
                                 "Expected exception for corrupted audio [Request contains an invalid argument.]"
                             )
                         }