From 67a7b9caffd6b1617a488cf16f0ec13549968ce7 Mon Sep 17 00:00:00 2001
From: yusuf temel <yusuf.temeldr@gmail.com>
Date: Tue, 26 Aug 2025 15:22:20 +0300
Subject: [PATCH 1/7] Improve OpenAIResponseAgent exception handling and add
 unit tests

---
 .../src/Agents/OpenAI/OpenAIResponseAgent.cs  | 151 +++++++++----
 .../OpenAIResponseAgentExceptionTests.cs      | 198 ++++++++++++++++++
 2 files changed, 304 insertions(+), 45 deletions(-)
 create mode 100644 dotnet/src/Agents/UnitTests/OpenAI/OpenAIResponseAgentExceptionTests.cs
diff --git a/dotnet/src/Agents/OpenAI/OpenAIResponseAgent.cs b/dotnet/src/Agents/OpenAI/OpenAIResponseAgent.cs
index e1a24b2c348b..cb0f6f66d69a 100644
--- a/dotnet/src/Agents/OpenAI/OpenAIResponseAgent.cs
+++ b/dotnet/src/Agents/OpenAI/OpenAIResponseAgent.cs
@@ -40,80 +40,141 @@ public OpenAIResponseAgent(OpenAIResponseClient client)
     public bool StoreEnabled { get; init; } = false;
 
     /// <inheritdoc/>
-    public override async IAsyncEnumerable<AgentResponseItem<ChatMessageContent>> InvokeAsync(ICollection<ChatMessageContent> messages, AgentThread? thread = null, AgentInvokeOptions? options = null, [EnumeratorCancellation] CancellationToken cancellationToken = default)
-    {
-        Verify.NotNull(messages);
+   public override async IAsyncEnumerable<AgentResponseItem<ChatMessageContent>> InvokeAsync(
+    ICollection<ChatMessageContent> messages,
+    AgentThread? thread = null,
+    AgentInvokeOptions? options = null,
+    [EnumeratorCancellation] CancellationToken cancellationToken = default)
+{
+    Verify.NotNull(messages);
 
-        AgentThread agentThread = await this.EnsureThreadExistsWithMessagesAsync(messages, thread, cancellationToken).ConfigureAwait(false);
+    AgentThread agentThread;
+    OpenAIResponseAgentInvokeOptions extensionsContextOptions;
+    IAsyncEnumerable<ChatMessageContent> invokeResults;
 
-        // Get the context contributions from the AIContextProviders.
-        OpenAIResponseAgentInvokeOptions extensionsContextOptions = await this.FinalizeInvokeOptionsAsync(messages, options, agentThread, cancellationToken).ConfigureAwait(false);
+    try
+    {
+        agentThread = await this.EnsureThreadExistsWithMessagesAsync(messages, thread, cancellationToken).ConfigureAwait(false);
+        extensionsContextOptions = await this.FinalizeInvokeOptionsAsync(messages, options, agentThread, cancellationToken).ConfigureAwait(false);
 
-        // Invoke responses with the updated chat history.
         ChatHistory chatHistory = [.. messages];
-        var invokeResults = ResponseThreadActions.InvokeAsync(
+        invokeResults = ResponseThreadActions.InvokeAsync(
             this,
             chatHistory,
             agentThread,
             extensionsContextOptions,
             cancellationToken);
+    }
+    catch (System.Net.Http.HttpRequestException ex) when (ex.Message.Contains("429"))
+    {
+        throw new KernelException($"Rate limit exceeded for agent '{this.Name}'. Check Retry-After header and implement backoff.", ex);
+    }
+    catch (System.Net.Http.HttpRequestException ex) when (ex.Message.Contains("401") || ex.Message.Contains("403"))
+    {
+        throw new KernelException($"Authentication or permission error for agent '{this.Name}'. Verify API key and account status.", ex);
+    }
+    catch (System.Net.Http.HttpRequestException ex) when (ex.Message.Contains("404"))
+    {
+        throw new KernelException($"Model or deployment not found for agent '{this.Name}'. Verify model configuration.", ex);
+    }
+    catch (System.Net.Http.HttpRequestException ex) when (ex.Message.Contains("content", StringComparison.OrdinalIgnoreCase) 
+                                                          && (ex.Message.Contains("filter", StringComparison.OrdinalIgnoreCase) 
+                                                          || ex.Message.Contains("policy", StringComparison.OrdinalIgnoreCase)))
+    {
+        throw new KernelException($"Content policy violation for agent '{this.Name}'. Request blocked by OpenAI filtering.", ex);
+    }
+    catch (TaskCanceledException ex) when (!cancellationToken.IsCancellationRequested)
+    {
+        throw new KernelException($"Request timeout for agent '{this.Name}'. The OpenAI API request timed out.", ex);
+    }
+    catch (Exception ex) when (ex.GetType().FullName?.StartsWith("OpenAI", StringComparison.OrdinalIgnoreCase) == true)
+    {
+        throw new KernelException($"OpenAI provider error for agent '{this.Name}': {ex.Message}", ex);
+    }
 
-        // Notify the thread of new messages and return them to the caller.
-        await foreach (var result in invokeResults.ConfigureAwait(false))
-        {
-            await this.NotifyThreadOfNewMessage(agentThread, result, cancellationToken).ConfigureAwait(false);
-            yield return new(result, agentThread);
-        }
+    // Yield results with additional error handling
+    await foreach (var result in invokeResults.ConfigureAwait(false))
+    {
+        await this.NotifyThreadOfNewMessage(agentThread, result, cancellationToken).ConfigureAwait(false);
+        yield return new(result, agentThread);
     }
+}
 
     /// <inheritdoc/>
-    public override async IAsyncEnumerable<AgentResponseItem<StreamingChatMessageContent>> InvokeStreamingAsync(ICollection<ChatMessageContent> messages, AgentThread? thread = null, AgentInvokeOptions? options = null, [EnumeratorCancellation] CancellationToken cancellationToken = default)
-    {
-        Verify.NotNull(messages);
+   public override async IAsyncEnumerable<AgentResponseItem<StreamingChatMessageContent>> InvokeStreamingAsync(
+    ICollection<ChatMessageContent> messages,
+    AgentThread? thread = null,
+    AgentInvokeOptions? options = null,
+    [EnumeratorCancellation] CancellationToken cancellationToken = default)
+{
+    Verify.NotNull(messages);
 
-        AgentThread agentThread = await this.EnsureThreadExistsWithMessagesAsync(messages, thread, cancellationToken).ConfigureAwait(false);
+    AgentThread agentThread;
+    OpenAIResponseAgentInvokeOptions extensionsContextOptions;
+    ChatHistory chatHistory;
+    int messageIndex;
+    IAsyncEnumerable<StreamingChatMessageContent> invokeResults;
 
-        // Get the context contributions from the AIContextProviders.
-        OpenAIResponseAgentInvokeOptions extensionsContextOptions = await this.FinalizeInvokeOptionsAsync(messages, options, agentThread, cancellationToken).ConfigureAwait(false);
+    try
+    {
+        agentThread = await this.EnsureThreadExistsWithMessagesAsync(messages, thread, cancellationToken).ConfigureAwait(false);
+        extensionsContextOptions = await this.FinalizeInvokeOptionsAsync(messages, options, agentThread, cancellationToken).ConfigureAwait(false);
 
-        // Invoke responses with the updated chat history.
-        ChatHistory chatHistory = [.. messages];
-        int messageCount = chatHistory.Count;
-        int messageIndex = chatHistory.Count;
-        var invokeResults = ResponseThreadActions.InvokeStreamingAsync(
+        chatHistory = [.. messages];
+        messageIndex = chatHistory.Count;
+        invokeResults = ResponseThreadActions.InvokeStreamingAsync(
             this,
             chatHistory,
             agentThread,
             extensionsContextOptions,
             cancellationToken);
+    }
+    catch (System.Net.Http.HttpRequestException ex)
+    {
+        if (ex.Message.Contains("429"))
+            throw new KernelException($"Rate limit exceeded for agent '{this.Name}' during streaming. Check Retry-After header and implement backoff.", ex);
+        if (ex.Message.Contains("401") || ex.Message.Contains("403"))
+            throw new KernelException($"Authentication or permission error for agent '{this.Name}' during streaming. Verify API key and account status.", ex);
+        if (ex.Message.Contains("404"))
+            throw new KernelException($"Model or deployment not found for agent '{this.Name}' during streaming. Verify model configuration.", ex);
+        if (ex.Message.Contains("content", StringComparison.OrdinalIgnoreCase) 
+            && (ex.Message.Contains("filter", StringComparison.OrdinalIgnoreCase) 
+            || ex.Message.Contains("policy", StringComparison.OrdinalIgnoreCase)))
+            throw new KernelException($"Content policy violation for agent '{this.Name}' during streaming. Request blocked by OpenAI filtering.", ex);
+
+        throw;
+    }
+    catch (TaskCanceledException ex) when (!cancellationToken.IsCancellationRequested)
+    {
+        throw new KernelException($"Request timeout for agent '{this.Name}' during streaming. The OpenAI API request timed out.", ex);
+    }
+    catch (Exception ex) when (ex.GetType().FullName?.StartsWith("OpenAI", StringComparison.OrdinalIgnoreCase) == true)
+    {
+        throw new KernelException($"OpenAI provider error for agent '{this.Name}' during streaming: {ex.Message}", ex);
+    }
 
-        // Return streaming chat message content to the caller.
-        await foreach (var result in invokeResults.ConfigureAwait(false))
+    async Task NotifyMessagesAsync()
+    {
+        for (; messageIndex < chatHistory.Count; messageIndex++)
         {
-            // Notify the thread of any messages that were assembled from the streaming response during this iteration.
-            await NotifyMessagesAsync().ConfigureAwait(false);
-
-            yield return new(result, agentThread);
-        }
+            ChatMessageContent newMessage = chatHistory[messageIndex];
+            await this.NotifyThreadOfNewMessage(agentThread, newMessage, cancellationToken).ConfigureAwait(false);
 
-        // Notify the thread of any remaining messages that were assembled from the streaming response after all iterations are complete.
-        await NotifyMessagesAsync().ConfigureAwait(false);
-
-        async Task NotifyMessagesAsync()
-        {
-            for (; messageIndex < chatHistory.Count; messageIndex++)
+            if (options?.OnIntermediateMessage is not null)
             {
-                ChatMessageContent newMessage = chatHistory[messageIndex];
-                await this.NotifyThreadOfNewMessage(agentThread, newMessage, cancellationToken).ConfigureAwait(false);
-
-                if (options?.OnIntermediateMessage is not null)
-                {
-                    await options.OnIntermediateMessage(newMessage).ConfigureAwait(false);
-                }
+                await options.OnIntermediateMessage(newMessage).ConfigureAwait(false);
             }
         }
     }
 
+    await foreach (var result in invokeResults.ConfigureAwait(false))
+    {
+        await NotifyMessagesAsync().ConfigureAwait(false);
+        yield return new(result, agentThread);
+    }
+}
+
+
     /// <inheritdoc/>
     [Experimental("SKEXP0110")]
     [ExcludeFromCodeCoverage]
diff --git a/dotnet/src/Agents/UnitTests/OpenAI/OpenAIResponseAgentExceptionTests.cs b/dotnet/src/Agents/UnitTests/OpenAI/OpenAIResponseAgentExceptionTests.cs
new file mode 100644
index 000000000000..5d0e95d7dba6
--- /dev/null
+++ b/dotnet/src/Agents/UnitTests/OpenAI/OpenAIResponseAgentExceptionTests.cs
@@ -0,0 +1,198 @@
+using System;
+using System.Net.Http;
+using System.Threading;
+using System.Threading.Tasks;
+using Xunit;
+using Microsoft.SemanticKernel;
+
+namespace SemanticKernel.Agents.UnitTests.OpenAI
+{
+    /// <summary>
+    /// Tests for the exception handling logic we added to OpenAIResponseAgent.
+    /// These tests verify that the right KernelException messages are created.
+    /// </summary>
+    public class OpenAIResponseAgentExceptionTests
+    {
+        [Fact]
+        public void ExceptionHandling_ShouldMapRateLimitCorrectly()
+        {
+            // Arrange
+            var httpEx = new HttpRequestException("HTTP 429 Rate limit exceeded");
+            var agentName = "TestAgent";
+
+            // Act - Simulate the exception handling logic from our code
+            KernelException? result = null;
+            try
+            {
+                if (httpEx.Message.Contains("429"))
+                {
+                    throw new KernelException($"Rate limit exceeded for agent '{agentName}'. Check Retry-After header and implement backoff.", httpEx);
+                }
+            }
+            catch (KernelException ex)
+            {
+                result = ex;
+            }
+
+            // Assert
+            Assert.NotNull(result);
+            Assert.Contains("Rate limit exceeded", result.Message);
+            Assert.Contains("TestAgent", result.Message);
+            Assert.Contains("Retry-After header", result.Message);
+            Assert.Equal(httpEx, result.InnerException);
+        }
+
+        [Theory]
+        [InlineData("HTTP 401 Unauthorized")]
+        [InlineData("HTTP 403 Forbidden")]
+        public void ExceptionHandling_ShouldMapAuthErrorsCorrectly(string errorMessage)
+        {
+            // Arrange
+            var httpEx = new HttpRequestException(errorMessage);
+            var agentName = "TestAgent";
+
+            // Act - Simulate the exception handling logic
+            KernelException? result = null;
+            try
+            {
+                if (httpEx.Message.Contains("401") || httpEx.Message.Contains("403"))
+                {
+                    throw new KernelException($"Authentication or permission error for agent '{agentName}'. Verify API key and account status.", httpEx);
+                }
+            }
+            catch (KernelException ex)
+            {
+                result = ex;
+            }
+
+            // Assert
+            Assert.NotNull(result);
+            Assert.Contains("Authentication or permission error", result.Message);
+            Assert.Contains("Verify API key", result.Message);
+            Assert.Equal(httpEx, result.InnerException);
+        }
+
+        [Fact]
+        public void ExceptionHandling_ShouldMapModelNotFoundCorrectly()
+        {
+            // Arrange
+            var httpEx = new HttpRequestException("HTTP 404 Model not found");
+            var agentName = "TestAgent";
+
+            // Act
+            KernelException? result = null;
+            try
+            {
+                if (httpEx.Message.Contains("404"))
+                {
+                    throw new KernelException($"Model or deployment not found for agent '{agentName}'. Verify model configuration.", httpEx);
+                }
+            }
+            catch (KernelException ex)
+            {
+                result = ex;
+            }
+
+            // Assert
+            Assert.NotNull(result);
+            Assert.Contains("Model or deployment not found", result.Message);
+            Assert.Contains("Verify model configuration", result.Message);
+        }
+
+        [Theory]
+        [InlineData("Content filter violation")]
+        [InlineData("Content policy blocked")]
+        [InlineData("Request blocked by content filter")]
+        public void ExceptionHandling_ShouldMapContentPolicyViolationCorrectly(string errorMessage)
+        {
+            // Arrange
+            var httpEx = new HttpRequestException(errorMessage);
+            var agentName = "TestAgent";
+
+            // Act
+            KernelException? result = null;
+            try
+            {
+                if (httpEx.Message.Contains("content", StringComparison.OrdinalIgnoreCase)
+                    && (httpEx.Message.Contains("filter", StringComparison.OrdinalIgnoreCase)
+                    || httpEx.Message.Contains("policy", StringComparison.OrdinalIgnoreCase)))
+                {
+                    throw new KernelException($"Content policy violation for agent '{agentName}'. Request blocked by OpenAI filtering.", httpEx);
+                }
+            }
+            catch (KernelException ex)
+            {
+                result = ex;
+            }
+
+            // Assert
+            Assert.NotNull(result);
+            Assert.Contains("Content policy violation", result.Message);
+            Assert.Contains("OpenAI filtering", result.Message);
+        }
+
+        [Fact]
+        public void ExceptionHandling_ShouldMapTimeoutCorrectly()
+        {
+            // Arrange
+            var timeoutEx = new TaskCanceledException("Request timeout");
+            var agentName = "TestAgent";
+            var cancellationToken = new CancellationToken(); // Not cancelled
+
+            // Act
+            KernelException? result = null;
+            try
+            {
+                if (!cancellationToken.IsCancellationRequested)
+                {
+                    throw new KernelException($"Request timeout for agent '{agentName}'. The OpenAI API request timed out.", timeoutEx);
+                }
+            }
+            catch (KernelException ex)
+            {
+                result = ex;
+            }
+
+            // Assert
+            Assert.NotNull(result);
+            Assert.Contains("Request timeout", result.Message);
+            Assert.Contains("OpenAI API request timed out", result.Message);
+            Assert.Equal(timeoutEx, result.InnerException);
+        }
+
+        [Fact]
+        public void ExceptionHandling_ShouldMapOpenAIProviderErrorCorrectly()
+        {
+            // Arrange - Create a custom exception that simulates OpenAI SDK exception
+            var openAIEx = new InvalidOperationException("Custom OpenAI error");
+            var agentName = "TestAgent";
+
+            // Act
+            KernelException? result = null;
+            try
+            {
+                // Simulate the check for OpenAI exceptions
+                var typeName = openAIEx.GetType().FullName;
+                if (typeName?.StartsWith("OpenAI", StringComparison.OrdinalIgnoreCase) == true)
+                {
+                    throw new KernelException($"OpenAI provider error for agent '{agentName}': {openAIEx.Message}", openAIEx);
+                }
+                else
+                {
+                    // For testing, we'll trigger this path manually
+                    throw new KernelException($"OpenAI provider error for agent '{agentName}': {openAIEx.Message}", openAIEx);
+                }
+            }
+            catch (KernelException ex)
+            {
+                result = ex;
+            }
+
+            // Assert
+            Assert.NotNull(result);
+            Assert.Contains("OpenAI provider error", result.Message);
+            Assert.Contains("Custom OpenAI error", result.Message);
+            Assert.Equal(openAIEx, result.InnerException);
+        }
+    }
+}
\ No newline at end of file

From 55698c501910336172122ad027c31c923b294a18 Mon Sep 17 00:00:00 2001
From: yusuf temel <temel.yusf@gmail.com>
Date: Wed, 10 Sep 2025 15:10:41 +0300
Subject: [PATCH 2/7] Address code review feedback: catch all exceptions for
 better future-proofing

- Changed exception handling to catch all Exception types instead of only OpenAI-specific ones
- This approach is more robust and won't miss new exception types from future SDK updates
- Inner exceptions are preserved for detailed error analysis
- Updated unit tests accordingly
---
 .../src/Agents/OpenAI/OpenAIResponseAgent.cs  | 198 +++++++-----------
 .../OpenAIResponseAgentExceptionTests.cs      | 187 ++++++++---------
 2 files changed, 165 insertions(+), 220 deletions(-)

diff --git a/dotnet/src/Agents/OpenAI/OpenAIResponseAgent.cs b/dotnet/src/Agents/OpenAI/OpenAIResponseAgent.cs
index cb0f6f66d69a..e8361c87bc26 100644
--- a/dotnet/src/Agents/OpenAI/OpenAIResponseAgent.cs
+++ b/dotnet/src/Agents/OpenAI/OpenAIResponseAgent.cs
@@ -40,140 +40,98 @@ public OpenAIResponseAgent(OpenAIResponseClient client)
     public bool StoreEnabled { get; init; } = false;
 
     /// <inheritdoc/>
-   public override async IAsyncEnumerable<AgentResponseItem<ChatMessageContent>> InvokeAsync(
-    ICollection<ChatMessageContent> messages,
-    AgentThread? thread = null,
-    AgentInvokeOptions? options = null,
-    [EnumeratorCancellation] CancellationToken cancellationToken = default)
-{
-    Verify.NotNull(messages);
+    public override async IAsyncEnumerable<AgentResponseItem<ChatMessageContent>> InvokeAsync(
+        ICollection<ChatMessageContent> messages,
+        AgentThread? thread = null,
+        AgentInvokeOptions? options = null,
+        [EnumeratorCancellation] CancellationToken cancellationToken = default)
+    {
+        Verify.NotNull(messages);
 
-    AgentThread agentThread;
-    OpenAIResponseAgentInvokeOptions extensionsContextOptions;
-    IAsyncEnumerable<ChatMessageContent> invokeResults;
+        AgentThread agentThread;
+        OpenAIResponseAgentInvokeOptions extensionsContextOptions;
+        IAsyncEnumerable<ChatMessageContent> invokeResults;
 
-    try
-    {
-        agentThread = await this.EnsureThreadExistsWithMessagesAsync(messages, thread, cancellationToken).ConfigureAwait(false);
-        extensionsContextOptions = await this.FinalizeInvokeOptionsAsync(messages, options, agentThread, cancellationToken).ConfigureAwait(false);
-
-        ChatHistory chatHistory = [.. messages];
-        invokeResults = ResponseThreadActions.InvokeAsync(
-            this,
-            chatHistory,
-            agentThread,
-            extensionsContextOptions,
-            cancellationToken);
-    }
-    catch (System.Net.Http.HttpRequestException ex) when (ex.Message.Contains("429"))
-    {
-        throw new KernelException($"Rate limit exceeded for agent '{this.Name}'. Check Retry-After header and implement backoff.", ex);
-    }
-    catch (System.Net.Http.HttpRequestException ex) when (ex.Message.Contains("401") || ex.Message.Contains("403"))
-    {
-        throw new KernelException($"Authentication or permission error for agent '{this.Name}'. Verify API key and account status.", ex);
-    }
-    catch (System.Net.Http.HttpRequestException ex) when (ex.Message.Contains("404"))
-    {
-        throw new KernelException($"Model or deployment not found for agent '{this.Name}'. Verify model configuration.", ex);
-    }
-    catch (System.Net.Http.HttpRequestException ex) when (ex.Message.Contains("content", StringComparison.OrdinalIgnoreCase) 
-                                                          && (ex.Message.Contains("filter", StringComparison.OrdinalIgnoreCase) 
-                                                          || ex.Message.Contains("policy", StringComparison.OrdinalIgnoreCase)))
-    {
-        throw new KernelException($"Content policy violation for agent '{this.Name}'. Request blocked by OpenAI filtering.", ex);
-    }
-    catch (TaskCanceledException ex) when (!cancellationToken.IsCancellationRequested)
-    {
-        throw new KernelException($"Request timeout for agent '{this.Name}'. The OpenAI API request timed out.", ex);
-    }
-    catch (Exception ex) when (ex.GetType().FullName?.StartsWith("OpenAI", StringComparison.OrdinalIgnoreCase) == true)
-    {
-        throw new KernelException($"OpenAI provider error for agent '{this.Name}': {ex.Message}", ex);
-    }
+        try
+        {
+            agentThread = await this.EnsureThreadExistsWithMessagesAsync(messages, thread, cancellationToken).ConfigureAwait(false);
+            extensionsContextOptions = await this.FinalizeInvokeOptionsAsync(messages, options, agentThread, cancellationToken).ConfigureAwait(false);
+
+            ChatHistory chatHistory = [.. messages];
+            invokeResults = ResponseThreadActions.InvokeAsync(
+                this,
+                chatHistory,
+                agentThread,
+                extensionsContextOptions,
+                cancellationToken);
+        }
+        catch (Exception ex)
+        {
+            throw new KernelException($"OpenAI provider error for agent '{this.Name}': {ex.Message}", ex);
+        }
 
-    // Yield results with additional error handling
-    await foreach (var result in invokeResults.ConfigureAwait(false))
-    {
-        await this.NotifyThreadOfNewMessage(agentThread, result, cancellationToken).ConfigureAwait(false);
-        yield return new(result, agentThread);
+        // Yield results with additional error handling
+        await foreach (var result in invokeResults.ConfigureAwait(false))
+        {
+            await this.NotifyThreadOfNewMessage(agentThread, result, cancellationToken).ConfigureAwait(false);
+            yield return new(result, agentThread);
+        }
     }
-}
 
     /// <inheritdoc/>
-   public override async IAsyncEnumerable<AgentResponseItem<StreamingChatMessageContent>> InvokeStreamingAsync(
-    ICollection<ChatMessageContent> messages,
-    AgentThread? thread = null,
-    AgentInvokeOptions? options = null,
-    [EnumeratorCancellation] CancellationToken cancellationToken = default)
-{
-    Verify.NotNull(messages);
-
-    AgentThread agentThread;
-    OpenAIResponseAgentInvokeOptions extensionsContextOptions;
-    ChatHistory chatHistory;
-    int messageIndex;
-    IAsyncEnumerable<StreamingChatMessageContent> invokeResults;
-
-    try
-    {
-        agentThread = await this.EnsureThreadExistsWithMessagesAsync(messages, thread, cancellationToken).ConfigureAwait(false);
-        extensionsContextOptions = await this.FinalizeInvokeOptionsAsync(messages, options, agentThread, cancellationToken).ConfigureAwait(false);
-
-        chatHistory = [.. messages];
-        messageIndex = chatHistory.Count;
-        invokeResults = ResponseThreadActions.InvokeStreamingAsync(
-            this,
-            chatHistory,
-            agentThread,
-            extensionsContextOptions,
-            cancellationToken);
-    }
-    catch (System.Net.Http.HttpRequestException ex)
-    {
-        if (ex.Message.Contains("429"))
-            throw new KernelException($"Rate limit exceeded for agent '{this.Name}' during streaming. Check Retry-After header and implement backoff.", ex);
-        if (ex.Message.Contains("401") || ex.Message.Contains("403"))
-            throw new KernelException($"Authentication or permission error for agent '{this.Name}' during streaming. Verify API key and account status.", ex);
-        if (ex.Message.Contains("404"))
-            throw new KernelException($"Model or deployment not found for agent '{this.Name}' during streaming. Verify model configuration.", ex);
-        if (ex.Message.Contains("content", StringComparison.OrdinalIgnoreCase) 
-            && (ex.Message.Contains("filter", StringComparison.OrdinalIgnoreCase) 
-            || ex.Message.Contains("policy", StringComparison.OrdinalIgnoreCase)))
-            throw new KernelException($"Content policy violation for agent '{this.Name}' during streaming. Request blocked by OpenAI filtering.", ex);
-
-        throw;
-    }
-    catch (TaskCanceledException ex) when (!cancellationToken.IsCancellationRequested)
-    {
-        throw new KernelException($"Request timeout for agent '{this.Name}' during streaming. The OpenAI API request timed out.", ex);
-    }
-    catch (Exception ex) when (ex.GetType().FullName?.StartsWith("OpenAI", StringComparison.OrdinalIgnoreCase) == true)
+    public override async IAsyncEnumerable<AgentResponseItem<StreamingChatMessageContent>> InvokeStreamingAsync(
+        ICollection<ChatMessageContent> messages,
+        AgentThread? thread = null,
+        AgentInvokeOptions? options = null,
+        [EnumeratorCancellation] CancellationToken cancellationToken = default)
     {
-        throw new KernelException($"OpenAI provider error for agent '{this.Name}' during streaming: {ex.Message}", ex);
-    }
+        Verify.NotNull(messages);
 
-    async Task NotifyMessagesAsync()
-    {
-        for (; messageIndex < chatHistory.Count; messageIndex++)
+        AgentThread agentThread;
+        OpenAIResponseAgentInvokeOptions extensionsContextOptions;
+        ChatHistory chatHistory;
+        int messageIndex;
+        IAsyncEnumerable<StreamingChatMessageContent> invokeResults;
+
+        try
         {
-            ChatMessageContent newMessage = chatHistory[messageIndex];
-            await this.NotifyThreadOfNewMessage(agentThread, newMessage, cancellationToken).ConfigureAwait(false);
+            agentThread = await this.EnsureThreadExistsWithMessagesAsync(messages, thread, cancellationToken).ConfigureAwait(false);
+            extensionsContextOptions = await this.FinalizeInvokeOptionsAsync(messages, options, agentThread, cancellationToken).ConfigureAwait(false);
+
+            chatHistory = [.. messages];
+            messageIndex = chatHistory.Count;
+            invokeResults = ResponseThreadActions.InvokeStreamingAsync(
+                this,
+                chatHistory,
+                agentThread,
+                extensionsContextOptions,
+                cancellationToken);
+        }
+        catch (Exception ex)
+        {
+            throw new KernelException($"OpenAI provider error for agent '{this.Name}' during streaming: {ex.Message}", ex);
+        }
 
-            if (options?.OnIntermediateMessage is not null)
+        async Task NotifyMessagesAsync()
+        {
+            for (; messageIndex < chatHistory.Count; messageIndex++)
             {
-                await options.OnIntermediateMessage(newMessage).ConfigureAwait(false);
+                ChatMessageContent newMessage = chatHistory[messageIndex];
+                await this.NotifyThreadOfNewMessage(agentThread, newMessage, cancellationToken).ConfigureAwait(false);
+
+                if (options?.OnIntermediateMessage is not null)
+                {
+                    await options.OnIntermediateMessage(newMessage).ConfigureAwait(false);
+                }
             }
         }
-    }
 
-    await foreach (var result in invokeResults.ConfigureAwait(false))
-    {
-        await NotifyMessagesAsync().ConfigureAwait(false);
-        yield return new(result, agentThread);
+        await foreach (var result in invokeResults.ConfigureAwait(false))
+        {
+            await NotifyMessagesAsync().ConfigureAwait(false);
+            yield return new(result, agentThread);
+        }
     }
-}
-
 
     /// <inheritdoc/>
     [Experimental("SKEXP0110")]
@@ -245,4 +203,4 @@ options is null ?
                 };
         return extensionsContextOptions;
     }
-}
+}
\ No newline at end of file
diff --git a/dotnet/src/Agents/UnitTests/OpenAI/OpenAIResponseAgentExceptionTests.cs b/dotnet/src/Agents/UnitTests/OpenAI/OpenAIResponseAgentExceptionTests.cs
index 5d0e95d7dba6..1803213ef4e3 100644
--- a/dotnet/src/Agents/UnitTests/OpenAI/OpenAIResponseAgentExceptionTests.cs
+++ b/dotnet/src/Agents/UnitTests/OpenAI/OpenAIResponseAgentExceptionTests.cs
@@ -1,4 +1,4 @@
-using System;
+﻿using System;
 using System.Net.Http;
 using System.Threading;
 using System.Threading.Tasks;
@@ -8,191 +8,178 @@
 namespace SemanticKernel.Agents.UnitTests.OpenAI
 {
     /// <summary>
-    /// Tests for the exception handling logic we added to OpenAIResponseAgent.
-    /// These tests verify that the right KernelException messages are created.
+    /// Tests for the updated exception handling logic in OpenAIResponseAgent.
+    /// Verifies that KernelException messages are correct and unknown exceptions propagate.
     /// </summary>
     public class OpenAIResponseAgentExceptionTests
     {
+        private const string AgentName = "TestAgent";
+
         [Fact]
-        public void ExceptionHandling_ShouldMapRateLimitCorrectly()
+        public void InvokeAsync_ShouldMapRateLimitCorrectly()
         {
-            // Arrange
-            var httpEx = new HttpRequestException("HTTP 429 Rate limit exceeded");
-            var agentName = "TestAgent";
-
-            // Act - Simulate the exception handling logic from our code
+            var ex = new HttpRequestException("HTTP 429 Rate limit exceeded");
             KernelException? result = null;
+
             try
             {
-                if (httpEx.Message.Contains("429"))
-                {
-                    throw new KernelException($"Rate limit exceeded for agent '{agentName}'. Check Retry-After header and implement backoff.", httpEx);
-                }
+                if (ex.Message.Contains("429"))
+                    throw new KernelException($"Rate limit exceeded for agent '{AgentName}'. Check Retry-After header and implement backoff.", ex);
             }
-            catch (KernelException ex)
+            catch (KernelException ke)
             {
-                result = ex;
+                result = ke;
             }
 
-            // Assert
             Assert.NotNull(result);
             Assert.Contains("Rate limit exceeded", result.Message);
-            Assert.Contains("TestAgent", result.Message);
             Assert.Contains("Retry-After header", result.Message);
-            Assert.Equal(httpEx, result.InnerException);
+            Assert.Equal(ex, result.InnerException);
         }
 
         [Theory]
         [InlineData("HTTP 401 Unauthorized")]
         [InlineData("HTTP 403 Forbidden")]
-        public void ExceptionHandling_ShouldMapAuthErrorsCorrectly(string errorMessage)
+        public void InvokeAsync_ShouldMapAuthErrorsCorrectly(string message)
         {
-            // Arrange
-            var httpEx = new HttpRequestException(errorMessage);
-            var agentName = "TestAgent";
-
-            // Act - Simulate the exception handling logic
+            var ex = new HttpRequestException(message);
             KernelException? result = null;
+
             try
             {
-                if (httpEx.Message.Contains("401") || httpEx.Message.Contains("403"))
-                {
-                    throw new KernelException($"Authentication or permission error for agent '{agentName}'. Verify API key and account status.", httpEx);
-                }
+                if (ex.Message.Contains("401") || ex.Message.Contains("403"))
+                    throw new KernelException($"Authentication or permission error for agent '{AgentName}'. Verify API key and account status.", ex);
             }
-            catch (KernelException ex)
+            catch (KernelException ke)
             {
-                result = ex;
+                result = ke;
             }
 
-            // Assert
             Assert.NotNull(result);
             Assert.Contains("Authentication or permission error", result.Message);
-            Assert.Contains("Verify API key", result.Message);
-            Assert.Equal(httpEx, result.InnerException);
+            Assert.Equal(ex, result.InnerException);
         }
 
         [Fact]
-        public void ExceptionHandling_ShouldMapModelNotFoundCorrectly()
+        public void InvokeAsync_ShouldMapModelNotFoundCorrectly()
         {
-            // Arrange
-            var httpEx = new HttpRequestException("HTTP 404 Model not found");
-            var agentName = "TestAgent";
-
-            // Act
+            var ex = new HttpRequestException("HTTP 404 Model not found");
             KernelException? result = null;
+
             try
             {
-                if (httpEx.Message.Contains("404"))
-                {
-                    throw new KernelException($"Model or deployment not found for agent '{agentName}'. Verify model configuration.", httpEx);
-                }
+                if (ex.Message.Contains("404"))
+                    throw new KernelException($"Model or deployment not found for agent '{AgentName}'. Verify model configuration.", ex);
             }
-            catch (KernelException ex)
+            catch (KernelException ke)
             {
-                result = ex;
+                result = ke;
             }
 
-            // Assert
             Assert.NotNull(result);
             Assert.Contains("Model or deployment not found", result.Message);
-            Assert.Contains("Verify model configuration", result.Message);
         }
 
         [Theory]
         [InlineData("Content filter violation")]
         [InlineData("Content policy blocked")]
-        [InlineData("Request blocked by content filter")]
-        public void ExceptionHandling_ShouldMapContentPolicyViolationCorrectly(string errorMessage)
+        public void InvokeAsync_ShouldMapContentPolicyViolationCorrectly(string message)
         {
-            // Arrange
-            var httpEx = new HttpRequestException(errorMessage);
-            var agentName = "TestAgent";
-
-            // Act
+            var ex = new HttpRequestException(message);
             KernelException? result = null;
+
             try
             {
-                if (httpEx.Message.Contains("content", StringComparison.OrdinalIgnoreCase)
-                    && (httpEx.Message.Contains("filter", StringComparison.OrdinalIgnoreCase)
-                    || httpEx.Message.Contains("policy", StringComparison.OrdinalIgnoreCase)))
+                if (ex.Message.Contains("content", StringComparison.OrdinalIgnoreCase)
+                    && (ex.Message.Contains("filter", StringComparison.OrdinalIgnoreCase)
+                    || ex.Message.Contains("policy", StringComparison.OrdinalIgnoreCase)))
                 {
-                    throw new KernelException($"Content policy violation for agent '{agentName}'. Request blocked by OpenAI filtering.", httpEx);
+                    throw new KernelException($"Content policy violation for agent '{AgentName}'. Request blocked by OpenAI filtering.", ex);
                 }
             }
-            catch (KernelException ex)
+            catch (KernelException ke)
             {
-                result = ex;
+                result = ke;
             }
 
-            // Assert
             Assert.NotNull(result);
             Assert.Contains("Content policy violation", result.Message);
-            Assert.Contains("OpenAI filtering", result.Message);
         }
 
         [Fact]
-        public void ExceptionHandling_ShouldMapTimeoutCorrectly()
+        public void InvokeAsync_ShouldMapTimeoutCorrectly()
         {
-            // Arrange
-            var timeoutEx = new TaskCanceledException("Request timeout");
-            var agentName = "TestAgent";
-            var cancellationToken = new CancellationToken(); // Not cancelled
-
-            // Act
+            var ex = new TaskCanceledException("Request timeout");
+            var token = new CancellationToken(); // Not cancelled
             KernelException? result = null;
+
             try
             {
-                if (!cancellationToken.IsCancellationRequested)
-                {
-                    throw new KernelException($"Request timeout for agent '{agentName}'. The OpenAI API request timed out.", timeoutEx);
-                }
+                if (!token.IsCancellationRequested)
+                    throw new KernelException($"Request timeout for agent '{AgentName}'. The OpenAI API request timed out.", ex);
             }
-            catch (KernelException ex)
+            catch (KernelException ke)
             {
-                result = ex;
+                result = ke;
             }
 
-            // Assert
             Assert.NotNull(result);
             Assert.Contains("Request timeout", result.Message);
-            Assert.Contains("OpenAI API request timed out", result.Message);
-            Assert.Equal(timeoutEx, result.InnerException);
+            Assert.Equal(ex, result.InnerException);
         }
 
         [Fact]
-        public void ExceptionHandling_ShouldMapOpenAIProviderErrorCorrectly()
+        public void InvokeAsync_UnknownOpenAIException_ShouldMapProviderError()
         {
-            // Arrange - Create a custom exception that simulates OpenAI SDK exception
-            var openAIEx = new InvalidOperationException("Custom OpenAI error");
-            var agentName = "TestAgent";
-
-            // Act
+            var ex = new InvalidOperationException("Custom OpenAI SDK error");
             KernelException? result = null;
+
             try
             {
-                // Simulate the check for OpenAI exceptions
-                var typeName = openAIEx.GetType().FullName;
-                if (typeName?.StartsWith("OpenAI", StringComparison.OrdinalIgnoreCase) == true)
-                {
-                    throw new KernelException($"OpenAI provider error for agent '{agentName}': {openAIEx.Message}", openAIEx);
-                }
+                // Simulate OpenAI SDK exception handling
+                if (ex.GetType().FullName?.StartsWith("OpenAI", StringComparison.OrdinalIgnoreCase) == true)
+                    throw new KernelException($"OpenAI provider error for agent '{AgentName}': {ex.Message}", ex);
                 else
-                {
-                    // For testing, we'll trigger this path manually
-                    throw new KernelException($"OpenAI provider error for agent '{agentName}': {openAIEx.Message}", openAIEx);
-                }
+                    throw new KernelException($"OpenAI provider error for agent '{AgentName}': {ex.Message}", ex);
             }
-            catch (KernelException ex)
+            catch (KernelException ke)
             {
-                result = ex;
+                result = ke;
             }
 
-            // Assert
             Assert.NotNull(result);
             Assert.Contains("OpenAI provider error", result.Message);
-            Assert.Contains("Custom OpenAI error", result.Message);
-            Assert.Equal(openAIEx, result.InnerException);
+            Assert.Equal(ex, result.InnerException);
+        }
+
+        [Fact]
+        public static void InvokeStreamingAsync_UnknownException_ShouldPropagate()
+        {
+            var ex = new InvalidOperationException("Unknown streaming exception");
+
+            // Synchronous exception için Assert.Throws kullanılır
+            var thrownException =  Assert.ThrowsAsync<InvalidOperationException>(() =>
+            {
+                throw ex;
+            });
+
+            Assert.Equal("Unknown streaming exception", thrownException.Result.Message);
+        }
+
+        // Eğer async test yapmak istiyorsanız:
+        [Fact]
+        public async Task InvokeStreamingAsync_UnknownExceptionAsync_ShouldPropagate()
+        {
+            var ex = new InvalidOperationException("Unknown streaming exception async");
+
+            // Async exception için Assert.ThrowsAsync kullanılır
+            var thrownException = await Assert.ThrowsAsync<InvalidOperationException>(async () =>
+            {
+                await Task.Delay(1); // Async operation simüle et
+                throw ex;
+            });
+
+            Assert.Equal("Unknown streaming exception async", thrownException.Message);
         }
     }
-}
\ No newline at end of file
+}

From 30cd7bcfe796eddfbdec0871e57f9dba3c4abea1 Mon Sep 17 00:00:00 2001
From: Yusuf Temel <152587378+Yusuftmle@users.noreply.github.com>
Date: Mon, 11 May 2026 15:22:33 +0300
Subject: [PATCH 3/7] Fix deferred exception handling on lazy enumeration and
 update unit tests

---
 .../src/Agents/OpenAI/OpenAIResponseAgent.cs  |  67 +++++-
 .../OpenAIResponseAgentExceptionTests.cs      | 223 ++++++------------
 2 files changed, 128 insertions(+), 162 deletions(-)

diff --git a/dotnet/src/Agents/OpenAI/OpenAIResponseAgent.cs b/dotnet/src/Agents/OpenAI/OpenAIResponseAgent.cs
index 4dcd0bf78188..f077280a834f 100644
--- a/dotnet/src/Agents/OpenAI/OpenAIResponseAgent.cs
+++ b/dotnet/src/Agents/OpenAI/OpenAIResponseAgent.cs
@@ -1,4 +1,4 @@
-﻿// Copyright (c) Microsoft. All rights reserved.
+// Copyright (c) Microsoft. All rights reserved.
 
 using System;
 using System.Collections.Generic;
@@ -72,13 +72,20 @@ public override async IAsyncEnumerable<AgentResponseItem<ChatMessageContent>> In
                 extensionsContextOptions,
                 cancellationToken);
         }
-        catch (Exception ex)
+        catch (Exception ex) when (ex is not OperationCanceledException)
         {
             throw new KernelException($"OpenAI provider error for agent '{this.Name}': {ex.Message}", ex);
         }
 
+        var errorMessagePrefix = $"OpenAI provider error for agent '{this.Name}': ";
+        var mappedResults = HandleProviderExceptionsAsync(
+            invokeResults,
+            result => result,
+            errorMessagePrefix,
+            cancellationToken);
+
         // Yield results with additional error handling
-        await foreach (var result in invokeResults.ConfigureAwait(false))
+        await foreach (var result in mappedResults.ConfigureAwait(false))
         {
             if (options?.OnIntermediateMessage is not null)
             {
@@ -119,7 +126,7 @@ public override async IAsyncEnumerable<AgentResponseItem<StreamingChatMessageCon
                 extensionsContextOptions,
                 cancellationToken);
         }
-        catch (Exception ex)
+        catch (Exception ex) when (ex is not OperationCanceledException)
         {
             throw new KernelException($"OpenAI provider error for agent '{this.Name}' during streaming: {ex.Message}", ex);
         }
@@ -138,7 +145,14 @@ async Task NotifyMessagesAsync()
             }
         }
 
-        await foreach (var result in invokeResults.ConfigureAwait(false))
+        var errorMessagePrefix = $"OpenAI provider error for agent '{this.Name}' during streaming: ";
+        var mappedResults = HandleProviderExceptionsAsync(
+            invokeResults,
+            result => result,
+            errorMessagePrefix,
+            cancellationToken);
+
+        await foreach (var result in mappedResults.ConfigureAwait(false))
         {
             await NotifyMessagesAsync().ConfigureAwait(false);
             yield return new(result, agentThread);
@@ -215,4 +229,47 @@ options is null ?
                 };
         return extensionsContextOptions;
     }
+
+    private static async IAsyncEnumerable<TResult> HandleProviderExceptionsAsync<TSource, TResult>(
+        IAsyncEnumerable<TSource> source,
+        Func<TSource, TResult> selector,
+        string errorMessagePrefix,
+        [EnumeratorCancellation] CancellationToken cancellationToken = default)
+    {
+        IAsyncEnumerator<TSource> enumerator;
+        try
+        {
+            enumerator = source.GetAsyncEnumerator(cancellationToken);
+        }
+        catch (Exception ex) when (ex is not OperationCanceledException)
+        {
+            throw new KernelException($"{errorMessagePrefix}{ex.Message}", ex);
+        }
+
+        try
+        {
+            while (true)
+            {
+                TSource item;
+                try
+                {
+                    if (!await enumerator.MoveNextAsync().ConfigureAwait(false))
+                    {
+                        break;
+                    }
+                    item = enumerator.Current;
+                }
+                catch (Exception ex) when (ex is not OperationCanceledException)
+                {
+                    throw new KernelException($"{errorMessagePrefix}{ex.Message}", ex);
+                }
+
+                yield return selector(item);
+            }
+        }
+        finally
+        {
+            await enumerator.DisposeAsync().ConfigureAwait(false);
+        }
+    }
 }
\ No newline at end of file
diff --git a/dotnet/src/Agents/UnitTests/OpenAI/OpenAIResponseAgentExceptionTests.cs b/dotnet/src/Agents/UnitTests/OpenAI/OpenAIResponseAgentExceptionTests.cs
index 1803213ef4e3..1cfb5a59df70 100644
--- a/dotnet/src/Agents/UnitTests/OpenAI/OpenAIResponseAgentExceptionTests.cs
+++ b/dotnet/src/Agents/UnitTests/OpenAI/OpenAIResponseAgentExceptionTests.cs
@@ -1,185 +1,94 @@
-﻿using System;
+// Copyright (c) Microsoft. All rights reserved.
+
+using System;
+using System.ClientModel;
+using System.ClientModel.Primitives;
 using System.Net.Http;
 using System.Threading;
 using System.Threading.Tasks;
 using Xunit;
+using OpenAI;
+using OpenAI.Responses;
 using Microsoft.SemanticKernel;
+using Microsoft.SemanticKernel.Agents.OpenAI;
+
+namespace SemanticKernel.Agents.UnitTests.OpenAI;
 
-namespace SemanticKernel.Agents.UnitTests.OpenAI
+/// <summary>
+/// Tests for the exception handling logic in OpenAIResponseAgent.
+/// Verifies that provider exceptions are wrapped in KernelException.
+/// </summary>
+public class OpenAIResponseAgentExceptionTests : BaseOpenAIResponseClientTest
 {
+    private const string AgentName = "TestAgent";
+
     /// <summary>
-    /// Tests for the updated exception handling logic in OpenAIResponseAgent.
-    /// Verifies that KernelException messages are correct and unknown exceptions propagate.
+    /// Verifies that InvokeAsync wraps provider exceptions in a KernelException.
     /// </summary>
-    public class OpenAIResponseAgentExceptionTests
+    [Fact]
+    public async Task InvokeAsync_WhenProviderFails_ShouldThrowKernelExceptionAsync()
     {
-        private const string AgentName = "TestAgent";
-
-        [Fact]
-        public void InvokeAsync_ShouldMapRateLimitCorrectly()
-        {
-            var ex = new HttpRequestException("HTTP 429 Rate limit exceeded");
-            KernelException? result = null;
-
-            try
-            {
-                if (ex.Message.Contains("429"))
-                    throw new KernelException($"Rate limit exceeded for agent '{AgentName}'. Check Retry-After header and implement backoff.", ex);
-            }
-            catch (KernelException ke)
-            {
-                result = ke;
-            }
-
-            Assert.NotNull(result);
-            Assert.Contains("Rate limit exceeded", result.Message);
-            Assert.Contains("Retry-After header", result.Message);
-            Assert.Equal(ex, result.InnerException);
-        }
+        // Arrange
+        var ex = new HttpRequestException("HTTP 429 Rate limit exceeded");
+        var agent = CreateAgentWithThrowingHandler(ex);
 
-        [Theory]
-        [InlineData("HTTP 401 Unauthorized")]
-        [InlineData("HTTP 403 Forbidden")]
-        public void InvokeAsync_ShouldMapAuthErrorsCorrectly(string message)
+        // Act & Assert
+        var exception = await Assert.ThrowsAsync<KernelException>(async () =>
         {
-            var ex = new HttpRequestException(message);
-            KernelException? result = null;
-
-            try
-            {
-                if (ex.Message.Contains("401") || ex.Message.Contains("403"))
-                    throw new KernelException($"Authentication or permission error for agent '{AgentName}'. Verify API key and account status.", ex);
-            }
-            catch (KernelException ke)
+            await foreach (var item in agent.InvokeAsync("Hello"))
             {
-                result = ke;
+                // Enumerate to trigger lazy execution
             }
+        });
 
-            Assert.NotNull(result);
-            Assert.Contains("Authentication or permission error", result.Message);
-            Assert.Equal(ex, result.InnerException);
-        }
-
-        [Fact]
-        public void InvokeAsync_ShouldMapModelNotFoundCorrectly()
-        {
-            var ex = new HttpRequestException("HTTP 404 Model not found");
-            KernelException? result = null;
-
-            try
-            {
-                if (ex.Message.Contains("404"))
-                    throw new KernelException($"Model or deployment not found for agent '{AgentName}'. Verify model configuration.", ex);
-            }
-            catch (KernelException ke)
-            {
-                result = ke;
-            }
-
-            Assert.NotNull(result);
-            Assert.Contains("Model or deployment not found", result.Message);
-        }
-
-        [Theory]
-        [InlineData("Content filter violation")]
-        [InlineData("Content policy blocked")]
-        public void InvokeAsync_ShouldMapContentPolicyViolationCorrectly(string message)
-        {
-            var ex = new HttpRequestException(message);
-            KernelException? result = null;
-
-            try
-            {
-                if (ex.Message.Contains("content", StringComparison.OrdinalIgnoreCase)
-                    && (ex.Message.Contains("filter", StringComparison.OrdinalIgnoreCase)
-                    || ex.Message.Contains("policy", StringComparison.OrdinalIgnoreCase)))
-                {
-                    throw new KernelException($"Content policy violation for agent '{AgentName}'. Request blocked by OpenAI filtering.", ex);
-                }
-            }
-            catch (KernelException ke)
-            {
-                result = ke;
-            }
-
-            Assert.NotNull(result);
-            Assert.Contains("Content policy violation", result.Message);
-        }
-
-        [Fact]
-        public void InvokeAsync_ShouldMapTimeoutCorrectly()
-        {
-            var ex = new TaskCanceledException("Request timeout");
-            var token = new CancellationToken(); // Not cancelled
-            KernelException? result = null;
-
-            try
-            {
-                if (!token.IsCancellationRequested)
-                    throw new KernelException($"Request timeout for agent '{AgentName}'. The OpenAI API request timed out.", ex);
-            }
-            catch (KernelException ke)
-            {
-                result = ke;
-            }
+        Assert.Contains($"OpenAI provider error for agent '{AgentName}':", exception.Message);
+        Assert.NotNull(exception.InnerException);
+        Assert.Contains("HTTP 429 Rate limit exceeded", exception.ToString());
+    }
 
-            Assert.NotNull(result);
-            Assert.Contains("Request timeout", result.Message);
-            Assert.Equal(ex, result.InnerException);
-        }
+    /// <summary>
+    /// Verifies that InvokeStreamingAsync wraps provider exceptions in a KernelException.
+    /// </summary>
+    [Fact]
+    public async Task InvokeStreamingAsync_WhenProviderFails_ShouldThrowKernelExceptionAsync()
+    {
+        // Arrange
+        var ex = new HttpRequestException("HTTP 500 Internal Server Error");
+        var agent = CreateAgentWithThrowingHandler(ex);
 
-        [Fact]
-        public void InvokeAsync_UnknownOpenAIException_ShouldMapProviderError()
+        // Act & Assert
+        var exception = await Assert.ThrowsAsync<KernelException>(async () =>
         {
-            var ex = new InvalidOperationException("Custom OpenAI SDK error");
-            KernelException? result = null;
-
-            try
-            {
-                // Simulate OpenAI SDK exception handling
-                if (ex.GetType().FullName?.StartsWith("OpenAI", StringComparison.OrdinalIgnoreCase) == true)
-                    throw new KernelException($"OpenAI provider error for agent '{AgentName}': {ex.Message}", ex);
-                else
-                    throw new KernelException($"OpenAI provider error for agent '{AgentName}': {ex.Message}", ex);
-            }
-            catch (KernelException ke)
+            await foreach (var item in agent.InvokeStreamingAsync("Hello"))
             {
-                result = ke;
+                // Enumerate to trigger lazy execution
             }
+        });
 
-            Assert.NotNull(result);
-            Assert.Contains("OpenAI provider error", result.Message);
-            Assert.Equal(ex, result.InnerException);
-        }
+        Assert.Contains($"OpenAI provider error for agent '{AgentName}' during streaming:", exception.Message);
+        Assert.NotNull(exception.InnerException);
+        Assert.Contains("HTTP 500 Internal Server Error", exception.ToString());
+    }
 
-        [Fact]
-        public static void InvokeStreamingAsync_UnknownException_ShouldPropagate()
+    private OpenAIResponseAgent CreateAgentWithThrowingHandler(Exception exceptionToThrow)
+    {
+#pragma warning disable CA2000 // Dispose objects before losing scope
+        var handler = new ThrowingHttpMessageHandler(exceptionToThrow);
+        var httpClient = new HttpClient(handler);
+        var clientOptions = new OpenAIClientOptions()
         {
-            var ex = new InvalidOperationException("Unknown streaming exception");
-
-            // Synchronous exception için Assert.Throws kullanılır
-            var thrownException =  Assert.ThrowsAsync<InvalidOperationException>(() =>
-            {
-                throw ex;
-            });
-
-            Assert.Equal("Unknown streaming exception", thrownException.Result.Message);
-        }
+            Transport = new HttpClientPipelineTransport(httpClient)
+        };
+        var client = new ResponsesClient(new ApiKeyCredential("apiKey"), clientOptions);
+        return new OpenAIResponseAgent(client) { Name = AgentName };
+#pragma warning restore CA2000 // Dispose objects before losing scope
+    }
 
-        // Eğer async test yapmak istiyorsanız:
-        [Fact]
-        public async Task InvokeStreamingAsync_UnknownExceptionAsync_ShouldPropagate()
+    private sealed class ThrowingHttpMessageHandler(Exception exceptionToThrow) : HttpMessageHandler
+    {
+        protected override Task<HttpResponseMessage> SendAsync(HttpRequestMessage request, CancellationToken cancellationToken)
         {
-            var ex = new InvalidOperationException("Unknown streaming exception async");
-
-            // Async exception için Assert.ThrowsAsync kullanılır
-            var thrownException = await Assert.ThrowsAsync<InvalidOperationException>(async () =>
-            {
-                await Task.Delay(1); // Async operation simüle et
-                throw ex;
-            });
-
-            Assert.Equal("Unknown streaming exception async", thrownException.Message);
+            return Task.FromException<HttpResponseMessage>(exceptionToThrow);
         }
     }
 }

From e9db76d91e7ce3cbb74660827e158559171c78d0 Mon Sep 17 00:00:00 2001
From: Yusuf Temel <152587378+Yusuftmle@users.noreply.github.com>
Date: Tue, 12 May 2026 09:25:14 +0300
Subject: [PATCH 4/7] fix(connectors/google): respect request-level ModelId
 overrides in Google/Vertex AI connectors

---
 ...oogleAIGeminiChatCompletionServiceTests.cs |  25 +++-
 .../Clients/GeminiChatCompletionClient.cs     | 128 +++++++++++++-----
 .../Core/GoogleAI/GoogleAIEmbeddingClient.cs  |  14 +-
 .../Core/VertexAI/VertexAIEmbeddingClient.cs  |  19 ++-
 .../GeminiPromptExecutionSettings.cs          |   3 +-
 5 files changed, 149 insertions(+), 40 deletions(-)

diff --git a/dotnet/src/Connectors/Connectors.Google.UnitTests/Services/GoogleAIGeminiChatCompletionServiceTests.cs b/dotnet/src/Connectors/Connectors.Google.UnitTests/Services/GoogleAIGeminiChatCompletionServiceTests.cs
index 76b381f12474..80dfe16674ce 100644
--- a/dotnet/src/Connectors/Connectors.Google.UnitTests/Services/GoogleAIGeminiChatCompletionServiceTests.cs
+++ b/dotnet/src/Connectors/Connectors.Google.UnitTests/Services/GoogleAIGeminiChatCompletionServiceTests.cs
@@ -1,4 +1,4 @@
-﻿// Copyright (c) Microsoft. All rights reserved.
+// Copyright (c) Microsoft. All rights reserved.
 
 using System;
 using System.Collections.Generic;
@@ -218,6 +218,29 @@ public async Task ItSendsBinaryContentCorrectlyAsync(bool useUriData)
     /// </summary>
     private const string PdfBase64Data = "JVBERi0xLjQKMSAwIG9iago8PC9UeXBlIC9DYXRhbG9nCi9QYWdlcyAyIDAgUgo+PgplbmRvYmoKMiAwIG9iago8PC9UeXBlIC9QYWdlcwovS2lkcyBbMyAwIFJdCi9Db3VudCAxCj4+CmVuZG9iagozIDAgb2JqCjw8L1R5cGUgL1BhZ2UKL1BhcmVudCAyIDAgUgovTWVkaWFCb3ggWzAgMCA1OTUgODQyXQovQ29udGVudHMgNSAwIFIKL1Jlc291cmNlcyA8PC9Qcm9jU2V0IFsvUERGIC9UZXh0XQovRm9udCA8PC9GMSA0IDAgUj4+Cj4+Cj4+CmVuZG9iago0IDAgb2JqCjw8L1R5cGUgL0ZvbnQKL1N1YnR5cGUgL1R5cGUxCi9OYW1lIC9GMQovQmFzZUZvbnQgL0hlbHZldGljYQovRW5jb2RpbmcgL01hY1JvbWFuRW5jb2RpbmcKPj4KZW5kb2JqCjUgMCBvYmoKPDwvTGVuZ3RoIDUzCj4+CnN0cmVhbQpCVAovRjEgMjAgVGYKMjIwIDQwMCBUZAooRHVtbXkgUERGKSBUagpFVAplbmRzdHJlYW0KZW5kb2JqCnhyZWYKMCA2CjAwMDAwMDAwMDAgNjU1MzUgZgowMDAwMDAwMDA5IDAwMDAwIG4KMDAwMDAwMDA2MyAwMDAwMCBuCjAwMDAwMDAxMjQgMDAwMDAgbgowMDAwMDAwMjc3IDAwMDAwIG4KMDAwMDAwMDM5MiAwMDAwMCBuCnRyYWlsZXIKPDwvU2l6ZSA2Ci9Sb290IDEgMCBSCj4+CnN0YXJ0eHJlZgo0OTUKJSVFT0YK";
 
+    [Fact]
+    public async Task GetChatMessageContentsAsyncUsesModelIdFromExecutionSettingsAsync()
+    {
+        // Arrange
+        string constructorModel = "fake-model-constructor";
+        string overriddenModel = "fake-model-overridden";
+        var sut = new GoogleAIGeminiChatCompletionService(constructorModel, "key", httpClient: this._httpClient);
+
+        var executionSettings = new GeminiPromptExecutionSettings { ModelId = overriddenModel };
+
+        // Act
+        var result = await sut.GetChatMessageContentsAsync(new ChatHistory { new ChatMessageContent(AuthorRole.User, "hello") }, executionSettings);
+
+        // Assert
+        Assert.NotNull(result);
+        Assert.NotNull(this._messageHandlerStub.RequestContent);
+        Assert.Equal(overriddenModel, result[0].ModelId);
+
+        // Verify the request URI uses the overridden model
+        Assert.NotNull(this._messageHandlerStub.RequestUri);
+        Assert.Contains($"/models/{overriddenModel}:generateContent", this._messageHandlerStub.RequestUri.AbsoluteUri);
+    }
+
     public void Dispose()
     {
         this._httpClient.Dispose();
diff --git a/dotnet/src/Connectors/Connectors.Google/Core/Gemini/Clients/GeminiChatCompletionClient.cs b/dotnet/src/Connectors/Connectors.Google/Core/Gemini/Clients/GeminiChatCompletionClient.cs
index e0138a8e9ce3..37778684b273 100644
--- a/dotnet/src/Connectors/Connectors.Google/Core/Gemini/Clients/GeminiChatCompletionClient.cs
+++ b/dotnet/src/Connectors/Connectors.Google/Core/Gemini/Clients/GeminiChatCompletionClient.cs
@@ -1,4 +1,4 @@
-﻿// Copyright (c) Microsoft. All rights reserved.
+// Copyright (c) Microsoft. All rights reserved.
 
 using System;
 using System.Collections.Generic;
@@ -29,6 +29,10 @@ internal sealed class GeminiChatCompletionClient : ClientBase
     private readonly string _modelId;
     private readonly Uri _chatGenerationEndpoint;
     private readonly Uri _chatStreamingEndpoint;
+    private readonly GoogleAIVersion? _googleAIVersion;
+    private readonly VertexAIVersion? _vertexAIVersion;
+    private readonly string? _location;
+    private readonly string? _projectId;
 
     private static readonly string s_namespace = typeof(GoogleAIGeminiChatCompletionService).Namespace!;
 
@@ -110,10 +114,33 @@ public GeminiChatCompletionClient(
         string versionSubLink = GetApiVersionSubLink(apiVersion);
 
         this._modelId = modelId;
+        this._googleAIVersion = apiVersion;
         this._chatGenerationEndpoint = new Uri($"https://generativelanguage.googleapis.com/{versionSubLink}/models/{this._modelId}:generateContent");
         this._chatStreamingEndpoint = new Uri($"https://generativelanguage.googleapis.com/{versionSubLink}/models/{this._modelId}:streamGenerateContent?alt=sse");
     }
 
+    private (Uri generationEndpoint, Uri streamingEndpoint) GetEndpoints(string modelId)
+    {
+        if (this._googleAIVersion.HasValue)
+        {
+            string versionSubLink = GetApiVersionSubLink(this._googleAIVersion.Value);
+            var generationEndpoint = new Uri($"https://generativelanguage.googleapis.com/{versionSubLink}/models/{modelId}:generateContent");
+            var streamingEndpoint = new Uri($"https://generativelanguage.googleapis.com/{versionSubLink}/models/{modelId}:streamGenerateContent?alt=sse");
+            return (generationEndpoint, streamingEndpoint);
+        }
+
+        if (this._vertexAIVersion.HasValue)
+        {
+            string versionSubLink = GetApiVersionSubLink(this._vertexAIVersion.Value);
+            string baseUri = GetVertexAIBaseUri(this._location!);
+            var generationEndpoint = new Uri($"{baseUri}/{versionSubLink}/projects/{this._projectId}/locations/{this._location}/publishers/google/models/{modelId}:generateContent");
+            var streamingEndpoint = new Uri($"{baseUri}/{versionSubLink}/projects/{this._projectId}/locations/{this._location}/publishers/google/models/{modelId}:streamGenerateContent?alt=sse");
+            return (generationEndpoint, streamingEndpoint);
+        }
+
+        return (this._chatGenerationEndpoint, this._chatStreamingEndpoint);
+    }
+
     /// <summary>
     /// Represents a client for interacting with the chat completion Gemini model via VertexAI.
     /// </summary>
@@ -146,6 +173,9 @@ public GeminiChatCompletionClient(
         string baseUri = GetVertexAIBaseUri(location);
 
         this._modelId = modelId;
+        this._vertexAIVersion = apiVersion;
+        this._location = location;
+        this._projectId = projectId;
         this._chatGenerationEndpoint = new Uri($"{baseUri}/{versionSubLink}/projects/{projectId}/locations/{location}/publishers/google/models/{this._modelId}:generateContent");
         this._chatStreamingEndpoint = new Uri($"{baseUri}/{versionSubLink}/projects/{projectId}/locations/{location}/publishers/google/models/{this._modelId}:streamGenerateContent?alt=sse");
     }
@@ -166,19 +196,25 @@ public async Task<IReadOnlyList<ChatMessageContent>> GenerateChatMessageAsync(
     {
         var state = this.ValidateInputAndCreateChatCompletionState(chatHistory, kernel, executionSettings);
 
+        string modelId = !string.IsNullOrWhiteSpace(state.ExecutionSettings.ModelId)
+            ? state.ExecutionSettings.ModelId
+            : this._modelId;
+
+        var (generationEndpoint, streamingEndpoint) = this.GetEndpoints(modelId);
+
         for (state.Iteration = 1; ; state.Iteration++)
         {
             List<GeminiChatMessageContent> chatResponses;
             using (var activity = ModelDiagnostics.StartCompletionActivity(
-                this._chatGenerationEndpoint, this._modelId, ModelProvider, chatHistory, state.ExecutionSettings))
+                generationEndpoint, modelId, ModelProvider, chatHistory, state.ExecutionSettings))
             {
                 GeminiResponse geminiResponse;
                 try
                 {
                     geminiResponse = await this.SendRequestAndReturnValidGeminiResponseAsync(
-                            this._chatGenerationEndpoint, state.GeminiRequest, cancellationToken)
+                            generationEndpoint, state.GeminiRequest, cancellationToken)
                         .ConfigureAwait(false);
-                    chatResponses = this.ProcessChatResponse(geminiResponse);
+                    chatResponses = this.ProcessChatResponse(geminiResponse, modelId);
                 }
                 catch (Exception ex) when (activity is not null)
                 {
@@ -236,19 +272,25 @@ public async IAsyncEnumerable<StreamingChatMessageContent> StreamGenerateChatMes
     {
         var state = this.ValidateInputAndCreateChatCompletionState(chatHistory, kernel, executionSettings);
 
+        string modelId = !string.IsNullOrWhiteSpace(state.ExecutionSettings.ModelId)
+            ? state.ExecutionSettings.ModelId
+            : this._modelId;
+
+        var (generationEndpoint, streamingEndpoint) = this.GetEndpoints(modelId);
+
         for (state.Iteration = 1; ; state.Iteration++)
         {
             // Reset LastMessage at the start of each iteration to detect if tool calls were found
             state.LastMessage = null;
 
             using (var activity = ModelDiagnostics.StartCompletionActivity(
-                this._chatGenerationEndpoint, this._modelId, ModelProvider, chatHistory, state.ExecutionSettings))
+                generationEndpoint, modelId, ModelProvider, chatHistory, state.ExecutionSettings))
             {
                 HttpResponseMessage? httpResponseMessage = null;
                 Stream? responseStream = null;
                 try
                 {
-                    using var httpRequestMessage = await this.CreateHttpRequestAsync(state.GeminiRequest, this._chatStreamingEndpoint).ConfigureAwait(false);
+                    using var httpRequestMessage = await this.CreateHttpRequestAsync(state.GeminiRequest, streamingEndpoint).ConfigureAwait(false);
                     httpResponseMessage = await this.SendRequestAndGetResponseImmediatelyAfterHeadersReadAsync(httpRequestMessage, cancellationToken).ConfigureAwait(false);
                     responseStream = await httpResponseMessage.Content.ReadAsStreamAndTranslateExceptionAsync(cancellationToken).ConfigureAwait(false);
                 }
@@ -354,7 +396,11 @@ private async IAsyncEnumerable<StreamingChatMessageContent> GetStreamingChatMess
         Stream responseStream,
         [EnumeratorCancellation] CancellationToken ct)
     {
-        var chatResponsesEnumerable = this.ProcessChatResponseStreamAsync(responseStream, ct: ct);
+        string modelId = !string.IsNullOrWhiteSpace(state.ExecutionSettings.ModelId)
+            ? state.ExecutionSettings.ModelId
+            : this._modelId;
+
+        var chatResponsesEnumerable = this.ProcessChatResponseStreamAsync(responseStream, modelId, ct: ct);
         IAsyncEnumerator<GeminiChatMessageContent> chatResponsesEnumerator = null!;
 
         // Track content and items from chunks before tool calls (lazy-init, only used when AutoInvoke is enabled)
@@ -397,7 +443,7 @@ private async IAsyncEnumerable<StreamingChatMessageContent> GetStreamingChatMess
                     }
 
                     // Yield the first chunk
-                    yield return this.GetStreamingChatContentFromChatContent(messageContent);
+                    yield return this.GetStreamingChatContentFromChatContent(messageContent, modelId);
 
                     // Consume the entire stream - accumulate tool calls, content, and items from all chunks
                     while (await chatResponsesEnumerator.MoveNextAsync().ConfigureAwait(false))
@@ -429,7 +475,7 @@ private async IAsyncEnumerable<StreamingChatMessageContent> GetStreamingChatMess
                         }
 
                         // Always yield the chunk to the caller for streaming output
-                        yield return this.GetStreamingChatContentFromChatContent(nextMessage);
+                        yield return this.GetStreamingChatContentFromChatContent(nextMessage, modelId);
                     }
 
                     // Create a combined message with all accumulated tool calls for auto-invoke processing
@@ -437,7 +483,7 @@ private async IAsyncEnumerable<StreamingChatMessageContent> GetStreamingChatMess
                     var combinedMessage = new GeminiChatMessageContent(
                         role: messageContent.Role,
                         content: combinedContent.Length > 0 ? combinedContent.ToString() : null,
-                        modelId: messageContent.ModelId ?? this._modelId,
+                        modelId: messageContent.ModelId ?? modelId,
                         partsWithFunctionCalls: allToolCalls.Select(tc => new GeminiPart
                         {
                             FunctionCall = new GeminiPart.FunctionCallPart
@@ -477,7 +523,7 @@ private async IAsyncEnumerable<StreamingChatMessageContent> GetStreamingChatMess
                 }
 
                 // If we don't want to attempt to invoke any functions, just return the result.
-                yield return this.GetStreamingChatContentFromChatContent(messageContent);
+                yield return this.GetStreamingChatContentFromChatContent(messageContent, modelId);
             }
         }
         finally
@@ -502,6 +548,10 @@ private async Task ProcessFunctionsAsync(ChatCompletionState state, Cancellation
                 string.Join(", ", state.LastMessage!.ToolCalls!.Select(ftc => ftc.ToString())));
         }
 
+        string modelId = !string.IsNullOrWhiteSpace(state.ExecutionSettings.ModelId)
+            ? state.ExecutionSettings.ModelId
+            : this._modelId;
+
         // We must send back a response for every tool call, regardless of whether we successfully executed it or not.
         // If we successfully execute it, we'll add the result. If we don't, we'll add an error.
         // Collect all tool responses before adding to chat history
@@ -511,7 +561,7 @@ private async Task ProcessFunctionsAsync(ChatCompletionState state, Cancellation
         foreach (var toolCall in state.LastMessage!.ToolCalls!)
         {
             var (toolResponse, terminationRequested) = await this.ProcessSingleToolCallWithFiltersAsync(
-                state, toolCall, toolCallIndex, cancellationToken).ConfigureAwait(false);
+                state, toolCall, toolCallIndex, modelId, cancellationToken).ConfigureAwait(false);
             toolResponses.Add(toolResponse);
 
             // If filter requested termination, stop processing more tool calls
@@ -530,7 +580,7 @@ private async Task ProcessFunctionsAsync(ChatCompletionState state, Cancellation
         }
 
         // Add all tool responses as a single batched message
-        this.AddBatchedToolResponseMessage(state.ChatHistory, state.GeminiRequest, toolResponses);
+        this.AddBatchedToolResponseMessage(state.ChatHistory, state.GeminiRequest, toolResponses, modelId);
 
         // Clear the tools. If we end up wanting to use tools, we'll reset it to the desired value.
         state.GeminiRequest.Tools = null;
@@ -567,6 +617,7 @@ private async Task ProcessFunctionsAsync(ChatCompletionState state, Cancellation
         ChatCompletionState state,
         GeminiFunctionToolCall toolCall,
         int toolCallIndex,
+        string modelId,
         CancellationToken cancellationToken)
     {
         // Make sure the requested function is one we requested. If we're permitting any kernel function to be invoked,
@@ -575,13 +626,13 @@ private async Task ProcessFunctionsAsync(ChatCompletionState state, Cancellation
         if (state.ExecutionSettings.ToolCallBehavior?.AllowAnyRequestedKernelFunction is not true &&
             !IsRequestableTool(state.GeminiRequest.Tools![0].Functions, toolCall))
         {
-            return (this.CreateToolResponseMessage(toolCall, functionResponse: null, "Error: Function call request for a function that wasn't defined."), false);
+            return (this.CreateToolResponseMessage(toolCall, functionResponse: null, "Error: Function call request for a function that wasn't defined.", modelId), false);
         }
 
         // Ensure the provided function exists for calling
         if (!state.Kernel!.Plugins.TryGetFunctionAndArguments(toolCall, out KernelFunction? function, out KernelArguments? functionArgs))
         {
-            return (this.CreateToolResponseMessage(toolCall, functionResponse: null, "Error: Requested function could not be found."), false);
+            return (this.CreateToolResponseMessage(toolCall, functionResponse: null, "Error: Requested function could not be found.", modelId), false);
         }
 
         // Create the invocation context for the filter pipeline
@@ -626,7 +677,7 @@ private async Task ProcessFunctionsAsync(ChatCompletionState state, Cancellation
         catch (Exception e)
 #pragma warning restore CA1031
         {
-            return (this.CreateToolResponseMessage(toolCall, functionResponse: null, $"Error: Exception while invoking function. {e.Message}"), false);
+            return (this.CreateToolResponseMessage(toolCall, functionResponse: null, $"Error: Exception while invoking function. {e.Message}", modelId), false);
         }
         finally
         {
@@ -636,7 +687,7 @@ private async Task ProcessFunctionsAsync(ChatCompletionState state, Cancellation
         // Apply any changes from the auto function invocation filters context to final result.
         functionResult = invocationContext.Result;
 
-        return (this.CreateToolResponseMessage(toolCall, functionResponse: functionResult, errorMessage: null), invocationContext.Terminate);
+        return (this.CreateToolResponseMessage(toolCall, functionResponse: functionResult, errorMessage: null, modelId), invocationContext.Terminate);
     }
 
     /// <summary>
@@ -679,7 +730,8 @@ await autoFunctionInvocationFilters[index].OnAutoFunctionInvocationAsync(context
     private void AddBatchedToolResponseMessage(
         ChatHistory chat,
         GeminiRequest request,
-        List<GeminiChatMessageContent> toolResponses)
+        List<GeminiChatMessageContent> toolResponses,
+        string modelId)
     {
         if (toolResponses.Count == 0)
         {
@@ -709,7 +761,7 @@ private void AddBatchedToolResponseMessage(
         var batchedMessage = new GeminiChatMessageContent(
             AuthorRole.Tool,
             combinedContent,
-            this._modelId,
+            modelId,
             calledToolResults: allToolResults);
 
         chat.Add(batchedMessage);
@@ -719,7 +771,8 @@ private void AddBatchedToolResponseMessage(
     private GeminiChatMessageContent CreateToolResponseMessage(
         GeminiFunctionToolCall tool,
         FunctionResult? functionResponse,
-        string? errorMessage)
+        string? errorMessage,
+        string modelId)
     {
         if (errorMessage is not null && this.Logger.IsEnabled(LogLevel.Debug))
         {
@@ -728,7 +781,7 @@ private GeminiChatMessageContent CreateToolResponseMessage(
 
         return new GeminiChatMessageContent(AuthorRole.Tool,
             content: errorMessage ?? string.Empty,
-            modelId: this._modelId,
+            modelId: modelId,
             calledToolResult: functionResponse is not null ? new GeminiFunctionToolResult(tool, functionResponse) : null,
             metadata: null);
     }
@@ -771,11 +824,12 @@ private static void ValidateChatHistory(ChatHistory chatHistory)
 
     private async IAsyncEnumerable<GeminiChatMessageContent> ProcessChatResponseStreamAsync(
         Stream responseStream,
+        string modelId,
         [EnumeratorCancellation] CancellationToken ct)
     {
         await foreach (var response in this.ParseResponseStreamAsync(responseStream, ct: ct).ConfigureAwait(false))
         {
-            foreach (var messageContent in this.ProcessChatResponse(response))
+            foreach (var messageContent in this.ProcessChatResponse(response, modelId))
             {
                 yield return messageContent;
             }
@@ -792,11 +846,12 @@ private async IAsyncEnumerable<GeminiResponse> ParseResponseStreamAsync(
         }
     }
 
-    private List<GeminiChatMessageContent> ProcessChatResponse(GeminiResponse geminiResponse)
+    private List<GeminiChatMessageContent> ProcessChatResponse(GeminiResponse geminiResponse, string? modelId = null)
     {
+        modelId ??= this._modelId;
         ValidateGeminiResponse(geminiResponse);
 
-        var chatMessageContents = this.GetChatMessageContentsFromResponse(geminiResponse);
+        var chatMessageContents = this.GetChatMessageContentsFromResponse(geminiResponse, modelId);
         this.LogUsage(chatMessageContents);
         return chatMessageContents;
     }
@@ -834,13 +889,17 @@ private void LogUsage(List<GeminiChatMessageContent> chatMessageContents)
         s_totalTokensCounter.Add(metadata.TotalTokenCount);
     }
 
-    private List<GeminiChatMessageContent> GetChatMessageContentsFromResponse(GeminiResponse geminiResponse)
-        => geminiResponse.Candidates == null ?
-            [new GeminiChatMessageContent(role: AuthorRole.Assistant, content: string.Empty, modelId: this._modelId, functionsToolCalls: null)]
-            : geminiResponse.Candidates.Select(candidate => this.GetChatMessageContentFromCandidate(geminiResponse, candidate)).ToList();
+    private List<GeminiChatMessageContent> GetChatMessageContentsFromResponse(GeminiResponse geminiResponse, string? modelId = null)
+    {
+        modelId ??= this._modelId;
+        return geminiResponse.Candidates == null ?
+            [new GeminiChatMessageContent(role: AuthorRole.Assistant, content: string.Empty, modelId: modelId, functionsToolCalls: null)]
+            : geminiResponse.Candidates.Select(candidate => this.GetChatMessageContentFromCandidate(geminiResponse, candidate, modelId)).ToList();
+    }
 
-    private GeminiChatMessageContent GetChatMessageContentFromCandidate(GeminiResponse geminiResponse, GeminiResponseCandidate candidate)
+    private GeminiChatMessageContent GetChatMessageContentFromCandidate(GeminiResponse geminiResponse, GeminiResponseCandidate candidate, string? modelId = null)
     {
+        modelId ??= this._modelId;
         var items = new List<KernelContent>();
 
         // Process parts to separate regular text from thinking content
@@ -883,7 +942,7 @@ private GeminiChatMessageContent GetChatMessageContentFromCandidate(GeminiRespon
         var chatMessage = new GeminiChatMessageContent(
             role: candidate.Content?.Role ?? AuthorRole.Assistant,
             content: string.IsNullOrEmpty(regularText) ? null : regularText,
-            modelId: this._modelId,
+            modelId: modelId,
             partsWithFunctionCalls: partsWithFunctionCalls,
             metadata: GetResponseMetadata(geminiResponse, candidate, textThoughtSignature));
 
@@ -906,8 +965,9 @@ private static GeminiRequest CreateRequest(
         return geminiRequest;
     }
 
-    private GeminiStreamingChatMessageContent GetStreamingChatContentFromChatContent(GeminiChatMessageContent message)
+    private GeminiStreamingChatMessageContent GetStreamingChatContentFromChatContent(GeminiChatMessageContent message, string? modelId = null)
     {
+        modelId ??= this._modelId;
         GeminiStreamingChatMessageContent streamingMessage;
 
         if (message.CalledToolResult is not null)
@@ -915,7 +975,7 @@ private GeminiStreamingChatMessageContent GetStreamingChatContentFromChatContent
             streamingMessage = new GeminiStreamingChatMessageContent(
                 role: message.Role,
                 content: message.Content,
-                modelId: this._modelId,
+                modelId: modelId,
                 calledToolResult: message.CalledToolResult,
                 metadata: message.Metadata,
                 choiceIndex: message.Metadata?.Index ?? 0);
@@ -925,7 +985,7 @@ private GeminiStreamingChatMessageContent GetStreamingChatContentFromChatContent
             streamingMessage = new GeminiStreamingChatMessageContent(
                 role: message.Role,
                 content: message.Content,
-                modelId: this._modelId,
+                modelId: modelId,
                 toolCalls: message.ToolCalls,
                 metadata: message.Metadata,
                 choiceIndex: message.Metadata?.Index ?? 0);
@@ -935,7 +995,7 @@ private GeminiStreamingChatMessageContent GetStreamingChatContentFromChatContent
             streamingMessage = new GeminiStreamingChatMessageContent(
                 role: message.Role,
                 content: message.Content,
-                modelId: this._modelId,
+                modelId: modelId,
                 choiceIndex: message.Metadata?.Index ?? 0,
                 metadata: message.Metadata);
         }
diff --git a/dotnet/src/Connectors/Connectors.Google/Core/GoogleAI/GoogleAIEmbeddingClient.cs b/dotnet/src/Connectors/Connectors.Google/Core/GoogleAI/GoogleAIEmbeddingClient.cs
index 8f009366dc46..683354a1c43d 100644
--- a/dotnet/src/Connectors/Connectors.Google/Core/GoogleAI/GoogleAIEmbeddingClient.cs
+++ b/dotnet/src/Connectors/Connectors.Google/Core/GoogleAI/GoogleAIEmbeddingClient.cs
@@ -1,4 +1,4 @@
-﻿// Copyright (c) Microsoft. All rights reserved.
+// Copyright (c) Microsoft. All rights reserved.
 
 using System;
 using System.Collections.Generic;
@@ -17,6 +17,7 @@ namespace Microsoft.SemanticKernel.Connectors.Google.Core;
 internal sealed class GoogleAIEmbeddingClient : ClientBase
 {
     private readonly string _embeddingModelId;
+    private readonly GoogleAIVersion _apiVersion;
     private readonly Uri _embeddingEndpoint;
     private readonly int? _dimensions;
 
@@ -46,11 +47,18 @@ public GoogleAIEmbeddingClient(
 
         string versionSubLink = GetApiVersionSubLink(apiVersion);
 
+        this._apiVersion = apiVersion;
         this._embeddingModelId = modelId;
         this._embeddingEndpoint = new Uri($"https://generativelanguage.googleapis.com/{versionSubLink}/models/{this._embeddingModelId}:batchEmbedContents");
         this._dimensions = dimensions;
     }
 
+    private Uri GetEmbeddingEndpoint(string modelId)
+    {
+        string versionSubLink = GetApiVersionSubLink(this._apiVersion);
+        return new Uri($"https://generativelanguage.googleapis.com/{versionSubLink}/models/{modelId}:batchEmbedContents");
+    }
+
     /// <summary>
     /// Generates embeddings for the given data asynchronously.
     /// </summary>
@@ -65,9 +73,11 @@ public async Task<IList<ReadOnlyMemory<float>>> GenerateEmbeddingsAsync(
     {
         Verify.NotNullOrEmpty(data);
 
+        string modelId = !string.IsNullOrWhiteSpace(options?.ModelId) ? options.ModelId : this._embeddingModelId;
         var geminiRequest = this.GetEmbeddingRequest(data, options);
 
-        using var httpRequestMessage = await this.CreateHttpRequestAsync(geminiRequest, this._embeddingEndpoint).ConfigureAwait(false);
+        var endpoint = modelId == this._embeddingModelId ? this._embeddingEndpoint : this.GetEmbeddingEndpoint(modelId);
+        using var httpRequestMessage = await this.CreateHttpRequestAsync(geminiRequest, endpoint).ConfigureAwait(false);
 
         string body = await this.SendRequestAndGetStringBodyAsync(httpRequestMessage, cancellationToken)
             .ConfigureAwait(false);
diff --git a/dotnet/src/Connectors/Connectors.Google/Core/VertexAI/VertexAIEmbeddingClient.cs b/dotnet/src/Connectors/Connectors.Google/Core/VertexAI/VertexAIEmbeddingClient.cs
index cb59e0087481..f7fd490de19b 100644
--- a/dotnet/src/Connectors/Connectors.Google/Core/VertexAI/VertexAIEmbeddingClient.cs
+++ b/dotnet/src/Connectors/Connectors.Google/Core/VertexAI/VertexAIEmbeddingClient.cs
@@ -1,4 +1,4 @@
-﻿// Copyright (c) Microsoft. All rights reserved.
+// Copyright (c) Microsoft. All rights reserved.
 
 using System;
 using System.Collections.Generic;
@@ -17,6 +17,9 @@ namespace Microsoft.SemanticKernel.Connectors.Google.Core;
 internal sealed class VertexAIEmbeddingClient : ClientBase
 {
     private readonly string _embeddingModelId;
+    private readonly VertexAIVersion _apiVersion;
+    private readonly string _location;
+    private readonly string _projectId;
     private readonly Uri _embeddingEndpoint;
     private readonly int? _dimensions;
 
@@ -53,11 +56,21 @@ public VertexAIEmbeddingClient(
         string versionSubLink = GetApiVersionSubLink(apiVersion);
         string baseUri = GetVertexAIBaseUri(location);
 
+        this._apiVersion = apiVersion;
+        this._location = location;
+        this._projectId = projectId;
         this._embeddingModelId = modelId;
         this._embeddingEndpoint = new Uri($"{baseUri}/{versionSubLink}/projects/{projectId}/locations/{location}/publishers/google/models/{this._embeddingModelId}:predict");
         this._dimensions = dimensions;
     }
 
+    private Uri GetEmbeddingEndpoint(string modelId)
+    {
+        string versionSubLink = GetApiVersionSubLink(this._apiVersion);
+        string baseUri = GetVertexAIBaseUri(this._location);
+        return new Uri($"{baseUri}/{versionSubLink}/projects/{this._projectId}/locations/{this._location}/publishers/google/models/{modelId}:predict");
+    }
+
     /// <summary>
     /// Generates embeddings for the given data asynchronously.
     /// </summary>
@@ -72,8 +85,10 @@ public async Task<IList<ReadOnlyMemory<float>>> GenerateEmbeddingsAsync(
     {
         Verify.NotNullOrEmpty(data);
 
+        string modelId = !string.IsNullOrWhiteSpace(options?.ModelId) ? options.ModelId : this._embeddingModelId;
         var geminiRequest = this.GetEmbeddingRequest(data, options);
-        using var httpRequestMessage = await this.CreateHttpRequestAsync(geminiRequest, this._embeddingEndpoint).ConfigureAwait(false);
+        var endpoint = modelId == this._embeddingModelId ? this._embeddingEndpoint : this.GetEmbeddingEndpoint(modelId);
+        using var httpRequestMessage = await this.CreateHttpRequestAsync(geminiRequest, endpoint).ConfigureAwait(false);
 
         string body = await this.SendRequestAndGetStringBodyAsync(httpRequestMessage, cancellationToken)
             .ConfigureAwait(false);
diff --git a/dotnet/src/Connectors/Connectors.Google/GeminiPromptExecutionSettings.cs b/dotnet/src/Connectors/Connectors.Google/GeminiPromptExecutionSettings.cs
index a9729f518899..df56950b817c 100644
--- a/dotnet/src/Connectors/Connectors.Google/GeminiPromptExecutionSettings.cs
+++ b/dotnet/src/Connectors/Connectors.Google/GeminiPromptExecutionSettings.cs
@@ -1,4 +1,4 @@
-﻿// Copyright (c) Microsoft. All rights reserved.
+// Copyright (c) Microsoft. All rights reserved.
 
 using System;
 using System.Collections.Generic;
@@ -371,6 +371,7 @@ public static GeminiPromptExecutionSettings FromExecutionSettings(PromptExecutio
 
         var json = JsonSerializer.Serialize(executionSettings);
         var settings = JsonSerializer.Deserialize<GeminiPromptExecutionSettings>(json, JsonOptionsCache.ReadPermissive)!;
+        settings.ModelId = executionSettings.ModelId;
 
         // If FunctionChoiceBehavior is set and ToolCallBehavior is not, convert it
         if (executionSettings.FunctionChoiceBehavior is not null && settings.ToolCallBehavior is null)

From 2c935e1cffca776324b84efb38f22f971519b7ce Mon Sep 17 00:00:00 2001
From: Yusuf Temel <152587378+Yusuftmle@users.noreply.github.com>
Date: Tue, 12 May 2026 09:28:44 +0300
Subject: [PATCH 5/7] refactor(connectors/google): simplify embedding endpoint
 resolution

---
 .../Connectors.Google/Core/GoogleAI/GoogleAIEmbeddingClient.cs  | 2 +-
 .../Connectors.Google/Core/VertexAI/VertexAIEmbeddingClient.cs  | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/dotnet/src/Connectors/Connectors.Google/Core/GoogleAI/GoogleAIEmbeddingClient.cs b/dotnet/src/Connectors/Connectors.Google/Core/GoogleAI/GoogleAIEmbeddingClient.cs
index 683354a1c43d..1396bab68b9b 100644
--- a/dotnet/src/Connectors/Connectors.Google/Core/GoogleAI/GoogleAIEmbeddingClient.cs
+++ b/dotnet/src/Connectors/Connectors.Google/Core/GoogleAI/GoogleAIEmbeddingClient.cs
@@ -76,7 +76,7 @@ public async Task<IList<ReadOnlyMemory<float>>> GenerateEmbeddingsAsync(
         string modelId = !string.IsNullOrWhiteSpace(options?.ModelId) ? options.ModelId : this._embeddingModelId;
         var geminiRequest = this.GetEmbeddingRequest(data, options);
 
-        var endpoint = modelId == this._embeddingModelId ? this._embeddingEndpoint : this.GetEmbeddingEndpoint(modelId);
+        var endpoint = this.GetEmbeddingEndpoint(modelId);
         using var httpRequestMessage = await this.CreateHttpRequestAsync(geminiRequest, endpoint).ConfigureAwait(false);
 
         string body = await this.SendRequestAndGetStringBodyAsync(httpRequestMessage, cancellationToken)
diff --git a/dotnet/src/Connectors/Connectors.Google/Core/VertexAI/VertexAIEmbeddingClient.cs b/dotnet/src/Connectors/Connectors.Google/Core/VertexAI/VertexAIEmbeddingClient.cs
index f7fd490de19b..87305b928f38 100644
--- a/dotnet/src/Connectors/Connectors.Google/Core/VertexAI/VertexAIEmbeddingClient.cs
+++ b/dotnet/src/Connectors/Connectors.Google/Core/VertexAI/VertexAIEmbeddingClient.cs
@@ -87,7 +87,7 @@ public async Task<IList<ReadOnlyMemory<float>>> GenerateEmbeddingsAsync(
 
         string modelId = !string.IsNullOrWhiteSpace(options?.ModelId) ? options.ModelId : this._embeddingModelId;
         var geminiRequest = this.GetEmbeddingRequest(data, options);
-        var endpoint = modelId == this._embeddingModelId ? this._embeddingEndpoint : this.GetEmbeddingEndpoint(modelId);
+        var endpoint = this.GetEmbeddingEndpoint(modelId);
         using var httpRequestMessage = await this.CreateHttpRequestAsync(geminiRequest, endpoint).ConfigureAwait(false);
 
         string body = await this.SendRequestAndGetStringBodyAsync(httpRequestMessage, cancellationToken)

From 65fc0d84fbe737514b202f342cd73234d7918439 Mon Sep 17 00:00:00 2001
From: Yusuf Temel <152587378+Yusuftmle@users.noreply.github.com>
Date: Tue, 12 May 2026 09:37:34 +0300
Subject: [PATCH 6/7] fix(connectors/openai): respect request-level ModelId
 overrides in OpenAIChatCompletionService

---
 .../OpenAIChatCompletionServiceTests.cs       | 24 ++++++++++++++++++-
 .../Services/OpenAIChatCompletionService.cs   | 10 ++++----
 2 files changed, 28 insertions(+), 6 deletions(-)

diff --git a/dotnet/src/Connectors/Connectors.OpenAI.UnitTests/Services/OpenAIChatCompletionServiceTests.cs b/dotnet/src/Connectors/Connectors.OpenAI.UnitTests/Services/OpenAIChatCompletionServiceTests.cs
index 57b7700a0595..ae57d92d09ba 100644
--- a/dotnet/src/Connectors/Connectors.OpenAI.UnitTests/Services/OpenAIChatCompletionServiceTests.cs
+++ b/dotnet/src/Connectors/Connectors.OpenAI.UnitTests/Services/OpenAIChatCompletionServiceTests.cs
@@ -1,4 +1,4 @@
-﻿// Copyright (c) Microsoft. All rights reserved.
+// Copyright (c) Microsoft. All rights reserved.
 
 using System;
 using System.ClientModel;
@@ -2267,6 +2267,28 @@ public async Task ItSendsBinaryContentCorrectlyAsync(bool useUriData)
         Assert.Equal($"data:{mimeType};base64,{PdfBase64Data}", dataUriFile);
     }
 
+    [Fact]
+    public async Task GetChatMessageContentsAsyncUsesModelIdFromExecutionSettingsAsync()
+    {
+        // Arrange
+        var chatCompletion = new OpenAIChatCompletionService(modelId: "gpt-3.5-turbo", apiKey: "NOKEY", httpClient: this._httpClient);
+        this._messageHandlerStub.ResponseToReturn = new HttpResponseMessage(System.Net.HttpStatusCode.OK)
+        { Content = new StringContent(ChatCompletionResponse) };
+        var settings = new OpenAIPromptExecutionSettings() { ModelId = "gpt-4-override" };
+
+        // Act
+        var result = await chatCompletion.GetChatMessageContentsAsync([new ChatMessageContent(AuthorRole.User, "test")], settings);
+
+        // Assert
+        Assert.NotNull(result);
+        Assert.Equal("gpt-4-override", result[0].ModelId);
+
+        var actualRequestContent = Encoding.UTF8.GetString(this._messageHandlerStub.RequestContent!);
+        Assert.NotNull(actualRequestContent);
+        var optionsJson = JsonElement.Parse(actualRequestContent);
+        Assert.Equal("gpt-4-override", optionsJson.GetProperty("model").GetString());
+    }
+
     /// <summary>
     /// Sample PDF data URI for testing.
     /// </summary>
diff --git a/dotnet/src/Connectors/Connectors.OpenAI/Services/OpenAIChatCompletionService.cs b/dotnet/src/Connectors/Connectors.OpenAI/Services/OpenAIChatCompletionService.cs
index a3f8d96d6e51..aac90b0944d2 100644
--- a/dotnet/src/Connectors/Connectors.OpenAI/Services/OpenAIChatCompletionService.cs
+++ b/dotnet/src/Connectors/Connectors.OpenAI/Services/OpenAIChatCompletionService.cs
@@ -1,4 +1,4 @@
-﻿// Copyright (c) Microsoft. All rights reserved.
+// Copyright (c) Microsoft. All rights reserved.
 
 using System;
 using System.Collections.Generic;
@@ -102,7 +102,7 @@ public Task<IReadOnlyList<ChatMessageContent>> GetChatMessageContentsAsync(
         PromptExecutionSettings? executionSettings = null,
         Kernel? kernel = null,
         CancellationToken cancellationToken = default)
-        => this._client.GetChatMessageContentsAsync(this._client.ModelId, chatHistory, executionSettings, kernel, cancellationToken);
+        => this._client.GetChatMessageContentsAsync(executionSettings?.ModelId ?? this._client.ModelId, chatHistory, executionSettings, kernel, cancellationToken);
 
     /// <inheritdoc/>
     public IAsyncEnumerable<StreamingChatMessageContent> GetStreamingChatMessageContentsAsync(
@@ -110,7 +110,7 @@ public IAsyncEnumerable<StreamingChatMessageContent> GetStreamingChatMessageCont
         PromptExecutionSettings? executionSettings = null,
         Kernel? kernel = null,
         CancellationToken cancellationToken = default)
-        => this._client.GetStreamingChatMessageContentsAsync(this._client.ModelId, chatHistory, executionSettings, kernel, cancellationToken);
+        => this._client.GetStreamingChatMessageContentsAsync(executionSettings?.ModelId ?? this._client.ModelId, chatHistory, executionSettings, kernel, cancellationToken);
 
     /// <inheritdoc/>
     public Task<IReadOnlyList<TextContent>> GetTextContentsAsync(
@@ -118,7 +118,7 @@ public Task<IReadOnlyList<TextContent>> GetTextContentsAsync(
         PromptExecutionSettings? executionSettings = null,
         Kernel? kernel = null,
         CancellationToken cancellationToken = default)
-        => this._client.GetChatAsTextContentsAsync(this._client.ModelId, prompt, executionSettings, kernel, cancellationToken);
+        => this._client.GetChatAsTextContentsAsync(executionSettings?.ModelId ?? this._client.ModelId, prompt, executionSettings, kernel, cancellationToken);
 
     /// <inheritdoc/>
     public IAsyncEnumerable<StreamingTextContent> GetStreamingTextContentsAsync(
@@ -126,5 +126,5 @@ public IAsyncEnumerable<StreamingTextContent> GetStreamingTextContentsAsync(
         PromptExecutionSettings? executionSettings = null,
         Kernel? kernel = null,
         CancellationToken cancellationToken = default)
-        => this._client.GetChatAsTextStreamingContentsAsync(this._client.ModelId, prompt, executionSettings, kernel, cancellationToken);
+        => this._client.GetChatAsTextStreamingContentsAsync(executionSettings?.ModelId ?? this._client.ModelId, prompt, executionSettings, kernel, cancellationToken);
 }

From 8a2b1b10320285b7c9f25b5d82c37f1b4ad01a01 Mon Sep 17 00:00:00 2001
From: Yusuf Temel <152587378+Yusuftmle@users.noreply.github.com>
Date: Tue, 12 May 2026 10:01:38 +0300
Subject: [PATCH 7/7] refactor(connectors): optimize model overrides and clean
 up unused variables

---
 .../Clients/GeminiChatCompletionClient.cs     |  2 +-
 .../Core/GoogleAI/GoogleAIEmbeddingClient.cs  | 11 ++++++--
 .../Core/VertexAI/VertexAIEmbeddingClient.cs  |  5 ++++
 .../Services/OpenAIChatCompletionService.cs   | 28 ++++++++++++++++---
 4 files changed, 38 insertions(+), 8 deletions(-)

diff --git a/dotnet/src/Connectors/Connectors.Google/Core/Gemini/Clients/GeminiChatCompletionClient.cs b/dotnet/src/Connectors/Connectors.Google/Core/Gemini/Clients/GeminiChatCompletionClient.cs
index 37778684b273..5805cf9cbe7d 100644
--- a/dotnet/src/Connectors/Connectors.Google/Core/Gemini/Clients/GeminiChatCompletionClient.cs
+++ b/dotnet/src/Connectors/Connectors.Google/Core/Gemini/Clients/GeminiChatCompletionClient.cs
@@ -200,7 +200,7 @@ public async Task<IReadOnlyList<ChatMessageContent>> GenerateChatMessageAsync(
             ? state.ExecutionSettings.ModelId
             : this._modelId;
 
-        var (generationEndpoint, streamingEndpoint) = this.GetEndpoints(modelId);
+        var (generationEndpoint, _) = this.GetEndpoints(modelId);
 
         for (state.Iteration = 1; ; state.Iteration++)
         {
diff --git a/dotnet/src/Connectors/Connectors.Google/Core/GoogleAI/GoogleAIEmbeddingClient.cs b/dotnet/src/Connectors/Connectors.Google/Core/GoogleAI/GoogleAIEmbeddingClient.cs
index 1396bab68b9b..f107e00c6d66 100644
--- a/dotnet/src/Connectors/Connectors.Google/Core/GoogleAI/GoogleAIEmbeddingClient.cs
+++ b/dotnet/src/Connectors/Connectors.Google/Core/GoogleAI/GoogleAIEmbeddingClient.cs
@@ -55,6 +55,11 @@ public GoogleAIEmbeddingClient(
 
     private Uri GetEmbeddingEndpoint(string modelId)
     {
+        if (modelId == this._embeddingModelId)
+        {
+            return this._embeddingEndpoint;
+        }
+
         string versionSubLink = GetApiVersionSubLink(this._apiVersion);
         return new Uri($"https://generativelanguage.googleapis.com/{versionSubLink}/models/{modelId}:batchEmbedContents");
     }
@@ -74,7 +79,7 @@ public async Task<IList<ReadOnlyMemory<float>>> GenerateEmbeddingsAsync(
         Verify.NotNullOrEmpty(data);
 
         string modelId = !string.IsNullOrWhiteSpace(options?.ModelId) ? options.ModelId : this._embeddingModelId;
-        var geminiRequest = this.GetEmbeddingRequest(data, options);
+        var geminiRequest = this.GetEmbeddingRequest(data, modelId, options);
 
         var endpoint = this.GetEmbeddingEndpoint(modelId);
         using var httpRequestMessage = await this.CreateHttpRequestAsync(geminiRequest, endpoint).ConfigureAwait(false);
@@ -85,8 +90,8 @@ public async Task<IList<ReadOnlyMemory<float>>> GenerateEmbeddingsAsync(
         return DeserializeAndProcessEmbeddingsResponse(body);
     }
 
-    private GoogleAIEmbeddingRequest GetEmbeddingRequest(IEnumerable<string> data, EmbeddingGenerationOptions? options = null)
-    => GoogleAIEmbeddingRequest.FromData(data, options?.ModelId ?? this._embeddingModelId, options?.Dimensions ?? this._dimensions, options);
+    private GoogleAIEmbeddingRequest GetEmbeddingRequest(IEnumerable<string> data, string modelId, EmbeddingGenerationOptions? options = null)
+    => GoogleAIEmbeddingRequest.FromData(data, modelId, options?.Dimensions ?? this._dimensions, options);
 
     private static List<ReadOnlyMemory<float>> DeserializeAndProcessEmbeddingsResponse(string body)
         => ProcessEmbeddingsResponse(DeserializeResponse<GoogleAIEmbeddingResponse>(body));
diff --git a/dotnet/src/Connectors/Connectors.Google/Core/VertexAI/VertexAIEmbeddingClient.cs b/dotnet/src/Connectors/Connectors.Google/Core/VertexAI/VertexAIEmbeddingClient.cs
index 87305b928f38..ef119370308b 100644
--- a/dotnet/src/Connectors/Connectors.Google/Core/VertexAI/VertexAIEmbeddingClient.cs
+++ b/dotnet/src/Connectors/Connectors.Google/Core/VertexAI/VertexAIEmbeddingClient.cs
@@ -66,6 +66,11 @@ public VertexAIEmbeddingClient(
 
     private Uri GetEmbeddingEndpoint(string modelId)
     {
+        if (modelId == this._embeddingModelId)
+        {
+            return this._embeddingEndpoint;
+        }
+
         string versionSubLink = GetApiVersionSubLink(this._apiVersion);
         string baseUri = GetVertexAIBaseUri(this._location);
         return new Uri($"{baseUri}/{versionSubLink}/projects/{this._projectId}/locations/{this._location}/publishers/google/models/{modelId}:predict");
diff --git a/dotnet/src/Connectors/Connectors.OpenAI/Services/OpenAIChatCompletionService.cs b/dotnet/src/Connectors/Connectors.OpenAI/Services/OpenAIChatCompletionService.cs
index aac90b0944d2..84626a444aa7 100644
--- a/dotnet/src/Connectors/Connectors.OpenAI/Services/OpenAIChatCompletionService.cs
+++ b/dotnet/src/Connectors/Connectors.OpenAI/Services/OpenAIChatCompletionService.cs
@@ -102,7 +102,12 @@ public Task<IReadOnlyList<ChatMessageContent>> GetChatMessageContentsAsync(
         PromptExecutionSettings? executionSettings = null,
         Kernel? kernel = null,
         CancellationToken cancellationToken = default)
-        => this._client.GetChatMessageContentsAsync(executionSettings?.ModelId ?? this._client.ModelId, chatHistory, executionSettings, kernel, cancellationToken);
+        => this._client.GetChatMessageContentsAsync(
+            string.IsNullOrWhiteSpace(executionSettings?.ModelId) ? this._client.ModelId : executionSettings!.ModelId,
+            chatHistory,
+            executionSettings,
+            kernel,
+            cancellationToken);
 
     /// <inheritdoc/>
     public IAsyncEnumerable<StreamingChatMessageContent> GetStreamingChatMessageContentsAsync(
@@ -110,7 +115,12 @@ public IAsyncEnumerable<StreamingChatMessageContent> GetStreamingChatMessageCont
         PromptExecutionSettings? executionSettings = null,
         Kernel? kernel = null,
         CancellationToken cancellationToken = default)
-        => this._client.GetStreamingChatMessageContentsAsync(executionSettings?.ModelId ?? this._client.ModelId, chatHistory, executionSettings, kernel, cancellationToken);
+        => this._client.GetStreamingChatMessageContentsAsync(
+            string.IsNullOrWhiteSpace(executionSettings?.ModelId) ? this._client.ModelId : executionSettings!.ModelId,
+            chatHistory,
+            executionSettings,
+            kernel,
+            cancellationToken);
 
     /// <inheritdoc/>
     public Task<IReadOnlyList<TextContent>> GetTextContentsAsync(
@@ -118,7 +128,12 @@ public Task<IReadOnlyList<TextContent>> GetTextContentsAsync(
         PromptExecutionSettings? executionSettings = null,
         Kernel? kernel = null,
         CancellationToken cancellationToken = default)
-        => this._client.GetChatAsTextContentsAsync(executionSettings?.ModelId ?? this._client.ModelId, prompt, executionSettings, kernel, cancellationToken);
+        => this._client.GetChatAsTextContentsAsync(
+            string.IsNullOrWhiteSpace(executionSettings?.ModelId) ? this._client.ModelId : executionSettings!.ModelId,
+            prompt,
+            executionSettings,
+            kernel,
+            cancellationToken);
 
     /// <inheritdoc/>
     public IAsyncEnumerable<StreamingTextContent> GetStreamingTextContentsAsync(
@@ -126,5 +141,10 @@ public IAsyncEnumerable<StreamingTextContent> GetStreamingTextContentsAsync(
         PromptExecutionSettings? executionSettings = null,
         Kernel? kernel = null,
         CancellationToken cancellationToken = default)
-        => this._client.GetChatAsTextStreamingContentsAsync(executionSettings?.ModelId ?? this._client.ModelId, prompt, executionSettings, kernel, cancellationToken);
+        => this._client.GetChatAsTextStreamingContentsAsync(
+            string.IsNullOrWhiteSpace(executionSettings?.ModelId) ? this._client.ModelId : executionSettings!.ModelId,
+            prompt,
+            executionSettings,
+            kernel,
+            cancellationToken);
 }