microsoft
diff --git a/‎samples/cs/Directory.Packages.props‎
Lines changed: 1 addition & 1 deletion b/‎samples/cs/Directory.Packages.props‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎samples/cs/README.md‎
Lines changed: 1 addition & 0 deletions b/‎samples/cs/README.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎samples/cs/responses-foundry-local-web-server/Program.cs‎
Lines changed: 180 additions & 0 deletions b/‎samples/cs/responses-foundry-local-web-server/Program.cs‎
Lines changed: 180 additions & 0 deletions
diff --git a/‎samples/cs/responses-foundry-local-web-server/ResponsesFoundryLocalWebServer.csproj‎
Lines changed: 54 additions & 0 deletions b/‎samples/cs/responses-foundry-local-web-server/ResponsesFoundryLocalWebServer.csproj‎
Lines changed: 54 additions & 0 deletions
diff --git a/‎sdk/cs/src/Detail/Model.cs‎
Lines changed: 0 additions & 5 deletions b/‎sdk/cs/src/Detail/Model.cs‎
Lines changed: 0 additions & 5 deletions
diff --git a/‎sdk/cs/src/Detail/ModelVariant.cs‎
Lines changed: 0 additions & 28 deletions b/‎sdk/cs/src/Detail/ModelVariant.cs‎
Lines changed: 0 additions & 28 deletions
diff --git a/‎sdk/cs/src/FoundryLocalManager.cs‎
Lines changed: 0 additions & 19 deletions b/‎sdk/cs/src/FoundryLocalManager.cs‎
Lines changed: 0 additions & 19 deletions
diff --git a/‎sdk/cs/src/IModel.cs‎
Lines changed: 0 additions & 7 deletions b/‎sdk/cs/src/IModel.cs‎
Lines changed: 0 additions & 7 deletions
diff --git a/‎sdk/cs/src/Microsoft.AI.Foundry.Local.csproj‎
Lines changed: 7 additions & 5 deletions b/‎sdk/cs/src/Microsoft.AI.Foundry.Local.csproj‎
Lines changed: 7 additions & 5 deletions
@@ -10,6 +10,6 @@
     <PackageVersion Include="Microsoft.Extensions.Logging" Version="9.0.10" />
     <PackageVersion Include="Microsoft.Extensions.Logging.Console" Version="9.0.10" />
     <PackageVersion Include="NAudio" Version="2.2.1" />
-    <PackageVersion Include="OpenAI" Version="2.5.0" />
+    <PackageVersion Include="OpenAI" Version="2.10.0" />
   </ItemGroup>
 </Project>
@@ -15,6 +15,7 @@ Both packages provide the same APIs, so the same source code works on all platfo
 | [embeddings](embeddings/) | Generate single and batch text embeddings using the Foundry Local SDK. |
 | [audio-transcription-example](audio-transcription-example/) | Transcribe audio files using the Foundry Local SDK. |
 | [foundry-local-web-server](foundry-local-web-server/) | Set up a local OpenAI-compliant web server. |
+| [responses-foundry-local-web-server](responses-foundry-local-web-server/) | Use the OpenAI Responses API (non-streaming, streaming, tool calling) against the local web server. |
 | [tool-calling-foundry-local-sdk](tool-calling-foundry-local-sdk/) | Use tool calling with native chat completions. |
 | [tool-calling-foundry-local-web-server](tool-calling-foundry-local-web-server/) | Use tool calling with the local web server. |
 | [model-management-example](model-management-example/) | Manage models, variant selection, and updates. |
 
@@ -0,0 +1,180 @@
+// <complete_code>
+// Demonstrates the OpenAI Responses API against the Foundry Local OpenAI-compatible web service.
+//
+// SDK responsibilities (Foundry Local):
+//   - SDK initialization
+//   - EP download/registration
+//   - model lookup, download, load
+//   - starting/stopping the local web service
+//
+// Responses API calls go through the official OpenAI .NET package's `ResponsesClient`
+// pointed at the local web service, mirroring how `foundry-local-web-server` uses
+// `OpenAIClient.GetChatClient(...)`.
+
+using System.ClientModel;
+using System.Text;
+using System.Text.Json;
+
+using Microsoft.AI.Foundry.Local;
+
+using OpenAI;
+using OpenAI.Responses;
+
+var config = new Configuration
+{
+    AppName = "foundry_local_samples",
+    LogLevel = Microsoft.AI.Foundry.Local.LogLevel.Information,
+    Web = new Configuration.WebService
+    {
+        Urls = "http://127.0.0.1:52495"
+    }
+};
+
+// Initialize the singleton instance.
+await FoundryLocalManager.CreateAsync(config, Utils.GetAppLogger());
+var mgr = FoundryLocalManager.Instance;
+
+// Download and register all execution providers.
+var currentEp = "";
+await mgr.DownloadAndRegisterEpsAsync((epName, percent) =>
+{
+    if (epName != currentEp)
+    {
+        if (currentEp != "") Console.WriteLine();
+        currentEp = epName;
+    }
+    Console.Write($"\r  {epName.PadRight(30)}  {percent,6:F1}%");
+});
+if (currentEp != "") Console.WriteLine();
+
+// Get the model catalog
+var catalog = await mgr.GetCatalogAsync();
+
+// Get a model using an alias
+var model = await catalog.GetModelAsync("qwen2.5-0.5b") ?? throw new Exception("Model not found");
+
+// Download the model (the method skips download if already cached)
+await model.DownloadAsync(progress =>
+{
+    Console.Write($"\rDownloading model: {progress:F2}%");
+    if (progress >= 100f)
+    {
+        Console.WriteLine();
+    }
+});
+
+// Load the model
+Console.Write($"Loading model {model.Id}...");
+await model.LoadAsync();
+Console.WriteLine("done.");
+
+// Start the web service
+Console.Write($"Starting web service on {config.Web.Urls}...");
+await mgr.StartWebServiceAsync();
+Console.WriteLine("done.");
+
+// <<<<<< OPEN AI RESPONSES SDK USAGE >>>>>>
+// Use the OpenAI Responses client to call the local Foundry web service.
+ApiKeyCredential key = new ApiKeyCredential("notneeded");
+OpenAIClient openai = new OpenAIClient(key, new OpenAIClientOptions
+{
+    Endpoint = new Uri(config.Web.Urls + "/v1"),
+});
+ResponsesClient responses = openai.GetResponsesClient();
+
+// 1) Non-streaming
+Console.WriteLine("\n=== Non-streaming ===");
+ResponseResult simple = await responses.CreateResponseAsync(model.Id, "What is 2 + 2? Respond with just the number.");
+Console.WriteLine($"[ASSISTANT]: {simple.GetOutputText()}");
+
+// 2) Streaming
+Console.WriteLine("\n=== Streaming ===");
+Console.Write("[ASSISTANT]: ");
+await foreach (StreamingResponseUpdate update in responses.CreateResponseStreamingAsync(model.Id, "Count from 1 to 3."))
+{
+    if (update is StreamingResponseOutputTextDeltaUpdate delta && !string.IsNullOrEmpty(delta.Delta))
+    {
+        Console.Write(delta.Delta);
+    }
+}
+Console.WriteLine();
+
+// 3) Function/tool calling — full round-trip using previous_response_id.
+Console.WriteLine("\n=== Function calling ===");
+var weatherSchema = BinaryData.FromString("""
+    {
+        "type": "object",
+        "properties": {
+            "city": { "type": "string", "description": "The city to look up" }
+        },
+        "required": ["city"]
+    }
+    """);
+
+var toolOptions = new CreateResponseOptions(
+    model.Id,
+    new[] { ResponseItem.CreateUserMessageItem("Use get_weather to look up the weather in Seattle, then summarize it.") })
+{
+    StoredOutputEnabled = true,
+    ToolChoice = ResponseToolChoice.CreateRequiredChoice(),
+};
+toolOptions.Tools.Add(ResponseTool.CreateFunctionTool(
+    functionName: "get_weather",
+    functionParameters: weatherSchema,
+    strictModeEnabled: true,
+    functionDescription: "Get the current weather for a given city."));
+
+ResponseResult toolCallResponse = await responses.CreateResponseAsync(toolOptions);
+
+// Find the function-call output item the model produced.
+FunctionCallResponseItem? functionCall = null;
+foreach (var item in toolCallResponse.OutputItems)
+{
+    if (item is FunctionCallResponseItem fc && fc.FunctionName == "get_weather")
+    {
+        functionCall = fc;
+        break;
+    }
+}
+
+if (functionCall is null)
+{
+    Console.WriteLine("Model did not produce a function call; skipping tool round-trip.");
+}
+else
+{
+    var argsJson = functionCall.FunctionArguments?.ToString() ?? "{}";
+    var city = "unknown";
+    try
+    {
+        city = JsonDocument.Parse(argsJson).RootElement.GetProperty("city").GetString() ?? "unknown";
+    }
+    catch (KeyNotFoundException) { /* model gave us no city */ }
+
+    Console.WriteLine($"Tool call: get_weather(city=\"{city}\")");
+    var toolOutput = $$$"""{"city": "{{{city}}}", "temperatureF": 68, "summary": "partly cloudy"}""";
+    Console.WriteLine($"Tool output: {toolOutput}");
+
+    // Submit the tool's output and ask the model to continue using `previous_response_id`.
+    var followUpOptions = new CreateResponseOptions(
+        model.Id,
+        new[] { ResponseItem.CreateFunctionCallOutputItem(functionCall.CallId, toolOutput) })
+    {
+        PreviousResponseId = toolCallResponse.Id,
+        StoredOutputEnabled = true,
+    };
+    followUpOptions.Tools.Add(ResponseTool.CreateFunctionTool(
+        functionName: "get_weather",
+        functionParameters: weatherSchema,
+        strictModeEnabled: true,
+        functionDescription: "Get the current weather for a given city."));
+
+    ResponseResult finalResponse = await responses.CreateResponseAsync(followUpOptions);
+    Console.WriteLine($"[ASSISTANT]: {finalResponse.GetOutputText()}");
+}
+// <<<<<< END OPEN AI RESPONSES SDK USAGE >>>>>>
+
+// Tidy up
+await mgr.StopWebServiceAsync();
+await model.UnloadAsync();
+// </complete_code>
@@ -0,0 +1,54 @@
+<Project Sdk="Microsoft.NET.Sdk">
+
+  <PropertyGroup>
+    <OutputType>Exe</OutputType>
+    <ImplicitUsings>enable</ImplicitUsings>
+    <Nullable>enable</Nullable>
+    <!-- OpenAI Responses APIs are experimental in the official OpenAI .NET package. -->
+    <NoWarn>$(NoWarn);OPENAI001</NoWarn>
+  </PropertyGroup>
+
+  <!-- Windows: target Windows SDK for WinML hardware acceleration -->
+  <PropertyGroup Condition="$([MSBuild]::IsOSPlatform('Windows'))">
+    <TargetFramework>net9.0-windows10.0.26100</TargetFramework>
+    <WindowsAppSDKSelfContained>false</WindowsAppSDKSelfContained>
+    <Platforms>ARM64;x64</Platforms>
+    <WindowsPackageType>None</WindowsPackageType>
+    <EnableCoreMrtTooling>false</EnableCoreMrtTooling>
+  </PropertyGroup>
+
+  <!-- Non-Windows: standard .NET -->
+  <PropertyGroup Condition="!$([MSBuild]::IsOSPlatform('Windows'))">
+    <TargetFramework>net9.0</TargetFramework>
+  </PropertyGroup>
+
+  <PropertyGroup Condition="'$(RuntimeIdentifier)'==''">
+    <RuntimeIdentifier>$(NETCoreSdkRuntimeIdentifier)</RuntimeIdentifier>
+  </PropertyGroup>
+
+  <!-- Windows: WinML for hardware acceleration -->
+  <ItemGroup Condition="$([MSBuild]::IsOSPlatform('Windows'))">
+    <PackageReference Include="Microsoft.AI.Foundry.Local.WinML" />
+  </ItemGroup>
+
+  <!-- Non-Windows: standard SDK -->
+  <ItemGroup Condition="!$([MSBuild]::IsOSPlatform('Windows'))">
+    <PackageReference Include="Microsoft.AI.Foundry.Local" />
+  </ItemGroup>
+
+  <!-- Linux GPU support -->
+  <ItemGroup Condition="'$(RuntimeIdentifier)' == 'linux-x64'">
+    <PackageReference Include="Microsoft.ML.OnnxRuntime.Gpu" />
+    <PackageReference Include="Microsoft.ML.OnnxRuntimeGenAI.Cuda" />
+  </ItemGroup>
+
+  <ItemGroup>
+    <PackageReference Include="OpenAI" />
+  </ItemGroup>
+
+  <!-- Shared utilities -->
+  <ItemGroup>
+    <Compile Include="../Shared/*.cs" />
+  </ItemGroup>
+
+</Project>
@@ -104,11 +104,6 @@ public async Task<OpenAIEmbeddingClient> GetEmbeddingClientAsync(CancellationTok
         return await SelectedVariant.GetEmbeddingClientAsync(ct).ConfigureAwait(false);
     }
 
-    public async Task<OpenAIResponsesClient> GetResponsesClientAsync(CancellationToken? ct = null)
-    {
-        return await SelectedVariant.GetResponsesClientAsync(ct).ConfigureAwait(false);
-    }
-
     public async Task UnloadAsync(CancellationToken? ct = null)
     {
         await SelectedVariant.UnloadAsync(ct).ConfigureAwait(false);
 
@@ -109,13 +109,6 @@ public async Task<OpenAIEmbeddingClient> GetEmbeddingClientAsync(CancellationTok
                                                     .ConfigureAwait(false);
     }
 
-    public async Task<OpenAIResponsesClient> GetResponsesClientAsync(CancellationToken? ct = null)
-    {
-        return await Utils.CallWithExceptionHandling(() => GetResponsesClientImplAsync(ct),
-                                                     "Error getting responses client for model", _logger)
-                                                    .ConfigureAwait(false);
-    }
-
     private async Task<bool> IsLoadedImplAsync(CancellationToken? ct = null)
     {
         var loadedModels = await _modelLoadManager.ListLoadedModelsAsync(ct).ConfigureAwait(false);
@@ -217,27 +210,6 @@ private async Task<OpenAIEmbeddingClient> GetEmbeddingClientImplAsync(Cancellati
         return new OpenAIEmbeddingClient(Id);
     }
 
-    private async Task<OpenAIResponsesClient> GetResponsesClientImplAsync(CancellationToken? ct = null)
-    {
-        if (!await IsLoadedAsync(ct))
-        {
-            throw new FoundryLocalException($"Model {Id} is not loaded. Call LoadAsync first.");
-        }
-
-        var manager = FoundryLocalManager.Instance;
-        if (manager.Urls == null || manager.Urls.Length == 0)
-        {
-            await manager.StartWebServiceAsync(ct).ConfigureAwait(false);
-        }
-
-        if (manager.Urls == null || manager.Urls.Length == 0)
-        {
-            throw new FoundryLocalException("Web service is not running. Call StartWebServiceAsync first.");
-        }
-
-        return new OpenAIResponsesClient(manager.Urls[0], Id);
-    }
-
     public void SelectVariant(IModel variant)
     {
         throw new FoundryLocalException(
 
@@ -460,23 +460,4 @@ public void Dispose()
         Dispose(disposing: true);
         GC.SuppressFinalize(this);
     }
-
-    /// <summary>
-    /// Get an HTTP client for the OpenAI Responses API.
-    /// </summary>
-    /// <remarks>
-    /// The web service must be started first (see <see cref="StartWebServiceAsync"/>).
-    /// </remarks>
-    /// <param name="modelId">Optional default model id used when callers don't supply one.</param>
-    /// <returns>A new <see cref="OpenAIResponsesClient"/>.</returns>
-    /// <exception cref="FoundryLocalException">If the web service has not been started.</exception>
-    public OpenAIResponsesClient GetResponsesClient(string? modelId = null)
-    {
-        if (Urls == null || Urls.Length == 0)
-        {
-            throw new FoundryLocalException("Web service is not running. Call StartWebServiceAsync first.");
-        }
-
-        return new OpenAIResponsesClient(Urls[0], modelId);
-    }
 }
@@ -77,13 +77,6 @@ Task DownloadAsync(Action<float>? downloadProgress = null,
     /// <returns>OpenAI.EmbeddingClient</returns>
     Task<OpenAIEmbeddingClient> GetEmbeddingClientAsync(CancellationToken? ct = null);
 
-    /// <summary>
-    /// Get an HTTP client for the OpenAI Responses API.
-    /// </summary>
-    /// <param name="ct">Optional cancellation token.</param>
-    /// <returns>An <see cref="OpenAIResponsesClient"/> bound to this model.</returns>
-    Task<OpenAIResponsesClient> GetResponsesClientAsync(CancellationToken? ct = null);
-
     /// <summary>
     /// Variants of the model that are available. Variants of the model are optimized for different devices.
     /// </summary>
 
@@ -72,7 +72,8 @@
     <!-- This target runs automatically after package assets are resolved and prints the exact version of the Core package that was selected. -->
     <Target Name="PrintResolvedVersions" AfterTargets="ResolvePackageAssets">
         <Message Importance="High" Text="Resolved Dependencies:" />
-        <Message Importance="High" Text="  %(PackageDependencies.Identity) : %(PackageDependencies.Version)" Condition="$([System.String]::Copy('%(PackageDependencies.Identity)').StartsWith('Microsoft.AI.Foundry.Local.Core'))" />
+        <Message Importance="High" Text="  %(PackageDependencies.Identity) : %(PackageDependencies.Version)" 
+                 Condition="$([System.String]::Copy('%(PackageDependencies.Identity)').StartsWith('Microsoft.AI.Foundry.Local.Core'))" />
     </Target>
 
     <ItemGroup>
@@ -120,13 +121,14 @@
       <NoWarn>$(NoWarn);NU1604</NoWarn>
     </PropertyGroup>
     <ItemGroup>
-      <PackageReference Condition="'$(UseWinML)' == 'true'" Include="Microsoft.AI.Foundry.Local.Core.WinML" Version="$(FoundryLocalCoreWinMLVersion)" />
-      <PackageReference Condition="'$(UseWinML)' != 'true'" Include="Microsoft.AI.Foundry.Local.Core" Version="$(FoundryLocalCoreVersion)" />
+      <PackageReference Condition="'$(UseWinML)' == 'true'"
+                        Include="Microsoft.AI.Foundry.Local.Core.WinML" Version="$(FoundryLocalCoreWinMLVersion)" />
+      <PackageReference Condition="'$(UseWinML)' != 'true'"
+                        Include="Microsoft.AI.Foundry.Local.Core" Version="$(FoundryLocalCoreVersion)" />
 
       <PackageReference Include="Betalgo.Ranul.OpenAI" Version="9.1.0" />
       <PackageReference Include="Microsoft.Extensions.Logging" Version="9.0.9" />
       <!-- specify PrivateAssets to exclude from nuget dependencies -->
-      <PackageReference Include="IDisposableAnalyzers" Version="4.0.8" PrivateAssets="all" />
-      <PackageReference Include="OpenAI" Version="2.10.0" />
+      <PackageReference Include="IDisposableAnalyzers" Version="4.0.8" PrivateAssets="all"/>
     </ItemGroup>
 </Project>
Original file line number	Diff line number	Diff line change
`@@ -104,11 +104,6 @@ public async Task<OpenAIEmbeddingClient> GetEmbeddingClientAsync(CancellationTok`
`104`	`104`	`return await SelectedVariant.GetEmbeddingClientAsync(ct).ConfigureAwait(false);`
`105`	`105`	`}`
`106`	`106`
`107`		`- public async Task<OpenAIResponsesClient> GetResponsesClientAsync(CancellationToken? ct = null)`
`108`		`- {`
`109`		`- return await SelectedVariant.GetResponsesClientAsync(ct).ConfigureAwait(false);`
`110`		`- }`
`111`		`-`
`112`	`107`	`public async Task UnloadAsync(CancellationToken? ct = null)`
`113`	`108`	`{`
`114`	`109`	`await SelectedVariant.UnloadAsync(ct).ConfigureAwait(false);`