diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 2c68e17..269eb5b 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -8,8 +8,8 @@ on:
     branches: [ "main", "master" ]
     paths: [ 'src/**' ]
 
-jobs:
 
+jobs:
   build:
 
     runs-on: ubuntu-latest
@@ -45,7 +45,7 @@ jobs:
       run: dotnet build --no-restore --configuration=Release /p:Version=${{steps.gitversion.outputs.semVer}}
 
     - name: Test
-      run: dotnet test --no-build --configuration=Release --verbosity normal
+      run: dotnet test --no-build --configuration=Release --verbosity normal --filter 'FullyQualifiedName!~FunctionalTests'
       
     - name: pack nuget packages
       run: dotnet pack --output nupkgs --configuration=Release --no-restore --no-build /p:PackageVersion=${{steps.gitversion.outputs.semVer}}
@@ -59,4 +59,4 @@ jobs:
 
     - name: upload nuget package
       if: github.event_name != 'pull_request'
-      run: dotnet nuget push nupkgs/OllamaSharp*.nupkg -k ${{ secrets.NUGET_API_KEY }} -s https://api.nuget.org/v3/index.json
+      run: dotnet nuget push nupkgs/OllamaSharp*.nupkg -k ${{ secrets.NUGET_API_KEY }} -s https://api.nuget.org/v3/index.json
\ No newline at end of file
diff --git a/.github/workflows/docs.yml b/.github/workflows/docs.yml
new file mode 100644
index 0000000..74de1ce
--- /dev/null
+++ b/.github/workflows/docs.yml
@@ -0,0 +1,40 @@
+name: docfx Build and Deploy
+
+on:
+  push:
+    branches: [ "main" ]
+  workflow_dispatch:
+    
+permissions:
+  actions: read
+  pages: write
+  id-token: write
+
+concurrency:
+  group: "pages"
+  cancel-in-progress: false
+  
+jobs:
+  publish-docs:
+    environment:
+      name: github-pages
+      url: ${{ steps.deployment.outputs.page_url }}
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v3
+      - name: Dotnet Setup
+        uses: actions/setup-dotnet@v3
+        with:
+          dotnet-version: 8.x
+
+      - run: dotnet tool update -g docfx
+      - run: docfx ./docfx.json
+
+      - name: Upload artifact
+        uses: actions/upload-pages-artifact@v3
+        with:
+          path: './_site'
+      - name: Deploy to GitHub Pages
+        id: deployment
+        uses: actions/deploy-pages@v4
\ No newline at end of file
diff --git a/.gitignore b/.gitignore
index f08db5b..240577a 100644
--- a/.gitignore
+++ b/.gitignore
@@ -396,4 +396,8 @@ FodyWeavers.xsd
 
 # JetBrains Rider
 *.sln.iml
-/.idea
\ No newline at end of file
+/.idea
+
+# DocFX
+_site/
+api/
\ No newline at end of file
diff --git a/demo/Demos/ToolConsole.cs b/demo/Demos/ToolConsole.cs
index e154626..9574da9 100644
--- a/demo/Demos/ToolConsole.cs
+++ b/demo/Demos/ToolConsole.cs
@@ -93,7 +93,7 @@ public override async Task Run()
 		}
 	}
 
-	private static IEnumerable<Tool> GetTools() => [new WeatherTool(), new NewsTool()];
+	private static Tool[] GetTools() => [new WeatherTool(), new NewsTool()];
 
 	private sealed class WeatherTool : Tool
 	{
diff --git a/doc-template/public/main.css b/doc-template/public/main.css
new file mode 100644
index 0000000..98b5285
--- /dev/null
+++ b/doc-template/public/main.css
@@ -0,0 +1,9 @@
+.flex-row {
+    display: flex;
+    flex-direction: row;
+}
+
+.flex-column {
+    display: flex;
+    flex-direction: column;
+}
\ No newline at end of file
diff --git a/doc-template/public/main.js b/doc-template/public/main.js
new file mode 100644
index 0000000..b0feb6f
--- /dev/null
+++ b/doc-template/public/main.js
@@ -0,0 +1,10 @@
+export default {
+    defaultTheme: 'dark',
+    iconLinks: [
+        {
+            icon: 'github',
+            href: 'https://github.com/awaescher/OllamaSharp',
+            title: 'GitHub'
+        }
+    ]
+}
\ No newline at end of file
diff --git a/docfx.json b/docfx.json
new file mode 100644
index 0000000..05f021e
--- /dev/null
+++ b/docfx.json
@@ -0,0 +1,52 @@
+{
+  "metadata": [
+    {
+      "src": [
+        {
+          "src": "./src",
+          "files": [
+            "**/*.csproj"
+          ]
+        }
+      ],
+      "dest": "api"
+    }
+  ],
+  "build": {
+    "content": [
+      {
+        "files": [
+          "**/*.{md,yml}"
+        ],
+        "exclude": [
+          "_site/**"
+        ]
+      }
+    ],
+    "markdownEngineProperties": {
+      "markdigExtensions": [
+        "CustomContainers"
+      ]
+    },
+    "resource": [
+      {
+        "files": [
+          "images/**"
+        ]
+      }
+    ],
+    "output": "_site",
+    "template": [
+      "default",
+      "modern",
+      "doc-template"
+    ],
+    "globalMetadata": {
+      "_appName": "OllamaSharp",
+      "_appTitle": "OllamaSharp",
+      "_appLogoPath": "images/0.png",
+      "_enableSearch": true,
+      "pdf": true
+    }
+  }
+}
\ No newline at end of file
diff --git a/docs/getting-started.md b/docs/getting-started.md
new file mode 100644
index 0000000..c2b1357
--- /dev/null
+++ b/docs/getting-started.md
@@ -0,0 +1,64 @@
+# Getting Started
+
+[OllamaSharp](https://github.com/awaescher/OllamaSharp) provides .NET bindings for the Ollama API, simplifying interactions with Ollama both locally and remotely. It provides asynchronous streaming, progress reporting and convenience classes and functions to simplify common use cases.
+
+Getting started with OllamaSharp only requires a running Ollama server and a supported version of [.NET](https://dotnet.microsoft.com/en-us/download).
+
+## Prerequisites
+
+- [Ollama](https://ollama.com/)
+- [.NET](https://dotnet.microsoft.com/en-us/download)
+
+## Pulling a model
+
+To use Ollama, you will need  to specify a large language model to talk with. You can download a model from the [Ollama model hub](https://ollama.com/models). Below is a code snippet illustrating how to connect to an Ollama server and pull a model from there:
+
+```csharp
+using OllamaSharp;
+
+// if you are running Ollama locally on the default port:
+var uri = new Uri("http://localhost:11434");
+var ollama = new OllamaApiClient(uri);
+
+// pull the model, and print the status of the pull operation.
+await foreach (var status in ollama.PullModelAsync("llama3.2-vision"))
+    Console.WriteLine($"{status.Percent}% {status.Status}");
+
+Console.WriteLine("Model pulled successfully.");
+```
+
+This should result in an output like this:
+
+```
+100% pulling manifest
+100% pulling 11f274007f09
+100% pulling ece5e659647a
+100% pulling 715415638c9c
+100% pulling 0b4284c1f870
+100% pulling fefc914e46e6
+100% pulling fbd313562bb7
+100% verifying sha256 digest
+100% writing manifest
+100% success
+Model pulled successfully.
+```
+
+## Taking to a model
+
+After obtaining a model, you can begin interacting with Ollama. The following code snippet demonstrates how to connect to an Ollama server, load a model, and initiate a conversation:
+
+```csharp
+using OllamaSharp;
+
+var uri = new Uri("http://localhost:11434");
+var model = "llama3.2-vision";
+
+var ollama = new OllamaApiClient(uri, model);
+    
+var request = "Write a deep, beautiful song for me about AI and the future.";
+
+await foreach (var stream in ollama.GenerateAsync(request))
+    Console.Write(stream.Response);
+```
+
+The model's answer should be streamed directly into your Console window.
\ No newline at end of file
diff --git a/docs/introduction.md b/docs/introduction.md
new file mode 100644
index 0000000..9698310
--- /dev/null
+++ b/docs/introduction.md
@@ -0,0 +1,5 @@
+# Introduction
+
+[Ollama](https://ollama.com/) is a [Go](https://go.dev/)-based, open-source server for interacting with local large language models using Georgi Gerganov's [llama.cpp](https://github.com/ggerganov/llama.cpp) library. Ollama provides first-class support for various models, including [llama3.2](https://ollama.com/library/llama3.2), [phi3.5](https://ollama.com/library/phi3.5), [mistral](https://ollama.com/library/mistral), and many more. It provides support for pulling, running, creating, pushing, and interacting with models.
+
+[OllamaSharp](https://github.com/awaescher/OllamaSharp) provides .NET bindings for the Ollama API, simplifying interactions with Ollama both locally and remotely. It provides asynchronous streaming, progress reporting and convenience classes and functions to simplify common use cases.
\ No newline at end of file
diff --git a/docs/toc.yml b/docs/toc.yml
new file mode 100644
index 0000000..d7e9ea8
--- /dev/null
+++ b/docs/toc.yml
@@ -0,0 +1,4 @@
+- name: Introduction
+  href: introduction.md
+- name: Getting Started
+  href: getting-started.md
\ No newline at end of file
diff --git a/images/0.png b/images/0.png
new file mode 100644
index 0000000..bdb78b2
Binary files /dev/null and b/images/0.png differ
diff --git a/images/dotnet@0.1x.png b/images/dotnet@0.1x.png
new file mode 100644
index 0000000..1420f88
Binary files /dev/null and b/images/dotnet@0.1x.png differ
diff --git a/images/logo.png b/images/logo.png
new file mode 100644
index 0000000..85dd87b
Binary files /dev/null and b/images/logo.png differ
diff --git a/images/logo@0.1x.png b/images/logo@0.1x.png
new file mode 100644
index 0000000..eb7374f
Binary files /dev/null and b/images/logo@0.1x.png differ
diff --git a/index.md b/index.md
new file mode 100644
index 0000000..8f52f86
--- /dev/null
+++ b/index.md
@@ -0,0 +1,53 @@
+---
+_layout: landing
+---
+
+::::flex-row
+
+:::col
+
+![Ollama Logo](images/logo@0.1x.png) ➕ ![.NET Logo](images/dotnet@0.1x.png)
+
+# Build AI-powered applications with Ollama and .NET 🦙
+
+OllamaSharp provides .NET bindings for the [Ollama API](https://github.com/jmorganca/ollama/blob/main/docs/api.md), simplifying interactions with Ollama both locally and remotely.
+
+Provides support for interacting with Ollama directly, or through the [Microsoft.Extensions.AI](https://devblogs.microsoft.com/dotnet/introducing-microsoft-extensions-ai-preview/)
+and [Microsoft Semantic Kernel](https://github.com/microsoft/semantic-kernel/pull/7362) libraries.
+:::
+:::col
+
+### Add OllamaSharp to your project
+```bash
+dotnet add package OllamaSharp
+```
+
+### Start talking to Ollama
+```csharp
+using OllamaSharp;
+
+var uri = new Uri("http://localhost:11434");
+var ollama = new OllamaApiClient(uri, "llama3.2");
+
+// messages including their roles and tool calls will automatically
+// be tracked within the chat object and are accessible via the Messages property
+var chat = new Chat(ollama);
+   
+Console.WriteLine("You're now talking with Ollama. Hit Ctrl+C to exit.");
+
+while (true)
+{
+    Console.Write("You: ");
+    var input = Console.ReadLine();
+
+    Console.Write("Assistant: ");
+    await foreach (var stream in chat.SendAsync(message))
+        Console.Write(stream);
+
+    Console.WriteLine("");
+}
+```
+
+:::
+
+::::
\ No newline at end of file
diff --git a/src/AsyncEnumerableExtensions/ChatResponseStreamAppender.cs b/src/AsyncEnumerableExtensions/ChatResponseStreamAppender.cs
index af25c7e..9c76d20 100644
--- a/src/AsyncEnumerableExtensions/ChatResponseStreamAppender.cs
+++ b/src/AsyncEnumerableExtensions/ChatResponseStreamAppender.cs
@@ -4,15 +4,16 @@
 namespace OllamaSharp.AsyncEnumerableExtensions;
 
 /// <summary>
-/// Appender to stream IAsyncEnumerable(ChatResponseStream) to build up one single ChatDoneResponseStream object
+/// Appender to stream <see cref="System.Collections.Generic.IAsyncEnumerable{ChatResponseStream}"/> to
+/// build up one single <see cref="ChatDoneResponseStream"/> object
 /// </summary>
-public class ChatResponseStreamAppender : IAppender<ChatResponseStream?, ChatDoneResponseStream?>
+internal class ChatResponseStreamAppender : IAppender<ChatResponseStream?, ChatDoneResponseStream?>
 {
 	private readonly MessageBuilder _messageBuilder = new();
 	private ChatDoneResponseStream? _lastItem;
 
 	/// <summary>
-	/// Appends a given ChatResponseStream item to build a single return object
+	/// Appends a given <see cref="ChatResponseStream"/> item to build a single return object
 	/// </summary>
 	/// <param name="item">The item to append</param>
 	public void Append(ChatResponseStream? item)
@@ -24,8 +25,10 @@ public void Append(ChatResponseStream? item)
 	}
 
 	/// <summary>
-	/// Builds up one single ChatDoneResponseStream object from the previously streamed ChatResponseStream items
+	/// Builds up one single <see cref="ChatDoneResponseStream"/> object from the
+	/// previously streamed <see cref="ChatResponseStream"/> items
 	/// </summary>
+	/// <returns>The completed consolidated <see cref="ChatDoneResponseStream"/> object</returns>
 	public ChatDoneResponseStream? Complete()
 	{
 		if (_lastItem is null)
diff --git a/src/AsyncEnumerableExtensions/GenerateResponseStreamAppender.cs b/src/AsyncEnumerableExtensions/GenerateResponseStreamAppender.cs
index 4ee4694..11e1649 100644
--- a/src/AsyncEnumerableExtensions/GenerateResponseStreamAppender.cs
+++ b/src/AsyncEnumerableExtensions/GenerateResponseStreamAppender.cs
@@ -5,15 +5,16 @@
 namespace OllamaSharp.AsyncEnumerableExtensions;
 
 /// <summary>
-/// Appender to stream IAsyncEnumerable(GenerateResponseStream) to build up one single GenerateDoneResponseStream object
+/// Appender to stream <see cref="System.Collections.Generic.IAsyncEnumerable{GenerateDoneResponseStream}"/>
+/// to build up one single <see cref="GenerateDoneResponseStream"/> object
 /// </summary>
-public class GenerateResponseStreamAppender : IAppender<GenerateResponseStream?, GenerateDoneResponseStream?>
+internal class GenerateResponseStreamAppender : IAppender<GenerateResponseStream?, GenerateDoneResponseStream?>
 {
 	private readonly StringBuilder _builder = new();
 	private GenerateDoneResponseStream? _lastItem;
 
 	/// <summary>
-	/// Appends a given GenerateResponseStream item to build a single return object
+	/// Appends a given <see cref="GenerateResponseStream"/> item to build a single return object
 	/// </summary>
 	/// <param name="item">The item to append</param>
 	public void Append(GenerateResponseStream? item)
@@ -25,8 +26,10 @@ public void Append(GenerateResponseStream? item)
 	}
 
 	/// <summary>
-	/// Builds up one single GenerateDoneResponseStream object from the previously streamed GenerateResponseStream items
+	/// Builds up one single <see cref="GenerateDoneResponseStream"/> object
+	/// from the previously streamed <see cref="GenerateResponseStream"/> items
 	/// </summary>
+	/// <returns>The completed, consolidated <see cref="GenerateDoneResponseStream"/> object</returns>
 	public GenerateDoneResponseStream? Complete()
 	{
 		if (_lastItem is null)
diff --git a/src/AsyncEnumerableExtensions/IAppender.cs b/src/AsyncEnumerableExtensions/IAppender.cs
index db819b1..99f9ae8 100644
--- a/src/AsyncEnumerableExtensions/IAppender.cs
+++ b/src/AsyncEnumerableExtensions/IAppender.cs
@@ -5,7 +5,7 @@ namespace OllamaSharp.AsyncEnumerableExtensions;
 /// </summary>
 /// <typeparam name="Tin">The type of the items of the IAsyncEnumerable</typeparam>
 /// <typeparam name="Tout">The return type after the IAsyncEnumerable was streamed to the end</typeparam>
-public interface IAppender<in Tin, out Tout>
+internal interface IAppender<in Tin, out Tout>
 {
 	/// <summary>
 	/// Appends an item to build up the return value
diff --git a/src/AsyncEnumerableExtensions/IAsyncEnumerableExtensions.cs b/src/AsyncEnumerableExtensions/IAsyncEnumerableExtensions.cs
index cf118f3..3a93901 100644
--- a/src/AsyncEnumerableExtensions/IAsyncEnumerableExtensions.cs
+++ b/src/AsyncEnumerableExtensions/IAsyncEnumerableExtensions.cs
@@ -19,7 +19,7 @@ public static partial class IAsyncEnumerableExtensions
 	/// </summary>
 	/// <param name="stream">The IAsyncEnumerable to stream</param>
 	/// <param name="itemCallback">An optional callback to additionally process every single item from the IAsyncEnumerable</param>
-	/// <returns>A single response stream appened from every IAsyncEnumerable item</returns>
+	/// <returns>A single response stream append from every IAsyncEnumerable item</returns>
 	public static Task<string> StreamToEndAsync(this IAsyncEnumerable<string> stream, Action<string>? itemCallback = null)
 		=> stream.StreamToEndAsync(new StringAppender(), itemCallback);
 
@@ -48,7 +48,7 @@ public static Task<string> StreamToEndAsync(this IAsyncEnumerable<string> stream
 	/// <param name="appender">The appender instance used to build up one single response value</param>
 	/// <param name="itemCallback">An optional callback to additionally process every single item from the IAsyncEnumerable</param>
 	/// <returns>A single ChatDoneResponseStream built up from every single IAsyncEnumerable item</returns>
-	public static async Task<Tout> StreamToEndAsync<Tin, Tout>(this IAsyncEnumerable<Tin> stream, IAppender<Tin, Tout> appender, Action<Tin>? itemCallback = null)
+	internal static async Task<Tout> StreamToEndAsync<Tin, Tout>(this IAsyncEnumerable<Tin> stream, IAppender<Tin, Tout> appender, Action<Tin>? itemCallback = null)
 	{
 		await foreach (var item in stream.ConfigureAwait(false))
 		{
diff --git a/src/AsyncEnumerableExtensions/StringAppender.cs b/src/AsyncEnumerableExtensions/StringAppender.cs
index abd99ed..6b3dd1d 100644
--- a/src/AsyncEnumerableExtensions/StringAppender.cs
+++ b/src/AsyncEnumerableExtensions/StringAppender.cs
@@ -3,9 +3,9 @@
 namespace OllamaSharp.AsyncEnumerableExtensions;
 
 /// <summary>
-/// Appender to stream IAsyncEnumerable(string) to build up one single result string
+/// Appender to stream <see cref="System.Collections.Generic.IAsyncEnumerable{String}"/> to build up one single result string
 /// </summary>
-public class StringAppender : IAppender<string, string>
+internal class StringAppender : IAppender<string, string>
 {
 	private readonly StringBuilder _builder = new();
 
diff --git a/src/ByteArrayExtensions.cs b/src/ByteArrayExtensions.cs
index ce11a7e..ffea185 100644
--- a/src/ByteArrayExtensions.cs
+++ b/src/ByteArrayExtensions.cs
@@ -7,17 +7,20 @@ namespace OllamaSharp;
 /// <summary>
 /// Extensions for byte arrays
 /// </summary>
-public static class ByteArrayExtensions
+internal static class ByteArrayExtensions
 {
 	/// <summary>
-	/// Converts a series of bytes to a base64 string
+	/// Converts a sequence of bytes to its equivalent string representation encoded in base-64.
 	/// </summary>
-	/// <param name="bytes">The bytes to convert to base64</param>
-	public static string ToBase64(this IEnumerable<byte>? bytes) => Convert.ToBase64String(bytes.ToArray());
+	/// <param name="bytes">The sequence of bytes to convert to a base-64 string.</param>
+	/// <returns>A base-64 encoded string representation of the input byte sequence.</returns>
+	public static string ToBase64(this IEnumerable<byte> bytes) => Convert.ToBase64String(bytes.ToArray());
+
 
 	/// <summary>
-	/// Converts multiple series of bytes to multiple base64 strings, one for each.
+	/// Converts a collection of byte arrays to a collection of base64 strings.
 	/// </summary>
-	/// <param name="byteArrays">The series of bytes to convert to base64</param>
-	public static IEnumerable<string>? ToBase64(this IEnumerable<IEnumerable<byte>>? byteArrays) => byteArrays?.Select(ToBase64);
+	/// <param name="byteArrays">The collection of byte arrays to convert to base64 strings.</param>
+	/// <returns>A collection of base64 strings, or null if the input is null.</returns>
+	public static IEnumerable<string>? ToBase64(this IEnumerable<IEnumerable<byte>>? byteArrays) => byteArrays?.Select(bytes => bytes.ToBase64());
 }
\ No newline at end of file
diff --git a/src/Chat.cs b/src/Chat.cs
index 0d0e0e2..65c18e5 100644
--- a/src/Chat.cs
+++ b/src/Chat.cs
@@ -12,6 +12,31 @@ namespace OllamaSharp;
 /// <summary>
 /// A chat helper that handles the chat logic internally and
 /// automatically extends the message history.
+///
+/// <example>
+/// A simple interactive chat can be implemented in just a handful of lines:
+/// <code>
+/// var ollama = new OllamaApiClient("http://localhost:11434", "llama3.2-vision:latest");
+/// var chat = new Chat(ollama);
+/// // ...
+/// while (true)
+/// {
+/// 	Console.Write("You: ");
+/// 	var message = Console.ReadLine()!;
+/// 	Console.Write("Ollama: ");
+/// 	await foreach (var answerToken in chat.SendAsync(message))
+/// 		Console.Write(answerToken);
+///		// ...
+/// 	Console.WriteLine();
+/// }
+/// // ...
+/// // Output:
+/// // You: Write a haiku about AI models
+/// // Ollama: Code whispers secrets
+/// //   Intelligent designs unfold
+/// //   Minds beyond our own
+/// </code>
+/// </example>
 /// </summary>
 public class Chat
 {
@@ -40,7 +65,17 @@ public class Chat
 	/// </summary>
 	/// <param name="client">The Ollama client to use for the chat</param>
 	/// <param name="systemPrompt">An optional system prompt to define the behavior of the chat assistant</param>
-	/// <exception cref="ArgumentNullException"></exception>
+	/// <exception cref="ArgumentNullException">
+	/// If the client is null, an <see cref="ArgumentNullException"/> is thrown.
+	/// </exception>
+	/// <example>
+	/// Setting up a chat with a system prompt:
+	/// <code>
+	///		var client = new OllamaApiClient("http://localhost:11434", "llama3.2-vision:latest");
+	///		var prompt = "You are a helpful assistant that will answer any question you are asked.";
+	///		var chat = new Chat(client, prompt);		
+	/// </code>
+	/// </example>
 	public Chat(IOllamaApiClient client, string systemPrompt = "")
 	{
 		Client = client ?? throw new ArgumentNullException(nameof(client));
@@ -55,6 +90,15 @@ public Chat(IOllamaApiClient client, string systemPrompt = "")
 	/// </summary>
 	/// <param name="message">The message to send</param>
 	/// <param name="cancellationToken">The token to cancel the operation with</param>
+	/// <returns>An <see cref="IAsyncEnumerable{String}"/> that streams the response.</returns>
+	/// <example>
+	/// Getting a response from the model:
+	/// <code>
+	/// var response = await chat.SendAsync("Write a haiku about AI models");
+	/// await foreach (var answerToken in response)
+	///		 Console.WriteLine(answerToken);
+	/// </code>
+	/// </example>
 	public IAsyncEnumerable<string> SendAsync(string message, CancellationToken cancellationToken = default)
 		=> SendAsync(message, tools: null, imagesAsBase64: null, cancellationToken);
 
@@ -64,7 +108,25 @@ public IAsyncEnumerable<string> SendAsync(string message, CancellationToken canc
 	/// <param name="message">The message to send</param>
 	/// <param name="imagesAsBytes">Images in byte representation to send to the model</param>
 	/// <param name="cancellationToken">The token to cancel the operation with</param>
-	public IAsyncEnumerable<string> SendAsync(string message, IEnumerable<IEnumerable<byte>> imagesAsBytes, CancellationToken cancellationToken = default)
+	/// <returns>An <see cref="IAsyncEnumerable{String}"/> that streams the response.</returns>
+	/// <example>
+	/// Getting a response from the model with an image:
+	/// <code>
+	///  var client = new HttpClient();
+	///  var cat = await client.GetByteArrayAsync("https://cataas.com/cat");
+	///  var ollama = new OllamaApiClient("http://localhost:11434", "llama3.2-vision:latest");
+	///  var chat = new Chat(ollama);
+	///  var response = chat.SendAsync("What do you see?", [cat]);
+	///  await foreach (var answerToken in response) Console.Write(answerToken);
+	///
+	///  // Output: The image shows a white kitten with black markings on its
+	///  //         head and tail, sitting next to an orange tabby cat. The kitten
+	///  //         is looking at the camera while the tabby cat appears to be
+	///  //         sleeping or resting with its eyes closed. The two cats are
+	///  //         lying in a blanket that has been rumpled up.
+	/// </code>
+	/// </example>
+	public IAsyncEnumerable<string> SendAsync(string message, IEnumerable<IEnumerable<byte>>? imagesAsBytes, CancellationToken cancellationToken = default)
 		=> SendAsync(message, imagesAsBytes?.ToBase64() ?? [], cancellationToken);
 
 	/// <summary>
@@ -73,7 +135,26 @@ public IAsyncEnumerable<string> SendAsync(string message, IEnumerable<IEnumerabl
 	/// <param name="message">The message to send</param>
 	/// <param name="imagesAsBase64">Base64 encoded images to send to the model</param>
 	/// <param name="cancellationToken">The token to cancel the operation with</param>
-	public IAsyncEnumerable<string> SendAsync(string message, IEnumerable<string> imagesAsBase64, CancellationToken cancellationToken = default)
+	/// <returns>An <see cref="IAsyncEnumerable{String}"/> that streams the response.</returns>
+	/// <example>
+	/// Getting a response from the model with an image:
+	/// <code>
+	/// var client = new HttpClient();
+	/// var cat = await client.GetByteArrayAsync("https://cataas.com/cat");
+	/// var base64Cat = Convert.ToBase64String(cat);
+	/// var ollama = new OllamaApiClient("http://localhost:11434", "llama3.2-vision:latest");
+	/// var chat = new Chat(ollama);
+	/// var response = chat.SendAsync("What do you see?", [base64Cat]);
+	/// await foreach (var answerToken in response) Console.Write(answerToken);
+	/// 
+	/// // Output:
+	/// // The image shows a cat lying on the floor next to an iPad. The cat is looking
+	/// // at the screen, which displays a game with fish and other sea creatures. The
+	/// // cat's paw is touching the screen, as if it is playing the game. The background
+	/// // of the image is a wooden floor.
+	/// </code>
+	/// </example>
+	public IAsyncEnumerable<string> SendAsync(string message, IEnumerable<string>? imagesAsBase64, CancellationToken cancellationToken = default)
 		=> SendAsync(message, [], imagesAsBase64, cancellationToken);
 
 	/// <summary>
@@ -83,7 +164,7 @@ public IAsyncEnumerable<string> SendAsync(string message, IEnumerable<string> im
 	/// <param name="tools">Tools that the model can make use of, see https://ollama.com/blog/tool-support. By using tools, response streaming is automatically turned off</param>
 	/// <param name="imagesAsBase64">Base64 encoded images to send to the model</param>
 	/// <param name="cancellationToken">The token to cancel the operation with</param>
-	public IAsyncEnumerable<string> SendAsync(string message, IEnumerable<Tool>? tools, IEnumerable<string>? imagesAsBase64 = default, CancellationToken cancellationToken = default)
+	public IAsyncEnumerable<string> SendAsync(string message, IReadOnlyCollection<Tool>? tools, IEnumerable<string>? imagesAsBase64 = default, CancellationToken cancellationToken = default)
 		=> SendAsAsync(ChatRole.User, message, tools, imagesAsBase64, cancellationToken);
 
 	/// <summary>
@@ -102,7 +183,7 @@ public IAsyncEnumerable<string> SendAsAsync(ChatRole role, string message, Cance
 	/// <param name="message">The message to send</param>
 	/// <param name="imagesAsBytes">Images in byte representation to send to the model</param>
 	/// <param name="cancellationToken">The token to cancel the operation with</param>
-	public IAsyncEnumerable<string> SendAsAsync(ChatRole role, string message, IEnumerable<IEnumerable<byte>> imagesAsBytes, CancellationToken cancellationToken = default)
+	public IAsyncEnumerable<string> SendAsAsync(ChatRole role, string message, IEnumerable<IEnumerable<byte>>? imagesAsBytes, CancellationToken cancellationToken = default)
 		=> SendAsAsync(role, message, imagesAsBytes?.ToBase64() ?? [], cancellationToken);
 
 	/// <summary>
@@ -112,7 +193,7 @@ public IAsyncEnumerable<string> SendAsAsync(ChatRole role, string message, IEnum
 	/// <param name="message">The message to send</param>
 	/// <param name="imagesAsBase64">Base64 encoded images to send to the model</param>
 	/// <param name="cancellationToken">The token to cancel the operation with</param>
-	public IAsyncEnumerable<string> SendAsAsync(ChatRole role, string message, IEnumerable<string> imagesAsBase64, CancellationToken cancellationToken = default)
+	public IAsyncEnumerable<string> SendAsAsync(ChatRole role, string message, IEnumerable<string>? imagesAsBase64, CancellationToken cancellationToken = default)
 		=> SendAsAsync(role, message, [], imagesAsBase64, cancellationToken);
 
 	/// <summary>
@@ -123,7 +204,7 @@ public IAsyncEnumerable<string> SendAsAsync(ChatRole role, string message, IEnum
 	/// <param name="tools">Tools that the model can make use of, see https://ollama.com/blog/tool-support. By using tools, response streaming is automatically turned off</param>
 	/// <param name="imagesAsBase64">Base64 encoded images to send to the model</param>
 	/// <param name="cancellationToken">The token to cancel the operation with</param>
-	public async IAsyncEnumerable<string> SendAsAsync(ChatRole role, string message, IEnumerable<Tool>? tools, IEnumerable<string>? imagesAsBase64 = default, [EnumeratorCancellation] CancellationToken cancellationToken = default)
+	public async IAsyncEnumerable<string> SendAsAsync(ChatRole role, string message, IReadOnlyCollection<Tool>? tools, IEnumerable<string>? imagesAsBase64 = default, [EnumeratorCancellation] CancellationToken cancellationToken = default)
 	{
 		Messages.Add(new Message(role, message, imagesAsBase64?.ToArray()));
 
diff --git a/src/HttpRequestMessageExtensions.cs b/src/HttpRequestMessageExtensions.cs
index e8f2163..264721d 100644
--- a/src/HttpRequestMessageExtensions.cs
+++ b/src/HttpRequestMessageExtensions.cs
@@ -1,20 +1,21 @@
 using System.Collections.Generic;
 using System.Net.Http;
+using System.Net.Http.Headers;
 using OllamaSharp.Models;
 
 namespace OllamaSharp;
 
 /// <summary>
-/// Extension methods for the http request message
+/// Provides extension methods for the <see cref="HttpRequestMessage"/> class.
 /// </summary>
-public static class HttpRequestMessageExtensions
+internal static class HttpRequestMessageExtensions
 {
 	/// <summary>
-	/// Applies default headers from the OllamaApiClient and optional Ollama requests
+	/// Applies custom headers to the <see cref="HttpRequestMessage"/> instance.
 	/// </summary>
-	/// <param name="requestMessage">The http request message to set the headers on</param>
-	/// <param name="headers">The headers to set on the request message</param>
-	/// <param name="ollamaRequest">The request to the Ollama API to get the custom headers from</param>
+	/// <param name="requestMessage">The <see cref="HttpRequestMessage"/> to set the headers on.</param>
+	/// <param name="headers">A dictionary containing the headers to set on the request message.</param>
+	/// <param name="ollamaRequest">An optional <see cref="OllamaRequest"/> to get additional custom headers from.</param>
 	public static void ApplyCustomHeaders(this HttpRequestMessage requestMessage, Dictionary<string, string> headers, OllamaRequest? ollamaRequest)
 	{
 		foreach (var header in headers)
@@ -27,7 +28,13 @@ public static void ApplyCustomHeaders(this HttpRequestMessage requestMessage, Di
 		}
 	}
 
-	private static void AddOrUpdateHeaderValue(System.Net.Http.Headers.HttpRequestHeaders requestMessageHeaders, string headerKey, string headerValue)
+	/// <summary>
+	/// Adds or updates a header value in the <see cref="HttpRequestHeaders"/> collection.
+	/// </summary>
+	/// <param name="requestMessageHeaders">The <see cref="HttpRequestHeaders"/> collection to update.</param>
+	/// <param name="headerKey">The key of the header to add or update.</param>
+	/// <param name="headerValue">The value of the header to add or update.</param>
+	private static void AddOrUpdateHeaderValue(HttpRequestHeaders requestMessageHeaders, string headerKey, string headerValue)
 	{
 		if (requestMessageHeaders.Contains(headerKey))
 			requestMessageHeaders.Remove(headerKey);
diff --git a/src/IOllamaApiClient.cs b/src/IOllamaApiClient.cs
index 8f2ddf3..a9f3686 100644
--- a/src/IOllamaApiClient.cs
+++ b/src/IOllamaApiClient.cs
@@ -16,9 +16,9 @@ namespace OllamaSharp;
 public interface IOllamaApiClient
 {
 	/// <summary>
-	/// Gets the endpoint uri used by the api client
+	/// Gets the endpoint URI used by the API client.
 	/// </summary>
-	public Uri Uri { get; }
+	Uri Uri { get; }
 
 	/// <summary>
 	/// Gets or sets the name of the model to run requests on.
@@ -27,12 +27,11 @@ public interface IOllamaApiClient
 
 	/// <summary>
 	/// Sends a request to the /api/chat endpoint and streams the response of the chat.
-	/// To implement a fully interactive chat, you should make use of the Chat class with "new Chat(...)"
 	/// </summary>
-	/// <param name="request">The request to send to Ollama</param>
-	/// <param name="cancellationToken">The token to cancel the operation with</param>
+	/// <param name="request">The request to send to Ollama.</param>
+	/// <param name="cancellationToken">The token to cancel the operation with.</param>
 	/// <returns>
-	/// An asynchronous enumerable that yields ChatResponseStream. Each item
+	/// An asynchronous enumerable that yields <see cref="ChatResponseStream"/>. Each item
 	/// represents a message in the chat response stream. Returns null when the
 	/// stream is completed.
 	/// </returns>
@@ -43,54 +42,57 @@ public interface IOllamaApiClient
 	IAsyncEnumerable<ChatResponseStream?> ChatAsync(ChatRequest request, [EnumeratorCancellation] CancellationToken cancellationToken = default);
 
 	/// <summary>
-	/// Sends a request to the /api/copy endpoint to copy a model
+	/// Sends a request to the /api/copy endpoint to copy a model.
 	/// </summary>
-	/// <param name="request">The parameters required to copy a model</param>
-	/// <param name="cancellationToken">The token to cancel the operation with</param>
+	/// <param name="request">The parameters required to copy a model.</param>
+	/// <param name="cancellationToken">The token to cancel the operation with.</param>
 	Task CopyModelAsync(CopyModelRequest request, CancellationToken cancellationToken = default);
 
 	/// <summary>
-	/// Sends a request to the /api/create endpoint to create a model
+	/// Sends a request to the /api/create endpoint to create a model.
 	/// </summary>
-	/// <param name="request">The request object containing the model details</param>
-	/// <param name="cancellationToken">The token to cancel the operation with</param>
-	/// <returns>An asynchronous enumerable of the model creation status</returns>
+	/// <param name="request">The request object containing the model details.</param>
+	/// <param name="cancellationToken">The token to cancel the operation with.</param>
+	/// <returns>An asynchronous enumerable of the model creation status.</returns>
 	IAsyncEnumerable<CreateModelResponse?> CreateModelAsync(CreateModelRequest request, [EnumeratorCancellation] CancellationToken cancellationToken = default);
 
 	/// <summary>
-	/// Sends a request to the /api/delete endpoint to delete a model
+	/// Sends a request to the /api/delete endpoint to delete a model.
 	/// </summary>
-	/// <param name="request">The request containing the model to delete</param>
-	/// <param name="cancellationToken">The token to cancel the operation with</param>
+	/// <param name="request">The request containing the model to delete.</param>
+	/// <param name="cancellationToken">The token to cancel the operation with.</param>
 	Task DeleteModelAsync(DeleteModelRequest request, CancellationToken cancellationToken = default);
 
 	/// <summary>
-	/// Sends a request to the /api/embed endpoint to generate embeddings
+	/// Sends a request to the /api/embed endpoint to generate embeddings.
 	/// </summary>
-	/// <param name="request">The parameters to generate embeddings for</param>
-	/// <param name="cancellationToken">The token to cancel the operation with</param>
+	/// <param name="request">The parameters to generate embeddings for.</param>
+	/// <param name="cancellationToken">The token to cancel the operation with.</param>
+	/// <returns>A task that represents the asynchronous operation. The task result contains the <see cref="EmbedResponse"/>.</returns>
 	Task<EmbedResponse> EmbedAsync(EmbedRequest request, CancellationToken cancellationToken = default);
 
 	/// <summary>
-	/// Sends a request to the /api/tags endpoint to get all models that are available locally
+	/// Sends a request to the /api/tags endpoint to get all models that are available locally.
 	/// </summary>
-	/// <param name="cancellationToken">The token to cancel the operation with</param>
+	/// <param name="cancellationToken">The token to cancel the operation with.</param>
+	/// <returns>A task that represents the asynchronous operation. The task result contains a collection of <see cref="Model"/>.</returns>
 	Task<IEnumerable<Model>> ListLocalModelsAsync(CancellationToken cancellationToken = default);
 
 	/// <summary>
-	/// Sends a request to the /api/ps endpoint to get the running models
+	/// Sends a request to the /api/ps endpoint to get the running models.
 	/// </summary>
-	/// <param name="cancellationToken">The token to cancel the operation with</param>
+	/// <param name="cancellationToken">The token to cancel the operation with.</param>
+	/// <returns>A task that represents the asynchronous operation. The task result contains a collection of <see cref="RunningModel"/>.</returns>
 	Task<IEnumerable<RunningModel>> ListRunningModelsAsync(CancellationToken cancellationToken = default);
 
 	/// <summary>
-	/// Sends a request to the /api/pull endpoint to pull a new model
+	/// Sends a request to the /api/pull endpoint to pull a new model.
 	/// </summary>
-	/// <param name="request">The request specifying the model name and whether to use insecure connection</param>
-	/// <param name="cancellationToken">The token to cancel the operation with</param>
+	/// <param name="request">The request specifying the model name and whether to use an insecure connection.</param>
+	/// <param name="cancellationToken">The token to cancel the operation with.</param>
 	/// <returns>
-	/// Async enumerable of PullStatus objects representing the status of the
-	/// model pull operation
+	/// An asynchronous enumerable of <see cref="PullModelResponse"/> objects representing the status of the
+	/// model pull operation.
 	/// </returns>
 	IAsyncEnumerable<PullModelResponse?> PullModelAsync(PullModelRequest request, [EnumeratorCancellation] CancellationToken cancellationToken = default);
 
@@ -106,11 +108,11 @@ public interface IOllamaApiClient
 	IAsyncEnumerable<PushModelResponse?> PushModelAsync(PushModelRequest request, [EnumeratorCancellation] CancellationToken cancellationToken = default);
 
 	/// <summary>
-	/// Sends a request to the /api/show endpoint to show the information of a model
+	/// Sends a request to the /api/show endpoint to show the information of a model.
 	/// </summary>
-	/// <param name="request">The request containing the name of the model the get the information for</param>
-	/// <param name="cancellationToken">The token to cancel the operation with</param>
-	/// <returns>The model information</returns>
+	/// <param name="request">The request containing the name of the model to get the information for.</param>
+	/// <param name="cancellationToken">The token to cancel the operation with.</param>
+	/// <returns>A task that represents the asynchronous operation. The task result contains the <see cref="ShowModelResponse"/>.</returns>
 	Task<ShowModelResponse> ShowModelAsync(ShowModelRequest request, CancellationToken cancellationToken = default);
 
 	/// <summary>
@@ -118,18 +120,20 @@ public interface IOllamaApiClient
 	/// </summary>
 	/// <param name="request">The request containing the parameters for the completion.</param>
 	/// <param name="cancellationToken">The token to cancel the operation with.</param>
-	/// <returns>An asynchronous enumerable of completion response streams.</returns>
+	/// <returns>An asynchronous enumerable of <see cref="GenerateResponseStream"/>.</returns>
 	IAsyncEnumerable<GenerateResponseStream?> GenerateAsync(GenerateRequest request, [EnumeratorCancellation] CancellationToken cancellationToken = default);
 
 	/// <summary>
-	/// Sends a query to check whether the Ollama api is running or not
+	/// Sends a query to check whether the Ollama API is running or not.
 	/// </summary>
-	/// <param name="cancellationToken">The token to cancel the operation with</param>
+	/// <param name="cancellationToken">The token to cancel the operation with.</param>
+	/// <returns>A task that represents the asynchronous operation. The task result contains a boolean indicating whether the API is running.</returns>
 	Task<bool> IsRunningAsync(CancellationToken cancellationToken = default);
 
 	/// <summary>
-	/// Get the version of Ollama
+	/// Gets the version of Ollama.
 	/// </summary>
-	/// <param name="cancellationToken">The token to cancel the operation with</param>
+	/// <param name="cancellationToken">The token to cancel the operation with.</param>
+	/// <returns>A task that represents the asynchronous operation. The task result contains the <see cref="Version"/>.</returns>
 	Task<Version> GetVersionAsync(CancellationToken cancellationToken = default);
 }
\ No newline at end of file
diff --git a/src/MicrosoftAi/AbstractionMapper.cs b/src/MicrosoftAi/AbstractionMapper.cs
index f9e1c1a..04e905e 100644
--- a/src/MicrosoftAi/AbstractionMapper.cs
+++ b/src/MicrosoftAi/AbstractionMapper.cs
@@ -12,13 +12,14 @@ namespace OllamaSharp.MicrosoftAi;
 /// <summary>
 /// Provides mapping functionality between OllamaSharp and Microsoft.Extensions.AI models.
 /// </summary>
-public static class AbstractionMapper
+internal static class AbstractionMapper
 {
 	/// <summary>
 	/// Maps a <see cref="ChatRequest"/> and <see cref="ChatDoneResponseStream"/> to a <see cref="ChatCompletion"/>.
 	/// </summary>
 	/// <param name="stream">The response stream with completion data.</param>
 	/// <param name="usedModel">The used model. This has to be a separate argument because there might be fallbacks from the calling method.</param>
+	/// <returns>A <see cref="ChatCompletion"/> object containing the mapped data.</returns>
 	public static ChatCompletion? ToChatCompletion(ChatDoneResponseStream? stream, string? usedModel)
 	{
 		if (stream is null)
@@ -40,21 +41,23 @@ public static class AbstractionMapper
 	}
 
 	/// <summary>
-	/// Converts Microsoft.Extensions.AI messages and options to an OllamaSharp chat request.
+	/// Converts Microsoft.Extensions.AI <see cref="ChatMessage"/> objects and
+	/// an option <see cref="ChatOptions"/> instance to an OllamaSharp <see cref="ChatRequest"/>.
 	/// </summary>
 	/// <param name="chatMessages">A list of chat messages.</param>
 	/// <param name="options">Optional chat options to configure the request.</param>
 	/// <param name="stream">Indicates if the request should be streamed.</param>
 	/// <param name="serializerOptions">Serializer options</param>
+	/// <returns>A <see cref="ChatRequest"/> object containing the converted data.</returns>
 	public static ChatRequest ToOllamaSharpChatRequest(IList<ChatMessage> chatMessages, ChatOptions? options, bool stream, JsonSerializerOptions serializerOptions)
 	{
 		var request = new ChatRequest
 		{
-			Format = options?.ResponseFormat == ChatResponseFormat.Json ? "json" : null,
+			Format = Equals(options?.ResponseFormat, ChatResponseFormat.Json) ? "json" : null,
 			KeepAlive = null,
 			Messages = ToOllamaSharpMessages(chatMessages, serializerOptions),
 			Model = options?.ModelId ?? "", // will be set OllamaApiClient.SelectedModel if not set
-			Options = new Models.RequestOptions
+			Options = new RequestOptions
 			{
 				FrequencyPenalty = options?.FrequencyPenalty,
 				PresencePenalty = options?.PresencePenalty,
@@ -115,7 +118,7 @@ public static ChatRequest ToOllamaSharpChatRequest(IList<ChatMessage> chatMessag
 	/// <param name="microsoftChatOptions">The chat options from the Microsoft abstraction</param>
 	/// <param name="option">The Ollama setting to add</param>
 	/// <param name="optionSetter">The setter to set the Ollama option if available in the chat options</param>
-	private static void TryAddOllamaOption<T>(ChatOptions microsoftChatOptions, OllamaOption option, Action<object?> optionSetter)
+	private static void TryAddOllamaOption<T>(ChatOptions? microsoftChatOptions, OllamaOption option, Action<object?> optionSetter)
 	{
 		if ((microsoftChatOptions?.AdditionalProperties?.TryGetValue(option.Name, out var value) ?? false) && value is not null)
 			optionSetter(value);
@@ -125,6 +128,7 @@ private static void TryAddOllamaOption<T>(ChatOptions microsoftChatOptions, Olla
 	/// Converts a collection of Microsoft.Extensions.AI.<see cref="AITool"/> to a collection of OllamaSharp tools.
 	/// </summary>
 	/// <param name="tools">The tools to convert.</param>
+	/// <returns>An enumeration of <see cref="Tool"/> objects containing the converted data.</returns>
 	private static IEnumerable<Tool>? ToOllamaSharpTools(IEnumerable<AITool>? tools)
 	{
 		return tools?.Select(ToOllamaSharpTool)
@@ -133,9 +137,13 @@ private static void TryAddOllamaOption<T>(ChatOptions microsoftChatOptions, Olla
 	}
 
 	/// <summary>
-	/// Converts an Microsoft.Extensions.AI.<see cref="AITool"/> to an OllamaSharp tool.
+	/// Converts a Microsoft.Extensions.AI.<see cref="AITool"/> to an OllamaSharp <see cref="Tool" />.
 	/// </summary>
 	/// <param name="tool">The tool to convert.</param>
+	/// <returns>
+	/// If parseable, a <see cref="Tool"/> object containing the converted data,
+	/// otherwise <see langword="null"/>.
+	/// </returns>
 	private static Tool? ToOllamaSharpTool(AITool tool)
 	{
 		if (tool is AIFunction f)
@@ -148,7 +156,8 @@ private static void TryAddOllamaOption<T>(ChatOptions microsoftChatOptions, Olla
 	/// Converts <see cref="AIFunctionMetadata"/> to a <see cref="Tool"/>.
 	/// </summary>
 	/// <param name="functionMetadata">The function metadata to convert.</param>
-	private static Tool? ToOllamaSharpTool(AIFunctionMetadata functionMetadata)
+	/// <returns>A <see cref="Tool"/> object containing the converted data.</returns>
+	private static Tool ToOllamaSharpTool(AIFunctionMetadata functionMetadata)
 	{
 		return new Tool
 		{
@@ -176,7 +185,8 @@ private static void TryAddOllamaOption<T>(ChatOptions microsoftChatOptions, Olla
 	/// Converts parameter schema object to a function type string.
 	/// </summary>
 	/// <param name="schema">The schema object holding schema type information.</param>
-	private static IEnumerable<string>? GetPossibleValues(JsonObject? schema)
+	/// <returns>A collection of strings containing the function types.</returns>
+	private static IEnumerable<string> GetPossibleValues(JsonObject? schema)
 	{
 		return []; // TODO others supported?
 	}
@@ -185,6 +195,7 @@ private static void TryAddOllamaOption<T>(ChatOptions microsoftChatOptions, Olla
 	/// Converts parameter schema object to a function type string.
 	/// </summary>
 	/// <param name="schema">The schema object holding schema type information.</param>
+	/// <returns>A string containing the function type.</returns>
 	private static string ToFunctionTypeString(JsonObject? schema)
 	{
 		return "string"; // TODO others supported?
@@ -195,6 +206,7 @@ private static string ToFunctionTypeString(JsonObject? schema)
 	/// </summary>
 	/// <param name="chatMessages">The chat messages to convert.</param>
 	/// <param name="serializerOptions">Serializer options</param>
+	/// <returns>An enumeration of <see cref="Message"/> objects containing the converted data.</returns>
 	private static IEnumerable<Message> ToOllamaSharpMessages(IList<ChatMessage> chatMessages, JsonSerializerOptions serializerOptions)
 	{
 		foreach (var cm in chatMessages)
@@ -236,7 +248,8 @@ private static IEnumerable<Message> ToOllamaSharpMessages(IList<ChatMessage> cha
 	/// Converts a Microsoft.Extensions.AI.<see cref="ImageContent"/> to a base64 image string.
 	/// </summary>
 	/// <param name="content">The data content to convert.</param>
-	private static string ToOllamaImage(ImageContent content)
+	/// <returns>A string containing the base64 image data.</returns>
+	private static string ToOllamaImage(ImageContent? content)
 	{
 		if (content is null)
 			return string.Empty;
@@ -251,6 +264,7 @@ private static string ToOllamaImage(ImageContent content)
 	/// Converts a Microsoft.Extensions.AI.<see cref="FunctionCallContent"/> to a <see cref="Message.ToolCall"/>.
 	/// </summary>
 	/// <param name="functionCall">The function call content to convert.</param>
+	/// <returns>A <see cref="Message.ToolCall"/> object containing the converted data.</returns>
 	private static Message.ToolCall ToOllamaSharpToolCall(FunctionCallContent functionCall)
 	{
 		return new Message.ToolCall
@@ -267,14 +281,15 @@ private static Message.ToolCall ToOllamaSharpToolCall(FunctionCallContent functi
 	/// Maps a <see cref="Microsoft.Extensions.AI.ChatRole"/> to an <see cref="OllamaSharp.Models.Chat.ChatRole"/>.
 	/// </summary>
 	/// <param name="role">The chat role to map.</param>
+	/// <returns>A <see cref="OllamaSharp.Models.Chat.ChatRole"/> object containing the mapped role.</returns>
 	private static Models.Chat.ChatRole ToOllamaSharpRole(Microsoft.Extensions.AI.ChatRole role)
 	{
 		return role.Value switch
 		{
-			"assistant" => OllamaSharp.Models.Chat.ChatRole.Assistant,
-			"system" => OllamaSharp.Models.Chat.ChatRole.System,
-			"user" => OllamaSharp.Models.Chat.ChatRole.User,
-			"tool" => OllamaSharp.Models.Chat.ChatRole.Tool,
+			"assistant" => Models.Chat.ChatRole.Assistant,
+			"system" => Models.Chat.ChatRole.System,
+			"user" => Models.Chat.ChatRole.User,
+			"tool" => Models.Chat.ChatRole.Tool,
 			_ => new OllamaSharp.Models.Chat.ChatRole(role.Value),
 		};
 	}
@@ -283,6 +298,7 @@ private static Models.Chat.ChatRole ToOllamaSharpRole(Microsoft.Extensions.AI.Ch
 	/// Maps an <see cref="OllamaSharp.Models.Chat.ChatRole"/> to a <see cref="Microsoft.Extensions.AI.ChatRole"/>.
 	/// </summary>
 	/// <param name="role">The chat role to map.</param>
+	/// <returns>A <see cref="Microsoft.Extensions.AI.ChatRole"/> object containing the mapped role.</returns>
 	private static Microsoft.Extensions.AI.ChatRole ToAbstractionRole(OllamaSharp.Models.Chat.ChatRole? role)
 	{
 		if (role is null)
@@ -302,6 +318,7 @@ private static Microsoft.Extensions.AI.ChatRole ToAbstractionRole(OllamaSharp.Mo
 	/// Converts a <see cref="ChatResponseStream"/> to a <see cref="StreamingChatCompletionUpdate"/>.
 	/// </summary>
 	/// <param name="response">The response stream to convert.</param>
+	/// <returns>A <see cref="StreamingChatCompletionUpdate"/> object containing the latest chat completion chunk.</returns>
 	public static StreamingChatCompletionUpdate ToStreamingChatCompletionUpdate(ChatResponseStream? response)
 	{
 		return new StreamingChatCompletionUpdate
@@ -312,6 +329,7 @@ public static StreamingChatCompletionUpdate ToStreamingChatCompletionUpdate(Chat
 			CreatedAt = response?.CreatedAt,
 			FinishReason = response?.Done == true ? ChatFinishReason.Stop : null,
 			RawRepresentation = response,
+			// TODO: Check if "Message" can ever actually be null. If not, remove the null-coalescing operator
 			Text = response?.Message?.Content ?? string.Empty,
 			Role = ToAbstractionRole(response?.Message?.Role),
 			ModelId = response?.Model
@@ -322,6 +340,7 @@ public static StreamingChatCompletionUpdate ToStreamingChatCompletionUpdate(Chat
 	/// Converts a <see cref="Message"/> to a <see cref="ChatMessage"/>.
 	/// </summary>
 	/// <param name="message">The message to convert.</param>
+	/// <returns>A <see cref="ChatMessage"/> object containing the converted data.</returns>
 	public static ChatMessage ToChatMessage(Message message)
 	{
 		var contents = new List<AIContent>();
@@ -350,7 +369,8 @@ public static ChatMessage ToChatMessage(Message message)
 	/// Parses additional properties from a <see cref="ChatDoneResponseStream"/>.
 	/// </summary>
 	/// <param name="response">The response to parse.</param>
-	private static AdditionalPropertiesDictionary? ParseOllamaChatResponseProps(ChatDoneResponseStream response)
+	/// <returns>An <see cref="AdditionalPropertiesDictionary"/> object containing the parsed additional properties.</returns>
+	private static AdditionalPropertiesDictionary ParseOllamaChatResponseProps(ChatDoneResponseStream response)
 	{
 		const double NANOSECONDS_PER_MILLISECOND = 1_000_000;
 
@@ -367,7 +387,8 @@ public static ChatMessage ToChatMessage(Message message)
 	/// Parses additional properties from a <see cref="EmbedResponse"/>.
 	/// </summary>
 	/// <param name="response">The response to parse.</param>
-	private static AdditionalPropertiesDictionary? ParseOllamaEmbedResponseProps(EmbedResponse response)
+	/// <returns>An <see cref="AdditionalPropertiesDictionary"/> object containing the parsed additional properties.</returns>
+	private static AdditionalPropertiesDictionary ParseOllamaEmbedResponseProps(EmbedResponse response)
 	{
 		const double NANOSECONDS_PER_MILLISECOND = 1_000_000;
 
@@ -382,6 +403,7 @@ public static ChatMessage ToChatMessage(Message message)
 	/// Maps a string representation of a finish reason to a <see cref="ChatFinishReason"/>.
 	/// </summary>
 	/// <param name="ollamaDoneReason">The finish reason string.</param>
+	/// <returns>A <see cref="ChatFinishReason"/> object containing the chat finish reason.</returns>
 	private static ChatFinishReason? ToFinishReason(string? ollamaDoneReason)
 	{
 		return ollamaDoneReason switch
@@ -414,10 +436,11 @@ public static ChatMessage ToChatMessage(Message message)
 	}
 
 	/// <summary>
-	/// Gets an embedding request for the Ollama API
+	/// Gets an <see cref="EmbedRequest"/> for the Ollama API.
 	/// </summary>
-	/// <param name="values">The values to get embeddings for</param>
-	/// <param name="options">The options for the embeddings</param>
+	/// <param name="values">The values to get embeddings for.</param>
+	/// <param name="options">The options for the embeddings.</param>
+	/// <returns>An <see cref="EmbedRequest"/> object containing the request data.</returns>
 	public static EmbedRequest ToOllamaEmbedRequest(IEnumerable<string> values, EmbeddingGenerationOptions? options)
 	{
 		var request = new EmbedRequest()
@@ -439,13 +462,15 @@ public static EmbedRequest ToOllamaEmbedRequest(IEnumerable<string> values, Embe
 	}
 
 	/// <summary>
-	/// Gets Microsoft GeneratedEmbeddings mapped from Ollama embeddings
+	/// Gets Microsoft GeneratedEmbeddings mapped from Ollama embeddings.
 	/// </summary>
-	/// <param name="ollamaRequest">The original Ollama request that was used to generate the embeddings</param>
-	/// <param name="ollamaResponse">The response from Ollama containing the embeddings</param>
+	/// <param name="ollamaRequest">The original Ollama request that was used to generate the embeddings.</param>
+	/// <param name="ollamaResponse">The response from Ollama containing the embeddings.</param>
 	/// <param name="usedModel">The used model. This has to be a separate argument because there might be fallbacks from the calling method.</param>
+	/// <returns>A <see cref="GeneratedEmbeddings{T}"/> object containing the mapped embeddings.</returns>
 	public static GeneratedEmbeddings<Embedding<float>> ToGeneratedEmbeddings(EmbedRequest ollamaRequest, EmbedResponse ollamaResponse, string? usedModel)
 	{
+		// TODO: Check if this can ever actually be null. If not, remove the null-coalescing operator
 		var mapped = (ollamaResponse.Embeddings ?? []).Select(vector => new Embedding<float>(vector)
 		{
 			CreatedAt = DateTimeOffset.UtcNow,
diff --git a/src/MicrosoftAi/ChatOptionsExtensions.cs b/src/MicrosoftAi/ChatOptionsExtensions.cs
index 8b50fc6..31fee77 100644
--- a/src/MicrosoftAi/ChatOptionsExtensions.cs
+++ b/src/MicrosoftAi/ChatOptionsExtensions.cs
@@ -12,11 +12,12 @@ public static class ChatOptionsExtensions
 {
 	/// <summary>
 	/// Adds Ollama specific options to the additional properties of ChatOptions.
-	/// These can be interpreted sent to the Ollama API by OllamaSharp.
+	/// These can be interpreted and sent to the Ollama API by OllamaSharp.
 	/// </summary>
 	/// <param name="chatOptions">The chat options to set Ollama options on</param>
 	/// <param name="option">The Ollama option to set, like OllamaOption.NumCtx for the option 'num_ctx'</param>
 	/// <param name="value">The value for the option</param>
+	/// <returns>The <see cref="ChatOptions"/> with the Ollama option set</returns>
 	public static ChatOptions AddOllamaOption(this ChatOptions chatOptions, OllamaOption option, object value)
 	{
 		chatOptions.AdditionalProperties ??= [];
diff --git a/src/MicrosoftAi/IAsyncEnumerableExtensions.cs b/src/MicrosoftAi/IAsyncEnumerableExtensions.cs
index 3cb2ff1..43bf37a 100644
--- a/src/MicrosoftAi/IAsyncEnumerableExtensions.cs
+++ b/src/MicrosoftAi/IAsyncEnumerableExtensions.cs
@@ -13,11 +13,11 @@ namespace OllamaSharp;
 public static partial class IAsyncEnumerableExtensions
 {
 	/// <summary>
-	/// Streams a given IAsyncEnumerable of response chunks to its end and builds one single StreamingChatCompletionUpdate out of them.
+	/// Streams a given <see cref="IAsyncEnumerable{StreamingChatCompletionUpdate}" /> of response chunks to its end and builds one single <see cref="StreamingChatCompletionUpdate"/> out of them.
 	/// </summary>
-	/// <param name="stream">The IAsyncEnumerable to stream</param>
+	/// <param name="stream">The <see cref="IAsyncEnumerable{StreamingChatCompletionUpdate}" /> to stream</param>
 	/// <param name="itemCallback">An optional callback to additionally process every single item from the IAsyncEnumerable</param>
-	/// <returns>A single StreamingChatCompletionUpdate built up from every single IAsyncEnumerable item</returns>
+	/// <returns>A single <see cref="StreamingChatCompletionUpdate"/> built up from every single IAsyncEnumerable item</returns>
 	public static Task<StreamingChatCompletionUpdate?> StreamToEndAsync(this IAsyncEnumerable<StreamingChatCompletionUpdate?> stream, Action<StreamingChatCompletionUpdate?>? itemCallback = null)
 		=> stream.StreamToEndAsync(new MicrosoftAi.StreamingChatCompletionUpdateAppender(), itemCallback);
 }
diff --git a/src/MicrosoftAi/OllamaFunctionResultContent.cs b/src/MicrosoftAi/OllamaFunctionResultContent.cs
index efe4853..e36f393 100644
--- a/src/MicrosoftAi/OllamaFunctionResultContent.cs
+++ b/src/MicrosoftAi/OllamaFunctionResultContent.cs
@@ -2,8 +2,21 @@ namespace OllamaSharp.MicrosoftAi;
 
 using System.Text.Json;
 
+/// <summary>
+/// A holder for the result of an Ollama function call.
+/// </summary>
 internal sealed class OllamaFunctionResultContent
 {
+	/// <summary>
+	/// The function call ID for which this is the result.
+	/// </summary>
 	public string? CallId { get; set; }
+
+	/// <summary>
+	/// This element value may be <see langword="null" /> if the function returned <see langword="null" />,
+	/// if the function was void-returning and thus had no result, or if the function call failed.
+	/// Typically, however, in order to provide meaningfully representative information to an AI service,
+	/// a human-readable representation of those conditions should be supplied.
+	/// </summary>
 	public JsonElement Result { get; set; }
 }
\ No newline at end of file
diff --git a/src/MicrosoftAi/StreamingChatCompletionUpdateAppender.cs b/src/MicrosoftAi/StreamingChatCompletionUpdateAppender.cs
index 906b44e..1ab216c 100644
--- a/src/MicrosoftAi/StreamingChatCompletionUpdateAppender.cs
+++ b/src/MicrosoftAi/StreamingChatCompletionUpdateAppender.cs
@@ -3,20 +3,22 @@
 namespace OllamaSharp.MicrosoftAi;
 
 /// <summary>
-/// Appender to stream IAsyncEnumerable(StreamingChatCompletionUpdate) to build up one single StreamingChatCompletionUpdate object
+/// Appender to stream <see cref="System.Collections.Generic.IAsyncEnumerable{StreamingChatCompletionUpdate}" />
+/// to build up one consolidated <see cref="StreamingChatCompletionUpdate"/> object
 /// </summary>
-public class StreamingChatCompletionUpdateAppender : IAppender<StreamingChatCompletionUpdate?, StreamingChatCompletionUpdate?>
+internal class StreamingChatCompletionUpdateAppender : IAppender<StreamingChatCompletionUpdate?, StreamingChatCompletionUpdate?>
 {
 	private readonly StreamingChatCompletionUpdateBuilder _messageBuilder = new();
 
 	/// <summary>
-	/// Appends a given StreamingChatCompletionUpdate item to build a single return object
+	/// Appends a given <see cref="StreamingChatCompletionUpdate"/> item to build a single return object
 	/// </summary>
 	/// <param name="item">The item to append</param>
 	public void Append(StreamingChatCompletionUpdate? item) => _messageBuilder.Append(item);
 
 	/// <summary>
-	/// Builds up one single StreamingChatCompletionUpdate object from the previously streamed items
+	/// Builds up one final, single <see cref="StreamingChatCompletionUpdate"/> object from the previously streamed items
 	/// </summary>
+	/// <returns>The completed, consolidated <see cref="StreamingChatCompletionUpdate"/> object</returns>
 	public StreamingChatCompletionUpdate? Complete() => _messageBuilder.Complete();
 }
\ No newline at end of file
diff --git a/src/MicrosoftAi/StreamingChatCompletionUpdateBuilder.cs b/src/MicrosoftAi/StreamingChatCompletionUpdateBuilder.cs
index bc007d1..0a37613 100644
--- a/src/MicrosoftAi/StreamingChatCompletionUpdateBuilder.cs
+++ b/src/MicrosoftAi/StreamingChatCompletionUpdateBuilder.cs
@@ -5,9 +5,9 @@
 namespace OllamaSharp.MicrosoftAi;
 
 /// <summary>
-/// A builder that can append streamed completion updates to one single completion update
+/// A builder that can append <see cref="StreamingChatCompletionUpdate"/> to one single completion update
 /// </summary>
-public class StreamingChatCompletionUpdateBuilder
+internal class StreamingChatCompletionUpdateBuilder
 {
 	private readonly StringBuilder _contentBuilder = new();
 	private StreamingChatCompletionUpdate? _first;
@@ -36,13 +36,16 @@ public void Append(StreamingChatCompletionUpdate? update)
 		//_first.Contents and .Text will be set in Complete() with values collected from each update
 		//_first.RawRepresentation makes no sense 
 
+		// TODO: Check if this can ever be null. The docs imply not.
 		if (update.Contents is not null)
 			Contents.AddRange(update.Contents);
 	}
 
 	/// <summary>
-	/// Builds the final completion update out of the streamed updates that were appended before
+	/// Builds the final consolidated <see cref="StreamingChatCompletionUpdate"/> out of the streamed
+	/// updates that were appended before
 	/// </summary>
+	/// <returns>The final consolidated <see cref="StreamingChatCompletionUpdate"/> object</returns>
 	public StreamingChatCompletionUpdate? Complete()
 	{
 		if (_first is null)
@@ -57,5 +60,6 @@ public void Append(StreamingChatCompletionUpdate? update)
 	/// <summary>
 	/// Gets or sets the list of all content elements received from completion updates
 	/// </summary>
+	/// <value>A <see cref="List{AIContent}"/> of <see cref="AIContent"/> elements</value>
 	public List<AIContent> Contents { get; set; } = [];
 }
\ No newline at end of file
diff --git a/src/Models/CopyModel.cs b/src/Models/CopyModel.cs
index c3676b2..164b88b 100644
--- a/src/Models/CopyModel.cs
+++ b/src/Models/CopyModel.cs
@@ -3,7 +3,8 @@
 namespace OllamaSharp.Models;
 
 /// <summary>
-/// https://github.com/jmorganca/ollama/blob/main/docs/api.md#copy-a-model
+/// Copy a model. Creates a model with another name from an existing model.
+/// <see href="https://ollama.ai/docs/api/#copy-a-model">Ollama API docs</see>
 /// </summary>
 public class CopyModelRequest : OllamaRequest
 {
diff --git a/src/Models/CreateModel.cs b/src/Models/CreateModel.cs
index f40f470..4d18694 100644
--- a/src/Models/CreateModel.cs
+++ b/src/Models/CreateModel.cs
@@ -3,7 +3,14 @@
 namespace OllamaSharp.Models;
 
 /// <summary>
-/// https://github.com/jmorganca/ollama/blob/main/docs/api.md#create-a-model
+/// Create a model from a Modelfile. It is recommended to set <see cref="ModelFileContent"/> to the
+/// content of the Modelfile rather than just set path. This is a requirement
+/// for remote create. Remote model creation must also create any file blobs,
+/// fields such as FROM and ADAPTER, explicitly with the server using Create a
+/// Blob and the value to the path indicated in the response.
+///
+/// <see href="https://github.com/jmorganca/ollama/blob/main/docs/api.md#create-a-model">Ollama API docs</see>
+/// 
 /// </summary>
 [JsonUnmappedMemberHandling(JsonUnmappedMemberHandling.Skip)]
 public class CreateModelRequest : OllamaRequest
diff --git a/src/Models/DeleteModel.cs b/src/Models/DeleteModel.cs
index ff76be8..9d450c1 100644
--- a/src/Models/DeleteModel.cs
+++ b/src/Models/DeleteModel.cs
@@ -3,7 +3,9 @@
 namespace OllamaSharp.Models;
 
 /// <summary>
-/// https://github.com/jmorganca/ollama/blob/main/docs/api.md#delete-a-model
+/// Delete a model and its data.
+///
+/// <see href="https://github.com/jmorganca/ollama/blob/main/docs/api.md#delete-a-model">Ollama API docs</see>
 /// </summary>
 [JsonUnmappedMemberHandling(JsonUnmappedMemberHandling.Skip)]
 public class DeleteModelRequest : OllamaRequest
diff --git a/src/Models/Embed.cs b/src/Models/Embed.cs
index 1c39a24..2d58ca7 100644
--- a/src/Models/Embed.cs
+++ b/src/Models/Embed.cs
@@ -4,7 +4,9 @@
 namespace OllamaSharp.Models;
 
 /// <summary>
-/// https://github.com/jmorganca/ollama/blob/main/docs/api.md#generate-embeddings
+/// Generate embeddings from a model.
+///
+/// <see href="https://github.com/jmorganca/ollama/blob/main/docs/api.md#generate-embeddings">Ollama API docs</see>
 /// </summary>
 public class EmbedRequest : OllamaRequest
 {
diff --git a/src/Models/Generate.cs b/src/Models/Generate.cs
index 3aa1fa7..f42b8e2 100644
--- a/src/Models/Generate.cs
+++ b/src/Models/Generate.cs
@@ -4,7 +4,11 @@
 namespace OllamaSharp.Models;
 
 /// <summary>
-/// https://github.com/jmorganca/ollama/blob/main/docs/api.md#generate-a-completion
+/// Generate a response for a given prompt with a provided model. This is a
+/// streaming endpoint, so there will be a series of responses. The final
+/// response object will include statistics and additional data from the request.
+///
+/// <see href="https://github.com/jmorganca/ollama/blob/main/docs/api.md#generate-a-completion">Ollama API docs</see>
 /// </summary>
 public class GenerateRequest : OllamaRequest
 {
diff --git a/src/Models/ListModels.cs b/src/Models/ListModels.cs
index 8b7ddaa..72a888b 100644
--- a/src/Models/ListModels.cs
+++ b/src/Models/ListModels.cs
@@ -5,8 +5,9 @@
 namespace OllamaSharp.Models;
 
 /// <summary>
-/// Represents the response from the API call to list local models.
-/// <see href="https://github.com/jmorganca/ollama/blob/main/docs/api.md#list-local-models"/>
+/// List models that are available locally.
+/// 
+/// <see href="https://github.com/jmorganca/ollama/blob/main/docs/api.md#list-local-models">Ollama API docs</see>
 /// </summary>
 public class ListModelsResponse
 {
diff --git a/src/Models/ListRunningModels.cs b/src/Models/ListRunningModels.cs
index bd17cb8..682a376 100644
--- a/src/Models/ListRunningModels.cs
+++ b/src/Models/ListRunningModels.cs
@@ -5,7 +5,9 @@
 namespace OllamaSharp.Models;
 
 /// <summary>
-/// A response from the /api/ps endpoint.
+/// List models that are currently loaded into memory.
+///
+/// <see href="https://github.com/ollama/ollama/blob/main/docs/api.md#list-running-models">Ollama API docs</see>
 /// </summary>
 [JsonUnmappedMemberHandling(JsonUnmappedMemberHandling.Skip)]
 public class ListRunningModelsResponse
diff --git a/src/Models/PullModel.cs b/src/Models/PullModel.cs
index c3d30b0..69b1953 100644
--- a/src/Models/PullModel.cs
+++ b/src/Models/PullModel.cs
@@ -3,8 +3,10 @@
 namespace OllamaSharp.Models;
 
 /// <summary>
-/// Represents a request to pull a model from the API.
-/// <see href="https://github.com/jmorganca/ollama/blob/main/docs/api.md#pull-a-model"/>
+/// Download a model from the ollama library. Cancelled pulls are resumed from
+/// where they left off, and multiple calls will share the same download progress.
+/// 
+/// <see href="https://github.com/jmorganca/ollama/blob/main/docs/api.md#pull-a-model">Ollama API docs</see>
 /// </summary>
 public class PullModelRequest : OllamaRequest
 {
diff --git a/src/Models/PushModel.cs b/src/Models/PushModel.cs
index 67b4c24..61495f0 100644
--- a/src/Models/PushModel.cs
+++ b/src/Models/PushModel.cs
@@ -3,7 +3,10 @@
 namespace OllamaSharp.Models;
 
 /// <summary>
-/// Represents a request to push a model.
+/// Upload a model to a model library. Requires registering for ollama.ai and
+/// adding a public key first.
+///
+/// <see href="https://github.com/ollama/ollama/blob/main/docs/api.md#push-a-model">Ollama API docs</see>
 /// </summary>
 public class PushModelRequest : OllamaRequest
 {
diff --git a/src/Models/ShowModel.cs b/src/Models/ShowModel.cs
index 72a61d0..d77cdb2 100644
--- a/src/Models/ShowModel.cs
+++ b/src/Models/ShowModel.cs
@@ -4,7 +4,10 @@
 namespace OllamaSharp.Models;
 
 /// <summary>
-/// Represents a request to show model information.
+/// Show information about a model including details, modelfile, template,
+/// parameters, license, system prompt.
+///
+/// <see href="https://github.com/ollama/ollama/blob/main/docs/api.md#show-model-information">Ollama API docs</see>
 /// </summary>
 [JsonUnmappedMemberHandling(JsonUnmappedMemberHandling.Skip)]
 public class ShowModelRequest : OllamaRequest
diff --git a/src/OllamaApiClient.cs b/src/OllamaApiClient.cs
index 982ad31..249a6f4 100644
--- a/src/OllamaApiClient.cs
+++ b/src/OllamaApiClient.cs
@@ -52,7 +52,7 @@ public class OllamaApiClient : IOllamaApiClient, IChatClient, IEmbeddingGenerato
 	public string SelectedModel { get; set; }
 
 	/// <summary>
-	/// Gets the HTTP client that is used to communicate with the Ollama API.
+	/// Gets the <see cref="HttpClient" /> used to communicate with the Ollama API.
 	/// </summary>
 	private readonly HttpClient _client;
 
@@ -221,7 +221,8 @@ public async Task<bool> IsRunningAsync(CancellationToken cancellationToken = def
 	public async Task<Version> GetVersionAsync(CancellationToken cancellationToken = default)
 	{
 		var data = await GetAsync<JsonNode>("api/version", cancellationToken).ConfigureAwait(false);
-		return Version.Parse(data["version"]?.ToString());
+		var versionString = data["version"]?.ToString() ?? throw new InvalidOperationException("Could not get version from response.");
+		return Version.Parse(versionString);
 	}
 
 	private async IAsyncEnumerable<GenerateResponseStream?> GenerateCompletionAsync(GenerateRequest generateRequest, [EnumeratorCancellation] CancellationToken cancellationToken)
diff --git a/src/OllamaApiClientExtensions.cs b/src/OllamaApiClientExtensions.cs
index 7d1dc13..e5000d1 100644
--- a/src/OllamaApiClientExtensions.cs
+++ b/src/OllamaApiClientExtensions.cs
@@ -17,6 +17,7 @@ public static class OllamaApiClientExtensions
 	/// <param name="source">The name of the existing model to copy.</param>
 	/// <param name="destination">The name the copied model should get.</param>
 	/// <param name="cancellationToken">The token to cancel the operation with.</param>
+	/// <returns>A task that represents the asynchronous operation.</returns>
 	public static Task CopyModelAsync(this IOllamaApiClient client, string source, string destination, CancellationToken cancellationToken = default)
 		=> client.CopyModelAsync(new CopyModelRequest { Source = source, Destination = destination }, cancellationToken);
 
@@ -30,6 +31,7 @@ public static Task CopyModelAsync(this IOllamaApiClient client, string source, s
 	/// See <see href="https://github.com/jmorganca/ollama/blob/main/docs/modelfile.md"/>.
 	/// </param>
 	/// <param name="cancellationToken">The token to cancel the operation with.</param>
+	/// <returns>An async enumerable that can be used to iterate over the streamed responses. See <see cref="CreateModelResponse"/>.</returns>
 	public static IAsyncEnumerable<CreateModelResponse?> CreateModelAsync(this IOllamaApiClient client, string name, string modelFileContent, CancellationToken cancellationToken = default)
 	{
 		var request = new CreateModelRequest
@@ -52,6 +54,7 @@ public static Task CopyModelAsync(this IOllamaApiClient client, string source, s
 	/// </param>
 	/// <param name="path">The name path to the model file.</param>
 	/// <param name="cancellationToken">The token to cancel the operation with.</param>
+	/// <returns>An async enumerable that can be used to iterate over the streamed responses. See <see cref="CreateModelResponse"/>.</returns>
 	public static IAsyncEnumerable<CreateModelResponse?> CreateModelAsync(this IOllamaApiClient client, string name, string modelFileContent, string path, CancellationToken cancellationToken = default)
 	{
 		var request = new CreateModelRequest
@@ -70,6 +73,7 @@ public static Task CopyModelAsync(this IOllamaApiClient client, string source, s
 	/// <param name="client">The client used to execute the command.</param>
 	/// <param name="model">The name of the model to delete.</param>
 	/// <param name="cancellationToken">The token to cancel the operation with.</param>
+	/// <returns>A task that represents the asynchronous operation.</returns>
 	public static Task DeleteModelAsync(this IOllamaApiClient client, string model, CancellationToken cancellationToken = default)
 		=> client.DeleteModelAsync(new DeleteModelRequest { Model = model }, cancellationToken);
 
@@ -79,6 +83,7 @@ public static Task DeleteModelAsync(this IOllamaApiClient client, string model,
 	/// <param name="client">The client used to execute the command.</param>
 	/// <param name="model">The name of the model to pull.</param>
 	/// <param name="cancellationToken">The token to cancel the operation with.</param>
+	/// <returns>An async enumerable that can be used to iterate over the streamed responses. See <see cref="PullModelResponse"/>.</returns>
 	public static IAsyncEnumerable<PullModelResponse?> PullModelAsync(this IOllamaApiClient client, string model, CancellationToken cancellationToken = default)
 		=> client.PullModelAsync(new PullModelRequest { Model = model }, cancellationToken);
 
@@ -88,6 +93,7 @@ public static Task DeleteModelAsync(this IOllamaApiClient client, string model,
 	/// <param name="client">The client used to execute the command.</param>
 	/// <param name="name">The name of the model to push.</param>
 	/// <param name="cancellationToken">The token to cancel the operation with.</param>
+	/// <returns>An async enumerable that can be used to iterate over the streamed responses. See <see cref="PullModelResponse"/>.</returns>
 	public static IAsyncEnumerable<PushModelResponse?> PushModelAsync(this IOllamaApiClient client, string name, CancellationToken cancellationToken = default)
 		=> client.PushModelAsync(new PushModelRequest { Model = name, Stream = true }, cancellationToken);
 
@@ -97,6 +103,7 @@ public static Task DeleteModelAsync(this IOllamaApiClient client, string model,
 	/// <param name="client">The client used to execute the command.</param>
 	/// <param name="input">The input text to generate embeddings for.</param>
 	/// <param name="cancellationToken">The token to cancel the operation with.</param>
+	/// <returns>A <see cref="EmbedResponse"/> containing the embeddings.</returns>
 	public static Task<EmbedResponse> EmbedAsync(this IOllamaApiClient client, string input, CancellationToken cancellationToken = default)
 	{
 		var request = new EmbedRequest
@@ -118,7 +125,7 @@ public static Task<EmbedResponse> EmbedAsync(this IOllamaApiClient client, strin
 	/// Should reuse the result from earlier calls if these calls belong together. Can be null initially.
 	/// </param>
 	/// <param name="cancellationToken">The token to cancel the operation with.</param>
-	/// <returns>An async enumerable that can be used to iterate over the streamed responses.</returns>
+	/// <returns>An async enumerable that can be used to iterate over the streamed responses. See <see cref="GenerateResponseStream"/>.</returns>
 	public static IAsyncEnumerable<GenerateResponseStream?> GenerateAsync(this IOllamaApiClient client, string prompt, ConversationContext? context = null, CancellationToken cancellationToken = default)
 	{
 		var request = new GenerateRequest
@@ -137,7 +144,7 @@ public static Task<EmbedResponse> EmbedAsync(this IOllamaApiClient client, strin
 	/// <param name="client">The client used to execute the command.</param>
 	/// <param name="model">The name of the model to get the information for.</param>
 	/// <param name="cancellationToken">The token to cancel the operation with.</param>
-	/// <returns>The model information.</returns>
+	/// <returns>A task that represents the asynchronous operation. The task result contains the <see cref="ShowModelResponse"/> with the model information.</returns>
 	public static Task<ShowModelResponse> ShowModelAsync(this IOllamaApiClient client, string model, CancellationToken cancellationToken = default)
 		=> client.ShowModelAsync(new ShowModelRequest { Model = model }, cancellationToken);
 }
diff --git a/src/OllamaSharp.csproj b/src/OllamaSharp.csproj
index 04c8775..65f4ed5 100644
--- a/src/OllamaSharp.csproj
+++ b/src/OllamaSharp.csproj
@@ -37,9 +37,14 @@
 		</None>
 	</ItemGroup>
 
+	<ItemGroup>
+		<AssemblyAttribute Include="System.Runtime.CompilerServices.InternalsVisibleToAttribute">
+			<_Parameter1>Tests, PublicKey=0024000004800000940000000602000000240000525341310004000001000100a171f1618f5d4caf94ac5e1323ed80e3e2b686509951a686b66491108cf673ec16a8507ae06e7a4cc81ac14b057659e84401f1d56e17023037c160f4e3e35f6de81c479a778c78a184d15b4ccce943d2202eeeaec0c63028e1061ef5ca236b7a7d7fc52eef66d1fc65ebb89560b8dffb2353dfd2394ef2b1ec41bc3accab7df0</_Parameter1>
+		</AssemblyAttribute>
+	</ItemGroup>
+
 	<ItemGroup>
 		<PackageReference Include="Microsoft.Bcl.AsyncInterfaces" Version="8.0.0" />
 		<PackageReference Include="Microsoft.Extensions.AI.Abstractions" Version="9.0.1-preview.1.24570.5" />
 	</ItemGroup>
-
-</Project>
+</Project>
\ No newline at end of file
diff --git a/test/FunctionalTests/ChatTests.cs b/test/FunctionalTests/ChatTests.cs
new file mode 100644
index 0000000..9bd8368
--- /dev/null
+++ b/test/FunctionalTests/ChatTests.cs
@@ -0,0 +1,53 @@
+using FluentAssertions;
+using Microsoft.Extensions.AI;
+using NUnit.Framework;
+using OllamaSharp;
+
+namespace Tests.FunctionalTests;
+
+public class ChatTests
+{
+	private readonly Uri _baseUri = new("http://localhost:11434");
+	private readonly string _model = "llama3.2:1b";
+
+#pragma warning disable NUnit1032
+	private OllamaApiClient _client = null!;
+	private Chat _chat = null!;
+#pragma warning restore NUnit1032
+
+	[SetUp]
+	public async Task Setup()
+	{
+		_client = new OllamaApiClient(_baseUri);
+		_chat = new Chat(_client);
+
+		var modelExists = (await _client.ListLocalModelsAsync()).Any(m => m.Name == _model);
+		if (!modelExists)
+			await _client.PullModelAsync(_model).ToListAsync();
+	}
+
+	[TearDown]
+	public Task Teardown()
+	{
+		((IChatClient?)_client)?.Dispose();
+		return Task.CompletedTask;
+	}
+
+
+	[Test]
+	public async Task SendAsync_ShouldSucceed()
+	{
+		_client.SelectedModel = _model;
+
+		var response = await _chat
+			.SendAsync("What is the ultimate answer to " +
+					   "life, the universe, and everything, as specified in " +
+					   "a Hitchhikers Guide to the Galaxy. " +
+					   "Provide only the answer.",
+				CancellationToken.None)
+			.StreamToEndAsync();
+
+		response.Should().NotBeNullOrEmpty();
+		response.Should().ContainAny("42", "forty-two", "forty two");
+	}
+}
\ No newline at end of file
diff --git a/test/FunctionalTests/OllamaApiClientTests.cs b/test/FunctionalTests/OllamaApiClientTests.cs
new file mode 100644
index 0000000..9da4348
--- /dev/null
+++ b/test/FunctionalTests/OllamaApiClientTests.cs
@@ -0,0 +1,262 @@
+using FluentAssertions;
+using Microsoft.Extensions.AI;
+using NUnit.Framework;
+using OllamaSharp;
+using OllamaSharp.Models;
+using OllamaSharp.Models.Chat;
+using ChatRole = OllamaSharp.Models.Chat.ChatRole;
+
+namespace Tests.FunctionalTests;
+
+public class OllamaApiClientTests
+{
+	private readonly Uri _baseUri = new("http://localhost:11434");
+	private readonly string _model = "llama3.2:1b";
+	private readonly string _localModel = "OllamaSharpTest";
+	private readonly string _embeddingModel = "all-minilm:22m";
+
+#pragma warning disable NUnit1032
+	private OllamaApiClient _client = null!;
+#pragma warning restore NUnit1032
+
+	[SetUp]
+	public async Task Setup()
+	{
+		_client = new OllamaApiClient(_baseUri);
+		await CleanupModel(_localModel);
+	}
+
+	[TearDown]
+	public async Task Teardown()
+	{
+		await CleanupModel(_localModel);
+		((IChatClient?)_client)?.Dispose();
+	}
+
+	private async Task CleanupModel(string? model = null)
+	{
+		var modelExists = (await _client.ListLocalModelsAsync()).Any(m => m.Name == (model ?? _model));
+
+		if (modelExists)
+			await _client.DeleteModelAsync(new DeleteModelRequest { Model = model ?? _model });
+	}
+
+	private async Task PullIfNotExists(string model)
+	{
+		var modelExists = (await _client.ListLocalModelsAsync()).Any(m => m.Name == model);
+
+		if (!modelExists)
+			await _client.PullModelAsync(new PullModelRequest { Model = model }).ToListAsync();
+	}
+
+
+	[Test, Order(1), Ignore("Prevent the model from being downloaded each test run")]
+	public async Task PullModel()
+	{
+		var response = await _client
+			.PullModelAsync(new PullModelRequest { Model = _model })
+			.ToListAsync();
+
+		var models = await _client.ListLocalModelsAsync();
+		models.Should().Contain(m => m.Name == _model);
+
+		response.Should().NotBeEmpty();
+		response.Should().Contain(r => r!.Status == "pulling manifest");
+		response.Should().Contain(r => r!.Status == "success");
+	}
+
+	[Test, Order(2)]
+	public async Task CreateModel()
+	{
+		await PullIfNotExists(_localModel);
+
+		var model = new CreateModelRequest
+		{
+			Model = _localModel,
+			ModelFileContent =
+				"""
+				FROM llama3.2
+				PARAMETER temperature 0.3
+				PARAMETER num_ctx 100
+
+				# sets a custom system message to specify the behavior of the chat assistant
+				SYSTEM You are a concise model that tries to return yes or no answers.
+				"""
+		};
+
+		var response = await _client
+			.CreateModelAsync(model)
+			.ToListAsync();
+
+		var models = await _client.ListLocalModelsAsync();
+		models.Should().Contain(m => m.Name.StartsWith(_localModel));
+
+		response.Should().NotBeEmpty();
+		response.Should().Contain(r => r!.Status == "success");
+	}
+
+	[Test, Order(3)]
+	public async Task CopyModel()
+	{
+		await PullIfNotExists(_localModel);
+
+		var model = new CopyModelRequest { Source = _localModel, Destination = $"{_localModel}-copy" };
+
+		await _client.CopyModelAsync(model);
+
+		var models = await _client.ListLocalModelsAsync();
+		models.Should().Contain(m => m.Name == $"{_localModel}-copy:latest");
+
+		await _client.DeleteModelAsync(new DeleteModelRequest { Model = $"{_localModel}-copy:latest" });
+	}
+
+	[Test]
+	public async Task Embed()
+	{
+		await PullIfNotExists(_embeddingModel);
+
+		var request = new EmbedRequest { Model = _embeddingModel, Input = ["Hello, world!"] };
+
+		var response = await _client.EmbedAsync(request);
+
+		response.Should().NotBeNull();
+		response.Embeddings.Should().NotBeEmpty();
+		response.LoadDuration.Should().BeGreaterThan(100, "Because loading the model should take some time");
+		response.TotalDuration.Should().BeGreaterThan(100, "Because generating embeddings should take some time");
+	}
+
+	[Test]
+	public async Task ListLocalModels()
+	{
+		var models = (await _client.ListLocalModelsAsync()).ToList();
+
+		models.Should().NotBeEmpty();
+		models.Should().Contain(m => m.Name == _model);
+	}
+
+	[Test]
+	public async Task ListRunningModels()
+	{
+		await PullIfNotExists(_model);
+		var backgroundTask = Task.Run(async () =>
+		{
+			var generate = _client
+				.GenerateAsync(new GenerateRequest { Model = _model, Prompt = "Write a long song." })
+				.ToListAsync();
+
+			await Task.Yield();
+
+			await generate;
+		});
+
+		var modelsTask = _client.ListRunningModelsAsync();
+		await Task.WhenAll(backgroundTask, modelsTask);
+
+		var models = modelsTask.Result.ToList();
+		models.Should().NotBeEmpty();
+		models.Should().Contain(m => m.Name == _model);
+	}
+
+	[Test]
+	public async Task ShowModel()
+	{
+		await PullIfNotExists(_model);
+
+		var response = await _client.ShowModelAsync(new ShowModelRequest { Model = _model });
+
+		response.Should().NotBeNull();
+		response.Info.Should().NotBeNull();
+		response.Info.Architecture.Should().Be("llama");
+		response.Details.Should().NotBeNull();
+		response.Details.Format.Should().NotBeNullOrEmpty();
+		response.Details.Family.Should().Be("llama");
+	}
+
+	[Test]
+	public async Task DeleteModel()
+	{
+		await PullIfNotExists(_localModel);
+		await _client.CopyModelAsync(new CopyModelRequest
+		{
+			Source = _localModel,
+			Destination = $"{_localModel}-copy"
+		});
+
+		var exists = (await _client.ListLocalModelsAsync()).Any(m => m.Name == $"{_localModel}-copy:latest");
+
+		exists.Should().BeTrue();
+
+		await _client.DeleteModelAsync(new DeleteModelRequest { Model = $"{_localModel}-copy:latest" });
+
+		var models = await _client.ListLocalModelsAsync();
+		models.Should().NotContain(m => m.Name == $"{_localModel}-copy:latest");
+	}
+
+	[Test]
+	public async Task GenerateAsync()
+	{
+		await PullIfNotExists(_model);
+
+		var response = await _client.GenerateAsync(new GenerateRequest
+		{
+			Model = _model,
+			Prompt =
+				"What is the meaning to life, the universe, and everything according to the Hitchhikers Guide to the Galaxy?"
+		})
+		.ToListAsync();
+
+		var joined = string.Join("", response.Select(r => r.Response));
+
+		response.Should().NotBeEmpty();
+		joined.Should().Contain("42");
+	}
+
+	[Test]
+	public async Task ChatAsync()
+	{
+		await PullIfNotExists(_model);
+
+		var response = await _client.ChatAsync(new ChatRequest
+		{
+			Model = _model,
+			Messages = new[]
+			{
+				new Message
+				{
+					Role = ChatRole.User,
+					Content = "What is the meaning to life, the universe, and everything according to the Hitchhikers Guide to the Galaxy?"
+				},
+				new Message
+				{
+					Role = ChatRole.System,
+					Content = "According to the Hitchhikers Guide to the Galaxy, the meaning to life, the universe, and everything is 42."
+				},
+				new Message
+				{
+					Role = ChatRole.User,
+					Content = "Who is the author of the Hitchhikers Guide to the Galaxy?"
+				}
+			}
+		})
+		.ToListAsync();
+
+		var joined = string.Join("", response.Select(r => r.Message.Content));
+
+		response.Should().NotBeEmpty();
+		joined.Should().Contain("Douglas Adams");
+	}
+
+	[Test]
+	public async Task IsRunningAsync()
+	{
+		var response = await _client.IsRunningAsync();
+		response.Should().BeTrue();
+	}
+
+	[Test]
+	public async Task GetVersionAsync()
+	{
+		var response = await _client.GetVersionAsync();
+		response.Should().NotBeNull();
+	}
+}
\ No newline at end of file
diff --git a/test/OllamaApiClientTests.cs b/test/OllamaApiClientTests.cs
index 44a4cda..eb5e360 100644
--- a/test/OllamaApiClientTests.cs
+++ b/test/OllamaApiClientTests.cs
@@ -1,525 +1,524 @@
-using System.IO;
-using System.Net;
-using System.Text;
-using System.Text.Json;
-using FluentAssertions;
-using Microsoft.Extensions.AI;
-using Moq;
-using Moq.Protected;
-using NUnit.Framework;
-using OllamaSharp;
-using OllamaSharp.Models;
-using OllamaSharp.Models.Chat;
-using OllamaSharp.Models.Exceptions;
-using ChatRole = OllamaSharp.Models.Chat.ChatRole;
-
-namespace Tests;
-
-public class OllamaApiClientTests
-{
-	private OllamaApiClient _client;
-	private HttpResponseMessage? _response;
-	private HttpRequestMessage? _request;
-	private string? _requestContent;
-	private Dictionary<string, string>? _expectedRequestHeaders;
-
-	[OneTimeSetUp]
-	public void OneTimeSetUp()
-	{
-		var mockHandler = new Mock<HttpMessageHandler>(MockBehavior.Strict);
-
-		mockHandler
-			.Protected()
-			.Setup<Task<HttpResponseMessage?>>(
-				"SendAsync",
-				ItExpr.Is<HttpRequestMessage>(r => ValidateExpectedRequestHeaders(r)),
-				ItExpr.IsAny<CancellationToken>())
-			.ReturnsAsync(() => _response);
-
-		var httpClient = new HttpClient(mockHandler.Object) { BaseAddress = new Uri("http://empty") };
-		_client = new OllamaApiClient(httpClient);
-
-		_client.DefaultRequestHeaders["default_header"] = "ok";
-	}
-
-	[SetUp]
-	public void SetUp()
-	{
-		_expectedRequestHeaders = null;
-	}
-
-	[OneTimeTearDown]
-	public void OneTimeTearDown()
-	{
-		((IDisposable)_client).Dispose();
-	}
-
-	/// <summary>
-	/// Validates if the http request message has the same headers as defined in _expectedRequestHeaders.
-	/// This method does nothing if _expectedRequestHeaders is null.
-	/// </summary>
-	private bool ValidateExpectedRequestHeaders(HttpRequestMessage request)
-	{
-		_request = request;
-		_requestContent = request.Content?.ReadAsStringAsync().GetAwaiter().GetResult();
-
-		if (_expectedRequestHeaders is null)
-			return true;
-
-		if (_expectedRequestHeaders.Count != request.Headers.Count())
-			throw new InvalidOperationException($"Expected {_expectedRequestHeaders.Count} request header(s) but found {request.Headers.Count()}!");
-
-		foreach (var expectedHeader in _expectedRequestHeaders)
-		{
-			if (!request.Headers.Contains(expectedHeader.Key))
-				throw new InvalidOperationException($"Expected request header '{expectedHeader.Key}' was not found!");
-
-			var actualHeaderValue = request.Headers.GetValues(expectedHeader.Key).Single();
-			if (!string.Equals(actualHeaderValue, expectedHeader.Value))
-				throw new InvalidOperationException($"Request request header '{expectedHeader.Key}' has value '{actualHeaderValue}' while '{expectedHeader.Value}' was expected!");
-		}
-
-		return true;
-	}
-
-	public class CreateModelMethod : OllamaApiClientTests
-	{
-		[Test, NonParallelizable]
-		public async Task Streams_Status_Updates()
-		{
-			await using var stream = new MemoryStream();
-
-			_response = new HttpResponseMessage
-			{
-				StatusCode = HttpStatusCode.OK,
-				Content = new StreamContent(stream)
-			};
-
-			await using var writer = new StreamWriter(stream, leaveOpen: true);
-			writer.AutoFlush = true;
-			await writer.WriteLineAsync("{\"status\": \"Creating model\"}");
-			await writer.WriteLineAsync("{\"status\": \"Downloading model\"}");
-			await writer.WriteLineAsync("{\"status\": \"Model created\"}");
-			stream.Seek(0, SeekOrigin.Begin);
-
-			var builder = new StringBuilder();
-			var modelStream = _client.CreateModelAsync(new CreateModelRequest(), CancellationToken.None);
-
-			await foreach (var status in modelStream)
-				builder.Append(status?.Status);
-
-			builder.ToString().Should().Be("Creating modelDownloading modelModel created");
-		}
-
-		/// <summary>
-		/// Applies to all methods on the OllamaApiClient
-		/// </summary>
-		[Test, NonParallelizable]
-		public async Task Sends_Default_Request_Headers()
-		{
-			_expectedRequestHeaders = new Dictionary<string, string>
-			{
-				["default_header"] = "ok" // set as default on the OllamaApiClient (see above)
-			};
-
-			_response = new HttpResponseMessage
-			{
-				StatusCode = HttpStatusCode.OK,
-				Content = new StreamContent(new MemoryStream())
-			};
-
-			var builder = new StringBuilder();
-			await foreach (var status in _client.CreateModelAsync(new CreateModelRequest(), CancellationToken.None))
-				builder.Append(status?.Status);
-
-			builder.Length.Should().Be(0); // assert anything, the test will fail if the expected headers are not available
-		}
-
-		/// <summary>
-		/// Applies to all methods on the OllamaApiClient
-		/// </summary>
-		[Test, NonParallelizable]
-		public async Task Sends_Custom_Request_Headers()
-		{
-			_expectedRequestHeaders = new Dictionary<string, string>
-			{
-				["default_header"] = "ok", // set as default on the OllamaApiClient (see above)
-				["api_method"] = "create" // set as custom request header (see below)
-			};
-
-			_response = new HttpResponseMessage
-			{
-				StatusCode = HttpStatusCode.OK,
-				Content = new StreamContent(new MemoryStream())
-			};
-
-			var request = new CreateModelRequest();
-			request.CustomHeaders["api_method"] = "create"; // set custom request headers
-
-			var builder = new StringBuilder();
-			await foreach (var status in _client.CreateModelAsync(request, CancellationToken.None))
-				builder.Append(status?.Status);
-
-			builder.Length.Should().Be(0); // assert anything, the test will fail if the expected headers are not available
-		}
-
-		/// <summary>
-		/// Applies to all methods on the OllamaApiClient
-		/// </summary>
-		[Test, NonParallelizable]
-		public async Task Overwrites_Http_Headers()
-		{
-			_expectedRequestHeaders = new Dictionary<string, string>
-			{
-				["default_header"] = "overwritten" // default header value on the OllamaApiClient is 1, but it's overwritten below
-			};
-
-			_response = new HttpResponseMessage
-			{
-				StatusCode = HttpStatusCode.OK,
-				Content = new StreamContent(new MemoryStream())
-			};
-
-			var request = new CreateModelRequest();
-			request.CustomHeaders["default_header"] = "overwritten";  // overwrites the default header defined on the OllamaApiClient
-
-			var builder = new StringBuilder();
-			await foreach (var status in _client.CreateModelAsync(request, CancellationToken.None))
-				builder.Append(status?.Status);
-
-			builder.Length.Should().Be(0); // assert anything, the test will fail if the expected headers are not available
-		}
-	}
-
-	public class GenerateMethod : OllamaApiClientTests
-	{
-		[Test, NonParallelizable]
-		public async Task Returns_Streamed_Responses_At_Once()
-		{
-			await using var stream = new MemoryStream();
-
-			_response = new HttpResponseMessage
-			{
-				StatusCode = HttpStatusCode.OK,
-				Content = new StreamContent(stream)
-			};
-
-			await using var writer = new StreamWriter(stream, leaveOpen: true);
-			writer.AutoFlush = true;
-			await writer.WriteCompletionStreamResponse("The ");
-			await writer.WriteCompletionStreamResponse("sky ");
-			await writer.WriteCompletionStreamResponse("is ");
-			await writer.FinishCompletionStreamResponse("blue.", context: [1, 2, 3]);
-			stream.Seek(0, SeekOrigin.Begin);
-
-			var context = await _client.GenerateAsync("prompt").StreamToEndAsync();
-
-			context.Should().NotBeNull();
-			context.Response.Should().Be("The sky is blue.");
-			var expectation = new int[] { 1, 2, 3 };
-			context.Context.Should().BeEquivalentTo(expectation);
-		}
-	}
-
-	public class CompleteMethod : OllamaApiClientTests
-	{
-		[Test, NonParallelizable]
-		public async Task Sends_Parameters_With_Request()
-		{
-			var payload = """
-				{
-				    "model": "llama2",
-				    "created_at": "2024-07-12T12:34:39.63897616Z",
-				    "message": {
-				        "role": "assistant",
-				        "content": "Test content."
-				    },
-				    "done_reason": "stop",
-				    "done": true,
-				    "total_duration": 137729492272,
-				    "load_duration": 133071702768,
-				    "prompt_eval_count": 26,
-				    "prompt_eval_duration": 35137000,
-				    "eval_count": 323,
-				    "eval_duration": 4575154000
-				}
-				""".ReplaceLineEndings(""); // the JSON stream reader reads by line, so we need to make this one single line
-
-			await using var stream = new MemoryStream();
-
-			await using var writer = new StreamWriter(stream, leaveOpen: true);
-			writer.AutoFlush = true;
-			await writer.WriteAsync(payload);
-			stream.Seek(0, SeekOrigin.Begin);
-
-			_response = new HttpResponseMessage
-			{
-				StatusCode = HttpStatusCode.OK,
-				Content = new StreamContent(stream)
-			};
-
-			List<Microsoft.Extensions.AI.ChatMessage> chatHistory = [];
-			chatHistory.Add(new(Microsoft.Extensions.AI.ChatRole.User, "Why?"));
-			chatHistory.Add(new(Microsoft.Extensions.AI.ChatRole.Assistant, "Because!"));
-			chatHistory.Add(new(Microsoft.Extensions.AI.ChatRole.User, "And where?"));
-
-			var chatClient = _client as Microsoft.Extensions.AI.IChatClient;
-
-			var options = new ChatOptions
-			{
-				ModelId = "model",
-				TopP = 100,
-				TopK = 50,
-				Temperature = 0.5f,
-				FrequencyPenalty = 0.1f,
-				PresencePenalty = 0.2f,
-				StopSequences = ["stop me"],
-			};
-
-			await chatClient.CompleteAsync(chatHistory, options, CancellationToken.None);
-
-			_request.Should().NotBeNull();
-			_requestContent.Should().NotBeNull();
-
-			_requestContent.Should().Contain("Why?");
-			_requestContent.Should().Contain("Because!");
-			_requestContent.Should().Contain("And where?");
-			_requestContent.Should().Contain("\"top_p\":100");
-			_requestContent.Should().Contain("\"top_k\":50");
-			_requestContent.Should().Contain("\"temperature\":0.5");
-			_requestContent.Should().Contain("\"frequency_penalty\":0.1");
-			_requestContent.Should().Contain("\"presence_penalty\":0.2");
-			_requestContent.Should().Contain("\"stop\":[\"stop me\"]");
-
-			// Ensure that the request does not contain any other properties when not provided.
-			_requestContent.Should().NotContain("tools");
-			_requestContent.Should().NotContain("tool_calls");
-			_requestContent.Should().NotContain("images");
-		}
-	}
-
-	public class ChatMethod : OllamaApiClientTests
-	{
-		[Test, NonParallelizable]
-		public async Task Receives_Response_Message_With_Metadata()
-		{
-			var payload = """
-				{
-				    "model": "llama2",
-				    "created_at": "2024-07-12T12:34:39.63897616Z",
-				    "message": {
-				        "role": "assistant",
-				        "content": "Test content."
-				    },
-				    "done_reason": "stop",
-				    "done": true,
-				    "total_duration": 137729492272,
-				    "load_duration": 133071702768,
-				    "prompt_eval_count": 26,
-				    "prompt_eval_duration": 35137000,
-				    "eval_count": 323,
-				    "eval_duration": 4575154000
-				}
-				""".ReplaceLineEndings(""); // the JSON stream reader reads by line, so we need to make this one single line
-
-			await using var stream = new MemoryStream();
-
-			await using var writer = new StreamWriter(stream, leaveOpen: true);
-			writer.AutoFlush = true;
-			await writer.WriteAsync(payload);
-			stream.Seek(0, SeekOrigin.Begin);
-
-			_response = new HttpResponseMessage
-			{
-				StatusCode = HttpStatusCode.OK,
-				Content = new StreamContent(stream)
-			};
-
-			var chat = new ChatRequest
-			{
-				Model = "model",
-				Messages = [
-					new(ChatRole.User, "Why?"),
-					new(ChatRole.Assistant, "Because!"),
-					new(ChatRole.User, "And where?")]
-			};
-
-			var result = await _client.ChatAsync(chat, CancellationToken.None).StreamToEndAsync();
-
-			result.Should().NotBeNull();
-			result.Message.Role.Should().Be(ChatRole.Assistant);
-			result.Message.Content.Should().Be("Test content.");
-			result.Done.Should().BeTrue();
-			result.DoneReason.Should().Be("stop");
-			result.TotalDuration.Should().Be(137729492272);
-			result.LoadDuration.Should().Be(133071702768);
-			result.PromptEvalCount.Should().Be(26);
-			result.PromptEvalDuration.Should().Be(35137000);
-			result.EvalCount.Should().Be(323);
-			result.EvalDuration.Should().Be(4575154000);
-		}
-
-		[Test, NonParallelizable]
-		public async Task Receives_Response_Message_With_ToolsCalls()
-		{
-			var payload = """
-				{
-				    "model": "llama3.1:latest",
-				    "created_at": "2024-09-01T16:12:28.639564938Z",
-				    "message": {
-				        "role": "assistant",
-				        "content": "",
-				        "tool_calls": [
-				            {
-				                "function": {
-				                    "name": "get_current_weather",
-				                    "arguments": {
-				                        "format": "celsius",
-				                        "location": "Los Angeles, CA",
-										"number": 42
-				                    }
-				                }
-				            }
-				        ]
-				    },
-				    "done_reason": "stop",
-				    "done": true,
-				    "total_duration": 24808639002,
-				    "load_duration": 5084890970,
-				    "prompt_eval_count": 311,
-				    "prompt_eval_duration": 15120086000,
-				    "eval_count": 28,
-				    "eval_duration": 4602334000
-				}
+using System.Net;
+using System.Text;
+using System.Text.Json;
+using FluentAssertions;
+using Microsoft.Extensions.AI;
+using Moq;
+using Moq.Protected;
+using NUnit.Framework;
+using OllamaSharp;
+using OllamaSharp.Models;
+using OllamaSharp.Models.Chat;
+using OllamaSharp.Models.Exceptions;
+using ChatRole = OllamaSharp.Models.Chat.ChatRole;
+
+namespace Tests;
+
+public class OllamaApiClientTests
+{
+	private OllamaApiClient _client;
+	private HttpResponseMessage? _response;
+	private HttpRequestMessage? _request;
+	private string? _requestContent;
+	private Dictionary<string, string>? _expectedRequestHeaders;
+
+	[OneTimeSetUp]
+	public void OneTimeSetUp()
+	{
+		var mockHandler = new Mock<HttpMessageHandler>(MockBehavior.Strict);
+
+		mockHandler
+			.Protected()
+			.Setup<Task<HttpResponseMessage?>>(
+				"SendAsync",
+				ItExpr.Is<HttpRequestMessage>(r => ValidateExpectedRequestHeaders(r)),
+				ItExpr.IsAny<CancellationToken>())
+			.ReturnsAsync(() => _response);
+
+		var httpClient = new HttpClient(mockHandler.Object) { BaseAddress = new Uri("http://empty") };
+		_client = new OllamaApiClient(httpClient);
+
+		_client.DefaultRequestHeaders["default_header"] = "ok";
+	}
+
+	[SetUp]
+	public void SetUp()
+	{
+		_expectedRequestHeaders = null;
+	}
+
+	[OneTimeTearDown]
+	public void OneTimeTearDown()
+	{
+		((IDisposable)_client).Dispose();
+	}
+
+	/// <summary>
+	/// Validates if the http request message has the same headers as defined in _expectedRequestHeaders.
+	/// This method does nothing if _expectedRequestHeaders is null.
+	/// </summary>
+	private bool ValidateExpectedRequestHeaders(HttpRequestMessage request)
+	{
+		_request = request;
+		_requestContent = request.Content?.ReadAsStringAsync().GetAwaiter().GetResult();
+
+		if (_expectedRequestHeaders is null)
+			return true;
+
+		if (_expectedRequestHeaders.Count != request.Headers.Count())
+			throw new InvalidOperationException($"Expected {_expectedRequestHeaders.Count} request header(s) but found {request.Headers.Count()}!");
+
+		foreach (var expectedHeader in _expectedRequestHeaders)
+		{
+			if (!request.Headers.Contains(expectedHeader.Key))
+				throw new InvalidOperationException($"Expected request header '{expectedHeader.Key}' was not found!");
+
+			var actualHeaderValue = request.Headers.GetValues(expectedHeader.Key).Single();
+			if (!string.Equals(actualHeaderValue, expectedHeader.Value))
+				throw new InvalidOperationException($"Request request header '{expectedHeader.Key}' has value '{actualHeaderValue}' while '{expectedHeader.Value}' was expected!");
+		}
+
+		return true;
+	}
+
+	public class CreateModelMethod : OllamaApiClientTests
+	{
+		[Test, NonParallelizable]
+		public async Task Streams_Status_Updates()
+		{
+			await using var stream = new MemoryStream();
+
+			_response = new HttpResponseMessage
+			{
+				StatusCode = HttpStatusCode.OK,
+				Content = new StreamContent(stream)
+			};
+
+			await using var writer = new StreamWriter(stream, leaveOpen: true);
+			writer.AutoFlush = true;
+			await writer.WriteLineAsync("{\"status\": \"Creating model\"}");
+			await writer.WriteLineAsync("{\"status\": \"Downloading model\"}");
+			await writer.WriteLineAsync("{\"status\": \"Model created\"}");
+			stream.Seek(0, SeekOrigin.Begin);
+
+			var builder = new StringBuilder();
+			var modelStream = _client.CreateModelAsync(new CreateModelRequest(), CancellationToken.None);
+
+			await foreach (var status in modelStream)
+				builder.Append(status?.Status);
+
+			builder.ToString().Should().Be("Creating modelDownloading modelModel created");
+		}
+
+		/// <summary>
+		/// Applies to all methods on the OllamaApiClient
+		/// </summary>
+		[Test, NonParallelizable]
+		public async Task Sends_Default_Request_Headers()
+		{
+			_expectedRequestHeaders = new Dictionary<string, string>
+			{
+				["default_header"] = "ok" // set as default on the OllamaApiClient (see above)
+			};
+
+			_response = new HttpResponseMessage
+			{
+				StatusCode = HttpStatusCode.OK,
+				Content = new StreamContent(new MemoryStream())
+			};
+
+			var builder = new StringBuilder();
+			await foreach (var status in _client.CreateModelAsync(new CreateModelRequest(), CancellationToken.None))
+				builder.Append(status?.Status);
+
+			builder.Length.Should().Be(0); // assert anything, the test will fail if the expected headers are not available
+		}
+
+		/// <summary>
+		/// Applies to all methods on the OllamaApiClient
+		/// </summary>
+		[Test, NonParallelizable]
+		public async Task Sends_Custom_Request_Headers()
+		{
+			_expectedRequestHeaders = new Dictionary<string, string>
+			{
+				["default_header"] = "ok", // set as default on the OllamaApiClient (see above)
+				["api_method"] = "create" // set as custom request header (see below)
+			};
+
+			_response = new HttpResponseMessage
+			{
+				StatusCode = HttpStatusCode.OK,
+				Content = new StreamContent(new MemoryStream())
+			};
+
+			var request = new CreateModelRequest();
+			request.CustomHeaders["api_method"] = "create"; // set custom request headers
+
+			var builder = new StringBuilder();
+			await foreach (var status in _client.CreateModelAsync(request, CancellationToken.None))
+				builder.Append(status?.Status);
+
+			builder.Length.Should().Be(0); // assert anything, the test will fail if the expected headers are not available
+		}
+
+		/// <summary>
+		/// Applies to all methods on the OllamaApiClient
+		/// </summary>
+		[Test, NonParallelizable]
+		public async Task Overwrites_Http_Headers()
+		{
+			_expectedRequestHeaders = new Dictionary<string, string>
+			{
+				["default_header"] = "overwritten" // default header value on the OllamaApiClient is 1, but it's overwritten below
+			};
+
+			_response = new HttpResponseMessage
+			{
+				StatusCode = HttpStatusCode.OK,
+				Content = new StreamContent(new MemoryStream())
+			};
+
+			var request = new CreateModelRequest();
+			request.CustomHeaders["default_header"] = "overwritten";  // overwrites the default header defined on the OllamaApiClient
+
+			var builder = new StringBuilder();
+			await foreach (var status in _client.CreateModelAsync(request, CancellationToken.None))
+				builder.Append(status?.Status);
+
+			builder.Length.Should().Be(0); // assert anything, the test will fail if the expected headers are not available
+		}
+	}
+
+	public class GenerateMethod : OllamaApiClientTests
+	{
+		[Test, NonParallelizable]
+		public async Task Returns_Streamed_Responses_At_Once()
+		{
+			await using var stream = new MemoryStream();
+
+			_response = new HttpResponseMessage
+			{
+				StatusCode = HttpStatusCode.OK,
+				Content = new StreamContent(stream)
+			};
+
+			await using var writer = new StreamWriter(stream, leaveOpen: true);
+			writer.AutoFlush = true;
+			await writer.WriteCompletionStreamResponse("The ");
+			await writer.WriteCompletionStreamResponse("sky ");
+			await writer.WriteCompletionStreamResponse("is ");
+			await writer.FinishCompletionStreamResponse("blue.", context: [1, 2, 3]);
+			stream.Seek(0, SeekOrigin.Begin);
+
+			var context = await _client.GenerateAsync("prompt").StreamToEndAsync();
+
+			context.Should().NotBeNull();
+			context.Response.Should().Be("The sky is blue.");
+			var expectation = new int[] { 1, 2, 3 };
+			context.Context.Should().BeEquivalentTo(expectation);
+		}
+	}
+
+	public class CompleteMethod : OllamaApiClientTests
+	{
+		[Test, NonParallelizable]
+		public async Task Sends_Parameters_With_Request()
+		{
+			var payload = """
+				{
+				    "model": "llama2",
+				    "created_at": "2024-07-12T12:34:39.63897616Z",
+				    "message": {
+				        "role": "assistant",
+				        "content": "Test content."
+				    },
+				    "done_reason": "stop",
+				    "done": true,
+				    "total_duration": 137729492272,
+				    "load_duration": 133071702768,
+				    "prompt_eval_count": 26,
+				    "prompt_eval_duration": 35137000,
+				    "eval_count": 323,
+				    "eval_duration": 4575154000
+				}
+				""".ReplaceLineEndings(""); // the JSON stream reader reads by line, so we need to make this one single line
+
+			await using var stream = new MemoryStream();
+
+			await using var writer = new StreamWriter(stream, leaveOpen: true);
+			writer.AutoFlush = true;
+			await writer.WriteAsync(payload);
+			stream.Seek(0, SeekOrigin.Begin);
+
+			_response = new HttpResponseMessage
+			{
+				StatusCode = HttpStatusCode.OK,
+				Content = new StreamContent(stream)
+			};
+
+			List<Microsoft.Extensions.AI.ChatMessage> chatHistory = [];
+			chatHistory.Add(new(Microsoft.Extensions.AI.ChatRole.User, "Why?"));
+			chatHistory.Add(new(Microsoft.Extensions.AI.ChatRole.Assistant, "Because!"));
+			chatHistory.Add(new(Microsoft.Extensions.AI.ChatRole.User, "And where?"));
+
+			var chatClient = _client as Microsoft.Extensions.AI.IChatClient;
+
+			var options = new ChatOptions
+			{
+				ModelId = "model",
+				TopP = 100,
+				TopK = 50,
+				Temperature = 0.5f,
+				FrequencyPenalty = 0.1f,
+				PresencePenalty = 0.2f,
+				StopSequences = ["stop me"],
+			};
+
+			await chatClient.CompleteAsync(chatHistory, options, CancellationToken.None);
+
+			_request.Should().NotBeNull();
+			_requestContent.Should().NotBeNull();
+
+			_requestContent.Should().Contain("Why?");
+			_requestContent.Should().Contain("Because!");
+			_requestContent.Should().Contain("And where?");
+			_requestContent.Should().Contain("\"top_p\":100");
+			_requestContent.Should().Contain("\"top_k\":50");
+			_requestContent.Should().Contain("\"temperature\":0.5");
+			_requestContent.Should().Contain("\"frequency_penalty\":0.1");
+			_requestContent.Should().Contain("\"presence_penalty\":0.2");
+			_requestContent.Should().Contain("\"stop\":[\"stop me\"]");
+
+			// Ensure that the request does not contain any other properties when not provided.
+			_requestContent.Should().NotContain("tools");
+			_requestContent.Should().NotContain("tool_calls");
+			_requestContent.Should().NotContain("images");
+		}
+	}
+
+	public class ChatMethod : OllamaApiClientTests
+	{
+		[Test, NonParallelizable]
+		public async Task Receives_Response_Message_With_Metadata()
+		{
+			var payload = """
+				{
+				    "model": "llama2",
+				    "created_at": "2024-07-12T12:34:39.63897616Z",
+				    "message": {
+				        "role": "assistant",
+				        "content": "Test content."
+				    },
+				    "done_reason": "stop",
+				    "done": true,
+				    "total_duration": 137729492272,
+				    "load_duration": 133071702768,
+				    "prompt_eval_count": 26,
+				    "prompt_eval_duration": 35137000,
+				    "eval_count": 323,
+				    "eval_duration": 4575154000
+				}
 				""".ReplaceLineEndings(""); // the JSON stream reader reads by line, so we need to make this one single line
 
-			await using var stream = new MemoryStream();
-
-			await using var writer = new StreamWriter(stream, leaveOpen: true);
-			writer.AutoFlush = true;
-			await writer.WriteAsync(payload);
-			stream.Seek(0, SeekOrigin.Begin);
-
-			_response = new HttpResponseMessage
-			{
-				StatusCode = HttpStatusCode.OK,
-				Content = new StreamContent(stream)
-			};
-
-			var chat = new ChatRequest
-			{
+			await using var stream = new MemoryStream();
+
+			await using var writer = new StreamWriter(stream, leaveOpen: true);
+			writer.AutoFlush = true;
+			await writer.WriteAsync(payload);
+			stream.Seek(0, SeekOrigin.Begin);
+
+			_response = new HttpResponseMessage
+			{
+				StatusCode = HttpStatusCode.OK,
+				Content = new StreamContent(stream)
+			};
+
+			var chat = new ChatRequest
+			{
+				Model = "model",
+				Messages = [
+					new(ChatRole.User, "Why?"),
+					new(ChatRole.Assistant, "Because!"),
+					new(ChatRole.User, "And where?")]
+			};
+
+			var result = await _client.ChatAsync(chat, CancellationToken.None).StreamToEndAsync();
+
+			result.Should().NotBeNull();
+			result.Message.Role.Should().Be(ChatRole.Assistant);
+			result.Message.Content.Should().Be("Test content.");
+			result.Done.Should().BeTrue();
+			result.DoneReason.Should().Be("stop");
+			result.TotalDuration.Should().Be(137729492272);
+			result.LoadDuration.Should().Be(133071702768);
+			result.PromptEvalCount.Should().Be(26);
+			result.PromptEvalDuration.Should().Be(35137000);
+			result.EvalCount.Should().Be(323);
+			result.EvalDuration.Should().Be(4575154000);
+		}
+
+		[Test, NonParallelizable]
+		public async Task Receives_Response_Message_With_ToolsCalls()
+		{
+			var payload = """
+				{
+				    "model": "llama3.1:latest",
+				    "created_at": "2024-09-01T16:12:28.639564938Z",
+				    "message": {
+				        "role": "assistant",
+				        "content": "",
+				        "tool_calls": [
+				            {
+				                "function": {
+				                    "name": "get_current_weather",
+				                    "arguments": {
+				                        "format": "celsius",
+				                        "location": "Los Angeles, CA",
+										"number": 42
+				                    }
+				                }
+				            }
+				        ]
+				    },
+				    "done_reason": "stop",
+				    "done": true,
+				    "total_duration": 24808639002,
+				    "load_duration": 5084890970,
+				    "prompt_eval_count": 311,
+				    "prompt_eval_duration": 15120086000,
+				    "eval_count": 28,
+				    "eval_duration": 4602334000
+				}
+				""".ReplaceLineEndings(""); // the JSON stream reader reads by line, so we need to make this one single line
+
+			await using var stream = new MemoryStream();
+
+			await using var writer = new StreamWriter(stream, leaveOpen: true);
+			writer.AutoFlush = true;
+			await writer.WriteAsync(payload);
+			stream.Seek(0, SeekOrigin.Begin);
+
+			_response = new HttpResponseMessage
+			{
+				StatusCode = HttpStatusCode.OK,
+				Content = new StreamContent(stream)
+			};
+
+			var chat = new ChatRequest
+			{
 				Model = "llama3.1:latest",
-				Stream = false,
-				Messages = [
-					new(ChatRole.User, "How is the weather in LA?"),
-				],
-				Tools = [
-					new Tool
-					{
-						Function = new Function
-						{
-							Description = "Get the current weather for a location",
-							Name = "get_current_weather",
-							Parameters = new Parameters
-							{
-								Properties = new Dictionary<string, Properties>
-								{
-									["location"] = new()
-									{
-										Type = "string",
-										Description = "The location to get the weather for, e.g. San Francisco, CA"
-									},
-									["format"] = new()
-									{
-										Type = "string",
-										Description = "The format to return the weather in, e.g. 'celsius' or 'fahrenheit'",
-										Enum = ["celsius", "fahrenheit"]
-									},
-									["number"] = new()
-									{
-										Type = "integer",
-										Description = "The number of the day to get the weather for, e.g. 42"
-									}
-								},
-								Required = ["location", "format"],
-							}
-						},
-						Type = "function"
-					}
-				]
-			};
-
-			var result = await _client.ChatAsync(chat, CancellationToken.None).StreamToEndAsync();
-
-			result.Should().NotBeNull();
-			result.Message.Role.Should().Be(ChatRole.Assistant);
-			result.Done.Should().BeTrue();
-			result.DoneReason.Should().Be("stop");
-
-			result.Message.ToolCalls.Should().HaveCount(1);
-
-			var toolsFunction = result.Message.ToolCalls.ElementAt(0).Function;
-			toolsFunction.Name.Should().Be("get_current_weather");
-			toolsFunction.Arguments.ElementAt(0).Key.Should().Be("format");
-			toolsFunction.Arguments.ElementAt(0).Value.ToString().Should().Be("celsius");
-
-			toolsFunction.Arguments.ElementAt(1).Key.Should().Be("location");
-			toolsFunction.Arguments.ElementAt(1).Value.ToString().Should().Be("Los Angeles, CA");
-
-			toolsFunction.Arguments.ElementAt(2).Key.Should().Be("number");
-			toolsFunction.Arguments.ElementAt(2).Value.ToString().Should().Be("42");
+				Stream = false,
+				Messages = [
+					new(ChatRole.User, "How is the weather in LA?"),
+				],
+				Tools = [
+					new Tool
+					{
+						Function = new Function
+						{
+							Description = "Get the current weather for a location",
+							Name = "get_current_weather",
+							Parameters = new Parameters
+							{
+								Properties = new Dictionary<string, Properties>
+								{
+									["location"] = new()
+									{
+										Type = "string",
+										Description = "The location to get the weather for, e.g. San Francisco, CA"
+									},
+									["format"] = new()
+									{
+										Type = "string",
+										Description = "The format to return the weather in, e.g. 'celsius' or 'fahrenheit'",
+										Enum = ["celsius", "fahrenheit"]
+									},
+									["number"] = new()
+									{
+										Type = "integer",
+										Description = "The number of the day to get the weather for, e.g. 42"
+									}
+								},
+								Required = ["location", "format"],
+							}
+						},
+						Type = "function"
+					}
+				]
+			};
+
+			var result = await _client.ChatAsync(chat, CancellationToken.None).StreamToEndAsync();
+
+			result.Should().NotBeNull();
+			result.Message.Role.Should().Be(ChatRole.Assistant);
+			result.Done.Should().BeTrue();
+			result.DoneReason.Should().Be("stop");
+
+			result.Message.ToolCalls.Should().HaveCount(1);
+
+			var toolsFunction = result.Message.ToolCalls.ElementAt(0).Function;
+			toolsFunction.Name.Should().Be("get_current_weather");
+			toolsFunction.Arguments.ElementAt(0).Key.Should().Be("format");
+			toolsFunction.Arguments.ElementAt(0).Value.ToString().Should().Be("celsius");
+
+			toolsFunction.Arguments.ElementAt(1).Key.Should().Be("location");
+			toolsFunction.Arguments.ElementAt(1).Value.ToString().Should().Be("Los Angeles, CA");
+
+			toolsFunction.Arguments.ElementAt(2).Key.Should().Be("number");
+			toolsFunction.Arguments.ElementAt(2).Value.ToString().Should().Be("42");
 		}
 
-		[Test, NonParallelizable]
-		public async Task Response_Streaming_Message_With_ToolsCalls_Throws_Not_Supported()
+		[Test, NonParallelizable]
+		public async Task Response_Streaming_Message_With_ToolsCalls_Throws_Not_Supported()
 		{
-			_response = new HttpResponseMessage
-			{
-				StatusCode = HttpStatusCode.OK,
-				Content = new StringContent(string.Empty)
+			_response = new HttpResponseMessage
+			{
+				StatusCode = HttpStatusCode.OK,
+				Content = new StringContent(string.Empty)
 			};
-
-			var request = new ChatRequest
-			{
+
+			var request = new ChatRequest
+			{
 				Model = "llama3.1:latest",
-				Messages = [
-					new(ChatRole.User, "How is the weather in LA?"),
-				],
-				Tools = [
-					new Tool
-					{
-						Function = new Function
-						{
-							Description = "Get the current weather for a location",
-							Name = "get_current_weather",
-							Parameters = new Parameters
-							{
-								Properties = new Dictionary<string, Properties>
-								{
-									["location"] = new()
-									{
-										Type = "string",
-										Description = "The location to get the weather for, e.g. San Francisco, CA"
-									},
-									["format"] = new()
-									{
-										Type = "string",
-										Description = "The format to return the weather in, e.g. 'celsius' or 'fahrenheit'",
-										Enum = ["celsius", "fahrenheit"]
-									},
-									["number"] = new()
-									{
-										Type = "integer",
-										Description = "The number of the day to get the weather for, e.g. 42"
-									}
-								},
-								Required = ["location", "format"],
-							}
-						},
-						Type = "function"
-					}
-				]
-			};
+				Messages = [
+					new(ChatRole.User, "How is the weather in LA?"),
+				],
+				Tools = [
+					new Tool
+					{
+						Function = new Function
+						{
+							Description = "Get the current weather for a location",
+							Name = "get_current_weather",
+							Parameters = new Parameters
+							{
+								Properties = new Dictionary<string, Properties>
+								{
+									["location"] = new()
+									{
+										Type = "string",
+										Description = "The location to get the weather for, e.g. San Francisco, CA"
+									},
+									["format"] = new()
+									{
+										Type = "string",
+										Description = "The format to return the weather in, e.g. 'celsius' or 'fahrenheit'",
+										Enum = ["celsius", "fahrenheit"]
+									},
+									["number"] = new()
+									{
+										Type = "integer",
+										Description = "The number of the day to get the weather for, e.g. 42"
+									}
+								},
+								Required = ["location", "format"],
+							}
+						},
+						Type = "function"
+					}
+				]
+			};
 
 			var act = async () =>
 			{
@@ -527,199 +526,199 @@ public async Task Response_Streaming_Message_With_ToolsCalls_Throws_Not_Supporte
 				await enumerator.MoveNextAsync();
 			};
 
-			await act.Should().ThrowAsync<NotSupportedException>();
-		}
-	}
-
-	public class StreamChatMethod : OllamaApiClientTests
-	{
-		[Test, NonParallelizable]
-		public async Task Streams_Response_Message_Chunks()
-		{
-			await using var stream = new MemoryStream();
-
-			_response = new HttpResponseMessage
-			{
-				StatusCode = HttpStatusCode.OK,
-				Content = new StreamContent(stream)
-			};
-
-			await using var writer = new StreamWriter(stream, leaveOpen: true);
-			writer.AutoFlush = true;
-			await writer.WriteChatStreamResponse("Leave ", ChatRole.Assistant);
-			await writer.WriteChatStreamResponse("me ", ChatRole.Assistant);
-			await writer.FinishChatStreamResponse("alone.", ChatRole.Assistant);
-			stream.Seek(0, SeekOrigin.Begin);
-
-			var chat = new ChatRequest
-			{
-				Model = "model",
-				Messages =
-				[
-					new(ChatRole.User, "Why?"),
-					new(ChatRole.Assistant, "Because!"),
-					new(ChatRole.User, "And where?"),
-				]
-			};
-
-			var chatStream = _client.ChatAsync(chat, CancellationToken.None);
-
-			var builder = new StringBuilder();
-			var responses = new List<Message?>();
-
-			await foreach (var response in chatStream)
-			{
-				builder.Append(response?.Message.Content);
-				responses.Add(response?.Message);
-			}
-
-			builder.ToString().Should().BeEquivalentTo("Leave me alone.");
-
-			responses.Should().HaveCount(3);
-			responses[0].Role.Should().Be(ChatRole.Assistant);
-			responses[1].Role.Should().Be(ChatRole.Assistant);
-			responses[2].Role.Should().Be(ChatRole.Assistant);
-		}
-
-		[Test, NonParallelizable]
-		public async Task Throws_Known_Exception_For_Models_That_Dont_Support_Tools()
-		{
-			_response = new HttpResponseMessage
-			{
-				StatusCode = HttpStatusCode.BadRequest,
-				Content = new StringContent("{ error: llama2 does not support tools }")
-			};
-
-			var act = () => _client.ChatAsync(new ChatRequest() { Stream = false }, CancellationToken.None).StreamToEndAsync();
-			await act.Should().ThrowAsync<ModelDoesNotSupportToolsException>();
-		}
-
-		[Test, NonParallelizable]
-		public async Task Throws_OllamaException_If_Parsing_Of_BadRequest_Errors_Fails()
-		{
-			_response = new HttpResponseMessage
-			{
-				StatusCode = HttpStatusCode.BadRequest,
-				Content = new StringContent("panic!")
-			};
-
-			var act = () => _client.ChatAsync(new ChatRequest(), CancellationToken.None).StreamToEndAsync();
-			await act.Should().ThrowAsync<OllamaException>();
-		}
-	}
-
-	public class ListLocalModelsMethod : OllamaApiClientTests
-	{
-		[Test, NonParallelizable]
-		public async Task Returns_Deserialized_Models()
-		{
-			_response = new HttpResponseMessage
-			{
-				StatusCode = HttpStatusCode.OK,
-				Content = new StringContent("{\r\n\"models\": [\r\n{\r\n\"name\": \"codellama:latest\",\r\n\"modified_at\": \"2023-10-12T14:17:04.967950259+02:00\",\r\n\"size\": 3791811617,\r\n\"digest\": \"36893bf9bc7ff7ace56557cd28784f35f834290c85d39115c6b91c00a031cfad\"\r\n},\r\n{\r\n\"name\": \"llama2:latest\",\r\n\"modified_at\": \"2023-10-02T14:10:14.78152065+02:00\",\r\n\"size\": 3791737662,\r\n\"digest\": \"d5611f7c428cf71fb05660257d18e043477f8b46cf561bf86940c687c1a59f70\"\r\n},\r\n{\r\n\"name\": \"mistral:latest\",\r\n\"modified_at\": \"2023-10-02T14:16:24.841447764+02:00\",\r\n\"size\": 4108916688,\r\n\"digest\": \"8aa307f73b2622af521e8f22d46e4b777123c4df91898dcb2e4079dc8fdf579e\"\r\n},\r\n{\r\n\"name\": \"vicuna:latest\",\r\n\"modified_at\": \"2023-10-06T09:44:16.936312659+02:00\",\r\n\"size\": 3825517709,\r\n\"digest\": \"675fa173a76abc48325d395854471961abf74b664d91e92ffb4fc03e0bde652b\"\r\n}\r\n]\r\n}\r\n")
-			};
-
-			var models = await _client.ListLocalModelsAsync(CancellationToken.None);
-			models.Count().Should().Be(4);
-
-			var first = models.First();
-			first.Name.Should().Be("codellama:latest");
-			first.ModifiedAt.Date.Should().Be(new DateTime(2023, 10, 12, 0, 0, 0, DateTimeKind.Local));
-			first.Size.Should().Be(3791811617);
-			first.Digest.Should().StartWith("36893bf9bc7ff7ace5655");
-		}
-	}
-
-	public class ShowMethod : OllamaApiClientTests
-	{
-		[Test, NonParallelizable]
-		public async Task Returns_Deserialized_Models()
-		{
-			_response = new HttpResponseMessage
-			{
-				StatusCode = HttpStatusCode.OK,
-				Content = new StringContent("{\r\n  \"license\": \"<contents of license block>\",\r\n  \"modelfile\": \"# Modelfile generated by \\\"ollama show\\\"\\n\\n\",\r\n  \"parameters\": \"stop                           [INST]\\nstop [/INST]\\nstop <<SYS>>\\nstop <</SYS>>\",\r\n  \"template\": \"[INST] {{ if and .First .System }}<<SYS>>{{ .System }}<</SYS>>\\n\\n{{ end }}{{ .Prompt }} [/INST] \"\r\n}")
-			};
-
-			var info = await _client.ShowModelAsync("codellama:latest", CancellationToken.None);
-
-			info.License.Should().Contain("contents of license block");
-			info.Modelfile.Should().StartWith("# Modelfile generated");
-			info.Parameters.Should().StartWith("stop");
-			info.Template.Should().StartWith("[INST]");
-		}
-
-		[Test, NonParallelizable]
-		public async Task Returns_Deserialized_Model_WithSystem()
-		{
-			_response = new HttpResponseMessage
-			{
-				StatusCode = HttpStatusCode.OK,
-				Content = new StringContent("{\"modelfile\":\"# Modelfile generated by \\\"ollama show\\\"\\n# To build a new Modelfile based on this, replace FROM with:\\n# FROM magicoder:latest\\n\\nFROM C:\\\\Users\\\\jd\\\\.ollama\\\\models\\\\blobs\\\\sha256-4a501ed4ce55e5611922b3ee422501ff7cc773b472d196c3c416859b6d375273\\nTEMPLATE \\\"{{ .System }}\\n\\n@@ Instruction\\n{{ .Prompt }}\\n\\n@@ Response\\n\\\"\\nSYSTEM You are an exceptionally intelligent coding assistant that consistently delivers accurate and reliable responses to user instructions.\\nPARAMETER num_ctx 16384\\n\",\"parameters\":\"num_ctx                        16384\",\"template\":\"{{ .System }}\\n\\n@@ Instruction\\n{{ .Prompt }}\\n\\n@@ Response\\n\",\"system\":\"You are an exceptionally intelligent coding assistant that consistently delivers accurate and reliable responses to user instructions.\",\"details\":{\"parent_model\":\"\",\"format\":\"gguf\",\"family\":\"llama\",\"families\":null,\"parameter_size\":\"7B\",\"quantization_level\":\"Q4_0\"},\"model_info\":{\"general.architecture\":\"llama\",\"general.file_type\":2,\"general.parameter_count\":8829407232,\"general.quantization_version\":2,\"llama.attention.head_count\":32,\"llama.attention.head_count_kv\":4,\"llama.attention.layer_norm_rms_epsilon\":0.000001,\"llama.block_count\":48,\"llama.context_length\":4096,\"llama.embedding_length\":4096,\"llama.feed_forward_length\":11008,\"llama.rope.dimension_count\":128,\"llama.rope.freq_base\":5000000,\"llama.vocab_size\":64000,\"tokenizer.ggml.add_bos_token\":false,\"tokenizer.ggml.add_eos_token\":false,\"tokenizer.ggml.bos_token_id\":1,\"tokenizer.ggml.eos_token_id\":2,\"tokenizer.ggml.model\":\"llama\",\"tokenizer.ggml.padding_token_id\":0,\"tokenizer.ggml.pre\":\"default\",\"tokenizer.ggml.scores\":[],\"tokenizer.ggml.token_type\":[],\"tokenizer.ggml.tokens\":[]},\"modified_at\":\"2024-05-14T23:33:07.4166573+08:00\"}")
-			};
-
-			var info = await _client.ShowModelAsync("starcoder:latest", CancellationToken.None);
-
-			info.License.Should().BeNullOrEmpty();
-			info.Modelfile.Should().StartWith("# Modelfile generated");
-			info.Parameters.Should().StartWith("num_ctx");
-			info.Template.Should().StartWith("{{ .System }}");
-			info.System.Should().StartWith("You are an exceptionally intelligent coding assistant");
-			info.Details.ParentModel.Should().BeNullOrEmpty();
-			info.Details.Format.Should().Be("gguf");
-			info.Details.Family.Should().Be("llama");
-			info.Details.Families.Should().BeNull();
-			info.Details.ParameterSize.Should().Be("7B");
-			info.Details.QuantizationLevel.Should().Be("Q4_0");
-			info.Info.Architecture.Should().Be("llama");
-			info.Info.QuantizationVersion.Should().Be(2);
-			info.Info.FileType.Should().Be(2);
-			info.Info.ExtraInfo.Should().NotBeNullOrEmpty();
-		}
-	}
-
-	public class GenerateEmbeddingsMethod : OllamaApiClientTests
-	{
-		[Test, NonParallelizable]
-		public async Task Returns_Deserialized_Models()
-		{
-			_response = new HttpResponseMessage
-			{
-				StatusCode = HttpStatusCode.OK,
-				Content = new StringContent("{\r\n  \"embeddings\": [[\r\n    0.5670403838157654, 0.009260174818336964, 0.23178744316101074, -0.2916173040866852, -0.8924556970596313  ]]\r\n}")
-			};
-
-			var info = await _client.EmbedAsync(new EmbedRequest { Model = "", Input = [""] }, CancellationToken.None);
-
-			info.Embeddings[0].Should().HaveCount(5);
-			info.Embeddings[0][0].Should().BeApproximately(0.567f, precision: 0.01f);
-		}
-	}
-}
-
-public static class WriterExtensions
-{
-	public static async Task WriteCompletionStreamResponse(this StreamWriter writer, string response)
-	{
-		var json = new { response, done = false };
-		await writer.WriteLineAsync(JsonSerializer.Serialize(json));
-	}
-
-	public static async Task FinishCompletionStreamResponse(this StreamWriter writer, string response, int[] context)
-	{
-		var json = new { response, done = true, context };
-		await writer.WriteLineAsync(JsonSerializer.Serialize(json));
-	}
-
-	public static async Task WriteChatStreamResponse(this StreamWriter writer, string content, ChatRole role)
-	{
-		var json = new { message = new { content, role }, role, done = false };
-		await writer.WriteLineAsync(JsonSerializer.Serialize(json));
-	}
-
-	public static async Task FinishChatStreamResponse(this StreamWriter writer, string content, ChatRole role)
-	{
-		var json = new { message = new { content, role = role.ToString() }, role = role.ToString(), done = true };
-		await writer.WriteLineAsync(JsonSerializer.Serialize(json));
-	}
+			await act.Should().ThrowAsync<NotSupportedException>();
+		}
+	}
+
+	public class StreamChatMethod : OllamaApiClientTests
+	{
+		[Test, NonParallelizable]
+		public async Task Streams_Response_Message_Chunks()
+		{
+			await using var stream = new MemoryStream();
+
+			_response = new HttpResponseMessage
+			{
+				StatusCode = HttpStatusCode.OK,
+				Content = new StreamContent(stream)
+			};
+
+			await using var writer = new StreamWriter(stream, leaveOpen: true);
+			writer.AutoFlush = true;
+			await writer.WriteChatStreamResponse("Leave ", ChatRole.Assistant);
+			await writer.WriteChatStreamResponse("me ", ChatRole.Assistant);
+			await writer.FinishChatStreamResponse("alone.", ChatRole.Assistant);
+			stream.Seek(0, SeekOrigin.Begin);
+
+			var chat = new ChatRequest
+			{
+				Model = "model",
+				Messages =
+				[
+					new(ChatRole.User, "Why?"),
+					new(ChatRole.Assistant, "Because!"),
+					new(ChatRole.User, "And where?"),
+				]
+			};
+
+			var chatStream = _client.ChatAsync(chat, CancellationToken.None);
+
+			var builder = new StringBuilder();
+			var responses = new List<Message?>();
+
+			await foreach (var response in chatStream)
+			{
+				builder.Append(response?.Message.Content);
+				responses.Add(response?.Message);
+			}
+
+			builder.ToString().Should().BeEquivalentTo("Leave me alone.");
+
+			responses.Should().HaveCount(3);
+			responses[0].Role.Should().Be(ChatRole.Assistant);
+			responses[1].Role.Should().Be(ChatRole.Assistant);
+			responses[2].Role.Should().Be(ChatRole.Assistant);
+		}
+
+		[Test, NonParallelizable]
+		public async Task Throws_Known_Exception_For_Models_That_Dont_Support_Tools()
+		{
+			_response = new HttpResponseMessage
+			{
+				StatusCode = HttpStatusCode.BadRequest,
+				Content = new StringContent("{ error: llama2 does not support tools }")
+			};
+
+			var act = () => _client.ChatAsync(new ChatRequest() { Stream = false }, CancellationToken.None).StreamToEndAsync();
+			await act.Should().ThrowAsync<ModelDoesNotSupportToolsException>();
+		}
+
+		[Test, NonParallelizable]
+		public async Task Throws_OllamaException_If_Parsing_Of_BadRequest_Errors_Fails()
+		{
+			_response = new HttpResponseMessage
+			{
+				StatusCode = HttpStatusCode.BadRequest,
+				Content = new StringContent("panic!")
+			};
+
+			var act = () => _client.ChatAsync(new ChatRequest(), CancellationToken.None).StreamToEndAsync();
+			await act.Should().ThrowAsync<OllamaException>();
+		}
+	}
+
+	public class ListLocalModelsMethod : OllamaApiClientTests
+	{
+		[Test, NonParallelizable]
+		public async Task Returns_Deserialized_Models()
+		{
+			_response = new HttpResponseMessage
+			{
+				StatusCode = HttpStatusCode.OK,
+				Content = new StringContent("{\r\n\"models\": [\r\n{\r\n\"name\": \"codellama:latest\",\r\n\"modified_at\": \"2023-10-12T14:17:04.967950259+02:00\",\r\n\"size\": 3791811617,\r\n\"digest\": \"36893bf9bc7ff7ace56557cd28784f35f834290c85d39115c6b91c00a031cfad\"\r\n},\r\n{\r\n\"name\": \"llama2:latest\",\r\n\"modified_at\": \"2023-10-02T14:10:14.78152065+02:00\",\r\n\"size\": 3791737662,\r\n\"digest\": \"d5611f7c428cf71fb05660257d18e043477f8b46cf561bf86940c687c1a59f70\"\r\n},\r\n{\r\n\"name\": \"mistral:latest\",\r\n\"modified_at\": \"2023-10-02T14:16:24.841447764+02:00\",\r\n\"size\": 4108916688,\r\n\"digest\": \"8aa307f73b2622af521e8f22d46e4b777123c4df91898dcb2e4079dc8fdf579e\"\r\n},\r\n{\r\n\"name\": \"vicuna:latest\",\r\n\"modified_at\": \"2023-10-06T09:44:16.936312659+02:00\",\r\n\"size\": 3825517709,\r\n\"digest\": \"675fa173a76abc48325d395854471961abf74b664d91e92ffb4fc03e0bde652b\"\r\n}\r\n]\r\n}\r\n")
+			};
+
+			var models = await _client.ListLocalModelsAsync(CancellationToken.None);
+			models.Count().Should().Be(4);
+
+			var first = models.First();
+			first.Name.Should().Be("codellama:latest");
+			first.ModifiedAt.Date.Should().Be(new DateTime(2023, 10, 12, 0, 0, 0, DateTimeKind.Local));
+			first.Size.Should().Be(3791811617);
+			first.Digest.Should().StartWith("36893bf9bc7ff7ace5655");
+		}
+	}
+
+	public class ShowMethod : OllamaApiClientTests
+	{
+		[Test, NonParallelizable]
+		public async Task Returns_Deserialized_Models()
+		{
+			_response = new HttpResponseMessage
+			{
+				StatusCode = HttpStatusCode.OK,
+				Content = new StringContent("{\r\n  \"license\": \"<contents of license block>\",\r\n  \"modelfile\": \"# Modelfile generated by \\\"ollama show\\\"\\n\\n\",\r\n  \"parameters\": \"stop                           [INST]\\nstop [/INST]\\nstop <<SYS>>\\nstop <</SYS>>\",\r\n  \"template\": \"[INST] {{ if and .First .System }}<<SYS>>{{ .System }}<</SYS>>\\n\\n{{ end }}{{ .Prompt }} [/INST] \"\r\n}")
+			};
+
+			var info = await _client.ShowModelAsync("codellama:latest", CancellationToken.None);
+
+			info.License.Should().Contain("contents of license block");
+			info.Modelfile.Should().StartWith("# Modelfile generated");
+			info.Parameters.Should().StartWith("stop");
+			info.Template.Should().StartWith("[INST]");
+		}
+
+		[Test, NonParallelizable]
+		public async Task Returns_Deserialized_Model_WithSystem()
+		{
+			_response = new HttpResponseMessage
+			{
+				StatusCode = HttpStatusCode.OK,
+				Content = new StringContent("{\"modelfile\":\"# Modelfile generated by \\\"ollama show\\\"\\n# To build a new Modelfile based on this, replace FROM with:\\n# FROM magicoder:latest\\n\\nFROM C:\\\\Users\\\\jd\\\\.ollama\\\\models\\\\blobs\\\\sha256-4a501ed4ce55e5611922b3ee422501ff7cc773b472d196c3c416859b6d375273\\nTEMPLATE \\\"{{ .System }}\\n\\n@@ Instruction\\n{{ .Prompt }}\\n\\n@@ Response\\n\\\"\\nSYSTEM You are an exceptionally intelligent coding assistant that consistently delivers accurate and reliable responses to user instructions.\\nPARAMETER num_ctx 16384\\n\",\"parameters\":\"num_ctx                        16384\",\"template\":\"{{ .System }}\\n\\n@@ Instruction\\n{{ .Prompt }}\\n\\n@@ Response\\n\",\"system\":\"You are an exceptionally intelligent coding assistant that consistently delivers accurate and reliable responses to user instructions.\",\"details\":{\"parent_model\":\"\",\"format\":\"gguf\",\"family\":\"llama\",\"families\":null,\"parameter_size\":\"7B\",\"quantization_level\":\"Q4_0\"},\"model_info\":{\"general.architecture\":\"llama\",\"general.file_type\":2,\"general.parameter_count\":8829407232,\"general.quantization_version\":2,\"llama.attention.head_count\":32,\"llama.attention.head_count_kv\":4,\"llama.attention.layer_norm_rms_epsilon\":0.000001,\"llama.block_count\":48,\"llama.context_length\":4096,\"llama.embedding_length\":4096,\"llama.feed_forward_length\":11008,\"llama.rope.dimension_count\":128,\"llama.rope.freq_base\":5000000,\"llama.vocab_size\":64000,\"tokenizer.ggml.add_bos_token\":false,\"tokenizer.ggml.add_eos_token\":false,\"tokenizer.ggml.bos_token_id\":1,\"tokenizer.ggml.eos_token_id\":2,\"tokenizer.ggml.model\":\"llama\",\"tokenizer.ggml.padding_token_id\":0,\"tokenizer.ggml.pre\":\"default\",\"tokenizer.ggml.scores\":[],\"tokenizer.ggml.token_type\":[],\"tokenizer.ggml.tokens\":[]},\"modified_at\":\"2024-05-14T23:33:07.4166573+08:00\"}")
+			};
+
+			var info = await _client.ShowModelAsync("starcoder:latest", CancellationToken.None);
+
+			info.License.Should().BeNullOrEmpty();
+			info.Modelfile.Should().StartWith("# Modelfile generated");
+			info.Parameters.Should().StartWith("num_ctx");
+			info.Template.Should().StartWith("{{ .System }}");
+			info.System.Should().StartWith("You are an exceptionally intelligent coding assistant");
+			info.Details.ParentModel.Should().BeNullOrEmpty();
+			info.Details.Format.Should().Be("gguf");
+			info.Details.Family.Should().Be("llama");
+			info.Details.Families.Should().BeNull();
+			info.Details.ParameterSize.Should().Be("7B");
+			info.Details.QuantizationLevel.Should().Be("Q4_0");
+			info.Info.Architecture.Should().Be("llama");
+			info.Info.QuantizationVersion.Should().Be(2);
+			info.Info.FileType.Should().Be(2);
+			info.Info.ExtraInfo.Should().NotBeNullOrEmpty();
+		}
+	}
+
+	public class GenerateEmbeddingsMethod : OllamaApiClientTests
+	{
+		[Test, NonParallelizable]
+		public async Task Returns_Deserialized_Models()
+		{
+			_response = new HttpResponseMessage
+			{
+				StatusCode = HttpStatusCode.OK,
+				Content = new StringContent("{\r\n  \"embeddings\": [[\r\n    0.5670403838157654, 0.009260174818336964, 0.23178744316101074, -0.2916173040866852, -0.8924556970596313  ]]\r\n}")
+			};
+
+			var info = await _client.EmbedAsync(new EmbedRequest { Model = "", Input = [""] }, CancellationToken.None);
+
+			info.Embeddings[0].Should().HaveCount(5);
+			info.Embeddings[0][0].Should().BeApproximately(0.567f, precision: 0.01f);
+		}
+	}
+}
+
+public static class WriterExtensions
+{
+	public static async Task WriteCompletionStreamResponse(this StreamWriter writer, string response)
+	{
+		var json = new { response, done = false };
+		await writer.WriteLineAsync(JsonSerializer.Serialize(json));
+	}
+
+	public static async Task FinishCompletionStreamResponse(this StreamWriter writer, string response, int[] context)
+	{
+		var json = new { response, done = true, context };
+		await writer.WriteLineAsync(JsonSerializer.Serialize(json));
+	}
+
+	public static async Task WriteChatStreamResponse(this StreamWriter writer, string content, ChatRole role)
+	{
+		var json = new { message = new { content, role }, role, done = false };
+		await writer.WriteLineAsync(JsonSerializer.Serialize(json));
+	}
+
+	public static async Task FinishChatStreamResponse(this StreamWriter writer, string content, ChatRole role)
+	{
+		var json = new { message = new { content, role = role.ToString() }, role = role.ToString(), done = true };
+		await writer.WriteLineAsync(JsonSerializer.Serialize(json));
+	}
 }
\ No newline at end of file
diff --git a/test/Tests.csproj b/test/Tests.csproj
index 74322e2..5855a05 100644
--- a/test/Tests.csproj
+++ b/test/Tests.csproj
@@ -1,15 +1,17 @@
 ﻿<Project Sdk="Microsoft.NET.Sdk">
 
-  <PropertyGroup>
-    <TargetFramework>net8.0</TargetFramework>
-    <ImplicitUsings>enable</ImplicitUsings>
-    <Nullable>enable</Nullable>
-    <IsPackable>false</IsPackable>
-    <IsTestProject>true</IsTestProject>
+	<PropertyGroup>
+		<TargetFramework>net8.0</TargetFramework>
+		<ImplicitUsings>enable</ImplicitUsings>
+		<Nullable>enable</Nullable>
+		<IsPackable>false</IsPackable>
+		<IsTestProject>true</IsTestProject>
 		<NoWarn>IDE0065;IDE0055;IDE0011;CS8602;CS8604;S6608</NoWarn>
+		<SignAssembly>True</SignAssembly>
+		<AssemblyOriginatorKeyFile>..\OllamaSharp.snk</AssemblyOriginatorKeyFile>
 	</PropertyGroup>
 
-  <ItemGroup>
+	<ItemGroup>
 		<PackageReference Include="FluentAssertions" Version="6.12.1" />
 		<PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.11.1" />
 		<PackageReference Include="Moq" Version="4.20.72" />
@@ -17,16 +19,17 @@
 		<PackageReference Include="NUnit3TestAdapter" Version="4.6.0" />
 		<PackageReference Include="NUnit.Analyzers" Version="4.3.0">
 			<PrivateAssets>all</PrivateAssets>
-      <IncludeAssets>runtime; build; native; contentfiles; analyzers; buildtransitive</IncludeAssets>
-    </PackageReference>
-    <PackageReference Include="coverlet.collector" Version="6.0.2">
-      <PrivateAssets>all</PrivateAssets>
-      <IncludeAssets>runtime; build; native; contentfiles; analyzers; buildtransitive</IncludeAssets>
-    </PackageReference>
-  </ItemGroup>
+			<IncludeAssets>runtime; build; native; contentfiles; analyzers; buildtransitive</IncludeAssets>
+		</PackageReference>
+		<PackageReference Include="coverlet.collector" Version="6.0.2">
+			<PrivateAssets>all</PrivateAssets>
+			<IncludeAssets>runtime; build; native; contentfiles; analyzers; buildtransitive</IncludeAssets>
+		</PackageReference>
+		<PackageReference Include="System.Linq.Async" Version="6.0.1" />
+	</ItemGroup>
 
-  <ItemGroup>
-    <ProjectReference Include="..\src\OllamaSharp.csproj" />
-  </ItemGroup>
+	<ItemGroup>
+		<ProjectReference Include="..\src\OllamaSharp.csproj" />
+	</ItemGroup>
 
 </Project>
diff --git a/toc.yml b/toc.yml
new file mode 100644
index 0000000..920d2e2
--- /dev/null
+++ b/toc.yml
@@ -0,0 +1,4 @@
+- name: Docs
+  href: docs/
+- name: API
+  href: api/OllamaSharp.html
\ No newline at end of file