Added Fireworks provider (#43)

MindWorkAI · Jul 25, 2024 · 9267ef8 · 9267ef8
1 parent 4f58152
commit 9267ef8
Show file tree

Hide file tree

Showing 19 changed files with 335 additions and 38 deletions.
diff --git a/README.md b/README.md
@@ -5,7 +5,7 @@ MindWork AI Studio is a desktop application available for macOS, Windows, and Li
 
 **Key advantages:**
 - **Free of charge**: The app is free to use, both for personal and commercial purposes.
-- **Independence**: Users are not tied to any single provider. Instead, they can choose the provider that best suits their needs. Right now, we support OpenAI (GPT4o etc.), Mistral, Anthropic (Claude), and self-hosted models using [llama.cpp](https://github.com/ggerganov/llama.cpp), [ollama](https://github.com/ollama/ollama), or [LM Studio](https://lmstudio.ai/). Support for Google Gemini, [Replicate](https://replicate.com/), and [Fireworks](https://fireworks.ai/) is planned.
+- **Independence**: You are not tied to any single provider. Instead, you can choose the provider that best suits their needs. Right now, we support OpenAI (GPT4o etc.), Mistral, Anthropic (Claude), and self-hosted models using [llama.cpp](https://github.com/ggerganov/llama.cpp), [ollama](https://github.com/ollama/ollama), [LM Studio](https://lmstudio.ai/), or [Fireworks](https://fireworks.ai/). Support for Google Gemini, and [Replicate](https://replicate.com/) is planned.
 - **Unrestricted usage**: Unlike services like ChatGPT, which impose limits after intensive use, MindWork AI Studio offers unlimited usage through the providers API.
 - **Cost-effective**: You only pay for what you use, which can be cheaper than monthly subscription services like ChatGPT Plus, especially if used infrequently. But beware, here be dragons: For extremely intensive usage, the API costs can be significantly higher. Unfortunately, providers currently do not offer a way to display current costs in the app. Therefore, check your account with the respective provider to see how your costs are developing. When available, use prepaid and set a cost limit.
 - **Privacy**: The data entered into the app is not used for training by the providers since we are using the provider's API.

diff --git a/app/MindWork AI Studio/Components/Blocks/Changelog.Logs.cs b/app/MindWork AI Studio/Components/Blocks/Changelog.Logs.cs
@@ -13,6 +13,7 @@ public readonly record struct Log(int Build, string Display, string Filename)
 
     public static readonly Log[] LOGS = 
     [
+        new (165, "v0.8.3, build 165 (2024-07-25 13:25 UTC)", "v0.8.3.md"),
         new (164, "v0.8.2, build 164 (2024-07-16 18:03 UTC)", "v0.8.2.md"),
         new (163, "v0.8.1, build 163 (2024-07-16 08:32 UTC)", "v0.8.1.md"),
         new (162, "v0.8.0, build 162 (2024-07-14 19:39 UTC)", "v0.8.0.md"),

diff --git a/app/MindWork AI Studio/Components/Pages/Home.razor.cs b/app/MindWork AI Studio/Components/Pages/Home.razor.cs
@@ -31,7 +31,7 @@ private async Task ReadLastChangeAsync()
     private static readonly TextItem[] ITEMS_ADVANTAGES =
     [
         new TextItem("Free of charge", "The app is free to use, both for personal and commercial purposes."),
-        new TextItem("Independence", "You are not tied to any single provider. Instead, you might choose the provider that best suits your needs. Right now, we support OpenAI (GPT4o etc.), Mistral, Anthropic (Claude), and self-hosted models using llama.cpp, ollama, or LM Studio. Support for Google Gemini, Replicate, and Fireworks is planned."),
+        new TextItem("Independence", "You are not tied to any single provider. Instead, you might choose the provider that best suits your needs. Right now, we support OpenAI (GPT4o etc.), Mistral, Anthropic (Claude), and self-hosted models using llama.cpp, ollama, LM Studio, or Fireworks. Support for Google Gemini and Replicate is planned."),
         new TextItem("Unrestricted usage", "Unlike services like ChatGPT, which impose limits after intensive use, MindWork AI Studio offers unlimited usage through the providers API."),
         new TextItem("Cost-effective", "You only pay for what you use, which can be cheaper than monthly subscription services like ChatGPT Plus, especially if used infrequently. But beware, here be dragons: For extremely intensive usage, the API costs can be significantly higher. Unfortunately, providers currently do not offer a way to display current costs in the app. Therefore, check your account with the respective provider to see how your costs are developing. When available, use prepaid and set a cost limit."),
         new TextItem("Privacy", "The data entered into the app is not used for training by the providers since we are using the provider's API."),

diff --git a/app/MindWork AI Studio/Components/Pages/Settings.razor b/app/MindWork AI Studio/Components/Pages/Settings.razor
@@ -41,7 +41,7 @@
                     }
                 </MudTd>
                 <MudTd Style="text-align: left;">
-                    <MudButton Variant="Variant.Filled" Color="Color.Info" StartIcon="@Icons.Material.Filled.OpenInBrowser" Class="ma-2" Href="@this.GetProviderDashboardURL(context.UsedProvider)" Target="_blank" Disabled="@(context.UsedProvider is Providers.NONE or Providers.SELF_HOSTED)">
+                    <MudButton Variant="Variant.Filled" Color="Color.Info" StartIcon="@Icons.Material.Filled.OpenInBrowser" Class="ma-2" Href="@this.GetProviderDashboardURL(context.UsedProvider)" Target="_blank" Disabled="@(!this.HasDashboard(context.UsedProvider))">
                         Open Dashboard
                     </MudButton>
                     <MudButton Variant="Variant.Filled" Color="Color.Info" StartIcon="@Icons.Material.Filled.Edit" Class="ma-2" OnClick="() => this.EditProvider(context)">

diff --git a/app/MindWork AI Studio/Components/Pages/Settings.razor.cs b/app/MindWork AI Studio/Components/Pages/Settings.razor.cs
@@ -102,11 +102,22 @@ private async Task DeleteProvider(AIStudio.Settings.Provider provider)
         await this.MessageBus.SendMessage<bool>(this, Event.CONFIGURATION_CHANGED);
     }
 
+    private bool HasDashboard(Providers provider) => provider switch
+    {
+        Providers.OPEN_AI => true,
+        Providers.MISTRAL => true,
+        Providers.ANTHROPIC => true,
+        Providers.FIREWORKS => true,
+
+        _ => false,
+    };
+
     private string GetProviderDashboardURL(Providers provider) => provider switch
     {
         Providers.OPEN_AI => "https://platform.openai.com/usage",
         Providers.MISTRAL => "https://console.mistral.ai/usage/",
         Providers.ANTHROPIC => "https://console.anthropic.com/settings/plans",
+        Providers.FIREWORKS => "https://fireworks.ai/account/billing",
 
         _ => string.Empty,
     };

diff --git a/app/MindWork AI Studio/Provider/Fireworks/ChatRequest.cs b/app/MindWork AI Studio/Provider/Fireworks/ChatRequest.cs
@@ -0,0 +1,13 @@
+namespace AIStudio.Provider.Fireworks;
+
+/// <summary>
+/// The Fireworks chat request model.
+/// </summary>
+/// <param name="Model">Which model to use for chat completion.</param>
+/// <param name="Messages">The chat messages.</param>
+/// <param name="Stream">Whether to stream the chat completion.</param>
+public readonly record struct ChatRequest(
+    string Model,
+    IList<Message> Messages,
+    bool Stream
+);
diff --git a/app/MindWork AI Studio/Provider/Fireworks/Message.cs b/app/MindWork AI Studio/Provider/Fireworks/Message.cs
@@ -0,0 +1,8 @@
+namespace AIStudio.Provider.Fireworks;
+
+/// <summary>
+/// Chat message model.
+/// </summary>
+/// <param name="Content">The text content of the message.</param>
+/// <param name="Role">The role of the message.</param>
+public readonly record struct Message(string Content, string Role);
diff --git a/app/MindWork AI Studio/Provider/Fireworks/ProviderFireworks.cs b/app/MindWork AI Studio/Provider/Fireworks/ProviderFireworks.cs
@@ -0,0 +1,160 @@
+using System.Net.Http.Headers;
+using System.Runtime.CompilerServices;
+using System.Text;
+using System.Text.Json;
+
+using AIStudio.Chat;
+using AIStudio.Settings;
+
+namespace AIStudio.Provider.Fireworks;
+
+public class ProviderFireworks() : BaseProvider("https://api.fireworks.ai/inference/v1/"), IProvider
+{
+    private static readonly JsonSerializerOptions JSON_SERIALIZER_OPTIONS = new()
+    {
+        PropertyNamingPolicy = JsonNamingPolicy.SnakeCaseLower,
+    };
+
+    #region Implementation of IProvider
+
+    /// <inheritdoc />
+    public string Id => "Fireworks.ai";
+
+    /// <inheritdoc />
+    public string InstanceName { get; set; } = "Fireworks.ai";
+
+    /// <inheritdoc />
+    public async IAsyncEnumerable<string> StreamChatCompletion(IJSRuntime jsRuntime, SettingsManager settings, Model chatModel, ChatThread chatThread, [EnumeratorCancellation] CancellationToken token = default)
+    {
+        // Get the API key:
+        var requestedSecret = await settings.GetAPIKey(jsRuntime, this);
+        if(!requestedSecret.Success)
+            yield break;
+
+        // Prepare the system prompt:
+        var systemPrompt = new Message
+        {
+            Role = "system",
+            Content = chatThread.SystemPrompt,
+        };
+
+        // Prepare the Fireworks HTTP chat request:
+        var fireworksChatRequest = JsonSerializer.Serialize(new ChatRequest
+        {
+            Model = chatModel.Id,
+
+            // Build the messages:
+            // - First of all the system prompt
+            // - Then none-empty user and AI messages
+            Messages = [systemPrompt, ..chatThread.Blocks.Where(n => n.ContentType is ContentType.TEXT && !string.IsNullOrWhiteSpace((n.Content as ContentText)?.Text)).Select(n => new Message
+            {
+                Role = n.Role switch
+                {
+                    ChatRole.USER => "user",
+                    ChatRole.AI => "assistant",
+                    ChatRole.SYSTEM => "system",
+
+                    _ => "user",
+                },
+
+                Content = n.Content switch
+                {
+                    ContentText text => text.Text,
+                    _ => string.Empty,
+                }
+            }).ToList()],
+
+            // Right now, we only support streaming completions:
+            Stream = true,
+        }, JSON_SERIALIZER_OPTIONS);
+
+        // Build the HTTP post request:
+        var request = new HttpRequestMessage(HttpMethod.Post, "chat/completions");
+
+        // Set the authorization header:
+        request.Headers.Authorization = new AuthenticationHeaderValue("Bearer", requestedSecret.Secret);
+
+        // Set the content:
+        request.Content = new StringContent(fireworksChatRequest, Encoding.UTF8, "application/json");
+
+        // Send the request with the ResponseHeadersRead option.
+        // This allows us to read the stream as soon as the headers are received.
+        // This is important because we want to stream the responses.
+        var response = await this.httpClient.SendAsync(request, HttpCompletionOption.ResponseHeadersRead, token);
+
+        // Open the response stream:
+        var fireworksStream = await response.Content.ReadAsStreamAsync(token);
+
+        // Add a stream reader to read the stream, line by line:
+        var streamReader = new StreamReader(fireworksStream);
+
+        // Read the stream, line by line:
+        while(!streamReader.EndOfStream)
+        {
+            // Check if the token is canceled:
+            if(token.IsCancellationRequested)
+                yield break;
+
+            // Read the next line:
+            var line = await streamReader.ReadLineAsync(token);
+
+            // Skip empty lines:
+            if(string.IsNullOrWhiteSpace(line))
+                continue;
+
+            // Skip lines that do not start with "data: ". Regard
+            // to the specification, we only want to read the data lines:
+            if(!line.StartsWith("data: ", StringComparison.InvariantCulture))
+                continue;
+
+            // Check if the line is the end of the stream:
+            if (line.StartsWith("data: [DONE]", StringComparison.InvariantCulture))
+                yield break;
+
+            ResponseStreamLine fireworksResponse;
+            try
+            {
+                // We know that the line starts with "data: ". Hence, we can
+                // skip the first 6 characters to get the JSON data after that.
+                var jsonData = line[6..];
+
+                // Deserialize the JSON data:
+                fireworksResponse = JsonSerializer.Deserialize<ResponseStreamLine>(jsonData, JSON_SERIALIZER_OPTIONS);
+            }
+            catch
+            {
+                // Skip invalid JSON data:
+                continue;
+            }    
+
+            // Skip empty responses:
+            if(fireworksResponse == default || fireworksResponse.Choices.Count == 0)
+                continue;
+
+            // Yield the response:
+            yield return fireworksResponse.Choices[0].Delta.Content;
+        }
+    }
+
+    #pragma warning disable CS1998 // Async method lacks 'await' operators and will run synchronously
+    /// <inheritdoc />
+    public async IAsyncEnumerable<ImageURL> StreamImageCompletion(IJSRuntime jsRuntime, SettingsManager settings, Model imageModel, string promptPositive, string promptNegative = FilterOperator.String.Empty, ImageURL referenceImageURL = default, [EnumeratorCancellation] CancellationToken token = default)
+    {
+        yield break;
+    }
+    #pragma warning restore CS1998 // Async method lacks 'await' operators and will run synchronously
+
+    /// <inheritdoc />
+    public Task<IEnumerable<Model>> GetTextModels(IJSRuntime jsRuntime, SettingsManager settings, string? apiKeyProvisional = null, CancellationToken token = default)
+    {
+        return Task.FromResult(Enumerable.Empty<Model>());
+    }
+
+    /// <inheritdoc />
+    public Task<IEnumerable<Model>> GetImageModels(IJSRuntime jsRuntime, SettingsManager settings, string? apiKeyProvisional = null, CancellationToken token = default)
+    {
+        return Task.FromResult(Enumerable.Empty<Model>());
+    }
+
+    #endregion
+}
diff --git a/app/MindWork AI Studio/Provider/Fireworks/ResponseStreamLine.cs b/app/MindWork AI Studio/Provider/Fireworks/ResponseStreamLine.cs
@@ -0,0 +1,24 @@
+namespace AIStudio.Provider.Fireworks;
+
+/// <summary>
+/// Data model for a line in the response stream, for streaming completions.
+/// </summary>
+/// <param name="Id">The id of the response.</param>
+/// <param name="Object">The object describing the response.</param>
+/// <param name="Created">The timestamp of the response.</param>
+/// <param name="Model">The model used for the response.</param>
+/// <param name="Choices">The choices made by the AI.</param>
+public readonly record struct ResponseStreamLine(string Id, string Object, uint Created, string Model, IList<Choice> Choices);
+
+/// <summary>
+/// Data model for a choice made by the AI.
+/// </summary>
+/// <param name="Index">The index of the choice.</param>
+/// <param name="Delta">The delta text of the choice.</param>
+public readonly record struct Choice(int Index, Delta Delta);
+
+/// <summary>
+/// The delta text of a choice.
+/// </summary>
+/// <param name="Content">The content of the delta text.</param>
+public readonly record struct Delta(string Content);
diff --git a/app/MindWork AI Studio/Provider/OpenAI/ProviderOpenAI.cs b/app/MindWork AI Studio/Provider/OpenAI/ProviderOpenAI.cs
@@ -97,7 +97,7 @@ public async IAsyncEnumerable<string> StreamChatCompletion(IJSRuntime jsRuntime,
         // Read the stream, line by line:
         while(!streamReader.EndOfStream)
         {
-            // Check if the token is cancelled:
+            // Check if the token is canceled:
             if(token.IsCancellationRequested)
                 yield break;
 

diff --git a/app/MindWork AI Studio/Provider/Providers.cs b/app/MindWork AI Studio/Provider/Providers.cs
@@ -1,4 +1,5 @@
 using AIStudio.Provider.Anthropic;
+using AIStudio.Provider.Fireworks;
 using AIStudio.Provider.Mistral;
 using AIStudio.Provider.OpenAI;
 using AIStudio.Provider.SelfHosted;
@@ -10,13 +11,15 @@ namespace AIStudio.Provider;
 /// </summary>
 public enum Providers
 {
-    NONE,
+    NONE = 0,
 
-    OPEN_AI,
-    ANTHROPIC,
-    MISTRAL,
+    OPEN_AI = 1,
+    ANTHROPIC = 2,
+    MISTRAL = 3,
 
-    SELF_HOSTED,
+    FIREWORKS = 5,
+
+    SELF_HOSTED = 4,
 }
 
 /// <summary>
@@ -37,6 +40,8 @@ public static class ExtensionsProvider
         Providers.ANTHROPIC => "Anthropic",
         Providers.MISTRAL => "Mistral",
 
+        Providers.FIREWORKS => "Fireworks.ai",
+
         Providers.SELF_HOSTED => "Self-hosted",
 
         _ => "Unknown",
@@ -56,9 +61,11 @@ public static IProvider CreateProvider(this Settings.Provider providerSettings)
                 Providers.OPEN_AI => new ProviderOpenAI { InstanceName = providerSettings.InstanceName },
                 Providers.ANTHROPIC => new ProviderAnthropic { InstanceName = providerSettings.InstanceName },
                 Providers.MISTRAL => new ProviderMistral { InstanceName = providerSettings.InstanceName },
-
+
+                Providers.FIREWORKS => new ProviderFireworks { InstanceName = providerSettings.InstanceName },
+
                 Providers.SELF_HOSTED => new ProviderSelfHosted(providerSettings) { InstanceName = providerSettings.InstanceName },
-
+                
                 _ => new NoProvider(),
             };
         }