AI-Studio/app/MindWork AI Studio/Provider/OpenAI/ProviderOpenAI.cs

167 lines
6.6 KiB
C#
Raw Normal View History

2024-05-04 09:11:23 +00:00
using System.Net.Http.Headers;
using System.Runtime.CompilerServices;
using System.Text;
using System.Text.Json;
using AIStudio.Chat;
using AIStudio.Settings;
2024-05-04 09:11:23 +00:00
namespace AIStudio.Provider.OpenAI;
/// <summary>
/// The OpenAI provider.
/// </summary>
2024-12-03 14:24:40 +00:00
public sealed class ProviderOpenAI(ILogger logger) : BaseProvider("https://api.openai.com/v1/", logger)
2024-05-04 09:11:23 +00:00
{
#region Implementation of IProvider
/// <inheritdoc />
2024-12-03 14:24:40 +00:00
public override string Id => LLMProviders.OPEN_AI.ToName();
2024-05-04 09:11:23 +00:00
/// <inheritdoc />
2024-12-03 14:24:40 +00:00
public override string InstanceName { get; set; } = "OpenAI";
2024-05-04 09:11:23 +00:00
/// <inheritdoc />
public override async IAsyncEnumerable<string> StreamChatCompletion(Model chatModel, ChatThread chatThread, SettingsManager settingsManager, [EnumeratorCancellation] CancellationToken token = default)
2024-05-04 09:11:23 +00:00
{
// Get the API key:
2024-09-01 18:10:03 +00:00
var requestedSecret = await RUST_SERVICE.GetAPIKey(this);
2024-05-04 09:11:23 +00:00
if(!requestedSecret.Success)
yield break;
2025-01-01 19:11:42 +00:00
// Unfortunately, OpenAI changed the name of the system prompt based on the model.
// All models that start with "o" (the omni aka reasoning models) and all GPT4o models
// have the system prompt named "developer". All other models have the system prompt
// named "system". We need to check this to get the correct system prompt.
//
// To complicate it even more: The early versions of reasoning models, which are released
// before the 17th of December 2024, have no system prompt at all. We need to check this
// as well.
// Apply the basic rule first:
var systemPromptRole = chatModel.Id.StartsWith('o') || chatModel.Id.Contains("4o") ? "developer" : "system";
// Check if the model is an early version of the reasoning models:
systemPromptRole = chatModel.Id switch
{
"o1-mini" => "user",
"o1-mini-2024-09-12" => "user",
"o1-preview" => "user",
"o1-preview-2024-09-12" => "user",
_ => systemPromptRole,
};
this.logger.LogInformation($"Using the system prompt role '{systemPromptRole}' for model '{chatModel.Id}'.");
2024-05-04 09:11:23 +00:00
// Prepare the system prompt:
var systemPrompt = new Message
{
2025-01-01 19:11:42 +00:00
Role = systemPromptRole,
Content = chatThread.PrepareSystemPrompt(settingsManager, chatThread, this.logger),
2024-05-04 09:11:23 +00:00
};
// Prepare the OpenAI HTTP chat request:
var openAIChatRequest = JsonSerializer.Serialize(new ChatRequest
{
Model = chatModel.Id,
// Build the messages:
// - First of all the system prompt
// - Then none-empty user and AI messages
Messages = [systemPrompt, ..chatThread.Blocks.Where(n => n.ContentType is ContentType.TEXT && !string.IsNullOrWhiteSpace((n.Content as ContentText)?.Text)).Select(n => new Message
{
Role = n.Role switch
{
ChatRole.USER => "user",
ChatRole.AI => "assistant",
ChatRole.AGENT => "assistant",
2025-01-01 19:11:42 +00:00
ChatRole.SYSTEM => systemPromptRole,
2024-05-04 09:11:23 +00:00
_ => "user",
},
Content = n.Content switch
{
ContentText text => text.Text,
_ => string.Empty,
}
}).ToList()],
Seed = chatThread.Seed,
// Right now, we only support streaming completions:
Stream = true,
}, JSON_SERIALIZER_OPTIONS);
2025-01-04 13:11:32 +00:00
async Task<HttpRequestMessage> RequestBuilder()
2025-01-01 14:49:27 +00:00
{
2025-01-04 13:11:32 +00:00
// Build the HTTP post request:
var request = new HttpRequestMessage(HttpMethod.Post, "chat/completions");
2025-01-01 14:49:27 +00:00
2025-01-04 13:11:32 +00:00
// Set the authorization header:
request.Headers.Authorization = new AuthenticationHeaderValue("Bearer", await requestedSecret.Secret.Decrypt(ENCRYPTION));
2025-01-01 14:49:27 +00:00
2025-01-04 13:11:32 +00:00
// Set the content:
request.Content = new StringContent(openAIChatRequest, Encoding.UTF8, "application/json");
return request;
}
2024-05-04 09:11:23 +00:00
2025-01-04 13:11:32 +00:00
await foreach (var content in this.StreamChatCompletionInternal<ResponseStreamLine>("OpenAI", RequestBuilder, token))
yield return content;
2024-05-04 09:11:23 +00:00
}
#pragma warning disable CS1998 // Async method lacks 'await' operators and will run synchronously
/// <inheritdoc />
2024-12-03 14:24:40 +00:00
public override async IAsyncEnumerable<ImageURL> StreamImageCompletion(Model imageModel, string promptPositive, string promptNegative = FilterOperator.String.Empty, ImageURL referenceImageURL = default, [EnumeratorCancellation] CancellationToken token = default)
2024-05-04 09:11:23 +00:00
{
yield break;
}
#pragma warning restore CS1998 // Async method lacks 'await' operators and will run synchronously
/// <inheritdoc />
2024-12-03 14:24:40 +00:00
public override Task<IEnumerable<Model>> GetTextModels(string? apiKeyProvisional = null, CancellationToken token = default)
2024-05-04 09:11:23 +00:00
{
2024-09-12 20:58:32 +00:00
return this.LoadModels(["gpt-", "o1-"], token, apiKeyProvisional);
2024-05-04 09:11:23 +00:00
}
/// <inheritdoc />
2024-12-03 14:24:40 +00:00
public override Task<IEnumerable<Model>> GetImageModels(string? apiKeyProvisional = null, CancellationToken token = default)
2024-05-04 09:11:23 +00:00
{
2024-09-12 20:58:32 +00:00
return this.LoadModels(["dall-e-"], token, apiKeyProvisional);
2024-05-04 09:11:23 +00:00
}
2024-12-03 14:24:40 +00:00
/// <inheritdoc />
public override Task<IEnumerable<Model>> GetEmbeddingModels(string? apiKeyProvisional = null, CancellationToken token = default)
{
return this.LoadModels(["text-embedding-"], token, apiKeyProvisional);
}
2024-05-04 09:11:23 +00:00
#endregion
2024-09-12 20:58:32 +00:00
private async Task<IEnumerable<Model>> LoadModels(string[] prefixes, CancellationToken token, string? apiKeyProvisional = null)
2024-05-04 09:11:23 +00:00
{
2024-06-03 17:42:53 +00:00
var secretKey = apiKeyProvisional switch
{
not null => apiKeyProvisional,
2024-09-01 18:10:03 +00:00
_ => await RUST_SERVICE.GetAPIKey(this) switch
2024-06-03 17:42:53 +00:00
{
2024-09-01 18:10:03 +00:00
{ Success: true } result => await result.Secret.Decrypt(ENCRYPTION),
2024-06-03 17:42:53 +00:00
_ => null,
}
};
if (secretKey is null)
2024-05-19 14:14:49 +00:00
return [];
2024-05-04 09:11:23 +00:00
var request = new HttpRequestMessage(HttpMethod.Get, "models");
2024-06-03 17:42:53 +00:00
request.Headers.Authorization = new AuthenticationHeaderValue("Bearer", secretKey);
2024-05-19 14:14:49 +00:00
2024-05-04 09:11:23 +00:00
var response = await this.httpClient.SendAsync(request, token);
if(!response.IsSuccessStatusCode)
2024-05-19 14:14:49 +00:00
return [];
2024-05-04 09:11:23 +00:00
var modelResponse = await response.Content.ReadFromJsonAsync<ModelsResponse>(token);
2024-09-12 20:58:32 +00:00
return modelResponse.Data.Where(model => prefixes.Any(prefix => model.Id.StartsWith(prefix, StringComparison.InvariantCulture)));
2024-05-04 09:11:23 +00:00
}
}