mirror of
https://github.com/MindWorkAI/AI-Studio.git
synced 2025-09-18 11:20:20 +00:00
Some checks are pending
Build and Release / Build app (${{ matrix.dotnet_runtime }}) (-x86_64-pc-windows-msvc.exe, win-x64, windows-latest, x86_64-pc-windows-msvc, nsis updater) (push) Blocked by required conditions
Build and Release / Build app (${{ matrix.dotnet_runtime }}) (-x86_64-unknown-linux-gnu, linux-x64, ubuntu-22.04, x86_64-unknown-linux-gnu, appimage deb updater) (push) Blocked by required conditions
Build and Release / Prepare & create release (push) Blocked by required conditions
Build and Release / Build app (${{ matrix.dotnet_runtime }}) (-x86_64-apple-darwin, osx-x64, macos-latest, x86_64-apple-darwin, dmg updater) (push) Blocked by required conditions
Build and Release / Read metadata (push) Waiting to run
Build and Release / Build app (${{ matrix.dotnet_runtime }}) (-aarch64-apple-darwin, osx-arm64, macos-latest, aarch64-apple-darwin, dmg updater) (push) Blocked by required conditions
Build and Release / Build app (${{ matrix.dotnet_runtime }}) (-aarch64-pc-windows-msvc.exe, win-arm64, windows-latest, aarch64-pc-windows-msvc, nsis updater) (push) Blocked by required conditions
Build and Release / Build app (${{ matrix.dotnet_runtime }}) (-aarch64-unknown-linux-gnu, linux-arm64, ubuntu-22.04-arm, aarch64-unknown-linux-gnu, appimage deb updater) (push) Blocked by required conditions
Build and Release / Publish release (push) Blocked by required conditions
383 lines
15 KiB
C#
383 lines
15 KiB
C#
using System.Net.Http.Headers;
|
|
using System.Runtime.CompilerServices;
|
|
using System.Text;
|
|
using System.Text.Json;
|
|
|
|
using AIStudio.Chat;
|
|
using AIStudio.Settings;
|
|
|
|
namespace AIStudio.Provider.OpenAI;
|
|
|
|
/// <summary>
|
|
/// The OpenAI provider.
|
|
/// </summary>
|
|
public sealed class ProviderOpenAI() : BaseProvider("https://api.openai.com/v1/", LOGGER)
|
|
{
|
|
private static readonly ILogger<ProviderOpenAI> LOGGER = Program.LOGGER_FACTORY.CreateLogger<ProviderOpenAI>();
|
|
|
|
#region Implementation of IProvider
|
|
|
|
/// <inheritdoc />
|
|
public override string Id => LLMProviders.OPEN_AI.ToName();
|
|
|
|
/// <inheritdoc />
|
|
public override string InstanceName { get; set; } = "OpenAI";
|
|
|
|
/// <inheritdoc />
|
|
public override async IAsyncEnumerable<ContentStreamChunk> StreamChatCompletion(Model chatModel, ChatThread chatThread, SettingsManager settingsManager, [EnumeratorCancellation] CancellationToken token = default)
|
|
{
|
|
// Get the API key:
|
|
var requestedSecret = await RUST_SERVICE.GetAPIKey(this);
|
|
if(!requestedSecret.Success)
|
|
yield break;
|
|
|
|
// Unfortunately, OpenAI changed the name of the system prompt based on the model.
|
|
// All models that start with "o" (the omni aka reasoning models), all GPT4o models,
|
|
// and all newer models have the system prompt named "developer". All other models
|
|
// have the system prompt named "system". We need to check this to get the correct
|
|
// system prompt.
|
|
//
|
|
// To complicate it even more: The early versions of reasoning models, which are released
|
|
// before the 17th of December 2024, have no system prompt at all. We need to check this
|
|
// as well.
|
|
|
|
// Apply the basic rule first:
|
|
var systemPromptRole =
|
|
chatModel.Id.StartsWith('o') ||
|
|
chatModel.Id.StartsWith("gpt-5", StringComparison.Ordinal) ||
|
|
chatModel.Id.Contains("4o") ? "developer" : "system";
|
|
|
|
// Check if the model is an early version of the reasoning models:
|
|
systemPromptRole = chatModel.Id switch
|
|
{
|
|
"o1-mini" => "user",
|
|
"o1-mini-2024-09-12" => "user",
|
|
"o1-preview" => "user",
|
|
"o1-preview-2024-09-12" => "user",
|
|
|
|
_ => systemPromptRole,
|
|
};
|
|
|
|
// Read the model capabilities:
|
|
var modelCapabilities = this.GetModelCapabilities(chatModel);
|
|
|
|
// Check if we are using the Responses API or the Chat Completion API:
|
|
var usingResponsesAPI = modelCapabilities.Contains(Capability.RESPONSES_API);
|
|
|
|
// Prepare the request path based on the API we are using:
|
|
var requestPath = usingResponsesAPI ? "responses" : "chat/completions";
|
|
|
|
LOGGER.LogInformation("Using the system prompt role '{SystemPromptRole}' and the '{RequestPath}' API for model '{ChatModelId}'.", systemPromptRole, requestPath, chatModel.Id);
|
|
|
|
// Prepare the system prompt:
|
|
var systemPrompt = new Message
|
|
{
|
|
Role = systemPromptRole,
|
|
Content = chatThread.PrepareSystemPrompt(settingsManager, chatThread),
|
|
};
|
|
|
|
//
|
|
// Prepare the tools we want to use:
|
|
//
|
|
IList<Tool> tools = modelCapabilities.Contains(Capability.WEB_SEARCH) switch
|
|
{
|
|
true => [ Tools.WEB_SEARCH ],
|
|
_ => []
|
|
};
|
|
|
|
//
|
|
// Create the request: either for the Responses API or the Chat Completion API
|
|
//
|
|
var openAIChatRequest = usingResponsesAPI switch
|
|
{
|
|
// Chat Completion API request:
|
|
false => JsonSerializer.Serialize(new ChatCompletionAPIRequest
|
|
{
|
|
Model = chatModel.Id,
|
|
|
|
// Build the messages:
|
|
// - First of all the system prompt
|
|
// - Then none-empty user and AI messages
|
|
Messages = [systemPrompt, ..chatThread.Blocks.Where(n => n.ContentType is ContentType.TEXT && !string.IsNullOrWhiteSpace((n.Content as ContentText)?.Text)).Select(n => new Message
|
|
{
|
|
Role = n.Role switch
|
|
{
|
|
ChatRole.USER => "user",
|
|
ChatRole.AI => "assistant",
|
|
ChatRole.AGENT => "assistant",
|
|
ChatRole.SYSTEM => systemPromptRole,
|
|
|
|
_ => "user",
|
|
},
|
|
|
|
Content = n.Content switch
|
|
{
|
|
ContentText text => text.Text,
|
|
_ => string.Empty,
|
|
}
|
|
}).ToList()],
|
|
|
|
// Right now, we only support streaming completions:
|
|
Stream = true,
|
|
}, JSON_SERIALIZER_OPTIONS),
|
|
|
|
// Responses API request:
|
|
true => JsonSerializer.Serialize(new ResponsesAPIRequest
|
|
{
|
|
Model = chatModel.Id,
|
|
|
|
// Build the messages:
|
|
// - First of all the system prompt
|
|
// - Then none-empty user and AI messages
|
|
Input = [systemPrompt, ..chatThread.Blocks.Where(n => n.ContentType is ContentType.TEXT && !string.IsNullOrWhiteSpace((n.Content as ContentText)?.Text)).Select(n => new Message
|
|
{
|
|
Role = n.Role switch
|
|
{
|
|
ChatRole.USER => "user",
|
|
ChatRole.AI => "assistant",
|
|
ChatRole.AGENT => "assistant",
|
|
ChatRole.SYSTEM => systemPromptRole,
|
|
|
|
_ => "user",
|
|
},
|
|
|
|
Content = n.Content switch
|
|
{
|
|
ContentText text => text.Text,
|
|
_ => string.Empty,
|
|
}
|
|
}).ToList()],
|
|
|
|
// Right now, we only support streaming completions:
|
|
Stream = true,
|
|
|
|
// We do not want to store any data on OpenAI's servers:
|
|
Store = false,
|
|
|
|
// Tools we want to use:
|
|
Tools = tools,
|
|
|
|
}, JSON_SERIALIZER_OPTIONS),
|
|
};
|
|
|
|
async Task<HttpRequestMessage> RequestBuilder()
|
|
{
|
|
// Build the HTTP post request:
|
|
var request = new HttpRequestMessage(HttpMethod.Post, requestPath);
|
|
|
|
// Set the authorization header:
|
|
request.Headers.Authorization = new AuthenticationHeaderValue("Bearer", await requestedSecret.Secret.Decrypt(ENCRYPTION));
|
|
|
|
// Set the content:
|
|
request.Content = new StringContent(openAIChatRequest, Encoding.UTF8, "application/json");
|
|
return request;
|
|
}
|
|
|
|
if (usingResponsesAPI)
|
|
await foreach (var content in this.StreamResponsesInternal<ResponsesDeltaStreamLine, ResponsesAnnotationStreamLine>("OpenAI", RequestBuilder, token))
|
|
yield return content;
|
|
|
|
else
|
|
await foreach (var content in this.StreamChatCompletionInternal<ChatCompletionDeltaStreamLine, ChatCompletionAnnotationStreamLine>("OpenAI", RequestBuilder, token))
|
|
yield return content;
|
|
}
|
|
|
|
#pragma warning disable CS1998 // Async method lacks 'await' operators and will run synchronously
|
|
|
|
/// <inheritdoc />
|
|
public override async IAsyncEnumerable<ImageURL> StreamImageCompletion(Model imageModel, string promptPositive, string promptNegative = FilterOperator.String.Empty, ImageURL referenceImageURL = default, [EnumeratorCancellation] CancellationToken token = default)
|
|
{
|
|
yield break;
|
|
}
|
|
|
|
#pragma warning restore CS1998 // Async method lacks 'await' operators and will run synchronously
|
|
|
|
/// <inheritdoc />
|
|
public override async Task<IEnumerable<Model>> GetTextModels(string? apiKeyProvisional = null, CancellationToken token = default)
|
|
{
|
|
var models = await this.LoadModels(["chatgpt-", "gpt-", "o1-", "o3-", "o4-"], token, apiKeyProvisional);
|
|
return models.Where(model => !model.Id.Contains("image", StringComparison.OrdinalIgnoreCase) &&
|
|
!model.Id.Contains("realtime", StringComparison.OrdinalIgnoreCase) &&
|
|
!model.Id.Contains("audio", StringComparison.OrdinalIgnoreCase) &&
|
|
!model.Id.Contains("tts", StringComparison.OrdinalIgnoreCase) &&
|
|
!model.Id.Contains("transcribe", StringComparison.OrdinalIgnoreCase));
|
|
}
|
|
|
|
/// <inheritdoc />
|
|
public override Task<IEnumerable<Model>> GetImageModels(string? apiKeyProvisional = null, CancellationToken token = default)
|
|
{
|
|
return this.LoadModels(["dall-e-", "gpt-image"], token, apiKeyProvisional);
|
|
}
|
|
|
|
/// <inheritdoc />
|
|
public override Task<IEnumerable<Model>> GetEmbeddingModels(string? apiKeyProvisional = null, CancellationToken token = default)
|
|
{
|
|
return this.LoadModels(["text-embedding-"], token, apiKeyProvisional);
|
|
}
|
|
|
|
public override IReadOnlyCollection<Capability> GetModelCapabilities(Model model)
|
|
{
|
|
var modelName = model.Id.ToLowerInvariant().AsSpan();
|
|
|
|
if (modelName is "gpt-4o-search-preview")
|
|
return
|
|
[
|
|
Capability.TEXT_INPUT,
|
|
Capability.TEXT_OUTPUT,
|
|
|
|
Capability.WEB_SEARCH,
|
|
Capability.CHAT_COMPLETION_API,
|
|
];
|
|
|
|
if (modelName is "gpt-4o-mini-search-preview")
|
|
return
|
|
[
|
|
Capability.TEXT_INPUT,
|
|
Capability.TEXT_OUTPUT,
|
|
|
|
Capability.WEB_SEARCH,
|
|
Capability.CHAT_COMPLETION_API,
|
|
];
|
|
|
|
if (modelName.StartsWith("o1-mini"))
|
|
return
|
|
[
|
|
Capability.TEXT_INPUT,
|
|
Capability.TEXT_OUTPUT,
|
|
|
|
Capability.ALWAYS_REASONING,
|
|
Capability.CHAT_COMPLETION_API,
|
|
];
|
|
|
|
if(modelName is "gpt-3.5-turbo")
|
|
return
|
|
[
|
|
Capability.TEXT_INPUT,
|
|
Capability.TEXT_OUTPUT,
|
|
Capability.RESPONSES_API,
|
|
];
|
|
|
|
if(modelName.StartsWith("gpt-3.5"))
|
|
return
|
|
[
|
|
Capability.TEXT_INPUT,
|
|
Capability.TEXT_OUTPUT,
|
|
Capability.CHAT_COMPLETION_API,
|
|
];
|
|
|
|
if (modelName.StartsWith("chatgpt-4o-"))
|
|
return
|
|
[
|
|
Capability.TEXT_INPUT, Capability.MULTIPLE_IMAGE_INPUT,
|
|
Capability.TEXT_OUTPUT,
|
|
Capability.RESPONSES_API,
|
|
];
|
|
|
|
if (modelName.StartsWith("o3-mini"))
|
|
return
|
|
[
|
|
Capability.TEXT_INPUT,
|
|
Capability.TEXT_OUTPUT,
|
|
|
|
Capability.ALWAYS_REASONING, Capability.FUNCTION_CALLING,
|
|
Capability.RESPONSES_API,
|
|
];
|
|
|
|
if (modelName.StartsWith("o4-mini") || modelName.StartsWith("o3"))
|
|
return
|
|
[
|
|
Capability.TEXT_INPUT, Capability.MULTIPLE_IMAGE_INPUT,
|
|
Capability.TEXT_OUTPUT,
|
|
|
|
Capability.ALWAYS_REASONING, Capability.FUNCTION_CALLING,
|
|
Capability.WEB_SEARCH,
|
|
Capability.RESPONSES_API,
|
|
];
|
|
|
|
if (modelName.StartsWith("o1"))
|
|
return
|
|
[
|
|
Capability.TEXT_INPUT, Capability.MULTIPLE_IMAGE_INPUT,
|
|
Capability.TEXT_OUTPUT,
|
|
|
|
Capability.ALWAYS_REASONING, Capability.FUNCTION_CALLING,
|
|
Capability.RESPONSES_API,
|
|
];
|
|
|
|
if(modelName.StartsWith("gpt-4-turbo"))
|
|
return
|
|
[
|
|
Capability.TEXT_INPUT, Capability.MULTIPLE_IMAGE_INPUT,
|
|
Capability.TEXT_OUTPUT,
|
|
|
|
Capability.FUNCTION_CALLING,
|
|
Capability.RESPONSES_API,
|
|
];
|
|
|
|
if(modelName is "gpt-4" || modelName.StartsWith("gpt-4-"))
|
|
return
|
|
[
|
|
Capability.TEXT_INPUT,
|
|
Capability.TEXT_OUTPUT,
|
|
Capability.RESPONSES_API,
|
|
];
|
|
|
|
if(modelName.StartsWith("gpt-5-nano"))
|
|
return
|
|
[
|
|
Capability.TEXT_INPUT, Capability.MULTIPLE_IMAGE_INPUT,
|
|
Capability.TEXT_OUTPUT,
|
|
|
|
Capability.FUNCTION_CALLING, Capability.ALWAYS_REASONING,
|
|
Capability.RESPONSES_API,
|
|
];
|
|
|
|
if(modelName is "gpt-5" || modelName.StartsWith("gpt-5-"))
|
|
return
|
|
[
|
|
Capability.TEXT_INPUT, Capability.MULTIPLE_IMAGE_INPUT,
|
|
Capability.TEXT_OUTPUT,
|
|
|
|
Capability.FUNCTION_CALLING, Capability.ALWAYS_REASONING,
|
|
Capability.WEB_SEARCH,
|
|
Capability.RESPONSES_API,
|
|
];
|
|
|
|
return
|
|
[
|
|
Capability.TEXT_INPUT, Capability.MULTIPLE_IMAGE_INPUT,
|
|
Capability.TEXT_OUTPUT,
|
|
|
|
Capability.FUNCTION_CALLING,
|
|
Capability.RESPONSES_API,
|
|
];
|
|
}
|
|
|
|
#endregion
|
|
|
|
private async Task<IEnumerable<Model>> LoadModels(string[] prefixes, CancellationToken token, string? apiKeyProvisional = null)
|
|
{
|
|
var secretKey = apiKeyProvisional switch
|
|
{
|
|
not null => apiKeyProvisional,
|
|
_ => await RUST_SERVICE.GetAPIKey(this) switch
|
|
{
|
|
{ Success: true } result => await result.Secret.Decrypt(ENCRYPTION),
|
|
_ => null,
|
|
}
|
|
};
|
|
|
|
if (secretKey is null)
|
|
return [];
|
|
|
|
using var request = new HttpRequestMessage(HttpMethod.Get, "models");
|
|
request.Headers.Authorization = new AuthenticationHeaderValue("Bearer", secretKey);
|
|
|
|
using var response = await this.httpClient.SendAsync(request, token);
|
|
if(!response.IsSuccessStatusCode)
|
|
return [];
|
|
|
|
var modelResponse = await response.Content.ReadFromJsonAsync<ModelsResponse>(token);
|
|
return modelResponse.Data.Where(model => prefixes.Any(prefix => model.Id.StartsWith(prefix, StringComparison.InvariantCulture)));
|
|
}
|
|
} |