From 6bcbe286f34b828672a7bbdffbfa7b3548259642 Mon Sep 17 00:00:00 2001 From: Enrico Ros Date: Mon, 13 May 2024 11:47:55 -0700 Subject: [PATCH] OpenAI: add support for 'o' models --- src/modules/llms/server/openai/models.data.ts | 30 ++++++++++++++++++- 1 file changed, 29 insertions(+), 1 deletion(-) diff --git a/src/modules/llms/server/openai/models.data.ts b/src/modules/llms/server/openai/models.data.ts index d26b451664..aed9b3b3d7 100644 --- a/src/modules/llms/server/openai/models.data.ts +++ b/src/modules/llms/server/openai/models.data.ts @@ -11,11 +11,39 @@ import { wireTogetherAIListOutputSchema } from './togetherai.wiretypes'; // [Azure] / [OpenAI] const _knownOpenAIChatModels: ManualMappings = [ + // GPT-4o -> 2024-05-13 + { + idPrefix: 'gpt-4o', + label: 'GPT-4o', + description: 'Currently points to gpt-4o-2024-05-13.', + symLink: 'gpt-4o-2024-05-13', + hidden: true, + // copied from symlinked + contextWindow: 128000, + maxCompletionTokens: 4096, + trainingDataCutoff: 'Oct 2023', + interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json], + pricing: { chatIn: 5, chatOut: 15 }, + benchmark: { cbaElo: 1310 }, + }, + { + isLatest: true, + idPrefix: 'gpt-4o-2024-05-13', + label: 'GPT-4o (2024-05-13)', + description: 'Advanced, multimodal flagship model that’s cheaper and faster than GPT-4 Turbo.', + contextWindow: 128000, + maxCompletionTokens: 4096, + trainingDataCutoff: 'Oct 2023', + interfaces: [LLM_IF_OAI_Chat, LLM_IF_OAI_Vision, LLM_IF_OAI_Fn, LLM_IF_OAI_Json], + pricing: { chatIn: 5, chatOut: 15 }, + benchmark: { cbaElo: 1310 }, + }, + // GPT4 Turbo with Vision -> 2024-04-09 { idPrefix: 'gpt-4-turbo', label: 'GPT-4 Turbo', - description: 'GPT-4 Turbo with Vision. The latest GPT-4 Turbo model with vision capabilities. Vision requests can now use JSON mode and function calling. Currently points to gpt-4-turbo-2024-04-09.', + description: 'New GPT-4 Turbo with Vision. The latest GPT-4 Turbo model with vision capabilities. Vision requests can now use JSON mode and function calling. Currently points to gpt-4-turbo-2024-04-09.', symLink: 'gpt-4-turbo-2024-04-09', hidden: true, // copied from symlinked