From dd8625f8cac4b8f2c8411c7fbec45b1914d13de6 Mon Sep 17 00:00:00 2001 From: Ankur Goyal Date: Sat, 4 Jan 2025 12:10:26 -0800 Subject: [PATCH] Add deepseek models --- packages/proxy/schema/index.ts | 2 ++ packages/proxy/schema/models.ts | 14 ++++++++++++++ 2 files changed, 16 insertions(+) diff --git a/packages/proxy/schema/index.ts b/packages/proxy/schema/index.ts index dde6156..9e7cf54 100644 --- a/packages/proxy/schema/index.ts +++ b/packages/proxy/schema/index.ts @@ -181,6 +181,7 @@ export const AvailableEndpointTypes: { [name: string]: ModelEndpointType[] } = { "NousResearch/Nous-Hermes-2-Yi-34B": ["together"], "deepseek-ai/deepseek-coder-33b-instruct": ["together"], "meta-llama/Llama-3.3-70B-Instruct-Turbo": ["together"], + "deepseek-ai/DeepSeek-V3": ["together"], "mistral-large-latest": ["mistral"], "open-mistral-nemo": ["mistral"], "codestral-latest": ["mistral"], @@ -212,6 +213,7 @@ export const AvailableEndpointTypes: { [name: string]: ModelEndpointType[] } = { "accounts/fireworks/models/llama-v3p1-70b-instruct": ["fireworks"], "accounts/fireworks/models/llama-v3p2-90b-vision-instruct": ["fireworks"], "accounts/fireworks/models/llama-v3p1-405b-instruct": ["fireworks"], + "accounts/fireworks/models/deepseek-v3": ["fireworks"], "anthropic.claude-3-5-sonnet-20241022-v2:0": ["bedrock"], "anthropic.claude-3-opus-20240229-v1:0": ["bedrock"], "anthropic.claude-3-haiku-20240307-v1:0": ["bedrock"], diff --git a/packages/proxy/schema/models.ts b/packages/proxy/schema/models.ts index cf80991..d0292cf 100644 --- a/packages/proxy/schema/models.ts +++ b/packages/proxy/schema/models.ts @@ -712,6 +712,13 @@ export const AvailableModels: { [name: string]: ModelSpec } = { output_cost_per_mil_tokens: 0.8, displayName: "Nous Hermes 2 Yi 34B", }, + "deepseek-ai/DeepSeek-V3": { + format: "openai", + flavor: "chat", + input_cost_per_mil_tokens: 2.5, + output_cost_per_mil_tokens: 2.5, + displayName: "DeepSeek V3", + }, "deepseek-ai/deepseek-coder-33b-instruct": { format: "openai", flavor: "chat", @@ -930,6 +937,13 @@ export const AvailableModels: { [name: string]: ModelSpec } = { input_cost_per_mil_tokens: 3, output_cost_per_mil_tokens: 3, }, + "accounts/fireworks/models/deepseek-v3": { + format: "openai", + flavor: "chat", + displayName: "DeepSeek v3", + input_cost_per_mil_tokens: 0.9, + output_cost_per_mil_tokens: 0.9, + }, // CEREBRAS MODELS "llama3.1-8b": {