Skip to content

Commit

Permalink
Add deepseek v3
Browse files Browse the repository at this point in the history
  • Loading branch information
mythz committed Dec 31, 2024
1 parent 554c15c commit fabd3a7
Show file tree
Hide file tree
Showing 4 changed files with 15 additions and 4 deletions.
4 changes: 2 additions & 2 deletions AiServer.Tests/TestUtils.cs
Original file line number Diff line number Diff line change
Expand Up @@ -133,7 +133,7 @@ public static JsonApiClient CreateSystemClient()
["mistral-nemo:12b"] = "mistralai/mistral-nemo",
["gemma:7b"] = "google/gemma-7b-it",
["gemma2:9b"] = "google/gemma-2-9b-it",
["gemma2:27"] = "google/gemma-2-27b-it",
["gemma2:27b"] = "google/gemma-2-27b-it",
["mixtral:8x7b"] = "mistralai/mixtral-8x7b-instruct",
["mixtral:8x22b"] = "mistralai/mixtral-8x22b-instruct",
["llama3:8b"] = "meta-llama/llama-3-8b-instruct",
Expand Down Expand Up @@ -313,7 +313,7 @@ public static JsonApiClient CreateSystemClient()
[
// new() { Model = "gemma:7b", },
new() { Model = "gemma2:9b", },
new() { Model = "gemma2:27", },
new() { Model = "gemma2:27b", },
new() { Model = "mixtral:8x22b", },
new() { Model = "llama3:8b" },
new() { Model = "llama3:70b" },
Expand Down
Binary file added AiServer/wwwroot/img/models/deepseek-3.jpg
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
10 changes: 10 additions & 0 deletions AiServer/wwwroot/lib/data/ai-models.json
Original file line number Diff line number Diff line change
Expand Up @@ -173,6 +173,16 @@
"description": "A strong, economical, and efficient Mixture-of-Experts language model.",
"icon": "/img/models/deepseek-coder.jpg"
},
{
"id": "deepseek-v3",
"tags": [
"671b"
],
"latest": "671b",
"website": "https://openrouter.ai/deepseek/deepseek-chat",
"description": "DeepSeek-V3 is the latest model from the DeepSeek team, building upon the instruction following and coding abilities of the previous versions. Pre-trained on nearly 15 trillion tokens, the reported evaluations reveal that the model outperforms other open-source models and rivals leading closed-source models.",
"icon": "/img/models/deepseek-3.jpg"
},
{
"id": "dolphin-llama3",
"tags": [
Expand Down
5 changes: 3 additions & 2 deletions AiServer/wwwroot/lib/data/ai-types.json
Original file line number Diff line number Diff line change
Expand Up @@ -20,13 +20,13 @@
"command-r-plus:104b": "cohere/command-r-plus",
"dbrx:132b": "databricks/dbrx-instruct",
"deepseek-coder-v2:236b": "deepseek/deepseek-coder",
"deepseek-v2:236b": "deepseek/deepseek-chat",
"deepseek-v3:671b": "deepseek/deepseek-chat",
"dolphin-llama3:70b": "cognitivecomputations/dolphin-llama-3-70b",
"dolphin-mixtral:8x7b": "cognitivecomputations/dolphin-mixtral-8x7b",
"dolphin-mixtral:8x22b": "cognitivecomputations/dolphin-mixtral-8x22b",
"gemma:7b": "google/gemma-7b-it",
"gemma2:9b": "google/gemma-2-9b-it",
"gemma2:27": "google/gemma-2-27b-it",
"gemma2:27b": "google/gemma-2-27b-it",
"llama3.1:8b": "meta-llama/llama-3.1-8b-instruct",
"llama3.1:70b": "meta-llama/llama-3.1-70b-instruct",
"llama3.1:405b": "meta-llama/llama-3.1-405b-instruct",
Expand Down Expand Up @@ -59,6 +59,7 @@
"qwen2-5:7b": "qwen/qwen-2.5-7b-instruct",
"qwen2-5:72b": "qwen/qwen-2.5-72b-instruct",
"qwen2.5-coder:32b": "qwen/qwen-2.5-coder-32b-instruct",
"qwq:32b": "qwen/qwq-32b-preview",
"wizardlm2:7b": "microsoft/wizardlm-2-7b",
"wizardlm2:8x22b": "microsoft/wizardlm-2-8x22b",
"zephyr:7b": "huggingfaceh4/zephyr-7b-beta:free",
Expand Down

0 comments on commit fabd3a7

Please sign in to comment.