Add deepseek v3

ServiceStack · Dec 31, 2024 · fabd3a7 · fabd3a7
1 parent 554c15c
commit fabd3a7
Show file tree

Hide file tree

Showing 4 changed files with 15 additions and 4 deletions.
diff --git a/AiServer.Tests/TestUtils.cs b/AiServer.Tests/TestUtils.cs
@@ -133,7 +133,7 @@ public static JsonApiClient CreateSystemClient()
             ["mistral-nemo:12b"] = "mistralai/mistral-nemo",
             ["gemma:7b"] = "google/gemma-7b-it",
             ["gemma2:9b"] = "google/gemma-2-9b-it",
-            ["gemma2:27"] = "google/gemma-2-27b-it",
+            ["gemma2:27b"] = "google/gemma-2-27b-it",
             ["mixtral:8x7b"] = "mistralai/mixtral-8x7b-instruct",
             ["mixtral:8x22b"] = "mistralai/mixtral-8x22b-instruct",
             ["llama3:8b"] = "meta-llama/llama-3-8b-instruct",
@@ -313,7 +313,7 @@ public static JsonApiClient CreateSystemClient()
         [
             // new() { Model = "gemma:7b", },
             new() { Model = "gemma2:9b", },
-            new() { Model = "gemma2:27", },
+            new() { Model = "gemma2:27b", },
             new() { Model = "mixtral:8x22b", },
             new() { Model = "llama3:8b" },
             new() { Model = "llama3:70b" },

diff --git a/AiServer/wwwroot/img/models/deepseek-3.jpg b/AiServer/wwwroot/img/models/deepseek-3.jpg
diff --git a/AiServer/wwwroot/lib/data/ai-models.json b/AiServer/wwwroot/lib/data/ai-models.json
@@ -173,6 +173,16 @@
     "description": "A strong, economical, and efficient Mixture-of-Experts language model.",
     "icon": "/img/models/deepseek-coder.jpg"
   },
+  {
+    "id": "deepseek-v3",
+    "tags": [
+      "671b"
+    ],
+    "latest": "671b",
+    "website": "https://openrouter.ai/deepseek/deepseek-chat",
+    "description": "DeepSeek-V3 is the latest model from the DeepSeek team, building upon the instruction following and coding abilities of the previous versions. Pre-trained on nearly 15 trillion tokens, the reported evaluations reveal that the model outperforms other open-source models and rivals leading closed-source models.",
+    "icon": "/img/models/deepseek-3.jpg"
+  },
   {
     "id": "dolphin-llama3",
     "tags": [

diff --git a/AiServer/wwwroot/lib/data/ai-types.json b/AiServer/wwwroot/lib/data/ai-types.json
@@ -20,13 +20,13 @@
       "command-r-plus:104b": "cohere/command-r-plus",
       "dbrx:132b": "databricks/dbrx-instruct",
       "deepseek-coder-v2:236b": "deepseek/deepseek-coder",
-      "deepseek-v2:236b": "deepseek/deepseek-chat",
+      "deepseek-v3:671b": "deepseek/deepseek-chat",
       "dolphin-llama3:70b": "cognitivecomputations/dolphin-llama-3-70b",
       "dolphin-mixtral:8x7b": "cognitivecomputations/dolphin-mixtral-8x7b",
       "dolphin-mixtral:8x22b": "cognitivecomputations/dolphin-mixtral-8x22b",
       "gemma:7b": "google/gemma-7b-it",
       "gemma2:9b": "google/gemma-2-9b-it",
-      "gemma2:27": "google/gemma-2-27b-it",
+      "gemma2:27b": "google/gemma-2-27b-it",
       "llama3.1:8b": "meta-llama/llama-3.1-8b-instruct",
       "llama3.1:70b": "meta-llama/llama-3.1-70b-instruct",
       "llama3.1:405b": "meta-llama/llama-3.1-405b-instruct",
@@ -59,6 +59,7 @@
       "qwen2-5:7b": "qwen/qwen-2.5-7b-instruct",
       "qwen2-5:72b": "qwen/qwen-2.5-72b-instruct",
       "qwen2.5-coder:32b": "qwen/qwen-2.5-coder-32b-instruct",
+      "qwq:32b": "qwen/qwq-32b-preview",
       "wizardlm2:7b": "microsoft/wizardlm-2-7b",
       "wizardlm2:8x22b": "microsoft/wizardlm-2-8x22b",
       "zephyr:7b": "huggingfaceh4/zephyr-7b-beta:free",