Add thudm gml + phi-4 reasoning models

mythz · mythz · commit 7ee1e66943d6 · 2025-05-02T19:16:53.000+08:00
diff --git a/AiServer/wwwroot/img/models/thudm.webp b/AiServer/wwwroot/img/models/thudm.webp
diff --git a/AiServer/wwwroot/lib/data/ai-models.json b/AiServer/wwwroot/lib/data/ai-models.json
@@ -805,6 +805,26 @@
     "description": "Phi 4 is a 14B parameter, state-of-the-art open model from Microsoft.",
     "icon": "/img/models/phi4.svg"
   },
+  {
+    "id": "phi-4-reasoning",
+    "tags": [
+      "14b"
+    ],
+    "latest": "14b",
+    "website": "https://ollama.ai/library/phi4",
+    "description": "Phi-4-reasoning is a 14B parameter dense decoder-only transformer developed by Microsoft, fine-tuned from Phi-4 to enhance complex reasoning capabilities. It uses a combination of supervised fine-tuning on chain-of-thought traces and reinforcement learning, targeting math, science, and code reasoning tasks. With a 32k context window and high inference efficiency, it is optimized for structured responses in a two-part format: reasoning trace followed by a final solution.",
+    "icon": "/img/models/phi4.svg"
+  },
+  {
+    "id": "phi-4-reasoning-plus",
+    "tags": [
+      "14b"
+    ],
+    "latest": "14b",
+    "website": "https://openrouter.ai/microsoft/phi-4-reasoning-plus",
+    "description": "Phi-4-reasoning-plus is an enhanced 14B parameter model from Microsoft, fine-tuned from Phi-4 with additional reinforcement learning to boost accuracy on math, science, and code reasoning tasks. It uses the same dense decoder-only transformer architecture as Phi-4, but generates longer, more comprehensive outputs structured into a step-by-step reasoning trace and final answer.",
+    "icon": "/img/models/phi4.svg"
+  },
   {
     "id": "phind-codellama",
     "tags": [
@@ -1389,5 +1409,12 @@
     "website": "https://openrouter.ai/amazon/nova-pro-v1",
     "description": "A capable multimodal model from Amazon focused on providing a combination of accuracy, speed, and cost for a wide range of tasks. As of December 2024, it achieves state-of-the-art performance on key benchmarks including visual question answering (TextVQA) and video understanding (VATEX).",
     "icon": "/img/models/aws.svg"
+  },
+  {
+    "id": "glm-4-32b",
+    "tags": [],
+    "website": "https://openrouter.ai/thudm/glm-4-32b",
+    "description": "GLM-4-32B-0414 is a 32B bilingual (Chinese-English) open-weight language model optimized for code generation, function calling, and agent-style tasks. Pretrained on 15T of high-quality and reasoning-heavy data, it was further refined using human preference alignment, rejection sampling, and reinforcement learning. The model excels in complex reasoning, artifact generation, and structured output tasks, achieving performance comparable to GPT-4o and DeepSeek-V3-0324 across several benchmarks.",
+    "icon": "/img/models/thudm.webp"
   }
 ]
diff --git a/AiServer/wwwroot/lib/data/ai-types.json b/AiServer/wwwroot/lib/data/ai-types.json
@@ -53,6 +53,8 @@
       "phi3:3.8b": "microsoft/phi-3-mini-128k-instruct",
       "phi3:14b": "microsoft/phi-3-medium-128k-instruct",
       "phi4:14b": "microsoft/phi-4",
+      "phi-4-reasoning:14b": "microsoft/phi-4-reasoning",
+      "phi-4-reasoning-plus:14b": "microsoft/phi-4-reasoning-plus",
       "qwen2:7b": "qwen/qwen-2-7b-instruct",
       "qwen2:72b": "qwen/qwen-2-72b-instruct",
       "qwen2-5:7b": "qwen/qwen-2.5-7b-instruct",
@@ -93,7 +95,8 @@
       "claude-3-sonnet": "anthropic/claude-3-sonnet",
       "claude-3-opus": "anthropic/claude-3-opus",
       "claude-3-5-sonnet": "anthropic/claude-3.5-sonnet",
-      "yi-large": "01-ai/yi-large"
+      "yi-large": "01-ai/yi-large",
+      "glm-4-32b": "thudm/glm-4-32b"
     }
   },
   {
@@ -119,14 +122,17 @@
       "deepseek-r1-zero:671b": "deepseek/deepseek-r1-zero:free",
       "phi3:3.8b": "microsoft/phi-3-mini-128k-instruct:free",
       "phi3:14b": "microsoft/phi-3-medium-128k-instruct:free",
+      "phi-4-reasoning:14b": "microsoft/phi-4-reasoning:free",
+      "phi-4-reasoning-plus:14b": "microsoft/phi-4-reasoning-plus:free",
       "qwen-vl-plus": "qwen/qwen-vl-plus:free",
       "qwq:32b": "qwen/qwq-32b:free",
       "qwen3:8b": "qwen/qwen3-8b:free",
       "qwen3:30b": "qwen/qwen3-30b-a3b:free",
       "qwen3:32b": "qwen/qwen3-32b:free",
       "qwen3:235b": "qwen/qwen3-235b-a22b:free",
       "gemini-pro": "google/gemini-2.5-pro-exp-03-25:free",
-      "gemini-pro-2.5": "google/gemini-2.5-pro-exp-03-25:free"
+      "gemini-pro-2.5": "google/gemini-2.5-pro-exp-03-25:free",
+      "glm-4-32b": "thudm/glm-4-32b:free"
     }
   },
   {
diff --git a/AiServer/wwwroot/lib/data/media-models.json b/AiServer/wwwroot/lib/data/media-models.json
@@ -116,7 +116,7 @@
     "dependencies": [
       "clip_l.safetensors",
       "clip_g.safetensors",
-      "t5xxl_fp8_e4m3fn_scaled.safetensors"
+      "t5xxl_fp8_e4m3fn.safetensors"
     ],
     "installer": "Text to Image (15G Stable Diffusion 3.5 FP8)",
     "path": "/data/models/checkpoints/sd3.5_large_fp8_scaled.safetensors",
@@ -134,8 +134,37 @@
     "url": "https://huggingface.co/Comfy-Org/stable-diffusion-3.5-fp8"
   },
   {
-    "id": "hidream_i1_dev",
-    "name": "HiDream I1 Dev",
+    "id": "hidream_i1_fast_fp8",
+    "name": "HiDream I1 Fast FP8",
+    "type": "TextToImage",
+    "apiModels": {
+      "ComfyUI": "hidream_i1_fast_fp8.safetensors"
+    },
+    "installer": "Text to Image (17G HiDream I1 Fast FP8)",
+    "path": "/data/models/checkpoints/hidream_i1_fast_fp8.safetensors",
+    "dependencies": [
+      "clip_l_hidream.safetensors",
+      "clip_g_hidream.safetensors",
+      "t5xxl_fp8_e4m3fn.safetensors",
+      "llama_3.1_8b_instruct_fp8_scaled.safetensors",
+      "ae.safetensors"
+    ],
+    "workflow": "text-to-image/hidream.json",
+    "workflowVars": {
+      "cfgScale": 1,
+      "steps": 28,
+      "scheduler": "normal",
+      "sampler": "lcm",
+      "width": 1024,
+      "height": 1024,
+      "batchSize": 1
+    },
+    "downloadUrl": "https://huggingface.co/Comfy-Org/HiDream-I1_ComfyUI/resolve/main/split_files/diffusion_models/hidream_i1_fast_fp8.safetensors",
+    "url": "https://comfyanonymous.github.io/ComfyUI_examples/hidream/"
+  },
+  {
+    "id": "hidream_i1_dev_fp8",
+    "name": "HiDream I1 Dev FP8",
     "type": "TextToImage",
     "apiModels": {
       "ComfyUI": "hidream_i1_dev_fp8.safetensors"