Skip to content

Commit 0d6d026

Browse files
committed
Use 4-bit quantized models
1 parent 91449cf commit 0d6d026

File tree

2 files changed

+8
-8
lines changed

2 files changed

+8
-8
lines changed

Libraries/MLXVLM/VLMModelFactory.swift

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -169,14 +169,14 @@ public class VLMRegistry: AbstractModelRegistry, @unchecked Sendable {
169169
extraEOSTokens: ["<end_of_turn>"]
170170
)
171171

172-
static public let gemma3n_E2B_instruct = ModelConfiguration(
173-
id: "mlx-community/gemma-3n-E2B-it-bf16",
172+
static public let gemma3n_E2B = ModelConfiguration(
173+
id: "mlx-community/gemma-3n-E2B-it-4bit",
174174
defaultPrompt: "Describe this image.",
175175
extraEOSTokens: ["<end_of_turn>"]
176176
)
177177

178-
static public let gemma3n_E4B_instruct = ModelConfiguration(
179-
id: "mlx-community/gemma-3n-E4B-it-bf16",
178+
static public let gemma3n_E4B = ModelConfiguration(
179+
id: "mlx-community/gemma-3n-E4B-it-4bit",
180180
defaultPrompt: "Describe this image.",
181181
extraEOSTokens: ["<end_of_turn>"]
182182
)
@@ -196,8 +196,8 @@ public class VLMRegistry: AbstractModelRegistry, @unchecked Sendable {
196196
gemma3_4B_qat_4bit,
197197
gemma3_12B_qat_4bit,
198198
gemma3_27B_qat_4bit,
199-
gemma3n_E2B_instruct,
200-
gemma3n_E4B_instruct,
199+
gemma3n_E2B,
200+
gemma3n_E4B,
201201
smolvlm,
202202
]
203203
}

Tools/llm-tool/LLMTool.swift

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -302,9 +302,9 @@ struct EvaluateCommand: AsyncParsableCommand {
302302
let modelFactory: ModelFactory
303303
let defaultModel: ModelConfiguration
304304

305-
// Always use VLM factory and gemma3n_E2B_instruct for testing
305+
// Always use VLM factory and gemma3n_E2B for testing
306306
modelFactory = VLMModelFactory.shared
307-
defaultModel = MLXVLM.VLMRegistry.gemma3n_E2B_instruct
307+
defaultModel = MLXVLM.VLMRegistry.gemma3n_E2B
308308

309309
// Load the model
310310
let modelContainer = try await memory.start { [args] in

0 commit comments

Comments
 (0)