From 604e43b28d12677c96675ba368eee20a2bed2c24 Mon Sep 17 00:00:00 2001 From: Patrick Devine Date: Tue, 18 Nov 2025 22:03:50 -0800 Subject: [PATCH] models: enable deepseek2 (deepseek v3.1 w/ MLA) on the new engine (#13151) --- fs/ggml/ggml.go | 1 + model/models/deepseek2/model.go | 5 +++++ 2 files changed, 6 insertions(+) diff --git a/fs/ggml/ggml.go b/fs/ggml/ggml.go index 205279c6..dcd1234d 100644 --- a/fs/ggml/ggml.go +++ b/fs/ggml/ggml.go @@ -250,6 +250,7 @@ func (kv KV) OllamaEngineRequired() bool { "qwen3", "qwen3moe", "qwen3vl", "qwen3vlmoe", "deepseekocr", + "deepseek2", }, kv.Architecture()) } diff --git a/model/models/deepseek2/model.go b/model/models/deepseek2/model.go index c1251ecf..99c57959 100644 --- a/model/models/deepseek2/model.go +++ b/model/models/deepseek2/model.go @@ -236,6 +236,11 @@ type Model struct { } func New(c fs.Config) (model.Model, error) { + if c.Uint("attention.key_length_mla") == 0 { + // non-MLA models aren't yet supported + return nil, model.ErrUnsupportedModel + } + layers := make([]Layer, c.Uint("block_count")) firstDenseLayerIndex := int(c.Uint("leading_dense_block_count"))