Unverified Commit 604e43b2 authored by Patrick Devine's avatar Patrick Devine Committed by GitHub
Browse files

models: enable deepseek2 (deepseek v3.1 w/ MLA) on the new engine (#13151)

parent 53985b3c
...@@ -250,6 +250,7 @@ func (kv KV) OllamaEngineRequired() bool { ...@@ -250,6 +250,7 @@ func (kv KV) OllamaEngineRequired() bool {
"qwen3", "qwen3moe", "qwen3", "qwen3moe",
"qwen3vl", "qwen3vlmoe", "qwen3vl", "qwen3vlmoe",
"deepseekocr", "deepseekocr",
"deepseek2",
}, kv.Architecture()) }, kv.Architecture())
} }
......
...@@ -236,6 +236,11 @@ type Model struct { ...@@ -236,6 +236,11 @@ type Model struct {
} }
func New(c fs.Config) (model.Model, error) { func New(c fs.Config) (model.Model, error) {
if c.Uint("attention.key_length_mla") == 0 {
// non-MLA models aren't yet supported
return nil, model.ErrUnsupportedModel
}
layers := make([]Layer, c.Uint("block_count")) layers := make([]Layer, c.Uint("block_count"))
firstDenseLayerIndex := int(c.Uint("leading_dense_block_count")) firstDenseLayerIndex := int(c.Uint("leading_dense_block_count"))
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment