Unverified Commit 9a3c8003 authored by Michael Yang's avatar Michael Yang Committed by GitHub
Browse files

Merge pull request #4624 from ollama/mxyng/fix-5

fix q5_0, q5_1
parents 4cc3be30 d51f1525
...@@ -125,9 +125,9 @@ type Tensor struct { ...@@ -125,9 +125,9 @@ type Tensor struct {
func (t Tensor) blockSize() uint64 { func (t Tensor) blockSize() uint64 {
switch t.Kind { switch t.Kind {
case 0, 1, 24, 25, 26, 27, 28, 31: // F32, F16, I8, I16, I32, I64, F64, BF16 case 0, 1, 24, 25, 26, 27, 28, 30: // F32, F16, I8, I16, I32, I64, F64, BF16
return 1 return 1
case 2, 3, 8, 9, 20: // Q4_0, Q4_1, Q8_0, Q8_1, IQ4_NL case 2, 3, 4, 5, 6, 7, 8, 9, 20: // Q4_0, Q4_1, Q5_0, Q5_1, Q8_0, Q8_1, IQ4_NL
return 32 return 32
default: // All others default: // All others
return 256 return 256
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment