mirror of
https://github.com/ollama/ollama.git
synced 2026-04-27 19:25:55 +02:00
mlx: int4 groupsize 64 (#14682)
Change affine 4bit integers to use groupsize 64
This commit is contained in:
@@ -21,7 +21,7 @@ var quantizeParams = map[string]struct {
|
||||
bits int
|
||||
mode string
|
||||
}{
|
||||
"int4": {32, 4, "affine"},
|
||||
"int4": {64, 4, "affine"},
|
||||
"nvfp4": {16, 4, "nvfp4"},
|
||||
"int8": {64, 8, "affine"},
|
||||
"mxfp8": {32, 8, "mxfp8"},
|
||||
|
||||
Reference in New Issue
Block a user