mirror of
https://github.com/ollama/ollama.git
synced 2026-04-17 19:54:03 +02:00
mlx: additional gemma4 cache fixes (#15607)
Harden additional corner cases
This commit is contained in:
5
x/mlxrunner/cache/cache.go
vendored
5
x/mlxrunner/cache/cache.go
vendored
@@ -337,9 +337,10 @@ func (c *RotatingKVCache) State() []*mlx.Array {
|
|||||||
if c.keys == nil || c.values == nil {
|
if c.keys == nil || c.values == nil {
|
||||||
return nil
|
return nil
|
||||||
}
|
}
|
||||||
|
liveLen := min(c.offset, c.keys.Dim(2))
|
||||||
return []*mlx.Array{
|
return []*mlx.Array{
|
||||||
c.keys.Slice(mlx.Slice(), mlx.Slice(), mlx.Slice(0, c.offset), mlx.Slice()),
|
c.keys.Slice(mlx.Slice(), mlx.Slice(), mlx.Slice(0, liveLen), mlx.Slice()),
|
||||||
c.values.Slice(mlx.Slice(), mlx.Slice(), mlx.Slice(0, c.offset), mlx.Slice()),
|
c.values.Slice(mlx.Slice(), mlx.Slice(), mlx.Slice(0, liveLen), mlx.Slice()),
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user