mirror of
https://github.com/ollama/ollama.git
synced 2026-04-18 09:03:35 -04:00
use 4096 kvcache.NewSWAMemCache
This commit is contained in:
@@ -5,7 +5,6 @@ import (
|
||||
"fmt"
|
||||
"image"
|
||||
"log/slog"
|
||||
"math"
|
||||
"slices"
|
||||
"time"
|
||||
|
||||
@@ -114,7 +113,7 @@ func New(c fs.Config) (model.Model, error) {
|
||||
|
||||
slidingWindowLen := int32(c.Uint("attention.sliding_window"))
|
||||
m.Cache = kvcache.NewWrapperCache(
|
||||
kvcache.NewSWAMemCache(slidingWindowLen, math.MaxInt32, m.Shift),
|
||||
kvcache.NewSWAMemCache(slidingWindowLen, 4096, m.Shift),
|
||||
kvcache.NewCausalCache(m.Shift),
|
||||
)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user