diff --git a/llm/memory.go b/llm/memory.go index b5a8dd5c6..b11d4144e 100644 --- a/llm/memory.go +++ b/llm/memory.go @@ -415,7 +415,7 @@ func projectorMemoryRequirements(filename string) (weights uint64) { } defer file.Close() - ggml, _, err := ggml.Decode(file, 1024) + ggml, _, err := ggml.Decode(file, 0) if err != nil { return 0 } diff --git a/server/create.go b/server/create.go index 68e003dfd..e46779c7f 100644 --- a/server/create.go +++ b/server/create.go @@ -467,7 +467,7 @@ func quantizeLayer(layer *layerGGML, quantizeType string, fn func(resp api.Progr return nil, err } - f, _, err := ggml.Decode(temp, 1024) + f, _, err := ggml.Decode(temp, 0) if err != nil { slog.Error(fmt.Sprintf("error decoding ggml: %s\n", err)) return nil, err diff --git a/server/images.go b/server/images.go index 352f10f2b..1a711f237 100644 --- a/server/images.go +++ b/server/images.go @@ -75,7 +75,7 @@ func (m *Model) Capabilities() []model.Capability { if err == nil { defer r.Close() - f, _, err := ggml.Decode(r, 1024) + f, _, err := ggml.Decode(r, 0) if err == nil { if _, ok := f.KV()[fmt.Sprintf("%s.pooling_type", f.KV().Architecture())]; ok { capabilities = append(capabilities, model.CapabilityEmbedding)