load arrays with up to 1024 elements when estimating

This mirrors the old behavior before #10382
This commit is contained in:
Devon Rifkin 2025-04-27 13:45:13 -07:00 committed by Ryan Schumacher
parent 558c1920fa
commit dd8d037c16
No known key found for this signature in database
1 changed files with 1 additions and 1 deletions

View File

@ -191,7 +191,7 @@ func (s *Scheduler) processPending(ctx context.Context) {
}
// Load model for fitting
ggml, err := llm.LoadModel(pending.model.ModelPath, 0)
ggml, err := llm.LoadModel(pending.model.ModelPath, 1024)
if err != nil {
pending.errCh <- err
break