From 8ba9ef83a3796cf98d5f5f04d4c8def42c8ec4ca Mon Sep 17 00:00:00 2001 From: jaakko Date: Tue, 14 Apr 2026 09:49:30 +0300 Subject: [PATCH] =?UTF-8?q?CodeBench:=20num=5Fctx=2016384=20=E2=80=94=20ra?= =?UTF-8?q?joita=20konteksti-ikkuna=20VRAM-s=C3=A4=C3=A4st=C3=B6ksi?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 256K konteksti varaa ~15 GB KV-cachea vaikka benchmark käyttää ~3K. 16K riittää hyvin ja säästää merkittävästi VRAM:ia. --- kipina-codebench/benchmark.mjs | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/kipina-codebench/benchmark.mjs b/kipina-codebench/benchmark.mjs index 2bad71c..76cf37c 100644 --- a/kipina-codebench/benchmark.mjs +++ b/kipina-codebench/benchmark.mjs @@ -104,7 +104,7 @@ async function ollamaChat(model, prompt, systemPrompt, maxTokens = 2048) { messages, stream: false, think: false, - options: { num_predict: maxTokens, temperature: 0.7, top_k: 40, repeat_penalty: 1.15 }, + options: { num_predict: maxTokens, num_ctx: 16384, temperature: 0.7, top_k: 40, repeat_penalty: 1.15 }, }), }); if (!resp.ok) throw new Error(`Ollama HTTP ${resp.status}: ${await resp.text()}`);