max_tokens per vaihe: manageri 200, koodari 512, testaaja 200, QA 512, DevOps 256

Hub ja natiivisolmu tukevat nyt max_tokens-kenttää API-pyynnöissä.
Pipeline-vaiheet käyttävät sopivan kokoisia token-rajoja.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
This commit is contained in:
2026-04-06 22:03:26 +03:00
parent e6e1f60935
commit 1ef7f7c956
3 changed files with 16 additions and 10 deletions

View File

@@ -326,9 +326,10 @@ async fn main() {
if let Some(ref mut engine) = llm {
busy = true;
tracing::info!("Generoidaan (task_id: {}): \"{}\"", task_id, prompt);
let max_tokens = task.get("max_tokens").and_then(|v| v.as_u64()).unwrap_or(512) as usize;
tracing::info!("Generoidaan (task_id: {}, max_tokens: {}): \"{}\"", task_id, max_tokens, prompt);
match engine.generate(prompt, 512) {
match engine.generate(prompt, max_tokens) {
Ok(result) => {
tracing::info!(
"Tulos: {} tokenia | {:.0}ms | {:.1} tok/s | \"{}\"",