Files
agentic-studio/kipina-codebench/results/2026-04-14T11-06.json
jaakko 5d0baf3ff1 CodeBench: combined-readme.md — todo + blog golden example 8b:lle
Molemmat esimerkit (single entity + FK relaatio) yhdessä tiedostossa.
1699 tokenia, 10.4% kontekstista. 8b näkee konkreettisen FK-patternen.
2026-04-14 14:54:12 +03:00

71 lines
1.5 KiB
JSON

[
{
"model": "qwen3:8b",
"scenario": "blog",
"reqOk": true,
"specOk": true,
"specEntities": 2,
"validationIssues": 0,
"fixRounds": 3,
"testsTotal": 12,
"testsPassed": 10,
"testsFailed": 2,
"totalDurationMs": 139308,
"totalTokens": 11782,
"avgTokPerSec": 96.85039238572556,
"promptChars": 11148,
"promptTokensEst": 2787,
"score": 70,
"stars": "★★★★☆",
"error": null,
"profile": "small",
"promptName": "code-small",
"round": 1
},
{
"model": "qwen3:8b",
"scenario": "blog",
"reqOk": true,
"specOk": true,
"specEntities": 2,
"validationIssues": 0,
"fixRounds": 3,
"testsTotal": 1,
"testsPassed": 0,
"testsFailed": 1,
"totalDurationMs": 132306,
"totalTokens": 11671,
"avgTokPerSec": 96.88921767777383,
"promptChars": 11267,
"promptTokensEst": 2817,
"score": 20,
"stars": "★☆☆☆☆",
"error": "Syntaksivirhe",
"profile": "small",
"promptName": "code-small",
"round": 2
},
{
"model": "qwen3:8b",
"scenario": "blog",
"reqOk": true,
"specOk": true,
"specEntities": 2,
"validationIssues": 0,
"fixRounds": 3,
"testsTotal": 12,
"testsPassed": 11,
"testsFailed": 1,
"totalDurationMs": 126092,
"totalTokens": 11132,
"avgTokPerSec": 96.98598556369416,
"promptChars": 11292,
"promptTokensEst": 2823,
"score": 75,
"stars": "★★★★☆",
"error": null,
"profile": "small",
"promptName": "code-small",
"round": 3
}
]