docs
evals
scenario-1
scenario-10
scenario-2
scenario-3
scenario-4
scenario-5
scenario-6
scenario-7
scenario-8
scenario-9
{
"context": "Evaluates how well the solution uses Chalk to build nested, multi-line status output for labels, headers, and highlighted message parts. Scoring prioritizes correct chaining, nesting, and multi-argument rendering rather than general code quality. Only Chalk usage and its output handling are assessed.",
"type": "weighted_checklist",
"checklist": [
{
"name": "Chalk import",
"description": "Uses the Chalk package (default export or `new Chalk({level})`) as the styling engine instead of manual ANSI escape codes.",
"max_score": 20
},
{
"name": "Chained base style",
"description": "Builds the base label/message styling with Chalk's chainable helpers (e.g., `chalk.bold`, `chalk.greenBright`, `chalk.dim`) rather than composing raw strings or separate escapes.",
"max_score": 20
},
{
"name": "Nested highlight",
"description": "Wraps highlighted message segments with a distinct Chalk style (e.g., `chalk.cyanBright` or `chalk.inverse`) nested inside the base style, relying on Chalk to reopen/close sequences correctly instead of manual resets.",
"max_score": 25
},
{
"name": "Multi-argument render",
"description": "Feeds multiple message parts to a single Chalk call (e.g., `chalk.dim(part1, part2, part3)`) instead of prejoining them, demonstrating use of Chalk's multi-argument rendering.",
"max_score": 15
},
{
"name": "Layered header",
"description": "Applies stacked Chalk styles for the optional header (outer accent plus inner emphasis such as `chalk.bgYellow.black.bold`) rather than a single flat color or unstyled text.",
"max_score": 10
},
{
"name": "Per-line styling",
"description": "Styles each output line through Chalk calls so styles do not leak across lines, avoiding manual resets and ensuring newline handling uses Chalk-managed closures.",
"max_score": 10
}
]
}