docs
evals
scenario-1
scenario-10
scenario-2
scenario-3
scenario-4
scenario-5
scenario-6
scenario-7
scenario-8
scenario-9
{
"context": "This evaluation assesses how well the engineer uses picocolors' basic foreground color functions to implement a status logger. The focus is on proper usage of the color functions (red, yellow, green, cyan, magenta, gray, black, white) to format terminal output appropriately.",
"type": "weighted_checklist",
"checklist": [
{
"name": "Import picocolors",
"description": "Correctly imports picocolors library using appropriate import or require syntax",
"max_score": 5
},
{
"name": "Use red() function",
"description": "Uses picocolors' red() function to display error messages in red",
"max_score": 15
},
{
"name": "Use yellow() function",
"description": "Uses picocolors' yellow() function to display warning messages in yellow",
"max_score": 15
},
{
"name": "Use green() function",
"description": "Uses picocolors' green() function to display success messages in green",
"max_score": 15
},
{
"name": "Use cyan() function",
"description": "Uses picocolors' cyan() function to display info messages in cyan",
"max_score": 10
},
{
"name": "Use magenta() function",
"description": "Uses picocolors' magenta() function to display debug messages in magenta",
"max_score": 10
},
{
"name": "Use gray() function",
"description": "Uses picocolors' gray() function to display trace messages in gray",
"max_score": 10
},
{
"name": "Use black() function",
"description": "Uses picocolors' black() function to display critical messages in black",
"max_score": 10
},
{
"name": "Use white() function",
"description": "Uses picocolors' white() function to handle unknown severity levels in white",
"max_score": 10
}
]
}