docs
evals
scenario-1
scenario-10
scenario-2
scenario-3
scenario-4
scenario-5
scenario-6
scenario-7
scenario-8
scenario-9
{
"context": "This criteria evaluates how well an engineer uses the cli package's progress bar display functionality to implement a file download simulator. The focus is on proper usage of cli.progress() and related methods for visual feedback.",
"type": "weighted_checklist",
"checklist": [
{
"name": "Uses cli.progress()",
"description": "The implementation calls the cli.progress() method to display progress updates during file download simulation",
"max_score": 40
},
{
"name": "Correct progress values",
"description": "Progress values passed to cli.progress() are in the correct range (0 to 1 scale) and accurately reflect download completion percentage",
"max_score": 25
},
{
"name": "Progressive updates",
"description": "The progress bar is updated multiple times during the download process (not just at 0% and 100%), showing intermediate progress states",
"max_score": 20
},
{
"name": "CLI package import",
"description": "The cli package is properly imported/required at the beginning of the implementation file",
"max_score": 15
}
]
}