docs
evals
scenario-1
scenario-10
scenario-2
scenario-3
scenario-4
scenario-5
scenario-6
scenario-7
scenario-8
scenario-9
{
"context": "This criteria evaluates how well the engineer uses chardet's statistical byte analysis pipeline to detect and rank character encodings. The focus is on proper usage of both single encoding detection and multi-encoding analysis capabilities with confidence-based sorting.",
"type": "weighted_checklist",
"checklist": [
{
"name": "Primary encoding detection",
"description": "Uses chardet.detect() or chardet.detectFile() to identify the most likely encoding for the input file",
"max_score": 25
},
{
"name": "Multi-encoding analysis",
"description": "Uses chardet.analyse() or equivalent to retrieve all possible encoding matches with confidence scores",
"max_score": 30
},
{
"name": "Confidence-based sorting",
"description": "Properly displays encoding alternatives sorted by confidence score in descending order, leveraging chardet's built-in ranking",
"max_score": 20
},
{
"name": "Match metadata extraction",
"description": "Correctly extracts and displays all match properties including name, confidence, and optional language code from chardet's AnalyseResult",
"max_score": 15
},
{
"name": "File I/O handling",
"description": "Properly uses chardet's file detection methods (detectFile or detectFileSync) rather than manually reading files and calling detect()",
"max_score": 10
}
]
}