Auto-generated tile from GitHub (10 skills)
92
94%
Does it follow best practices?
Impact
92%
1.16xAverage score across 44 eval scenarios
Advisory
Suggest reviewing before use
{
"context": "Tests whether the agent correctly diagnoses libuv thread pool saturation caused by dns.lookup() and large file readFile(), replaces them with thread-pool-avoiding alternatives (dns.resolve4, streaming), and configures UV_THREADPOOL_SIZE correctly before Node.js starts rather than at runtime.",
"type": "weighted_checklist",
"checklist": [
{
"name": "dns.resolve4 instead of dns.lookup",
"description": "fixed-service.js uses `dns.resolve4()` (or `dns.promises.resolve4()` or another `dns.resolve*` method) instead of `dns.lookup()` for hostname resolution",
"max_score": 14
},
{
"name": "No dns.lookup in fixed code",
"description": "fixed-service.js does NOT contain any call to `dns.lookup()` or `dns.promises.lookup()`",
"max_score": 10
},
{
"name": "Streaming for large file",
"description": "fixed-service.js uses a streaming approach (e.g., `createReadStream`, `pipeline`, or async iteration over a stream) to read the large config/data file, NOT `readFile()` or `promises.readFile()`",
"max_score": 12
},
{
"name": "UV_THREADPOOL_SIZE in startup script",
"description": "start.sh sets UV_THREADPOOL_SIZE as an environment variable before `node` starts (e.g., `UV_THREADPOOL_SIZE=N node service.js` or `export UV_THREADPOOL_SIZE=N` before the node command)",
"max_score": 14
},
{
"name": "UV_THREADPOOL_SIZE value > 4",
"description": "The UV_THREADPOOL_SIZE value set in start.sh is greater than 4 (the default), appropriate for an I/O-heavy service",
"max_score": 8
},
{
"name": "No runtime process.env assignment",
"description": "fixed-service.js does NOT contain `process.env.UV_THREADPOOL_SIZE = ...` (setting the value at runtime, which has no effect)",
"max_score": 14
},
{
"name": "monitorEventLoopDelay used",
"description": "monitoring.js uses `monitorEventLoopDelay` from `node:perf_hooks` (or `perf_hooks`) to measure event loop lag",
"max_score": 14
},
{
"name": "p99 latency check",
"description": "monitoring.js reads the p99 percentile from the histogram (calls `.percentile(99)`) as an indicator of thread pool saturation",
"max_score": 14
}
]
}evals
scenario-1
scenario-2
scenario-3
scenario-4
scenario-5
scenario-6
scenario-7
scenario-8
scenario-9
scenario-10
scenario-11
scenario-12
scenario-13
scenario-14
scenario-15
scenario-16
scenario-17
scenario-18
scenario-19
scenario-20
scenario-21
scenario-22
scenario-23
scenario-24
scenario-25
scenario-26
scenario-27
scenario-28
scenario-29
scenario-30
scenario-31
scenario-32
scenario-33
scenario-34
scenario-35
scenario-36
scenario-37
scenario-38
scenario-39
scenario-40
scenario-41
scenario-42
scenario-43
scenario-44
skills
documentation
fastify
init
linting-neostandard-eslint9
node
nodejs-core
rules
oauth
octocat
snipgrapher