eigent/backend/benchmark/dataset/0.json
bytecii f7bf29a40a
benchmark: update benchmark (#1207)
Co-authored-by: bytecii <bytecii@users.noreply.github.com>
Co-authored-by: Wendong-Fan <w3ndong.fan@gmail.com>
Co-authored-by: Wendong-Fan <133094783+Wendong-Fan@users.noreply.github.com>
2026-02-12 16:35:18 +08:00

22 lines
1,015 B
JSON

{
"metadata": {
"difficulty": "easy",
"description": "1) search tool usage and choosing the appropriate website from results, 2) interpreting advanced obfuscated Python code patterns (requires deep coding comprehension), 3) strict instruction following with implicit output modification instead of directly copying code from the website.",
"tags": [
"instruction-following",
"browser",
"coding",
"python",
"target-searching"
]
},
"data": {
"name": "0",
"question": "Find 'obscure hello world program' from mathspp, read the page, and write a Python script named 'hello_world.py' that faithfully reproduces the obfuscated Hello World program shown on that page. Do not simplify or rewrite it, just use the same structure, tricks, and naming conventions used by the author. Notice that the script MUST print 'Hello, WORLD!' when run.",
"env": {}
},
"tests": {
"checker": ["benchmark/checker/0.py"],
"grader": ["benchmark/grader/0.py"]
}
}