eigent/backend/benchmark/dataset/0.json
bytecii eadc6ee56b
test: add basic benchmark (#1138)
Co-authored-by: bytecii <bytecii@users.noreply.github.com>
Co-authored-by: Tong Chen <web_chentong@163.com>
2026-02-05 01:15:55 -08:00

20 lines
965 B
JSON

{
"metadata": {
"difficulty": "easy",
"description": "Google a specific blog post on mathspp.com about obfuscated Python, read and understand the code tricks, then faithfully reproduce the exact program as hello_world.py.",
"tags": ["browser", "coding", "python", "target-searching"]
},
"data": {
"name": "0",
"question": "Google search 'The most obscure Hello, world! program', choose the link from the website mathspp, read the page, and write a Python script named 'hello_world.py' that faithfully reproduces the exact obfuscated Hello World program shown on that page. Do not simplify or rewrite it — copy the same structure, tricks, and naming conventions used by the author. The script must print 'Hello, World!' when run.",
"env": {}
},
"model_kwargs": {
"model_platform": "openai",
"model_type": "gpt-5.2"
},
"tests": {
"checker": ["benchmark/checker/0.py"],
"grader": ["benchmark/grader/0.py"]
}
}