{ "category": [ "code", "iterate" ], "cutoff": 75, "dependencies": [ "TestReadFile" ], "eval_id": "a758335b-539b-4d8a-b90e-cf7036952294", "ground": { "answer": "[0, 1] [2, 5] [0, 3]", "eval": { "type": "python" }, "files": [ "test.py" ], "should_contain": [ "[0, 1]", "[2, 5]", "[0, 3]" ], "should_not_contain": [] }, "info": { "description": "Tests ability for the agent to debug python code with a simple typo in it.", "difficulty": "novice", "side_effects": [] }, "name": "DebugSimpleTypoWithGuidance", "task": "1- Run test.py.\n2- Read sample_code.py.\n3- Modify sample_code.py.\nRepeat step 1, 2 and 3 until test.py runs without errors.\n" }