{ "category": [ "code", "iterate" ], "cutoff": 75, "dependencies": [ "TestDebugSimpleTypoWithGuidance" ], "eval_id": "1d171b68-0374-4b08-ae6a-c7223f89ecc1", "ground": { "answer": "[0, 1] [2, 5] [0, 3]", "eval": { "type": "python" }, "files": [ "test.py" ], "should_contain": [ "[0, 1]", "[2, 5]", "[0, 3]" ], "should_not_contain": [] }, "info": { "description": "Tests ability for the agent to debug python code with a simple typo in it, using a very broad prompt without guidance", "difficulty": "intermediate", "side_effects": [] }, "name": "DebugSimpleTypoWithoutGuidance", "task": "Make test.py run without errors." }