{ "name": "debug_simple_typo_without_guidance", "category": ["code"], "task": "Make test.py run without errors.", "dependencies": [], "ground": { "answer": "[0, 1] [2, 5] [0, 3]", "should_contain": ["[0, 1]", "[2, 5]", "[0, 3]"], "should_not_contain": [], "files": ["test.py"], "type": "execute_python_code" }, "mock": { "mock_func": null, "mock_task": null }, "info": { "difficulty": "basic", "description": "Tests ability for the agent to debug python code with a simple typo in it, using a very broad prompt without guidance", "side_effects": ["tests if there is in fact an LLM attached"] } }