Files
Auto-GPT/benchmark/agbenchmark/challenges/deprecated/code/d2.1_guided/data.json
merwanehamadi f4d319cee4 Refactor benchmark (#5247)
Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com>
2023-09-17 06:55:20 -07:00

22 lines
640 B
JSON

{
"name": "DebugSimpleTypoWithGuidance",
"category": ["code", "iterate"],
"task": "1- Run test.py.\n2- Read sample_code.py.\n3- Modify sample_code.py.\nRepeat step 1, 2 and 3 until test.py runs without errors.\n",
"dependencies": ["ReadFile"],
"cutoff": 75,
"ground": {
"answer": "[0, 1] [2, 5] [0, 3]",
"should_contain": ["[0, 1]", "[2, 5]", "[0, 3]"],
"should_not_contain": [],
"files": ["test.py"],
"eval": {
"type": "python"
}
},
"info": {
"difficulty": "novice",
"description": "s ability for the agent to debug python code with a simple typo in it.",
"side_effects": []
}
}