Files
Auto-GPT/agbenchmark/reports/mini-agi/12_TestDebugSimpleTypoWithGuidance.json

32 lines
980 B
JSON

{
"command": "agbenchmark start --test TestDebugSimpleTypoWithGuidance",
"completion_time": "2023-07-17-21:44",
"metrics": {
"run_time": "63.37 seconds",
"highest_difficulty": "No successful tests"
},
"tests": {
"TestDebugSimpleTypoWithGuidance": {
"data_path": "agbenchmark/challenges/code/d1",
"is_regression": false,
"task": "1- Run test.py.\n2- Read code.py.\n3- Modify code.py.\nRepeat step 1, 2 and 3 until test.py runs without errors.\n",
"answer": "[0, 1] [2, 5] [0, 3]",
"description": "Tests ability for the agent to debug python code with a simple typo in it.",
"metrics": {
"difficulty": "basic",
"success": false,
"fail_reason": "assert 1 in [0.0]",
"success_%": 0.0,
"run_time": "63.125 seconds"
},
"reached_cutoff": true
}
},
"config": {
"workspace": "${os.path.join(Path.home(), 'miniagi')}"
},
"additional": {
"model": "gpt-4"
}
}