mirror of
https://github.com/aljazceru/Auto-GPT.git
synced 2026-01-25 08:54:28 +01:00
Make agbenchmark a proxy of the evaluated agent (#5279)
Make agbenchmark a Proxy of the evaluated agent Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com>
This commit is contained in:
@@ -1,21 +1,31 @@
|
||||
{
|
||||
"name": "ReturnCodeWrite",
|
||||
"category": ["code", "iterate"],
|
||||
"task": "Add a function called multiply_int in sample_code.py that multiplies numbers by 2. You can make sure you have correctly done this by running test.py",
|
||||
"dependencies": ["ReturnCodeSimple"],
|
||||
"cutoff": 120,
|
||||
"ground": {
|
||||
"answer": "Just a simple multiple by 2 function. Num is 4 so answer is 8",
|
||||
"should_contain": ["8"],
|
||||
"should_not_contain": [],
|
||||
"files": ["test.py"],
|
||||
"eval": {
|
||||
"type": "python"
|
||||
}
|
||||
},
|
||||
"info": {
|
||||
"difficulty": "novice",
|
||||
"description": "Small step up, just writing the function with a name as well as the return statement.",
|
||||
"side_effects": []
|
||||
}
|
||||
}
|
||||
"name": "ReturnCodeWrite",
|
||||
"category": [
|
||||
"code",
|
||||
"iterate"
|
||||
],
|
||||
"task": "Add a function called multiply_int in sample_code.py that multiplies numbers by 2. You can make sure you have correctly done this by running test.py",
|
||||
"dependencies": [
|
||||
"ReturnCodeSimple"
|
||||
],
|
||||
"cutoff": 120,
|
||||
"ground": {
|
||||
"answer": "Just a simple multiple by 2 function. Num is 4 so answer is 8",
|
||||
"should_contain": [
|
||||
"8"
|
||||
],
|
||||
"should_not_contain": [],
|
||||
"files": [
|
||||
"test.py"
|
||||
],
|
||||
"eval": {
|
||||
"type": "python"
|
||||
}
|
||||
},
|
||||
"info": {
|
||||
"difficulty": "novice",
|
||||
"description": "Small step up, just writing the function with a name as well as the return statement.",
|
||||
"side_effects": []
|
||||
},
|
||||
"eval_id": "d36bf9f5-ee0f-4d84-b4d8-71f20e8454d5"
|
||||
}
|
||||
Reference in New Issue
Block a user