mirror of
https://github.com/aljazceru/Auto-GPT.git
synced 2026-01-10 09:44:26 +01:00
* WIP Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com> * WIP Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com> * Update config for benchmark changes (#4883) * Add Helicone * Add reports, consolidate, update benchmark files (#4941) * updating config * add reports, consolidate, update benchmark files * Update benchmarks.py * Change entrypath and add __init__.py * Remove Helicone integration because we now have proxy at the system level * Support more regression tests * Fix Auto-GPT/benchmark integration Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com> * Remove cutoff * Install agbenchmark and make continuous mode dynamic Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com> --------- Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com> Co-authored-by: Silen Naihin <silen.naihin@gmail.com>
25 lines
628 B
JSON
25 lines
628 B
JSON
{
|
|
"TestBasicCodeGeneration": {
|
|
"difficulty": "basic",
|
|
"dependencies": [
|
|
"TestWriteFile"
|
|
],
|
|
"data_path": "agbenchmark/challenges/code/d3"
|
|
},
|
|
"TestBasicMemory": {
|
|
"difficulty": "basic",
|
|
"data_path": "agbenchmark/challenges/memory/m1"
|
|
},
|
|
"TestReadFile": {
|
|
"difficulty": "basic",
|
|
"dependencies": [
|
|
"TestWriteFile"
|
|
],
|
|
"data_path": "agbenchmark/challenges/interface/read_file"
|
|
},
|
|
"TestWriteFile": {
|
|
"dependencies": [],
|
|
"data_path": "agbenchmark/challenges/interface/write_file"
|
|
}
|
|
}
|