mirror of
https://github.com/aljazceru/Auto-GPT.git
synced 2025-12-31 21:04:25 +01:00
Use artifacts out insted of python code (#72)
This commit is contained in:
@@ -0,0 +1 @@
|
||||
2314
|
||||
@@ -0,0 +1,4 @@
|
||||
3145
|
||||
3791
|
||||
9317
|
||||
9471
|
||||
@@ -0,0 +1,4 @@
|
||||
3145
|
||||
3791
|
||||
9317
|
||||
9471
|
||||
@@ -0,0 +1,4 @@
|
||||
The purple elephant danced on a rainbow while eating a taco
|
||||
The sneaky toaster stole my socks and ran away to Hawaii
|
||||
My pet rock sings better than Beyoncé on Tuesdays
|
||||
The giant hamster rode a unicycle through the crowded mall
|
||||
@@ -0,0 +1 @@
|
||||
25.89
|
||||
@@ -0,0 +1 @@
|
||||
81,462 Millions
|
||||
@@ -0,0 +1,15 @@
|
||||
15 Millions
|
||||
112 Millions
|
||||
117 Millions
|
||||
204 Millions
|
||||
413 Millions
|
||||
2,014 Millions
|
||||
3,198 Millions
|
||||
4,046 Millions
|
||||
7,000 Millions
|
||||
11,759 Millions
|
||||
21,461 Millions
|
||||
24,578 Millions
|
||||
31,536 Millions
|
||||
53,823 Millions
|
||||
81,462 Millions
|
||||
@@ -1,14 +1,13 @@
|
||||
from typing import Any, Dict, Optional
|
||||
|
||||
import agbenchmark.mocks.tests.basic_mocks as basic_mocks
|
||||
import agbenchmark.mocks.tests.retrieval_mocks as retrieval_mocks
|
||||
|
||||
|
||||
class MockManager:
|
||||
def __init__(self, task: Optional[str], config: Dict[str, Any]) -> None:
|
||||
self.task = task
|
||||
self.workspace = config["workspace"]
|
||||
self.modules = [basic_mocks, retrieval_mocks]
|
||||
self.modules = [basic_mocks]
|
||||
|
||||
def delegate(self, mock_function_name: Any, *args: Any, **kwargs: Any) -> None:
|
||||
if hasattr(self, mock_function_name):
|
||||
|
||||
@@ -1,78 +1,12 @@
|
||||
from agbenchmark.challenge import Challenge
|
||||
|
||||
|
||||
def basic_write_file_mock(task: str, workspace: str) -> None:
|
||||
def example_mock(task: str, workspace: str) -> None:
|
||||
"""
|
||||
This mock writes to a file (creates one if it doesn't exist)
|
||||
"""
|
||||
Challenge.write_to_file(
|
||||
workspace,
|
||||
"file_to_check.txt",
|
||||
"Washington DC is the capital of the United States of America",
|
||||
)
|
||||
|
||||
|
||||
def basic_retrieval_mock(task: str, workspace: str) -> None:
|
||||
"""
|
||||
This mock writes to a file (creates one if it doesn't exist)
|
||||
"""
|
||||
Challenge.write_to_file(
|
||||
workspace,
|
||||
"file_to_check.txt",
|
||||
"25.89",
|
||||
)
|
||||
|
||||
|
||||
def basic_retrieval_2_mock(task: str, workspace: str) -> None:
|
||||
"""
|
||||
This mock writes to a file (creates one if it doesn't exist)
|
||||
"""
|
||||
Challenge.write_to_file(
|
||||
workspace,
|
||||
"file_to_check.txt",
|
||||
"81,462",
|
||||
)
|
||||
|
||||
|
||||
def basic_retrieval_3_mock(task: str, workspace: str) -> None:
|
||||
"""
|
||||
This mock writes to a file (creates one if it doesn't exist)
|
||||
"""
|
||||
Challenge.write_to_file(
|
||||
workspace,
|
||||
"file_to_check.txt",
|
||||
"15 Millions\n112 Millions\n117 Millions\n204 Millions\n413 Millions\n2,014 Millions\n3,198 Millions\n4,046 Millions\n7,000 Millions\n11,759 Millions\n21,461 Millions\n24,578 Millions\n31,536 Millions\n53,823 Millions\n81,462 Millions",
|
||||
)
|
||||
|
||||
|
||||
def basic_memory_mock(task: str, workspace: str) -> None:
|
||||
"""
|
||||
This mock writes to a file (creates one if it doesn't exist)
|
||||
"""
|
||||
Challenge.write_to_file(
|
||||
workspace,
|
||||
"file_to_check.txt",
|
||||
"2314",
|
||||
)
|
||||
|
||||
|
||||
def remember_multiple_ids_mock(task: str, workspace: str) -> None:
|
||||
"""
|
||||
This mock writes to a file (creates one if it doesn't exist)
|
||||
"""
|
||||
Challenge.write_to_file(
|
||||
workspace,
|
||||
"file_to_check.txt",
|
||||
"3145\n3791\n9317\n9471",
|
||||
)
|
||||
|
||||
|
||||
def remember_multiple_phrases_with_noise_mock(task: str, workspace: str) -> None:
|
||||
"""
|
||||
This mock writes to a file (creates one if it doesn't exist)
|
||||
"""
|
||||
Challenge.write_to_file(
|
||||
workspace,
|
||||
"file_to_check.txt",
|
||||
"The purple elephant danced on a rainbow while eating a taco\nThe sneaky toaster stole my socks and ran away to Hawaii\nMy pet rock sings better than Beyoncé on Tuesdays\nThe giant hamster rode a unicycle through the crowded mall",
|
||||
"This is an example showing how you can use mocks but here you can use artifacts_out folder instead of a mock.",
|
||||
)
|
||||
|
||||
@@ -1,5 +0,0 @@
|
||||
# TODO: Make it so that you can specify for tests to only run if their prerequisites are met.
|
||||
# Prerequisites here would be writing to a file (basic_abilities test).
|
||||
# Should also check if prerequisites exists in regression file
|
||||
def retrieval_1_mock(task: str, workspace: str) -> None:
|
||||
pass
|
||||
@@ -0,0 +1 @@
|
||||
Washington
|
||||
@@ -4,6 +4,11 @@
|
||||
"dependencies": [],
|
||||
"test": "agbenchmark/challenges/code/d1/debug_simple_typo_with_guidance_test.py"
|
||||
},
|
||||
"TestDebugSimpleTypoWithoutGuidance": {
|
||||
"difficulty": "basic",
|
||||
"dependencies": [],
|
||||
"test": "agbenchmark/challenges/code/d2/d2_test.py"
|
||||
},
|
||||
"TestBasicMemory": {
|
||||
"difficulty": "basic",
|
||||
"dependencies": [],
|
||||
@@ -19,11 +24,6 @@
|
||||
"dependencies": [],
|
||||
"test": "agbenchmark/challenges/memory/m3/remember_multiple_ids_with_noise_test.py"
|
||||
},
|
||||
"TestRememberMultiplePhrasesWithNoise": {
|
||||
"difficulty": "medium",
|
||||
"dependencies": [],
|
||||
"test": "agbenchmark/challenges/memory/m4/remember_multiple_phrases_with_noise_test.py"
|
||||
},
|
||||
"TestRetrieval": {
|
||||
"difficulty": "basic",
|
||||
"dependencies": [],
|
||||
@@ -39,11 +39,6 @@
|
||||
"dependencies": [],
|
||||
"test": "agbenchmark/challenges/retrieval/r2/r2_test.py"
|
||||
},
|
||||
"TestRetrieval3": {
|
||||
"difficulty": "basic",
|
||||
"dependencies": [],
|
||||
"test": "agbenchmark/challenges/retrieval/r3/r3_test.py"
|
||||
},
|
||||
"TestReadFile": {
|
||||
"difficulty": "basic",
|
||||
"dependencies": [
|
||||
@@ -51,9 +46,14 @@
|
||||
],
|
||||
"test": "agbenchmark/tests/basic_abilities/read_file/read_file_test.py"
|
||||
},
|
||||
"TestDebugSimpleTypoWithoutGuidance": {
|
||||
"TestRetrieval3": {
|
||||
"difficulty": "basic",
|
||||
"dependencies": [],
|
||||
"test": "agbenchmark/challenges/code/d2/d2_test.py"
|
||||
"test": "agbenchmark/challenges/retrieval/r3/r3_test.py"
|
||||
},
|
||||
"TestRememberMultiplePhrasesWithNoise": {
|
||||
"difficulty": "medium",
|
||||
"dependencies": [],
|
||||
"test": "agbenchmark/challenges/memory/m4/remember_multiple_phrases_with_noise_test.py"
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user