Feature/llm data structs (#3486)

* Organize all the llm stuff into a subpackage * Add structs for interacting with llms
2025-12-21 16:04:21 +01:00 · 2023-04-28 15:04:31 -07:00
parent c7d75643d3
commit b8478a96ae
9 changed files with 122 additions and 14 deletions
--- a/autogpt/agent/agent_manager.py
+++ b/autogpt/agent/agent_manager.py
@@ -4,9 +4,8 @@ from __future__ import annotations
 from typing import List

 from autogpt.config.config import Config
-from autogpt.llm import create_chat_completion
+from autogpt.llm import Message, create_chat_completion
 from autogpt.singleton import Singleton
-from autogpt.types.openai import Message


 class AgentManager(metaclass=Singleton):
--- a/autogpt/llm/init.py
+++ b/autogpt/llm/init.py
@@ -1,4 +1,13 @@
 from autogpt.llm.api_manager import ApiManager
+from autogpt.llm.base import (
+    ChatModelInfo,
+    ChatModelResponse,
+    EmbeddingModelInfo,
+    EmbeddingModelResponse,
+    LLMResponse,
+    Message,
+    ModelInfo,
+)
 from autogpt.llm.chat import chat_with_ai, create_chat_message, generate_context
 from autogpt.llm.llm_utils import (
    call_ai_function,
@@ -10,6 +19,13 @@ from autogpt.llm.token_counter import count_message_tokens, count_string_tokens

 __all__ = [
    "ApiManager",
+    "Message",
+    "ModelInfo",
+    "ChatModelInfo",
+    "EmbeddingModelInfo",
+    "LLMResponse",
+    "ChatModelResponse",
+    "EmbeddingModelResponse",
    "create_chat_message",
    "generate_context",
    "chat_with_ai",
--- a/autogpt/llm/base.py
+++ b/autogpt/llm/base.py
@@ -0,0 +1,65 @@
+from dataclasses import dataclass, field
+from typing import List, TypedDict
+
+
+class Message(TypedDict):
+    """OpenAI Message object containing a role and the message content"""
+
+    role: str
+    content: str
+
+
+@dataclass
+class ModelInfo:
+    """Struct for model information.
+
+    Would be lovely to eventually get this directly from APIs, but needs to be scraped from
+    websites for now.
+
+    """
+
+    name: str
+    prompt_token_cost: float
+    completion_token_cost: float
+    max_tokens: int
+
+
+@dataclass
+class ChatModelInfo(ModelInfo):
+    """Struct for chat model information."""
+
+    pass
+
+
+@dataclass
+class EmbeddingModelInfo(ModelInfo):
+    """Struct for embedding model information."""
+
+    embedding_dimensions: int
+
+
+@dataclass
+class LLMResponse:
+    """Standard response struct for a response from an LLM model."""
+
+    model_info: ModelInfo
+    prompt_tokens_used: int = 0
+    completion_tokens_used: int = 0
+
+
+@dataclass
+class EmbeddingModelResponse(LLMResponse):
+    """Standard response struct for a response from an embedding model."""
+
+    embedding: List[float] = field(default_factory=list)
+
+    def __post_init__(self):
+        if self.completion_tokens_used:
+            raise ValueError("Embeddings should not have completion tokens used.")
+
+
+@dataclass
+class ChatModelResponse(LLMResponse):
+    """Standard response struct for a response from an LLM model."""
+
+    content: str = None
--- a/autogpt/llm/chat.py
+++ b/autogpt/llm/chat.py
@@ -5,13 +5,13 @@ from openai.error import RateLimitError

 from autogpt.config import Config
 from autogpt.llm.api_manager import ApiManager
+from autogpt.llm.base import Message
 from autogpt.llm.llm_utils import create_chat_completion
 from autogpt.llm.token_counter import count_message_tokens
 from autogpt.logs import logger
 from autogpt.memory_management.store_memory import (
    save_memory_trimmed_from_context_window,
 )
-from autogpt.types.openai import Message

 cfg = Config()

--- a/autogpt/llm/llm_utils.py
+++ b/autogpt/llm/llm_utils.py
@@ -10,8 +10,8 @@ from openai.error import APIError, RateLimitError, Timeout

 from autogpt.config import Config
 from autogpt.llm.api_manager import ApiManager
+from autogpt.llm.base import Message
 from autogpt.logs import logger
-from autogpt.types.openai import Message


 def retry_openai_api(
--- a/autogpt/llm/providers/init.py
+++ b/autogpt/llm/providers/init.py
--- a/autogpt/llm/providers/openai.py
+++ b/autogpt/llm/providers/openai.py
@@ -0,0 +1,37 @@
+from autogpt.llm.base import ChatModelInfo, EmbeddingModelInfo
+
+OPEN_AI_CHAT_MODELS = {
+    "gpt-3.5-turbo": ChatModelInfo(
+        name="gpt-3.5-turbo",
+        prompt_token_cost=0.002,
+        completion_token_cost=0.002,
+        max_tokens=4096,
+    ),
+    "gpt-4": ChatModelInfo(
+        name="gpt-4",
+        prompt_token_cost=0.03,
+        completion_token_cost=0.06,
+        max_tokens=8192,
+    ),
+    "gpt-4-32k": ChatModelInfo(
+        name="gpt-4-32k",
+        prompt_token_cost=0.06,
+        completion_token_cost=0.12,
+        max_tokens=32768,
+    ),
+}
+
+OPEN_AI_EMBEDDING_MODELS = {
+    "text-embedding-ada-002": EmbeddingModelInfo(
+        name="text-embedding-ada-002",
+        prompt_token_cost=0.0004,
+        completion_token_cost=0.0,
+        max_tokens=8191,
+        embedding_dimensions=1536,
+    ),
+}
+
+OPEN_AI_MODELS = {
+    **OPEN_AI_CHAT_MODELS,
+    **OPEN_AI_EMBEDDING_MODELS,
+}
--- a/autogpt/llm/token_counter.py
+++ b/autogpt/llm/token_counter.py
@@ -5,8 +5,8 @@ from typing import List

 import tiktoken

+from autogpt.llm.base import Message
 from autogpt.logs import logger
-from autogpt.types.openai import Message


 def count_message_tokens(
--- a/autogpt/types/openai.py
+++ b/autogpt/types/openai.py
@@ -1,9 +0,0 @@
-"""Type helpers for working with the OpenAI library"""
-from typing import TypedDict
-
-
-class Message(TypedDict):
-    """OpenAI Message object containing a role and the message content"""
-
-    role: str
-    content: str