enable milvus as memory backend

2025-12-18 22:44:21 +01:00 · 2023-04-11 19:36:41 +08:00
parent 1073954fb7
commit 395d9d0481
6 changed files with 145 additions and 9 deletions
--- a/.env.template
+++ b/.env.template
@@ -77,6 +77,13 @@ REDIS_PASSWORD=
 WIPE_REDIS_ON_START=False
 MEMORY_INDEX=auto-gpt
 ### MILVUS
 # MILVUS_ADDR - Milvus remote address (e.g. localhost:19530)
 # MILVUS_COLLECTION - Milvus collection, 
 # change it if you want to start a new memory and retain the old memory.
 MILVUS_ADDR=your-milvus-cluster-host-port
 MILVUS_COLLECTION=autogpt
 ################################################################################
 ### IMAGE GENERATION PROVIDER
 ################################################################################
--- a/README.md
+++ b/README.md
@@ -35,22 +35,27 @@ Your support is greatly appreciated
 ## Table of Contents
 - [Auto-GPT: An Autonomous GPT-4 Experiment](#auto-gpt-an-autonomous-gpt-4-experiment)
-  - [Demo (30/03/2023):](#demo-30032023)
+    - [🔴 🔴 🔴  Urgent: USE `stable` not `master`  🔴 🔴 🔴](#----urgent-use-stable-not-master----)
    - [Demo (30/03/2023):](#demo-30032023)
  - [Table of Contents](#table-of-contents)
  - [🚀 Features](#-features)
  - [📋 Requirements](#-requirements)
  - [💾 Installation](#-installation)
  - [🔧 Usage](#-usage)
    - [Logs](#logs)
    - [Docker](#docker)
    - [Command Line Arguments](#command-line-arguments)
  - [🗣️ Speech Mode](#️-speech-mode)
  - [🔍 Google API Keys Configuration](#-google-api-keys-configuration)
    - [Setting up environment variables](#setting-up-environment-variables)
-  - [Redis Setup](#redis-setup)
+  - [Memory Backend Setup](#memory-backend-setup)
-  - [🌲 Pinecone API Key Setup](#-pinecone-api-key-setup)
+    - [Redis Setup](#redis-setup)
    - [🌲 Pinecone API Key Setup](#-pinecone-api-key-setup)
    - [Milvus Setup](#milvus-setup)
    - [Setting up environment variables](#setting-up-environment-variables-1)
  - [Setting Your Cache Type](#setting-your-cache-type)
  - [View Memory Usage](#view-memory-usage)
-  - [🧠 Memory pre-seeding](#memory-pre-seeding)
+  - [🧠 Memory pre-seeding](#-memory-pre-seeding)
  - [💀 Continuous Mode ⚠️](#-continuous-mode-️)
  - [GPT3.5 ONLY Mode](#gpt35-only-mode)
  - [🖼 Image Generation](#-image-generation)
@@ -75,10 +80,11 @@ Your support is greatly appreciated
  - [Python 3.8 or later](https://www.tutorialspoint.com/how-to-install-python-in-windows)
 - [OpenAI API key](https://platform.openai.com/account/api-keys)
 Optional:
- [PINECONE API key](https://www.pinecone.io/) (If you want Pinecone backed memory)
+- Memory backend
  - [PINECONE API key](https://www.pinecone.io/) (If you want Pinecone backed memory)
  - [Milvus](https://milvus.io/) (If you want Milvus as memory backend)
 - ElevenLabs Key (If you want the AI to speak)
 ## 💾 Installation
@@ -209,7 +215,11 @@ export CUSTOM_SEARCH_ENGINE_ID="YOUR_CUSTOM_SEARCH_ENGINE_ID"
 ```
-## Redis Setup
+## Memory Backend Setup
 Setup any one backend to persist memory.
 ### Redis Setup
 Install docker desktop.
@@ -246,7 +256,7 @@ You can specify the memory index for redis using the following:
 MEMORY_INDEX=whatever
 ```
-## 🌲 Pinecone API Key Setup
+### 🌲 Pinecone API Key Setup
 Pinecone enables the storage of vast amounts of vector-based memory, allowing for only relevant memories to be loaded for the agent at any given time.
@@ -254,6 +264,18 @@ Pinecone enables the storage of vast amounts of vector-based memory, allowing fo
 2. Choose the `Starter` plan to avoid being charged.
 3. Find your API key and region under the default project in the left sidebar.
 ### Milvus Setup
 [Milvus](https://milvus.io/) is a open-source, high scalable vector database to storage huge amount of vector-based memory and provide fast relevant search.
 - setup milvus database, keep your pymilvus version and milvus version same to avoid compatible issues.
  - setup by open source [Install Milvus](https://milvus.io/docs/install_standalone-operator.md)
  - or setup by [Zilliz Cloud](https://zilliz.com/cloud)
 - set `MILVUS_ADDR` in `.env` to your milvus address `host:ip`.
 - set `MEMORY_BACKEND` in `.env` to `milvus` to enable milvus as backend.
 - optional
  - set `MILVUS_COLLECTION` in `.env` to change milvus collection name as you want, `autogpt` is the default name.
 ### Setting up environment variables
 In the `.env` file set:
--- a/autogpt/config/config.py
+++ b/autogpt/config/config.py
@@ -62,6 +62,10 @@ class Config(metaclass=Singleton):
        self.pinecone_api_key = os.getenv("PINECONE_API_KEY")
        self.pinecone_region = os.getenv("PINECONE_ENV")
        # milvus configuration, e.g., localhost:19530.
        self.milvus_addr = os.getenv("MILVUS_ADDR", "localhost:19530")
        self.milvus_collection = os.getenv("MILVUS_COLLECTION", "autogpt")
        self.image_provider = os.getenv("IMAGE_PROVIDER")
        self.huggingface_api_token = os.getenv("HUGGINGFACE_API_TOKEN")
--- a/autogpt/memory/init.py
+++ b/autogpt/memory/init.py
@@ -21,6 +21,12 @@ except ImportError:
    print("Pinecone not installed. Skipping import.")
    PineconeMemory = None
 try:
    from memory.milvus import MilvusMemory
 except ImportError:
    print("pymilvus not installed. Skipping import.")
    MilvusMemory = None
 def get_memory(cfg, init=False):
    memory = None
@@ -44,6 +50,12 @@ def get_memory(cfg, init=False):
            memory = RedisMemory(cfg)
    elif cfg.memory_backend == "no_memory":
        memory = NoMemory(cfg)
    elif cfg.memory_backend == "milvus":
        if not MilvusMemory:
            print("Error: Milvus sdk is not installed."
                  "Please install pymilvus to use Milvus as memory backend.")
        else:
            memory = MilvusMemory(cfg)
    if memory is None:
        memory = LocalCache(cfg)
@@ -56,4 +68,4 @@ def get_supported_memory_backends():
    return supported_memory
-__all__ = ["get_memory", "LocalCache", "RedisMemory", "PineconeMemory", "NoMemory"]
+__all__ = ["get_memory", "LocalCache", "RedisMemory", "PineconeMemory", "NoMemory", "MilvusMemory"]
--- a/requirements.txt
+++ b/requirements.txt
@@ -12,6 +12,7 @@ docker
 duckduckgo-search
 google-api-python-client #(https://developers.google.com/custom-search/v1/overview)
 pinecone-client==2.2.1
 pymilvus==2.2.4
 redis
 orjson
 Pillow
--- a/scripts/memory/milvus.py
+++ b/scripts/memory/milvus.py
@@ -0,0 +1,90 @@
 from pymilvus import (
    connections,
    FieldSchema,
    CollectionSchema,
    DataType,
    Collection,
 )
 from memory.base import MemoryProviderSingleton, get_ada_embedding
 class MilvusMemory(MemoryProviderSingleton):
    def __init__(self, cfg):
        """ Construct a milvus memory storage connection.
        Args:
            cfg (Config): Auto-GPT global config.
        """
        # connect to milvus server.
        connections.connect(address=cfg.milvus_addr)
        fields = [
            FieldSchema(name="pk", dtype=DataType.INT64,
                        is_primary=True, auto_id=True),
            FieldSchema(name="embeddings",
                        dtype=DataType.FLOAT_VECTOR, dim=1536),
            FieldSchema(name="raw_text", dtype=DataType.VARCHAR,
                        max_length=65535)
        ]
        # create collection if not exist and load it.
        schema = CollectionSchema(fields, "auto-gpt memory storage")
        self.collection = Collection(cfg.milvus_collection, schema)
        # create index if not exist.
        if not self.collection.has_index(index_name="embeddings"):
            self.collection.release()
            self.collection.create_index("embeddings", {
                "index_type": "IVF_FLAT",
                "metric_type": "IP",
                "params": {"nlist": 128},
            }, index_name="embeddings")
        self.collection.load()
    def add(self, data):
        """ Add a embedding of data into memory.
        Args:
            data (str): The raw text to construct embedding index.
        Returns:
            str: log.
        """
        embedding = get_ada_embedding(data)
        result = self.collection.insert([[embedding], [data]])
        _text = f"Inserting data into memory at primary key: {result.primary_keys[0]}:\n data: {data}"
        return _text
    def get(self, data):
        """ Return the most relevant data in memory.
        Args:
            data: The data to compare to.
        """
        return self.get_relevant(data, 1)
    def clear(self):
        """ Drop the index in memory.
        """
        self.collection.drop()
        return "Obliviated"
    def get_relevant(self, data, num_relevant=5):
        """ Return the top-k relevant data in memory.
        Args:
            data: The data to compare to.
            num_relevant (int, optional): The max number of relevant data. Defaults to 5.
        """
        # search the embedding and return the most relevant text.
        embedding = get_ada_embedding(data)
        search_params = {
            "metrics_type": "IP",
            "params": {"nprobe": 8},
        }
        result = self.collection.search(
            [embedding], "embeddings", search_params, num_relevant, output_fields=["raw_text"])
        return [item.entity.value_of_field("raw_text") for item in result[0]]
    def get_stats(self):
        """
        Returns: The stats of the milvus cache.
        """
        return f"Entities num: {self.collection.num_entities}"