Updates to the api + refactor

2023-08-25 11:48:43 +02:00 · 2023-08-25 11:48:43 +02:00 · fd9d4952ee
commit fd9d4952ee
parent 32d3bd026a
3 changed files with 71 additions and 29 deletions
--- a/level_2/Readme.md
+++ b/level_2/Readme.md
@ -24,21 +24,43 @@ Initial code lets you do three operations:

 ## Usage

-The fast API endpoint accepts prompts and PDF files and returns a JSON object with the generated text.
+The fast API endpoint accepts prompts and stores data with the help of the Memory Manager
+
+The types of memory are: Episodic, Semantic, Buffer
+
+Endpoint Overview
+The Memory API provides the following endpoints:
+
+- /[memory_type]/add-memory (POST)
+- /[memory_type]/fetch-memory (POST)
+- /[memory_type]/delete-memory (POST)
+- /available-buffer-actions (GET)
+- /run-buffer (POST)
+- /buffer/create-context (POST)
+
+Here is a payload example:

-```curl                                                                    
-    -X POST                                                                                             
-    -F "prompt=The quick brown fox"                                                                     
-    -F "file=@/path/to/file.pdf"                                                                       
-    http://localhost:8000/upload/                                                                    
 ```
-
 {
  "payload": {
    "user_id": "681",
    "session_id": "471",
    "model_speed": "slow",
-    "prompt": "Temperature=Cold;Food Type=Ice Cream",
-    "pdf_url": "https://www.w3.org/WAI/ER/tests/xhtml/testfiles/resources/pdf/dummy.pdf"
+    "prompt": "I want ",
+    "pdf_url": "https://www.w3.org/WAI/ER/tests/xhtml/testfiles/resources/pdf/dummy.pdf",
+    "params": {
+        "version": "1.0",
+        "agreement_id": "AG123456",
+        "privacy_policy": "https://example.com/privacy",
+        "terms_of_service": "https://example.com/terms",
+        "format": "json",
+        "schema_version": "1.1",
+        "checksum": "a1b2c3d4e5f6",
+        "owner": "John Doe",
+        "license": "MIT",
+        "validity_start": "2023-08-01",
+        "validity_end": "2024-07-31"
+    }
  }
-}
+}
+```
--- a/level_2/api.py
+++ b/level_2/api.py
@ -242,7 +242,7 @@ async def available_buffer_actions(
        await Memory_.async_init()

        # memory_class = getattr(Memory_, f"_delete_{memory_type}_memory", None)
-        output = Memory_._available_operations()
+        output = await Memory_._available_operations()
        return JSONResponse(content={"response": output}, status_code=200)

    except Exception as e:
@ -263,13 +263,35 @@ async def available_buffer_actions(
        await Memory_.async_init()

        # memory_class = getattr(Memory_, f"_delete_{memory_type}_memory", None)
-        output = Memory_._run_buffer(user_input=decoded_payload['prompt'], params=decoded_payload['params'])
+        output = await Memory_._run_buffer(user_input=decoded_payload['prompt'], params=decoded_payload['params'])
        return JSONResponse(content={"response": output}, status_code=200)

    except Exception as e:

        return JSONResponse(content={"response": {"error": str(e)}}, status_code=503)

+@app.post("/buffer/create-context", response_model=dict)
+async def available_buffer_actions(
+        payload: Payload,
+        # files: List[UploadFile] = File(...),
+):
+    try:
+
+        decoded_payload = payload.payload
+
+        Memory_ = Memory(user_id=decoded_payload['user_id'])
+
+        await Memory_.async_init()
+
+        # memory_class = getattr(Memory_, f"_delete_{memory_type}_memory", None)
+        output = await Memory_._create_buffer_context(user_input=decoded_payload['prompt'], params=decoded_payload['params'])
+        return JSONResponse(content={"response": output}, status_code=200)
+
+    except Exception as e:
+
+        return JSONResponse(content={"response": {"error": str(e)}}, status_code=503)
+
+
 #
    #     # Process each uploaded PDF file
    #     results = []
--- a/level_2/level_2_pdf_vectorstore__dlt_contracts.py
+++ b/level_2/level_2_pdf_vectorstore__dlt_contracts.py
@ -490,17 +490,12 @@ class EpisodicBuffer(BaseMemory):
        return ["translate", "structure", "load to database", "load to semantic memory", "load to episodic memory",
                "load to buffer"]

-    async def main_buffer(self, user_input=None, content=None, params=None):
-
-        """AI buffer to understand user PDF query, prioritize memory info and process it based on available operations"""
-
+    async def buffer_context(self, user_input=None, content=None, params=None):
+        """Generates the context to be used for the buffer and passed to the agent"""
        # we get a list of available operations for our buffer to consider
        # these operations are what we can do with the data, in the context of PDFs (load, translate, structure, etc)
        list_of_operations = await self.available_operations()

-        memory = Memory(user_id=self.user_id)
-        await memory.async_init()
-
        try:
            # we delete all memories in the episodic buffer, so we can start fresh
            await self.delete_memories()
@ -530,8 +525,6 @@ class EpisodicBuffer(BaseMemory):
                context.append(frequency)

                # fix this so it actually filters
-
-
        else:
            # defaults to semantic search if we don't want to apply algorithms on the vectordb data
            memory = Memory(user_id=self.user_id)
@ -616,7 +609,15 @@ class EpisodicBuffer(BaseMemory):

        # Extract the list of tasks
        tasks_list = data["tasks"]
+        return tasks_list

+    async def main_buffer(self, user_input=None, content=None, params=None):
+
+        """AI buffer to understand user PDF query, prioritize memory info and process it based on available operations"""
+
+        memory = Memory(user_id=self.user_id)
+        await memory.async_init()
+        tasks_list = await self.buffer_context(user_input=user_input, content=content, params=params)
        result_tasks = []

        for task in tasks_list:
@ -716,20 +717,13 @@ class EpisodicBuffer(BaseMemory):
        )

        _input = prompt.format_prompt(query=user_input, steps=str(tasks_list), buffer=buffer_result)
-        #
-        # print("a few things to do like load episodic memory in a structured format")
-        #
+
        # return "a few things to do like load episodic memory in a structured format"

        output = self.llm_base(_input.to_string())
-
        result_parsing = parser.parse(output)
-
        print("here is the parsing result", result_parsing)
-        #
        lookup_value = await memory._add_episodic_memory(observation=str(output), params=params)
-        # now we clean up buffer memory
-
        await self.delete_memories()
        return lookup_value

@ -857,6 +851,10 @@ class Memory:
        return await self.short_term_memory.episodic_buffer.delete_memories(
            params=params
        )
+    async def _create_buffer_context(self,  user_input: str, content: str = None, params:str=None):
+        return await self.short_term_memory.episodic_buffer.buffer_context(
+            user_input=user_input, content=content, params=params
+        )
    async def _available_operations(self):
        return await self.long_term_memory.episodic_buffer.available_operations()