letta-ai · cpacker · Nov 3, 2023 · Nov 3, 2023 · Nov 3, 2023 · Nov 3, 2023
diff --git a/memgpt/local_llm/json_parser.py b/memgpt/local_llm/json_parser.py
@@ -0,0 +1,63 @@
+import json
+
+
+def extract_first_json(string):
+    """Handles the case of two JSON objects back-to-back"""
+    depth = 0
+    start_index = None
+
+    for i, char in enumerate(string):
+        if char == "{":
+            if depth == 0:
+                start_index = i
+            depth += 1
+        elif char == "}":
+            depth -= 1
+            if depth == 0 and start_index is not None:
+                try:
+                    return json.loads(string[start_index : i + 1])
+                except json.JSONDecodeError as e:
+                    raise json.JSONDecodeError(f"Matched closing bracket, but decode failed with error: {str(e)}")
+    print("No valid JSON object found.")
+    raise json.JSONDecodeError("Couldn't find starting bracket")
+
+
+def add_missing_heartbeat(llm_json):
+    """Manually insert heartbeat requests into messages that should have them
+
+    Use the following heuristic:
+      - if (function call is not send_message && prev message['role'] == user): insert heartbeat
+
+    Basically, if MemGPT is calling a function (not send_message) immediately after the user sending a message,
+    it probably is a retriever or insertion call, in which case we likely want to eventually reply with send_message
+
+            "message" = {
+            "role": "assistant",
+            "content": ...,
+            "function_call": {
+                "name": ...
+                "arguments": {
+                    "arg1": val1,
+                    ...
+                }
+            }
+        }
+    """
+    raise NotImplementedError
+
+
+def clean_json(raw_llm_output, messages=None, functions=None):
+    """Try a bunch of hacks to parse the data coming out of the LLM"""
+
+    try:
+        data = json.loads(raw_llm_output)
+    except json.JSONDecodeError:
+        try:
+            data = json.loads(raw_llm_output + "}")
+        except json.JSONDecodeError:
+            try:
+                data = extract_first_json(raw_llm_output + "}")
+            except:
+                raise
+
+    return data
diff --git a/memgpt/local_llm/llm_chat_completion_wrappers/airoboros.py b/memgpt/local_llm/llm_chat_completion_wrappers/airoboros.py
@@ -1,6 +1,7 @@
 import json
 
 from .wrapper_base import LLMChatCompletionWrapper
+from ..json_parser import clean_json
 from ...errors import LLMJSONParsingError
 
 
@@ -184,9 +185,9 @@ def output_to_chat_completion_response(self, raw_llm_output):
             raw_llm_output = "{" + raw_llm_output
 
         try:
-            function_json_output = json.loads(raw_llm_output)
+            function_json_output = clean_json(raw_llm_output)
         except Exception as e:
-            raise Exception(f"Failed to decode JSON from LLM output:\n{raw_llm_output}")
+            raise Exception(f"Failed to decode JSON from LLM output:\n{raw_llm_output} - error\n{str(e)}")
         try:
             function_name = function_json_output["function"]
             function_parameters = function_json_output["params"]
@@ -393,12 +394,9 @@ def output_to_chat_completion_response(self, raw_llm_output):
             raw_llm_output = "{" + raw_llm_output
 
         try:
-            function_json_output = json.loads(raw_llm_output)
+            function_json_output = clean_json(raw_llm_output)
         except Exception as e:
-            try:
-                function_json_output = json.loads(raw_llm_output + "\n}")
-            except:
-                raise Exception(f"Failed to decode JSON from LLM output:\n{raw_llm_output}")
+            raise Exception(f"Failed to decode JSON from LLM output:\n{raw_llm_output} - error\n{str(e)}")
         try:
             function_name = function_json_output["function"]
             function_parameters = function_json_output["params"]