Add retries for gpt-4o performance tests

letta-ai · Dec 21, 2024 · 17796ed · 17796ed
1 parent 6bb64af
commit 17796ed
Show file tree

Hide file tree

Showing 2 changed files with 38 additions and 5 deletions.
diff --git a/letta/server/rest_api/routers/v1/sources.py b/letta/server/rest_api/routers/v1/sources.py
@@ -130,9 +130,8 @@ def attach_source_to_agent(
     Attach a data source to an existing agent.
     """
     actor = server.user_manager.get_user_or_default(user_id=user_id)
-
-    source = server.agent_manager.attach_source(source_id=source_id, agent_id=agent_id, actor=actor)
-    return source
+    server.agent_manager.attach_source(source_id=source_id, agent_id=agent_id, actor=actor)
+    return server.source_manager.get_source_by_id(source_id=source_id, actor=actor)
 
 
 @router.post("/{source_id}/detach", response_model=Source, operation_id="detach_agent_from_source")
@@ -146,7 +145,8 @@ def detach_source_from_agent(
     Detach a data source from an existing agent.
     """
     actor = server.user_manager.get_user_or_default(user_id=user_id)
-    return server.agent_manager.detach_source(agent_id=agent_id, source_id=source_id, actor=actor)
+    server.agent_manager.detach_source(agent_id=agent_id, source_id=source_id, actor=actor)
+    return server.source_manager.get_source_by_id(source_id=source_id, actor=actor)
 
 
 @router.post("/{source_id}/upload", response_model=Job, operation_id="upload_file_to_source")

diff --git a/tests/test_model_letta_perfomance.py b/tests/test_model_letta_perfomance.py
@@ -56,17 +56,43 @@ def wrapper(*args, **kwargs):
     return decorator_retry
 
 
+def retry_until_success(max_attempts=10, sleep_time_seconds=4):
+    """
+    Decorator to retry a function until it succeeds or the maximum number of attempts is reached.
+
+    :param max_attempts: Maximum number of attempts to retry the function.
+    :param sleep_time_seconds: Time to wait between attempts, in seconds.
+    """
+
+    def decorator_retry(func):
+        @functools.wraps(func)
+        def wrapper(*args, **kwargs):
+            for attempt in range(1, max_attempts + 1):
+                try:
+                    return func(*args, **kwargs)
+                except Exception as e:
+                    print(f"\033[93mAttempt {attempt} failed with error:\n{e}\033[0m")
+                    if attempt == max_attempts:
+                        raise
+                    time.sleep(sleep_time_seconds)
+
+        return wrapper
+
+    return decorator_retry
+
+
 # ======================================================================================================================
 # OPENAI TESTS
 # ======================================================================================================================
-@retry_until_threshold(threshold=0.75, max_attempts=4)
+@retry_until_success(max_attempts=5, sleep_time_seconds=2)
 def test_openai_gpt_4o_returns_valid_first_message():
     filename = os.path.join(llm_config_dir, "openai-gpt-4o.json")
     response = check_first_response_is_valid_for_llm_endpoint(filename)
     # Log out successful response
     print(f"Got successful response from client: \n\n{response}")
 
 
+@retry_until_success(max_attempts=5, sleep_time_seconds=2)
 def test_openai_gpt_4o_returns_keyword():
     keyword = "banana"
     filename = os.path.join(llm_config_dir, "openai-gpt-4o.json")
@@ -75,47 +101,54 @@ def test_openai_gpt_4o_returns_keyword():
     print(f"Got successful response from client: \n\n{response}")
 
 
+@retry_until_success(max_attempts=5, sleep_time_seconds=2)
 def test_openai_gpt_4o_uses_external_tool():
     filename = os.path.join(llm_config_dir, "openai-gpt-4o.json")
     response = check_agent_uses_external_tool(filename)
     # Log out successful response
     print(f"Got successful response from client: \n\n{response}")
 
 
+@retry_until_success(max_attempts=5, sleep_time_seconds=2)
 def test_openai_gpt_4o_recall_chat_memory():
     filename = os.path.join(llm_config_dir, "openai-gpt-4o.json")
     response = check_agent_recall_chat_memory(filename)
     # Log out successful response
     print(f"Got successful response from client: \n\n{response}")
 
 
+@retry_until_success(max_attempts=5, sleep_time_seconds=2)
 def test_openai_gpt_4o_archival_memory_retrieval():
     filename = os.path.join(llm_config_dir, "openai-gpt-4o.json")
     response = check_agent_archival_memory_retrieval(filename)
     # Log out successful response
     print(f"Got successful response from client: \n\n{response}")
 
 
+@retry_until_success(max_attempts=5, sleep_time_seconds=2)
 def test_openai_gpt_4o_archival_memory_insert():
     filename = os.path.join(llm_config_dir, "openai-gpt-4o.json")
     response = check_agent_archival_memory_insert(filename)
     # Log out successful response
     print(f"Got successful response from client: \n\n{response}")
 
 
+@retry_until_success(max_attempts=5, sleep_time_seconds=2)
 def test_openai_gpt_4o_edit_core_memory():
     filename = os.path.join(llm_config_dir, "openai-gpt-4o.json")
     response = check_agent_edit_core_memory(filename)
     # Log out successful response
     print(f"Got successful response from client: \n\n{response}")
 
 
+@retry_until_success(max_attempts=5, sleep_time_seconds=2)
 def test_openai_gpt_4o_summarize_memory():
     filename = os.path.join(llm_config_dir, "openai-gpt-4o.json")
     response = check_agent_summarize_memory_simple(filename)
     print(f"Got successful response from client: \n\n{response}")
 
 
+@retry_until_success(max_attempts=5, sleep_time_seconds=2)
 def test_embedding_endpoint_openai():
     filename = os.path.join(embedding_config_dir, "openai_embed.json")
     run_embedding_endpoint(filename)