From dc7c3b1f641898dc588afaffa35f68e36e5ca01b Mon Sep 17 00:00:00 2001
From: Alexander Dibrov <108030031+dibrale@users.noreply.github.com>
Date: Thu, 27 Apr 2023 19:37:28 -0500
Subject: [PATCH 1/2] Fix for silent llama

Fix for prioritization agent deleting priority list when returning empty output. Prompt engineering and parameter improvements to reduce number of empty responses from llama models. More debug output.
---
 babyagi.py | 85 ++++++++++++++++++++++++++++++++++--------------------
 1 file changed, 54 insertions(+), 31 deletions(-)

diff --git a/babyagi.py b/babyagi.py
index bcc44306..594e278a 100755
--- a/babyagi.py
+++ b/babyagi.py
@@ -46,6 +46,7 @@
 # Model configuration
 OPENAI_TEMPERATURE = float(os.getenv("OPENAI_TEMPERATURE", 0.0))
 
+
 # Extensions support begin
 
 def can_import(module_name):
@@ -66,6 +67,7 @@ def can_import(module_name):
 if ENABLE_COMMAND_LINE_ARGS:
     if can_import("extensions.argparseext"):
         from extensions.argparseext import parse_arguments
+
         OBJECTIVE, INITIAL_TASK, LLM_MODEL, DOTENV_EXTENSIONS, INSTANCE_NAME, COOPERATIVE_MODE, JOIN_EXISTING_OBJECTIVE = parse_arguments()
 
 # Human mode extension
@@ -80,6 +82,7 @@ def can_import(module_name):
 if DOTENV_EXTENSIONS:
     if can_import("extensions.dotenvext"):
         from extensions.dotenvext import load_dotenv_extensions
+
         load_dotenv_extensions(DOTENV_EXTENSIONS)
 
 # TODO: There's still work to be done here to enable people to get
@@ -106,22 +109,26 @@ def can_import(module_name):
         print(f"LLAMA : {LLAMA_MODEL_PATH}" + "\n")
         assert os.path.exists(LLAMA_MODEL_PATH), "\033[91m\033[1m" + f"Model can't be found." + "\033[0m\033[0m"
 
-        CTX_MAX = 2048
+        CTX_MAX = 1024
         LLAMA_THREADS_NUM = int(os.getenv("LLAMA_THREADS_NUM", 8))
+
+        print('Initialize model for evaluation')
         llm = Llama(
             model_path=LLAMA_MODEL_PATH,
             n_ctx=CTX_MAX,
             n_threads=LLAMA_THREADS_NUM,
             n_batch=512,
-            use_mlock=True,
+            use_mlock=False,
         )
+
+        print('\nInitialize model for embedding')
         llm_embed = Llama(
             model_path=LLAMA_MODEL_PATH,
             n_ctx=CTX_MAX,
             n_threads=LLAMA_THREADS_NUM,
             n_batch=512,
             embedding=True,
-            use_mlock=True,
+            use_mlock=False,
         )
 
         print(
@@ -284,8 +291,10 @@ def get_task_names(self):
     if can_import("extensions.ray_tasks"):
         import sys
         from pathlib import Path
+
         sys.path.append(str(Path(__file__).resolve().parent))
         from extensions.ray_tasks import CooperativeTaskListStorage
+
         tasks_storage = CooperativeTaskListStorage(OBJECTIVE)
         print("\nReplacing tasks storage: " + "\033[93m\033[1m" + "Ray" + "\033[0m\033[0m")
 elif COOPERATIVE_MODE in ['d', 'distributed']:
@@ -314,8 +323,18 @@ def openai_call(
     while True:
         try:
             if model.lower().startswith("llama"):
-                result = llm(prompt[:CTX_MAX], stop=["### Human"], echo=False, temperature=0.2)
-                return str(result['choices'][0]['text'].strip())
+                result = llm(prompt[:CTX_MAX],
+                             stop=["### Human"],
+                             echo=False,
+                             temperature=0.2,
+                             top_k=40,
+                             top_p=0.95,
+                             repeat_penalty=1.05,
+                             max_tokens=200)
+                # print('\n*****RESULT JSON DUMP*****\n')
+                # print(json.dumps(result))
+                # print('\n')
+                return result['choices'][0]['text'].strip()
             elif model.lower().startswith("human"):
                 return user_input_await(prompt)
             elif not model.lower().startswith("gpt-"):
@@ -384,7 +403,6 @@ def openai_call(
 def task_creation_agent(
         objective: str, result: Dict, task_description: str, task_list: List[str]
 ):
-
     prompt = f"""
 You are to use the result from an execution agent to create new tasks with the following objective: {objective}.
 The last completed task has the result: \n{result["data"]}
@@ -392,22 +410,22 @@ def task_creation_agent(
 
     if task_list:
         prompt += f"These are incomplete tasks: {', '.join(task_list)}\n"
-    prompt += "Based on the result, create a list of new tasks to be completed in order to meet the objective. "
+    prompt += "Based on the result, return a list of tasks to be completed in order to meet the objective. "
     if task_list:
         prompt += "These new tasks must not overlap with incomplete tasks. "
 
     prompt += """
-Return all the new tasks, with one task per line in your response. The result must be a numbered list in the format:
-    
+Return one task per line in your response. The result must be a numbered list in the format:
+
 #. First task
 #. Second task
-        
-The number of each entry must be followed by a period.
-Do not include any headers before your numbered list. Do not follow your numbered list with any other output."""
 
-    print(f'\n************** TASK CREATION AGENT PROMPT *************\n{prompt}\n')
+The number of each entry must be followed by a period. If your list is empty, write "There are no tasks to add at this time."
+Unless your list is empty, do not include any headers before your numbered list or follow your numbered list with any other output."""
+
+    print(f'\n*****TASK CREATION AGENT PROMPT****\n{prompt}\n')
     response = openai_call(prompt, max_tokens=2000)
-    print(f'\n************* TASK CREATION AGENT RESPONSE ************\n{response}\n')
+    print(f'\n****TASK CREATION AGENT RESPONSE****\n{response}\n')
     new_tasks = response.split('\n')
     new_tasks_list = []
     for task_string in new_tasks:
@@ -426,23 +444,26 @@ def task_creation_agent(
 def prioritization_agent():
     task_names = tasks_storage.get_task_names()
     next_task_id = tasks_storage.next_task_id()
+    bullet_string = '\n'
 
     prompt = f"""
-You are tasked with cleaning the format and re-prioritizing the following tasks: {', '.join(task_names)}.
+You are tasked with prioritizing the following tasks: {bullet_string + bullet_string.join(task_names)}
 Consider the ultimate objective of your team: {OBJECTIVE}.
-Tasks should be sorted from highest to lowest priority. 
-Higher-priority tasks are those that act as pre-requisites or are more essential for meeting the objective.
-Do not remove any tasks. Return the result as a numbered list in the format:
+Tasks should be sorted from highest to lowest priority, where higher-priority tasks are those that act as pre-requisites or are more essential for meeting the objective.
+Do not remove any tasks. Return the ranked tasks as a numbered list in the format:
 
 #. First task
 #. Second task
 
-The entries are consecutively numbered, starting with 1. The number of each entry must be followed by a period.
-Do not include any headers before your numbered list. Do not follow your numbered list with any other output."""
+The entries must be consecutively numbered, starting with 1. The number of each entry must be followed by a period.
+Do not include any headers before your ranked list or follow your list with any other output."""
 
-    print(f'\n************** TASK PRIORITIZATION AGENT PROMPT *************\n{prompt}\n')
+    print(f'\n****TASK PRIORITIZATION AGENT PROMPT****\n{prompt}\n')
     response = openai_call(prompt, max_tokens=2000)
-    print(f'\n************* TASK PRIORITIZATION AGENT RESPONSE ************\n{response}\n')
+    print(f'\n****TASK PRIORITIZATION AGENT RESPONSE****\n{response}\n')
+    if not response:
+        print('Received empty response from priotritization agent. Keeping task list unchanged.')
+        return
     new_tasks = response.split("\n") if "\n" in response else [response]
     new_tasks_list = []
     for task_string in new_tasks:
@@ -453,7 +474,7 @@ def prioritization_agent():
             if task_name.strip():
                 new_tasks_list.append({"task_id": task_id, "task_name": task_name})
 
-    tasks_storage.replace(new_tasks_list)
+    return new_tasks_list
 
 
 # Execute a task based on the objective and five previous tasks
@@ -469,15 +490,14 @@ def execution_agent(objective: str, task: str) -> str:
         str: The response generated by the AI for the given task.
 
     """
-    
+
     context = context_agent(query=objective, top_results_num=5)
-    # print("\n*******RELEVANT CONTEXT******\n")
+    # print("\n****RELEVANT CONTEXT****\n")
     # print(context)
     # print('')
     prompt = f'Perform one task based on the following objective: {objective}.\n'
     if context:
-        prompt += 'Take into account these previously completed tasks:' + '\n'.join(context)\
-
+        prompt += 'Take into account these previously completed tasks:' + '\n'.join(context)
     prompt += f'\nYour task: {task}\nResponse:'
     return openai_call(prompt, max_tokens=2000)
 
@@ -496,7 +516,7 @@ def context_agent(query: str, top_results_num: int):
 
     """
     results = results_storage.query(query=query, top_results_num=top_results_num)
-    # print("***** RESULTS *****")
+    # print("****RESULTS****")
     # print(results)
     return results
 
@@ -537,7 +557,7 @@ def main():
             }
             # extract the actual result from the dictionary
             # since we don't do enrichment currently
-            # vector = enriched_result["data"]  
+            # vector = enriched_result["data"]
 
             result_id = f"result_{task['task_id']}"
 
@@ -558,9 +578,12 @@ def main():
                 print(str(new_task))
                 tasks_storage.append(new_task)
 
-            if not JOIN_EXISTING_OBJECTIVE: prioritization_agent()
+            if not JOIN_EXISTING_OBJECTIVE:
+                prioritized_tasks = prioritization_agent()
+                if prioritized_tasks:
+                    tasks_storage.replace(prioritized_tasks)
 
-        # Sleep a bit before checking the task list again
+            # Sleep a bit before checking the task list again
             time.sleep(5)
         else:
             print('Done.')

From e3d0f479135b84d0b46c0fcf06913cfd8cf375ad Mon Sep 17 00:00:00 2001
From: Alexander Dibrov <108030031+dibrale@users.noreply.github.com>
Date: Sun, 30 Apr 2023 21:09:48 -0500
Subject: [PATCH 2/2] Revert prompt changes

At the request of the maintainer
---
 babyagi.py | 29 ++++++++++++++++-------------
 1 file changed, 16 insertions(+), 13 deletions(-)

diff --git a/babyagi.py b/babyagi.py
index f4638789..af5ca683 100755
--- a/babyagi.py
+++ b/babyagi.py
@@ -1,5 +1,6 @@
 #!/usr/bin/env python3
 from dotenv import load_dotenv
+
 # Load default environment variables (.env)
 load_dotenv()
 
@@ -18,8 +19,8 @@
 
 # default opt out of chromadb telemetry.
 from chromadb.config import Settings
-client = chromadb.Client(Settings(anonymized_telemetry=False))
 
+client = chromadb.Client(Settings(anonymized_telemetry=False))
 
 # Engine configuration
 
@@ -175,6 +176,8 @@ def can_import(module_name):
 class LlamaEmbeddingFunction(EmbeddingFunction):
     def __init__(self):
         return
+
+
     def __call__(self, texts: Documents) -> Embeddings:
         embeddings = []
         for t in texts:
@@ -424,18 +427,18 @@ def task_creation_agent(
 
     if task_list:
         prompt += f"These are incomplete tasks: {', '.join(task_list)}\n"
-    prompt += "Based on the result, return a list of tasks to be completed in order to meet the objective. "
+    prompt += "Based on the result, create a list of new tasks to be completed in order to meet the objective. "
     if task_list:
         prompt += "These new tasks must not overlap with incomplete tasks. "
 
     prompt += """
-Return one task per line in your response. The result must be a numbered list in the format:
-
+Return all the new tasks, with one task per line in your response. The result must be a numbered list in the format:
+    
 #. First task
 #. Second task
-
-The number of each entry must be followed by a period. If your list is empty, write "There are no tasks to add at this time."
-Unless your list is empty, do not include any headers before your numbered list or follow your numbered list with any other output."""
+        
+The number of each entry must be followed by a period.
+Do not include any headers before your numbered list. Do not follow your numbered list with any other output."""
 
     print(f'\n*****TASK CREATION AGENT PROMPT****\n{prompt}\n')
     response = openai_call(prompt, max_tokens=2000)
@@ -458,19 +461,19 @@ def task_creation_agent(
 def prioritization_agent():
     task_names = tasks_storage.get_task_names()
     next_task_id = tasks_storage.next_task_id()
-    bullet_string = '\n'
 
     prompt = f"""
-You are tasked with prioritizing the following tasks: {bullet_string + bullet_string.join(task_names)}
+You are tasked with cleaning the format and re-prioritizing the following tasks: {', '.join(task_names)}.
 Consider the ultimate objective of your team: {OBJECTIVE}.
-Tasks should be sorted from highest to lowest priority, where higher-priority tasks are those that act as pre-requisites or are more essential for meeting the objective.
-Do not remove any tasks. Return the ranked tasks as a numbered list in the format:
+Tasks should be sorted from highest to lowest priority. 
+Higher-priority tasks are those that act as pre-requisites or are more essential for meeting the objective.
+Do not remove any tasks. Return the result as a numbered list in the format:
 
 #. First task
 #. Second task
 
-The entries must be consecutively numbered, starting with 1. The number of each entry must be followed by a period.
-Do not include any headers before your ranked list or follow your list with any other output."""
+The entries are consecutively numbered, starting with 1. The number of each entry must be followed by a period.
+Do not include any headers before your numbered list. Do not follow your numbered list with any other output."""
 
     print(f'\n****TASK PRIORITIZATION AGENT PROMPT****\n{prompt}\n')
     response = openai_call(prompt, max_tokens=2000)