jefcoder
diff --git a/‎README.md‎
Lines changed: 9 additions & 4 deletions b/‎README.md‎
Lines changed: 9 additions & 4 deletions
diff --git a/‎code_agent/__pycache__/agent_subtask_executor.cpython-311.pyc‎
33 Bytes b/‎code_agent/__pycache__/agent_subtask_executor.cpython-311.pyc‎
33 Bytes
diff --git a/‎code_agent/__pycache__/function_validator.cpython-311.pyc‎
2.15 KB b/‎code_agent/__pycache__/function_validator.cpython-311.pyc‎
2.15 KB
diff --git a/‎code_agent/__pycache__/logging_handler.cpython-311.pyc‎
0 Bytes b/‎code_agent/__pycache__/logging_handler.cpython-311.pyc‎
0 Bytes
diff --git a/‎code_agent/agent_subtask_executor.py‎
Lines changed: 92 additions & 81 deletions b/‎code_agent/agent_subtask_executor.py‎
Lines changed: 92 additions & 81 deletions
@@ -54,13 +54,20 @@ AutoCodeAgent allows you to handle complex tasks such as:
 
 - *"I want to review the picture on Wikipedia for three different actors. Use browser_navigation to visit each actor's Wikipedia page, please use your vision capability guess the actor's age in the picture. Your goal is to guess the actor's age in the picture. Then, create a summary when you compare the picture age with the actual actor's age. Once you have completed the report, send it by email to (your_email). The actors are: Brad Pitt Robert De Niro Marlon Rando. Good luck!"*
 
-- *"Visit 4 different electronics e-commerce sites to get the average price of the top 3 search results for the query: iPhone 13 Pro. The websites are: https://www.bestbuy.com/, https://www.croma.com/, https://www.mediaworld.it/, https://www.boulanger.com/. Then, provide me with a price comparison report. If you find a currency other than the euro, search Google for the latest exchange rate and convert the prices. Finally, save the report in the simple rag database and send me the same report via email to (your_email)"*
+- *"Navigate with browser different electronics e-commerce sites to get the average price of the top 3 search results for the query: iPhone 13 Pro. The websites are: https://www.bestbuy.com/, https://www.croma.com/, https://www.mediaworld.it/, https://www.boulanger.com/. Then, provide me with a price comparison report. If you find a currency other than the euro, search Google for the latest exchange rate and convert the prices. Finally, save the report in the llama index database and send me the same report via email to (your_email)"*
 
 - *"Go to LinkedIn Feed and log in using your email (your_email) and password (your_password). Scroll down to the first post and leave a comment that is both intelligent and contextually relevant, taking into account the text and image. Your comment must contain at least 40 words. Once you have posted your comment, email the execution result to (your_email)."*
 
 - *"Please visit Booking.com and search for a Hotel in Milan that is available from June 1st to June 10th. Extract the name and price of the first hotel in the result. Then save it on simple rag database, send an email to (your_email) with the hotel's name and price."*
 
-- *"Calculate the area of the triangle formed by Paris, Moscow, and Rome in square kilometers, and send me an email at samuele.giampieri1@gmail.com with the coordinates of the cities and the calculated area."*
+- *"Calculate the area of the triangle formed by Paris, Moscow, and Rome in square kilometers, and send me an email at your_email@gmail.com with the coordinates of the cities and the calculated area."*
+
+- *"Search for the latest news about Open AI, summarize it and send me an email at your_email@gmail.com with the summary."*
+
+- *"Search for the latest articles on cybersecurity, extract full-page content along with any notable images and captions using your web search and browser navigation tools, compile everything into an HTML report, and send it via email to my team at your_email@gmail.com with the subject 'Cybersecurity Trends Update'."*
+
+- *"Search for the latest news about the latest Ferrari model, summarize it, and save it in the LlamaIndex database. After that, make 3 different queries on the database to check if the information was stored correctly. Finally, send me a report by email to your_email@gmail.com"*
+
 
 AutoCodeAgent 2.0 introduces RAG (Retrieval-Augmented Generation) capabilities, empowering the system with multi RAG techniques, each having its own ingestion and retrieval tools. 
 The system uses many persistent Database integrated in Docker, like Vector ChromaDB, Graph Neo4j, and Others.
@@ -634,5 +641,3 @@ We welcome contributions from the community! If you'd like to contribute, please
 By contributing, you agree that your changes will be licensed under the same license as the project.
 
 Thank you for helping improve this project! 🚀
-
-
 
@@ -1,5 +1,5 @@
 import json
-import traceback
+import re
 import inspect
 from .function_validator import FunctionValidator
 from models.models import call_model
@@ -19,43 +19,97 @@ def __init__(self, agent):
             lib_name for tool in self.agent.tools for lib_name in tool["lib_names"]
         ]
 
+
+ 
     def execute_subtasks(self):
-        """
-        Iterates over the subtasks in the JSON plan, validates each subtask’s code,
-        attempts to execute it (with regeneration on error), and then calls the subtask function.
+            """
+            Iterates over the subtasks in the JSON plan, validates each subtask’s code,
+            executes it (with regeneration on error based on in-memory log inspection),
+            and then calls the subtask function.
 
-        :return: A dictionary with the results of the executed subtasks.
-        """
-        results = {}
-        subtasks = self.agent.json_plan.get("subtasks", [])
-
-        for index, subtask in enumerate(subtasks):
-            # --- Step 1: Validate subtask code ---
-            output_validator, subtask = self._validate_subtask_code(subtask, index, results)
-            code_string = output_validator["code_string"]
-
-            # --- Step 2: Execute the subtask code (with retries) ---
-            temp_namespace, code_string = self._execute_subtask_code(subtask, code_string, index)
-
-            # --- Step 3: Run the subtask function from the namespace ---
-            subtask_name = subtask["subtask_name"]
-            input_tool_name = subtask.get("input_from_subtask", "")
-            if subtask_name in temp_namespace:
-                tool_func = temp_namespace[subtask_name]
-                sig = inspect.signature(tool_func)
-                if index > 0:
-                    previous_result = results.get(input_tool_name, {})
-                    result = tool_func(previous_result)
-                else:
-                    if "previous_output" in sig.parameters:
-                        result = tool_func({})
+            :return: A dictionary with the results of the executed subtasks.
+            """
+            results = {}
+            subtasks = self.agent.json_plan.get("subtasks", [])
+
+            error_pattern = re.compile(r"\[ERROR\]")
+
+            for index, subtask in enumerate(subtasks):
+                # --- Step 1: Validate subtask code ---
+                output_validator, subtask = self._validate_subtask_code(subtask, index, results)
+                code_string = output_validator["code_string"]
+
+                subtask_name = subtask["subtask_name"]
+                input_tool_name = subtask.get("input_from_subtask", "")
+                attempts = 0
+                success = False
+
+                # Regeneration loop for execution errors (based on log inspection)
+                while attempts < self.execution_max_regeneration_attempts and not success:
+                    # --- Step 2: Execute the subtask code ---
+                    temp_namespace, code_string = self._execute_subtask_code(subtask, code_string, index)
+
+                    if subtask_name not in temp_namespace:
+                        error_msg = f"Subtask '{subtask_name}' not found in the execution namespace."
+                        self.agent.logger.error(
+                            self.agent.enrich_log(error_msg, "add_red_divider"),
+                            extra={'no_memory': True}
+                        )
+                        raise Exception(error_msg)
+
+                    tool_func = temp_namespace[subtask_name]
+                    sig = inspect.signature(tool_func)
+
+                    log_start_index = len(self.agent.execution_logs)
+
+                    # --- Step 3: Call the subtask function ---
+                    if index > 0:
+                        previous_result = results.get(input_tool_name, {})
+                        result = tool_func(previous_result)
+                    else:
+                        if "previous_output" in sig.parameters:
+                            result = tool_func({})
+                        else:
+                            result = tool_func()
+                    results[subtask_name] = result
+
+                    # After calling the function, retrieve new log entries.
+                    new_logs = self.agent.execution_logs[log_start_index:]
+                    if any(error_pattern.search(log) for log in new_logs):
+                        error_message = "\n".join(new_logs)
+                        self.agent.logger.error(
+                            self.agent.enrich_log(
+                                f"❌ Errors found after executing subtask '{subtask_name}' "
+                                f"(attempt {attempts + 1}/{self.execution_max_regeneration_attempts}):\n{error_message}",
+                                "add_red_divider"
+                            ),
+                            extra={'no_memory': True} 
+                        )
+                        # Regenerate the subtask code based on the error logs.
+                        regen_subtask = self.regenerate_subtask(error_message, subtask)
+                        self._update_subtask_in_plan(subtask_name, regen_subtask)
+                        subtask = regen_subtask
+                        code_string = subtask["code"]
+                        attempts += 1
                     else:
-                        result = tool_func()
-                results[subtask_name] = result
+                        success = True
+
+                if not success:
+                    error_msg = (
+                        f"❌❌❌ Subtask '{subtask_name}' still fails after {attempts} execution regeneration attempts."
+                    )
+                    self.agent.logger.error(
+                        self.agent.enrich_log(error_msg, "add_red_divider"),
+                        extra={'no_memory': True}
+                    )
+                    raise Exception(error_msg)
 
-                results_str = json.dumps(results, indent=4) 
+                # --- Logging the successful execution ---
+                results_str = json.dumps(results, indent=4)
                 if index == len(subtasks) - 1:
-                    self.agent.logger.info(f"✅ Last subtask '{subtask_name}' executed successfully. this is the final result: {results_str}")
+                    self.agent.logger.info(
+                        f"✅ Last subtask '{subtask_name}' executed successfully. This is the final result: {results_str}"
+                    )
                 if len(results_str) > 500:
                     results_str = results_str[:500] + "... [truncated]"
 
@@ -68,15 +122,9 @@ def execute_subtasks(self):
                     ),
                     extra={'no_memory': True}
                 )
-            else:
-                error_msg = f"Subtask '{subtask_name}' not found in the execution namespace."
-                self.agent.logger.error(
-                    self.agent.enrich_log(error_msg, "add_red_divider"),
-                    extra={'no_memory': True}
-                )
-                raise Exception(error_msg)
 
-        return results
+            return results
+
 
     def _update_subtask_in_plan(self, subtask_name, new_subtask):
         """
@@ -170,18 +218,7 @@ def _validate_subtask_code(self, subtask, index, results):
         return output_validator, subtask
 
     def _execute_subtask_code(self, subtask, code_string, index):
-        """
-        Executes the code string within a dedicated namespace and attempts regeneration if an error occurs.
-
-        :param subtask: The current subtask (a dict).
-        :param code_string: The Python code (as a string) to execute.
-        :param index: The index of the current subtask.
-        :return: A tuple (temp_namespace, code_string) where temp_namespace is the dictionary in which the code was executed.
-        :raises Exception: If execution fails after the maximum regeneration attempts.
-        """
-        attempts = 0
         temp_namespace = {"logger": self.agent.logger}
-
         self.agent.logger.info(
             self.agent.enrich_log(
                 f"⌛ Executing subtask nr.{index + 1} of {len(self.agent.json_plan.get('subtasks', []))}: {subtask['subtask_name']}",
@@ -190,35 +227,9 @@ def _execute_subtask_code(self, subtask, code_string, index):
             extra={'no_memory': True}
         )
 
-        while attempts < self.execution_max_regeneration_attempts:
-            try:
-                exec(code_string, temp_namespace)
-                return temp_namespace, code_string
-            except Exception:
-                error_message = traceback.format_exc()
-                self.agent.logger.error(
-                    self.agent.enrich_log(
-                        f"❌ Error during execution of subtask '{subtask['subtask_name']}' "
-                        f"(attempt {attempts + 1}/{self.execution_max_regeneration_attempts}):\n{error_message}",
-                        "add_red_divider"
-                    ),
-                    extra={'no_memory': True}
-                )
-                regen_subtask = self.regenerate_subtask(error_message, subtask)
-                self._update_subtask_in_plan(subtask["subtask_name"], regen_subtask)
-                # In this case we assume that the regenerated subtask has an updated "code" field.
-                code_string = regen_subtask["code"]
-                attempts += 1
-
-        error_msg = (
-            f"❌❌❌ Subtask '{subtask['subtask_name']}' still fails after "
-            f"{attempts} execution regeneration attempts."
-        )
-        self.agent.logger.error(
-            self.agent.enrich_log(error_msg, "add_red_divider"),
-            extra={'no_memory': True}
-        )
-        raise Exception(error_msg)
+        exec(code_string, temp_namespace)
+        return temp_namespace, code_string
+
 
     def regenerate_subtask(self, subtask_errors, subtask):
         """