SkyworkAI
diff --git a/‎src/agent/base_agent.py
Lines changed: 38 additions & 6 deletions b/‎src/agent/base_agent.py
Lines changed: 38 additions & 6 deletions
diff --git a/‎src/agent/browser_use_agent/prompts/browser_use_agent.yaml
Lines changed: 6 additions & 139 deletions b/‎src/agent/browser_use_agent/prompts/browser_use_agent.yaml
Lines changed: 6 additions & 139 deletions
diff --git a/‎src/agent/deep_analyzer_agent/prompts/deep_analyzer_agent.yaml
Lines changed: 6 additions & 139 deletions b/‎src/agent/deep_analyzer_agent/prompts/deep_analyzer_agent.yaml
Lines changed: 6 additions & 139 deletions
@@ -1,3 +1,4 @@
+import os
 from typing import (
     Any,
     Callable,
@@ -31,7 +32,17 @@
     AgentImage,
 )
 from src.utils import assemble_project_path
+from src.utils.path_utils import assemble_project_path
+from src.memory.memory import AgentMemory  # Remove PromptTemplates from this import
+from src.logger.logger import LogLevel
+import yaml
+from jinja2 import Environment, FileSystemLoader, TemplateNotFound, meta, Template
+from abc import ABC, abstractmethod
+from typing import Any, List, Dict, Union, Optional, Type
+
+from src.logger import logger
 
+from src.memory.memory import ActionStep
 class BaseAgent(AsyncMultiStepAgent):
     """Base class for agents with common logic."""
     AGENT_NAME = "base_agent"  # Must be overridden by subclasses
@@ -79,13 +90,34 @@ def __init__(
         )
 
         # Loading prompt_templates
-        if prompt_templates:
-            self.prompt_templates = prompt_templates
+        if prompt_templates_path:
+            # template_dir is the directory of the specific agent's prompt file
+            template_dir = os.path.dirname(prompt_templates_path)
+            template_filename = os.path.basename(prompt_templates_path)
+
+            # Determine the common prompts directory relative to this file (base_agent.py)
+            # __file__ is .../src/agent/base_agent.py
+            # common_prompts_dir should be .../src/base/prompts/
+            current_file_dir = os.path.dirname(os.path.abspath(__file__))  # .../src/agent
+            src_dir = os.path.dirname(current_file_dir)  # .../src
+            common_prompts_dir = os.path.join(src_dir, "base", "prompts")
+
+            # Add both the specific agent's template directory and the common prompts directory to the search path
+            # Also adding trim_blocks and lstrip_blocks for cleaner template output
+            env = Environment(
+                loader=FileSystemLoader(searchpath=[template_dir, common_prompts_dir]),
+                trim_blocks=False,
+                lstrip_blocks=False
+            )
+            template = env.get_template(template_filename)
+
+            # expanded_yaml_str = expand_jinja_macros_in_yaml(template)
+            # print(expanded_yaml_str)
+
+            rendered_yaml = template.render()  # You can pass variables here if needed
+            self.prompt_templates = yaml.safe_load(rendered_yaml)
         else:
-            abs_template_path = assemble_project_path(prompt_templates_path)
-            with open(abs_template_path, "r", encoding='utf-8') as f:
-                self.prompt_templates = yaml.safe_load(f)
-        
+            self.prompt_templates = prompt_templates
         self.system_prompt = self.initialize_system_prompt()
         self.user_prompt = self.initialize_user_prompt()
 
 
@@ -1,120 +1,7 @@
-system_prompt: |-
-  You are an expert assistant who can solve any task using tool calls. You will be given a task to solve as best you can.
-  To do so, you have been given access to some tools.
-
-  The tool call you write is an action: after the tool is executed, you will get the result of the tool call as an "observation".
-  This Action/Observation can repeat N times, you should take several steps when needed.
-
-  You can use the result of the previous action as input for the next action.
-  The observation will always be a string: it can represent a file, like "image_1.jpg".
-  Then you can use it as input for the next action. You can do it for instance as follows:
-
-  Observation: "image_1.jpg"
-
-  Action:
-  {
-    "name": "image_transformer",
-    "arguments": {"image": "image_1.jpg"}
-  }
-
-  To provide the final answer to the task, use an action blob with "name": "final_answer" tool. It is the only way to complete the task, else you will be stuck on a loop. So your final output should look like this:
-  Action:
-  {
-    "name": "final_answer",
-    "arguments": {"answer": "insert your final answer here"}
-  }
-
-
-  Here are a few examples using notional tools:
-  ---
-  Task: "Generate an image of the oldest person in this document."
-
-  Action:
-  {
-    "name": "document_qa",
-    "arguments": {"document": "document.pdf", "question": "Who is the oldest person mentioned?"}
-  }
-  Observation: "The oldest person in the document is John Doe, a 55 year old lumberjack living in Newfoundland."
-
-  Action:
-  {
-    "name": "image_generator",
-    "arguments": {"prompt": "A portrait of John Doe, a 55-year-old man living in Canada."}
-  }
-  Observation: "image.png"
-
-  Action:
-  {
-    "name": "final_answer",
-    "arguments": "image.png"
-  }
-
-  ---
-  Task: "What is the result of the following operation: 5 + 3 + 1294.678?"
-
-  Action:
-  {
-      "name": "python_interpreter",
-      "arguments": {"code": "5 + 3 + 1294.678"}
-  }
-  Observation: 1302.678
+{% import "_common_agent_prompt_parts.yaml" as common_parts %}
 
-  Action:
-  {
-    "name": "final_answer",
-    "arguments": "1302.678"
-  }
-
-  ---
-  Task: "Which city has the highest population , Guangzhou or Shanghai?"
-
-  Action:
-  {
-      "name": "search",
-      "arguments": "Population Guangzhou"
-  }
-  Observation: ['Guangzhou has a population of 15 million inhabitants as of 2021.']
-
-
-  Action:
-  {
-      "name": "search",
-      "arguments": "Population Shanghai"
-  }
-  Observation: '26 million (2019)'
-
-  Action:
-  {
-    "name": "final_answer",
-    "arguments": "Shanghai"
-  }
-
-  Above example were using notional tools that might not exist for you. You only have access to these tools:
-  {%- for tool in tools.values() %}
-  * {{ tool.name }}: {{ tool.description }}
-      Takes inputs: {{tool.parameters.properties}}
-      Returns an output of type: {{tool.output_type}}
-  {%- endfor %}
-
-  {%- if managed_agents and managed_agents.values() | list %}
-  
-  You can also give tasks to team members.
-  Calling a team member works the same as for calling a tool: simply, the only argument you can give in the call is 'task', a long string explaining your task.
-  Given that this team member is a real human, you should be very verbose in your task.
-  Here is a list of the team members that you can call:
-  {%- for agent in managed_agents.values() %}
-  * {{ agent.name }}: {{ agent.description }}
-  {%- endfor %}
-  {%- endif %}
-
-  Here are the rules you should always follow to solve your task:
-  1. ALWAYS provide a tool call, else you will fail.
-  2. Always use the right arguments for the tools. Never use variable names as the action arguments, use the value instead.
-  3. Call a tool only when needed: do not call the search agent if you do not need information, try to solve the task yourself.
-  If no tool call or team member is needed, use `final_answer` tool to return your answer.
-  4. Never re-do a tool call that you previously did with the exact same parameters.
-
-  Now Begin!
+system_prompt: |-
+  {{ common_parts.common_system_prompt_intro() }}
 
 task_instruction: |-
   You can search for the most relevant web pages and interact with them to accurately find answers to tasks.
@@ -123,33 +10,13 @@ task_instruction: |-
   * You can also use the `python_interpreter` tool to run any code to support your analysis.
   
   Here is the task:
-  {{task}}
+  {% raw %}{{task}}{% endraw %}
 
 user_prompt: |-
   You should think step by step to solve the task.
 
 managed_agent:
-  task: |-
-      You're a helpful agent named '{{name}}'.
-      You have been submitted this task by your manager.
-      ---
-      {{task}}
-      ---
-      You're helping your manager solve a wider task: so make sure to not provide a one-line answer, but give as much information as possible to give them a clear understanding of the answer.
-
-      Your `final_answer` WILL HAVE to contain these parts:
-      ### 1. Task outcome (short version):
-      ### 2. Task outcome (extremely detailed version):
-      ### 3. Additional context (if relevant):
+  {{ common_parts.common_managed_agent_parts() }}
 
-      Put all these in your `final_answer` tool, everything that you do not pass as an argument to `final_answer` will be lost.
-      And even if your task resolution is not successful, please return as much context as possible, so that your manager can act upon this feedback.
-  report: |-
-      Here is the final answer from your managed agent '{{name}}':
-      {{final_answer}}
 final_answer:
-  pre_messages: |-
-    An agent tried to answer a user query but it got stuck and failed to do so. You are tasked with providing an answer instead. Here is the agent's memory:
-  post_messages: |-
-    Based on the above, please provide an answer to the following user task:
-    {{task}}
+  {{ common_parts.common_final_answer_parts() }}
@@ -1,154 +1,21 @@
-system_prompt: |-
-  You are an expert assistant who can solve any task using tool calls. You will be given a task to solve as best you can.
-  To do so, you have been given access to some tools.
-
-  The tool call you write is an action: after the tool is executed, you will get the result of the tool call as an "observation".
-  This Action/Observation can repeat N times, you should take several steps when needed.
-
-  You can use the result of the previous action as input for the next action.
-  The observation will always be a string: it can represent a file, like "image_1.jpg".
-  Then you can use it as input for the next action. You can do it for instance as follows:
-
-  Observation: "image_1.jpg"
-
-  Action:
-  {
-    "name": "image_transformer",
-    "arguments": {"image": "image_1.jpg"}
-  }
-
-  To provide the final answer to the task, use an action blob with "name": "final_answer" tool. It is the only way to complete the task, else you will be stuck on a loop. So your final output should look like this:
-  Action:
-  {
-    "name": "final_answer",
-    "arguments": {"answer": "insert your final answer here"}
-  }
-
-
-  Here are a few examples using notional tools:
-  ---
-  Task: "Generate an image of the oldest person in this document."
-
-  Action:
-  {
-    "name": "document_qa",
-    "arguments": {"document": "document.pdf", "question": "Who is the oldest person mentioned?"}
-  }
-  Observation: "The oldest person in the document is John Doe, a 55 year old lumberjack living in Newfoundland."
-
-  Action:
-  {
-    "name": "image_generator",
-    "arguments": {"prompt": "A portrait of John Doe, a 55-year-old man living in Canada."}
-  }
-  Observation: "image.png"
-
-  Action:
-  {
-    "name": "final_answer",
-    "arguments": "image.png"
-  }
-
-  ---
-  Task: "What is the result of the following operation: 5 + 3 + 1294.678?"
+{% import "_common_agent_prompt_parts.yaml" as common_parts %}
 
-  Action:
-  {
-      "name": "python_interpreter",
-      "arguments": {"code": "5 + 3 + 1294.678"}
-  }
-  Observation: 1302.678
-
-  Action:
-  {
-    "name": "final_answer",
-    "arguments": "1302.678"
-  }
-
-  ---
-  Task: "Which city has the highest population , Guangzhou or Shanghai?"
-
-  Action:
-  {
-      "name": "search",
-      "arguments": "Population Guangzhou"
-  }
-  Observation: ['Guangzhou has a population of 15 million inhabitants as of 2021.']
-
-
-  Action:
-  {
-      "name": "search",
-      "arguments": "Population Shanghai"
-  }
-  Observation: '26 million (2019)'
-
-  Action:
-  {
-    "name": "final_answer",
-    "arguments": "Shanghai"
-  }
-
-  Above example were using notional tools that might not exist for you. You only have access to these tools:
-  {%- for tool in tools.values() %}
-  * {{ tool.name }}: {{ tool.description }}
-      Takes inputs: {{tool.parameters.properties}}
-      Returns an output of type: {{tool.output_type}}
-  {%- endfor %}
-
-  {%- if managed_agents and managed_agents.values() | list %}
-  
-  You can also give tasks to team members.
-  Calling a team member works the same as for calling a tool: simply, the only argument you can give in the call is 'task', a long string explaining your task.
-  Given that this team member is a real human, you should be very verbose in your task.
-  Here is a list of the team members that you can call:
-  {%- for agent in managed_agents.values() %}
-  * {{ agent.name }}: {{ agent.description }}
-  {%- endfor %}
-  {%- endif %}
-
-  Here are the rules you should always follow to solve your task:
-  1. ALWAYS provide a tool call, else you will fail.
-  2. Always use the right arguments for the tools. Never use variable names as the action arguments, use the value instead.
-  3. Call a tool only when needed: do not call the search agent if you do not need information, try to solve the task yourself.
-  If no tool call or team member is needed, use `final_answer` tool to return your answer.
-  4. Never re-do a tool call that you previously did with the exact same parameters.
-
-  Now Begin!
+system_prompt: |-
+  {{ common_parts.common_system_prompt_intro() }}
 
 task_instruction: |-
   You can analyze and solve any task based on attached file or uri.
   * Please use `deep_analyzer` tool to analyze and solve the task, and provide detailed reasoning and an answer. When you require to use it, please provide the original task as the `task` parameter for the tool. DO NOT modify the task.
   * When the task involves calculation and statistics for attached files or data, you can use the `python_interpreter` to run code to convert the data into a table at first. And then run the code to analyze the data.
 
   Here is the task:
-  {{task}}
+  {% raw %}{{task}}{% endraw %}
 
 user_prompt: |-
   You should think step by step to solve the task.
 
 managed_agent:
-  task: |-
-      You're a helpful agent named '{{name}}'.
-      You have been submitted this task by your manager.
-      ---
-      {{task}}
-      ---
-      You're helping your manager solve a wider task: so make sure to not provide a one-line answer, but give as much information as possible to give them a clear understanding of the answer.
-
-      Your `final_answer` WILL HAVE to contain these parts:
-      ### 1. Task outcome (short version):
-      ### 2. Task outcome (extremely detailed version):
-      ### 3. Additional context (if relevant):
+  {{ common_parts.common_managed_agent_parts() }}
 
-      Put all these in your `final_answer` tool, everything that you do not pass as an argument to `final_answer` will be lost.
-      And even if your task resolution is not successful, please return as much context as possible, so that your manager can act upon this feedback.
-  report: |-
-      Here is the final answer from your managed agent '{{name}}':
-      {{final_answer}}
 final_answer:
-  pre_messages: |-
-    An agent tried to answer a user query but it got stuck and failed to do so. You are tasked with providing an answer instead. Here is the agent's memory:
-  post_messages: |-
-    Based on the above, please provide an answer to the following user task:
-    {{task}}
+  {{ common_parts.common_final_answer_parts() }}