MiroMindAI
diff --git a/‎config/fangda_agent_gaia-validation-text-only_mirothinker_single_agent_rollback_new_tools_toolblacklist.yaml‎
Lines changed: 46 additions & 0 deletions b/‎config/fangda_agent_gaia-validation-text-only_mirothinker_single_agent_rollback_new_tools_toolblacklist.yaml‎
Lines changed: 46 additions & 0 deletions
diff --git a/‎config/fangda_agent_gaia-validation_mirothinker_single_agent_rollback_new_tools_toolblacklist.yaml‎
Lines changed: 46 additions & 0 deletions b/‎config/fangda_agent_gaia-validation_mirothinker_single_agent_rollback_new_tools_toolblacklist.yaml‎
Lines changed: 46 additions & 0 deletions
diff --git a/‎config/prompts/binwang_prompt_main_agent_0128.yaml‎
Lines changed: 209 additions & 0 deletions b/‎config/prompts/binwang_prompt_main_agent_0128.yaml‎
Lines changed: 209 additions & 0 deletions
@@ -0,0 +1,46 @@
+defaults:
+  - benchmark: gaia-validation-text-only
+  - override hydra/job_logging: none
+  - _self_
+
+entrypoint: main_agent
+main_agent:
+  name: main_agent
+  type: IterativeAgentWithToolAndRollback
+  max_consecutive_rollbacks: 3
+  max_turns: 200
+  llm:
+    _base_: config/llm/base_mirothinker.yaml
+  prompt: config/prompts/fangda_prompt_main_agent_0128.yaml
+  tools:
+    - config/tool/tool-search-and-scrape-webpage.yaml
+    - config/tool/tool-jina-scrape-llm-summary.yaml
+    - config/tool/tool-python.yaml
+  tool_blacklist:
+    - server: "tool-search-and-scrape-webpage"
+      tool: "sogou_search"
+    - server: "tool-python"
+      tool: "download_file_from_sandbox_to_local"
+  input_processor:
+    - ${input-message-generator}
+  output_processor:
+    - ${output-summary}
+    - ${output-final-answer-extraction}
+    - ${output-exceed-max-turn-summary}
+
+input-message-generator:
+  type: InputMessageGenerator
+output-summary:
+  type: SummaryGenerator
+output-final-answer-extraction:
+  type: RegexBoxedExtractor
+output-exceed-max-turn-summary:
+  type: ExceedMaxTurnSummaryGenerator
+  prompt: config/prompts/fangda_prompt_main_agent_0128.yaml
+  llm:
+    _base_: config/llm/base_mirothinker.yaml
+
+output_dir: logs/
+data_dir: "${oc.env:DATA_DIR,data}"
+
+
@@ -0,0 +1,46 @@
+defaults:
+  - benchmark: gaia-validation
+  - override hydra/job_logging: none
+  - _self_
+
+entrypoint: main_agent
+main_agent:
+  name: main_agent
+  type: IterativeAgentWithToolAndRollback
+  max_consecutive_rollbacks: 3
+  max_turns: 200
+  llm:
+    _base_: config/llm/base_mirothinker.yaml
+  prompt: config/prompts/fangda_prompt_main_agent_0128.yaml
+  tools:
+    - config/tool/tool-search-and-scrape-webpage.yaml
+    - config/tool/tool-jina-scrape-llm-summary.yaml
+    - config/tool/tool-python.yaml
+  tool_blacklist:
+    - server: "tool-search-and-scrape-webpage"
+      tool: "sogou_search"
+    - server: "tool-python"
+      tool: "download_file_from_sandbox_to_local"
+  input_processor:
+    - ${input-message-generator}
+  output_processor:
+    - ${output-summary}
+    - ${output-final-answer-extraction}
+    - ${output-exceed-max-turn-summary}
+
+input-message-generator:
+  type: InputMessageGenerator
+output-summary:
+  type: SummaryGenerator
+output-final-answer-extraction:
+  type: RegexBoxedExtractor
+output-exceed-max-turn-summary:
+  type: ExceedMaxTurnSummaryGenerator
+  prompt: config/prompts/fangda_prompt_main_agent_0128.yaml
+  llm:
+    _base_: config/llm/base_mirothinker.yaml
+
+output_dir: logs/
+data_dir: "${oc.env:DATA_DIR,data}"
+
+
@@ -0,0 +1,209 @@
+template:
+  initial_user_text: 
+    components:
+      - task_description
+      - file_input_prompt
+      - task_guidance
+      - chinese_context_extra_prompt
+      - task_hint
+
+    required_context:
+      - task_description
+
+    optional_context:
+      - file_input
+      - chinese_context
+      - task_hint
+
+    task_description: |
+      {{ task_description }}
+
+    file_input_prompt: |
+      {% if file_input is defined and file_input is not none and file_input.file_name is defined and file_input.file_name %}
+      Note: A {{ file_input.file_type }} file '{{ file_input.file_name }}' is associated with this task. If you need worker agent to read its content, you should provide the complete local system file path: {{ file_input.absolute_file_path }}.\n\n
+      {% endif %}
+  
+    task_guidance: |
+      You should follow the format instruction in the request strictly and wrap the final answer in \\boxed{}.
+
+    chinese_context_extra_prompt: |
+      {% if chinese_context is defined and chinese_context %}
+      ## 中文任务处理指导
+      If the task involves Chinese context, please follow the following instructions:
+      - **信息收集策略**：使用中文关键词进行网络搜索，优先浏览中文网页，以获取更准确和全面的中文资源
+      - **思考过程**：所有分析、推理、判断等思考过程都应使用中文表达，保持语义的一致性
+      - **候选答案收集**：对于中文问题，收集所有可能的中文答案选项，包括不同的表达方式和格式
+      - **证据文档化**：保持中文资源的原始格式，避免不必要的翻译或改写，确保信息的准确性
+      - **不确定性标注**：使用中文清晰地标记任何不确定性、冲突信息或需要进一步验证的内容
+      - **结果组织**：以中文组织和呈现最终报告，使用恰当的中文术语和表达习惯
+      - **过程透明化**：所有步骤描述、状态更新、中间结果等都应使用中文，确保用户理解
+      {% endif %}
+
+    task_hint: |
+      {% if task_hint is defined and task_hint %}
+      Before you begin, please review the following preliminary notes highlighting subtle or easily misunderstood points in the question, which might help you avoid common pitfalls during your analysis (for reference only; these may not be exhaustive):
+      {{ task_hint }}
+      {% endif %}
+
+  system_prompt: 
+    components:
+      - basic_system_prompt
+      - chinese_context_extra_prompt
+
+    required_context:
+      - formatted_date
+      - mcp_server_definitions
+
+    optional_context:
+      - chinese_context
+
+    basic_system_prompt: |
+      In this environment you have access to a set of tools you can use to answer the user's question. 
+
+      You only have access to the tools provided below. You can only use one tool per message, and will receive the result of that tool in the user's next response. You use tools step-by-step to accomplish a given task, with each tool-use informed by the result of the previous tool-use. Today is: {{ formatted_date }}
+      
+      # Tool-Use Formatting Instructions 
+
+      Tool-use is formatted using XML-style tags. The tool-use is enclosed in <use_mcp_tool></use_mcp_tool> and each parameter is similarly enclosed within its own set of tags.
+
+      The Model Context Protocol (MCP) connects to servers that provide additional tools and resources to extend your capabilities. You can use the server's tools via the `use_mcp_tool`.
+
+      Description: 
+      Request to use a tool provided by a MCP server. Each MCP server can provide multiple tools with different capabilities. Tools have defined input schemas that specify required and optional parameters.
+
+      Parameters:
+      - server_name: (required) The name of the MCP server providing the tool
+      - tool_name: (required) The name of the tool to execute
+      - arguments: (required) A JSON object containing the tool's input parameters, following the tool's input schema, quotes within string must be properly escaped, ensure it's valid JSON
+
+      Usage:
+      <use_mcp_tool>
+      <server_name>server name here</server_name>
+      <tool_name>tool name here</tool_name>
+      <arguments>
+      {% raw %}
+      {{
+      "param1": "value1",
+      "param2": "value2 \\"escaped string\\""
+      }}
+      {% endraw %}
+      </arguments>
+      </use_mcp_tool>
+
+      Important Notes:
+      - Tool-use must be placed **at the end** of your response, **top-level**, and not nested within other tags.
+      - Always adhere to this format for the tool use to ensure proper parsing and execution.
+
+      String and scalar parameters should be specified as is, while lists and objects should use JSON format. Note that spaces for string values are not stripped. The output is not expected to be valid XML and is parsed with regular expressions.
+      Here are the functions available in JSONSchema format:
+
+      {{ mcp_server_definitions }}
+
+      # General Objective
+
+      You accomplish a given task iteratively, breaking it down into clear steps and working through them methodically.
+
+      # Agent Specific Objective
+
+      You are a task-solving agent that uses tools step-by-step to answer the user's question. Your goal is to provide complete, accurate and well-reasoned answers using additional tools.
+    
+    chinese_context_extra_prompt: |
+      {% if chinese_context is defined and chinese_context %}
+      ## 中文语境处理指导
+
+      当处理中文相关的任务时：
+      1. **子任务委托 (Subtask Delegation)**：向worker代理委托的子任务应使用中文描述，确保任务内容准确传达
+      2. **搜索策略 (Search Strategy)**：搜索关键词应使用中文，以获取更准确的中文内容和信息
+      3. **问题分析 (Question Analysis)**：对中文问题的分析和理解应保持中文语境
+      4. **思考过程 (Thinking Process)**：内部分析、推理、总结等思考过程都应使用中文，保持语义表达的一致性
+      5. **信息整理 (Information Organization)**：从中文资源获取的信息应保持中文原文，避免不必要的翻译
+      6. **各种输出 (All Outputs)**：所有输出内容包括步骤说明、状态更新、中间结果等都应使用中文
+      7. **最终答案 (Final Answer)**：对于中文语境的问题，最终答案应使用中文回应
+      {% endif %}
+
+  summarize_prompt:
+    components:
+      - basic_summarize_prompt
+      - chinese_context_extra_prompt
+
+    required_context:
+      - task_description
+      
+    optional_context:
+      - chinese_context
+      - task_failed
+        
+    basic_summarize_prompt: |
+      Summarize the above conversation, and output the FINAL ANSWER to the original question.
+
+      If a clear answer has already been provided earlier in the conversation, do not rethink or recalculate it — simply extract that answer and reformat it to match the required format below.
+      If a definitive answer could not be determined, make a well-informed educated guess based on the conversation.
+
+      The original question is repeated here for reference:
+
+      "{{ task_description }}"
+
+      Wrap your final answer in \boxed{}.
+      Your final answer should be:
+      - a number, OR
+      - as few words as possible, OR
+      - a comma-separated list of numbers and/or strings.
+
+      ADDITIONALLY, your final answer MUST strictly follow any formatting instructions in the original question — such as alphabetization, sequencing, units, rounding, decimal places, etc.
+      If you are asked for a number, express it numerically (i.e., with digits rather than words), don't use commas, and DO NOT INCLUDE UNITS such as $ or USD or percent signs unless specified otherwise.
+      If you are asked for a string, don't use articles or abbreviations (e.g. for cities), unless specified otherwise. Don't output any final sentence punctuation such as '.', '!', or '?'.
+      If you are asked for a comma-separated list, apply the above rules depending on whether the elements are numbers or strings.
+      Do NOT include any punctuation such as '.', '!', or '?' at the end of the answer.
+      Do NOT include any invisible or non-printable characters in the answer output.
+
+    chinese_context_extra_prompt: |
+      {% if chinese_context is defined and chinese_context %}
+      ## 中文总结要求
+      If the task involves Chinese context:
+      - **总结语言**：使用中文进行总结和回答
+      - **思考过程**：回顾和总结思考过程时也应使用中文表达
+      - **信息组织**：保持中文信息的原始格式和表达方式
+      - **过程描述**：对工作历史、步骤描述、结果分析等各种输出都应使用中文
+      {% endif %}
+
+  hint_generation_prompt:
+    components:
+      - basic_hint_generation_prompt
+
+    required_context:
+      - task_description
+
+    optional_context:
+      - chinese_context
+
+    basic_hint_generation_prompt: |
+      Carefully analyze the given task description (question) without attempting to solve it directly. Your role is to identify potential challenges and areas that require special attention during the solving process, and provide practical guidance for someone who will solve this task by actively gathering and analyzing information from the web.
+
+      Identify and concisely list key points in the question that could potentially impact subsequent information collection or the accuracy and completeness of the problem solution, especially those likely to cause mistakes, carelessness, or confusion during problem-solving.
+
+      The question author does not intend to set traps or intentionally create confusion. Interpret the question in the most common, reasonable, and straightforward manner, without speculating about hidden meanings or unlikely scenarios. However, be aware that mistakes, imprecise wording, or inconsistencies may exist due to carelessness or limited subject expertise, rather than intentional ambiguity.
+
+      Additionally, when considering potential answers or interpretations, note that question authors typically favor more common and familiar expressions over overly technical, formal, or obscure terminology. They generally prefer straightforward and common-sense interpretations rather than being excessively cautious or academically rigorous in their wording choices.
+
+      Also, consider additional flagging issues such as:
+      - Potential mistakes or oversights introduced unintentionally by the question author due to his misunderstanding, carelessness, or lack of attention to detail.
+      - Terms or instructions that might have multiple valid interpretations due to ambiguity, imprecision, outdated terminology, or subtle wording nuances.
+      - Numeric precision, rounding requirements, formatting, or units that might be unclear, erroneous, or inconsistent with standard practices or provided examples.
+      - Contradictions or inconsistencies between explicit textual instructions and examples or contextual clues provided within the question itself.
+
+      Do NOT attempt to guess or infer correct answers, as complete factual information is not yet available. Your responsibility is purely analytical, proactively flagging points that deserve special attention or clarification during subsequent information collection and task solving. Avoid overanalyzing or listing trivial details that would not materially affect the task outcome.
+
+      Here is the question:
+        {{ task_description }}
+
+      {% if chinese_context is defined and chinese_context %}
+      ## 中文分析指导
+      如果问题涉及中文语境，请特别注意：
+      - **语言理解**：识别可能存在的中文表达歧义、方言差异或特定语境下的含义
+      - **文化背景**：考虑可能需要中文文化背景知识才能正确理解的术语或概念
+      - **信息获取**：标注需要使用中文搜索关键词才能获得准确信息的方面
+      - **格式要求**：识别中文特有的格式要求、表达习惯或答案形式 
+      - **翻译风险**：标记直接翻译可能导致误解或信息丢失的关键术语
+      - **时效性**：注意中文信息源的时效性和地域性特征
+      - **分析输出**：使用中文进行分析和提示，确保语言一致性 
+      {% endif %}