p2p-stabletoolbench / pipeline /prompt_builder.py
Dwootton's picture
Add prompt_builder.py
a5eff80 verified
"""Prompt builder for StableToolBench ReAct evaluation.
Constructs system + user prompts for each P2P condition, with pluggable
tool descriptions and in-context examples.
"""
import json
from typing import Dict, List, Optional, Any
def build_task_description(tool_descriptions):
"""Build the task description that lists available tools (from StableToolBench rapidapi.py)."""
desc = ('You should use functions to help handle the real time user querys. Remember:\n'
'1.ALWAYS call "Finish" function at the end of the task. And the final answer '
'should contain enough information to show to the user,If you can\'t handle the '
'task, or you find that function calls always fail(the function is not valid now), '
'use function Finish->give_up_and_restart.\n'
'2.Do not use origin tool names, use only subfunctions\' names.\n'
'You have access of the following tools:\n')
seen = {}
for std_name, tool_des in tool_descriptions:
if std_name not in seen: seen[std_name] = tool_des
for k, (std_name, tool_des) in enumerate(seen.items()):
striped = (tool_des[:512].replace('\n', '').strip()) if tool_des else "None"
if not striped: striped = "None"
desc += f"{k+1}.{std_name}: {striped}\n"
return desc
def build_system_prompt(task_description):
"""Build the system message for ReAct (FORMAT_INSTRUCTIONS_SYSTEM_FUNCTION)."""
return ("You are AutoGPT, you can use many tools(functions) to do the following task.\n"
"First I will give you the task description, and your task start.\n"
"At each step, you need to give your thought to analyze the status now and "
"what to do next, with a function call to actually excute your step.\n"
"After the call, you will get the call result, and you are now in a new state.\n"
"Then you will analyze your status now, then decide what to do next...\n"
"After many (Thought-call) pairs, you finally perform the task, then you can "
"give your finial answer.\nRemember: \n"
"1.the state change is irreversible, you can't go back to one of the former state, "
'if you want to restart the task, say "I give up and restart".\n'
"2.All the thought is short, at most in 5 sentence.\n"
"3.You can do more then one trys, so if your plan is to continusly try some "
"conditions, you can do one of the conditions per try.\nLet's Begin!\n"
f"Task description: {task_description}")
def build_user_prompt(query, examples=None):
"""Build the initial user message, optionally with in-context examples."""
prompt = ""
if examples:
prompt += "Here are some examples of how to use the available tools:\n\n"
for i, ex in enumerate(examples, 1):
prompt += f"Example {i}:\nUser: {ex['instruction']}\n"
prompt += f"Tool call: {json.dumps(ex['fn_call'])}\n"
prompt += f"Tool result: {str(ex['tool_results'])[:512]}\n"
prompt += f"Answer: {ex['answer']}\n\n"
prompt += "Now handle the following real task:\n\n"
prompt += f"{query}\nBegin!\n"
return prompt
def build_initial_messages(query, tool_descriptions, examples=None):
"""Build the initial message list for a ReAct conversation."""
task_desc = build_task_description(tool_descriptions)
system = build_system_prompt(task_desc)
user = build_user_prompt(query, examples)
return [{"role": "system", "content": system}, {"role": "user", "content": user}]
def get_condition_config(condition, p2p_descriptions=None, p2p_examples=None):
"""Get configuration for a P2P condition.
condition: One of 'baseline', 'p2p_desc', 'p2p_demo', 'p2p_full'
Returns dict with: use_custom_descriptions, custom_descriptions, use_examples, examples
"""
configs = {
"baseline": {"use_custom_descriptions": False, "custom_descriptions": None, "use_examples": False, "examples": None},
"p2p_desc": {"use_custom_descriptions": True, "custom_descriptions": p2p_descriptions or {}, "use_examples": False, "examples": None},
"p2p_demo": {"use_custom_descriptions": False, "custom_descriptions": None, "use_examples": True, "examples": p2p_examples or {}},
"p2p_full": {"use_custom_descriptions": True, "custom_descriptions": p2p_descriptions or {}, "use_examples": True, "examples": p2p_examples or {}},
}
if condition not in configs:
raise ValueError(f"Unknown condition: {condition}. Must be one of {list(configs.keys())}")
return configs[condition]
def gather_examples_for_query(tool_names, api_name_reflect, functions, all_examples, max_per_tool=1):
"""Gather in-context examples relevant to a specific query's tools."""
gathered = []
for func in functions:
func_name = func["function"]["name"]
if func_name == "Finish": continue
if func_name in all_examples:
gathered.extend(all_examples[func_name][:max_per_tool])
return gathered