You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
316 lines
12 KiB
316 lines
12 KiB
"""Run your code assistant agent in a sandbox environment.
|
|
|
|
This example demonstrates how to create a code assistant agent that can execute code
|
|
in a sandbox environment. The agent can execute Python and JavaScript code blocks
|
|
and provide the output to the user. The agent can also check the correctness of the
|
|
code execution results and provide feedback to the user.
|
|
|
|
|
|
You can limit the memory and file system resources available to the code execution
|
|
environment. The code execution environment is isolated from the host system,
|
|
preventing access to the internet and other external resources.
|
|
"""
|
|
|
|
import asyncio
|
|
import logging
|
|
import os
|
|
from typing import Optional, Tuple
|
|
|
|
from dbgpt.agent import (
|
|
Action,
|
|
ActionOutput,
|
|
AgentContext,
|
|
AgentMemory,
|
|
AgentMemoryFragment,
|
|
AgentMessage,
|
|
AgentResource,
|
|
ConversableAgent,
|
|
HybridMemory,
|
|
LLMConfig,
|
|
ProfileConfig,
|
|
UserProxyAgent,
|
|
)
|
|
from dbgpt.agent.expand.code_assistant_agent import CHECK_RESULT_SYSTEM_MESSAGE
|
|
from dbgpt.core import ModelMessageRoleType
|
|
from dbgpt.util.code_utils import UNKNOWN, extract_code, infer_lang
|
|
from dbgpt.util.string_utils import str_to_bool
|
|
from dbgpt.util.utils import colored
|
|
from dbgpt.vis.tags.vis_code import Vis, VisCode
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
class SandboxCodeAction(Action[None]):
|
|
"""Code Action Module."""
|
|
|
|
def __init__(self, **kwargs):
|
|
"""Code action init."""
|
|
super().__init__(**kwargs)
|
|
self._render_protocol = VisCode()
|
|
self._code_execution_config = {}
|
|
|
|
@property
|
|
def render_protocol(self) -> Optional[Vis]:
|
|
"""Return the render protocol."""
|
|
return self._render_protocol
|
|
|
|
async def run(
|
|
self,
|
|
ai_message: str,
|
|
resource: Optional[AgentResource] = None,
|
|
rely_action_out: Optional[ActionOutput] = None,
|
|
need_vis_render: bool = True,
|
|
**kwargs,
|
|
) -> ActionOutput:
|
|
"""Perform the action."""
|
|
try:
|
|
code_blocks = extract_code(ai_message)
|
|
if len(code_blocks) < 1:
|
|
logger.info(
|
|
f"No executable code found in answer,{ai_message}",
|
|
)
|
|
return ActionOutput(
|
|
is_exe_success=False, content="No executable code found in answer."
|
|
)
|
|
elif len(code_blocks) > 1 and code_blocks[0][0] == UNKNOWN:
|
|
# found code blocks, execute code and push "last_n_messages" back
|
|
logger.info(
|
|
f"Missing available code block type, unable to execute code,"
|
|
f"{ai_message}",
|
|
)
|
|
return ActionOutput(
|
|
is_exe_success=False,
|
|
content="Missing available code block type, "
|
|
"unable to execute code.",
|
|
)
|
|
exitcode, logs = await self.execute_code_blocks(code_blocks)
|
|
exit_success = exitcode == 0
|
|
|
|
content = (
|
|
logs
|
|
if exit_success
|
|
else f"exitcode: {exitcode} (execution failed)\n {logs}"
|
|
)
|
|
|
|
param = {
|
|
"exit_success": exit_success,
|
|
"language": code_blocks[0][0],
|
|
"code": code_blocks,
|
|
"log": logs,
|
|
}
|
|
if not self.render_protocol:
|
|
raise NotImplementedError("The render_protocol should be implemented.")
|
|
view = await self.render_protocol.display(content=param)
|
|
return ActionOutput(
|
|
is_exe_success=exit_success,
|
|
content=content,
|
|
view=view,
|
|
thoughts=ai_message,
|
|
observations=content,
|
|
)
|
|
except Exception as e:
|
|
logger.exception("Code Action Run Failed!")
|
|
return ActionOutput(
|
|
is_exe_success=False, content="Code execution exception," + str(e)
|
|
)
|
|
|
|
async def execute_code_blocks(self, code_blocks):
|
|
"""Execute the code blocks and return the result."""
|
|
from lyric import (
|
|
PyTaskFsConfig,
|
|
PyTaskMemoryConfig,
|
|
PyTaskResourceConfig,
|
|
)
|
|
|
|
from dbgpt.util.code.server import get_code_server
|
|
|
|
fs = PyTaskFsConfig(
|
|
preopens=[
|
|
# Mount the /tmp directory to the /tmp directory in the sandbox
|
|
# Directory permissions are set to 3 (read and write)
|
|
# File permissions are set to 3 (read and write)
|
|
("/tmp", "/tmp", 3, 3),
|
|
# Mount the current directory to the /home directory in the sandbox
|
|
# Directory and file permissions are set to 1 (read)
|
|
(".", "/home", 1, 1),
|
|
]
|
|
)
|
|
memory = PyTaskMemoryConfig(memory_limit=50 * 1024 * 1024) # 50MB in bytes
|
|
resources = PyTaskResourceConfig(
|
|
fs=fs,
|
|
memory=memory,
|
|
env_vars=[
|
|
("TEST_ENV", "hello, im an env var"),
|
|
("TEST_ENV2", "hello, im another env var"),
|
|
],
|
|
)
|
|
|
|
code_server = await get_code_server()
|
|
logs_all = ""
|
|
exitcode = -1
|
|
for i, code_block in enumerate(code_blocks):
|
|
lang, code = code_block
|
|
if not lang:
|
|
lang = infer_lang(code)
|
|
print(
|
|
colored(
|
|
f"\n>>>>>>>> EXECUTING CODE BLOCK {i} "
|
|
f"(inferred language is {lang})...",
|
|
"red",
|
|
),
|
|
flush=True,
|
|
)
|
|
if lang in ["python", "Python"]:
|
|
result = await code_server.exec(code, "python", resources=resources)
|
|
exitcode = result.exit_code
|
|
logs = result.logs
|
|
elif lang in ["javascript", "JavaScript"]:
|
|
result = await code_server.exec(code, "javascript", resources=resources)
|
|
exitcode = result.exit_code
|
|
logs = result.logs
|
|
else:
|
|
# In case the language is not supported, we return an error message.
|
|
exitcode, logs = (
|
|
1,
|
|
f"unknown language {lang}",
|
|
)
|
|
|
|
logs_all += "\n" + logs
|
|
if exitcode != 0:
|
|
return exitcode, logs_all
|
|
return exitcode, logs_all
|
|
|
|
|
|
class SandboxCodeAssistantAgent(ConversableAgent):
|
|
"""Code Assistant Agent."""
|
|
|
|
profile: ProfileConfig = ProfileConfig(
|
|
name="Turing",
|
|
role="CodeEngineer",
|
|
goal=(
|
|
"使用您的编码和语言技能解决任务。\n"
|
|
"在以下情况下,建议用户执行python代码(在python编码块中)或javascript。\n"
|
|
" 1. 当你需要收集信息时,使用代码输出你需要的信息,例如,获取当前日期/时间,检查操作系统。在打印出足够的信息并且任务已准备好根据您的语言技能解决后,您可以自己解决任务。\n"
|
|
" 2. 当您需要使用代码执行某些任务时,请使用代码执行任务并输出结果。聪明地完成任务。"
|
|
),
|
|
constraints=[
|
|
"The user cannot provide any other feedback or perform any other "
|
|
"action beyond executing the code you suggest. The user can't modify "
|
|
"your code. So do not suggest incomplete code which requires users to "
|
|
"modify. Don't use a code block if it's not intended to be executed "
|
|
"by the user.Don't ask users to copy and paste results. Instead, "
|
|
"the 'Print' function must be used for output when relevant.",
|
|
"When using code, you must indicate the script type in the code block. "
|
|
"Please don't include multiple code blocks in one response.",
|
|
"If you receive user input that indicates an error in the code "
|
|
"execution, fix the error and output the complete code again. It is "
|
|
"recommended to use the complete code rather than partial code or "
|
|
"code changes. If the error cannot be fixed, or the task is not "
|
|
"resolved even after the code executes successfully, analyze the "
|
|
"problem, revisit your assumptions, gather additional information you "
|
|
"need from historical conversation records, and consider trying a "
|
|
"different approach.",
|
|
"Unless necessary, give priority to solving problems with python code.",
|
|
"The output content of the 'print' function will be passed to other "
|
|
"LLM agents as dependent data. Please control the length of the "
|
|
"output content of the 'print' function. The 'print' function only "
|
|
"outputs part of the key data information that is relied on, "
|
|
"and is as concise as possible.",
|
|
"Your code will by run in a sandbox environment(supporting python and "
|
|
"javascript), which means you can't access the internet or use any "
|
|
"libraries that are not in standard library.",
|
|
"It is prohibited to fabricate non-existent data to achieve goals.",
|
|
],
|
|
desc=(
|
|
"Can independently write and execute python/shell code to solve various"
|
|
" problems"
|
|
),
|
|
)
|
|
|
|
def __init__(self, **kwargs):
|
|
"""Create a new CodeAssistantAgent instance."""
|
|
super().__init__(**kwargs)
|
|
self._init_actions([SandboxCodeAction])
|
|
|
|
async def correctness_check(
|
|
self, message: AgentMessage
|
|
) -> Tuple[bool, Optional[str]]:
|
|
"""Verify whether the current execution results meet the target expectations."""
|
|
task_goal = message.current_goal
|
|
action_report = message.action_report
|
|
if not action_report:
|
|
return False, "No execution solution results were checked"
|
|
check_result, model = await self.thinking(
|
|
messages=[
|
|
AgentMessage(
|
|
role=ModelMessageRoleType.HUMAN,
|
|
content="Please understand the following task objectives and "
|
|
f"results and give your judgment:\n"
|
|
f"Task goal: {task_goal}\n"
|
|
f"Execution Result: {action_report.content}",
|
|
)
|
|
],
|
|
prompt=CHECK_RESULT_SYSTEM_MESSAGE,
|
|
)
|
|
success = str_to_bool(check_result)
|
|
fail_reason = None
|
|
if not success:
|
|
fail_reason = (
|
|
f"Your answer was successfully executed by the agent, but "
|
|
f"the goal cannot be completed yet. Please regenerate based on the "
|
|
f"failure reason:{check_result}"
|
|
)
|
|
return success, fail_reason
|
|
|
|
|
|
async def main():
|
|
from dbgpt.model.proxy.llms.siliconflow import SiliconFlowLLMClient
|
|
|
|
llm_client = SiliconFlowLLMClient(
|
|
model_alias=os.getenv(
|
|
"SILICONFLOW_MODEL_VERSION", "Qwen/Qwen2.5-Coder-32B-Instruct"
|
|
),
|
|
)
|
|
context: AgentContext = AgentContext(conv_id="test123")
|
|
|
|
# TODO Embedding and Rerank model refactor
|
|
from dbgpt.rag.embedding import OpenAPIEmbeddings
|
|
|
|
silicon_embeddings = OpenAPIEmbeddings(
|
|
api_url=os.getenv("SILICONFLOW_API_BASE") + "/embeddings",
|
|
api_key=os.getenv("SILICONFLOW_API_KEY"),
|
|
model_name="BAAI/bge-large-zh-v1.5",
|
|
)
|
|
agent_memory = AgentMemory(
|
|
HybridMemory[AgentMemoryFragment].from_chroma(
|
|
embeddings=silicon_embeddings,
|
|
)
|
|
)
|
|
agent_memory.gpts_memory.init("test123")
|
|
|
|
coder = (
|
|
await SandboxCodeAssistantAgent()
|
|
.bind(context)
|
|
.bind(LLMConfig(llm_client=llm_client))
|
|
.bind(agent_memory)
|
|
.build()
|
|
)
|
|
|
|
user_proxy = await UserProxyAgent().bind(context).bind(agent_memory).build()
|
|
|
|
# First case: The user asks the agent to calculate 321 * 123
|
|
await user_proxy.initiate_chat(
|
|
recipient=coder,
|
|
reviewer=user_proxy,
|
|
message="计算下321 * 123等于多少",
|
|
)
|
|
|
|
await user_proxy.initiate_chat(
|
|
recipient=coder,
|
|
reviewer=user_proxy,
|
|
message="Calculate 100 * 99, must use javascript code block",
|
|
)
|
|
|
|
|
|
if __name__ == "__main__":
|
|
asyncio.run(main())
|
|
|