mriusero
core: safety
60ed03c
raw
history blame
6.07 kB
from gradio import ChatMessage
import json
import asyncio
import re
from src.agent.mistral_agent import MistralAgent
from src.agent.utils.call import call_tool
agent = MistralAgent()
api_lock = asyncio.Lock()
tool_lock = asyncio.Lock()
with open("./prompt.md", encoding="utf-8") as f:
SYSTEM_PROMPT = f.read()
def extract_phases(text):
"""Découpe le contenu en THINK / ACT / OBSERVE / FINAL ANSWER"""
phases = {'think': '', 'act': '', 'observe': '', 'final': ''}
matches = list(re.finditer(r'(THINK:|ACT:|OBSERVE:|FINAL ANSWER:)', text))
for i, match in enumerate(matches):
phase = match.group(1).lower().replace(":", "").replace("final answer", "final")
start = match.end()
end = matches[i+1].start() if i + 1 < len(matches) else len(text)
phases[phase] = text[start:end].strip()
return phases
async def respond(message, history=None):
if history is None:
history = []
if not history or history[-1].role != "assistant" or history[-1].metadata.get("status") == "done":
history.append(ChatMessage(role="assistant", content="", metadata={"title": "Thinking...", "status": "pending"}))
yield history
messages = [
{"role": "system", "content": SYSTEM_PROMPT},
{"role": "user", "content": message},
{"role": "assistant", "content": "THINK: Let's start thinking, ", "prefix": True},
]
phase_order = ["think", "act", "observe", "final"]
current_phase_index = 0
done = False
final_full = ""
while not done:
current_phase = phase_order[current_phase_index]
if current_phase != "final":
full = ""
else:
full = final_full
print('\n', '---' * 15)
print(f">>> messages before payload [phase {current_phase_index}] :", json.dumps([m for m in messages if m.get("role") != "system"], indent=2))
payload = {
"agent_id": agent.agent_id,
"messages": messages,
"stream": True,
"max_tokens": None,
"tools": agent.tools,
"tool_choice": "auto",
"presence_penalty": 0,
"frequency_penalty": 0,
"n": 1
}
async with api_lock:
response = await agent.client.agents.stream_async(**payload)
async for chunk in response:
delta = chunk.data.choices[0].delta
content = delta.content or ""
full += content
if current_phase == "final":
final_full = full
phases = extract_phases(full)
buffer = phases.get(current_phase, "")
if current_phase == "think":
history[-1] = ChatMessage(role="assistant", content=buffer, metadata={"title": "Thinking...", "status": "pending"})
elif current_phase == "act":
history[-1] = ChatMessage(role="assistant", content=buffer, metadata={"title": "Acting...", "status": "pending"})
elif current_phase == "observe":
history[-1] = ChatMessage(role="assistant", content=buffer, metadata={"title": "Observing...", "status": "pending"})
yield history
if current_phase == "final":
delta_content = delta.content or ""
final_full += delta_content
phases = extract_phases(final_full)
buffer = phases.get("final", "")
yield history
if delta_content == "" and buffer:
done = True
break
if current_phase_index == 0:
messages = [msg for msg in messages if not msg.get("prefix")]
if buffer:
prefix_label = current_phase.upper() if current_phase != "final" else "FINAL ANSWER"
messages.append({
"role": "assistant",
"content": f"{prefix_label}: {buffer}\n\nACT: Let's using some tools to solve the problem.",
"prefix": True
})
elif current_phase_index == 1:
for message in messages:
if "prefix" in message:
del message["prefix"]
if current_phase_index == 2:
for message in messages:
if "prefix" in message:
del message["prefix"]
messages.append({
"role": "assistant",
"content": "OBSERVE: Based on the results, let's observe the situation and see if we need to adjust our approach.",
"prefix": True
})
yield history
if current_phase == "act":
tool_calls = getattr(delta, "tool_calls", None)
if tool_calls and tool_calls != [] and str(tool_calls) != "Unset()":
async with tool_lock:
messages = call_tool(
agent,
tool_calls,
messages,
)
last_tool_response = next((m for m in reversed(messages) if m["role"] == "tool"), None)
if last_tool_response and last_tool_response.get("content"):
buffer += "\n\n" + last_tool_response["content"]
history[-1] = ChatMessage(role="assistant", content=buffer, metadata={"title": "Acting...", "status": "pending"})
yield history
if not done:
current_phase_index += 1
if current_phase_index < len(phase_order):
pass
else:
done = True
observe_text = phases.get("observe", "")
final_text = phases.get("final", "")
if observe_text:
history[-1] = ChatMessage(role="assistant", content=observe_text, metadata={"title": "Observing...", "status": "done"})
if final_text:
history.append(ChatMessage(role="assistant", content=final_text))
yield history