Spaces:

minchyeom
/

llmOS-Agent

Runtime error

tech-envision commited on Jun 5

Commit

10ac258

1 Parent(s): 4b17985

Insert system prompt at runtime

Files changed (2) hide show

README.md CHANGED Viewed

@@ -11,8 +11,9 @@ conversations can be resumed with context. One example tool is included:
   returned. The VM is created when a chat session starts and reused for all
   subsequent tool calls.
-The application now injects a system prompt that instructs the model to chain
-multiple tools when required. This prompt ensures the assistant can orchestrate
 tool calls in sequence to satisfy the user's request.
 ## Usage

   returned. The VM is created when a chat session starts and reused for all
   subsequent tool calls.
+The application injects a system prompt on each request that instructs the
+model to chain multiple tools when required. This prompt is **not** stored in
+the chat history but is provided at runtime so the assistant can orchestrate
 tool calls in sequence to satisfy the user's request.
 ## Usage

src/chat.py CHANGED Viewed

@@ -50,7 +50,6 @@ class ChatSession:
         )
         self._vm = None
         self._messages: List[Msg] = self._load_history()
-        self._ensure_system_prompt()
     async def __aenter__(self) -> "ChatSession":
         self._vm = VMRegistry.acquire(self._user.username)
@@ -82,18 +81,12 @@ class ChatSession:
         add_document(self._user.username, str(target), src.name)
         return f"/data/{src.name}"
-    def _ensure_system_prompt(self) -> None:
-        if any(m.get("role") == "system" for m in self._messages):
-            return
-        DBMessage.create(
-            conversation=self._conversation, role="system", content=SYSTEM_PROMPT
-        )
-        self._messages.insert(0, {"role": "system", "content": SYSTEM_PROMPT})
     def _load_history(self) -> List[Msg]:
         messages: List[Msg] = []
         for msg in self._conversation.messages.order_by(DBMessage.created_at):
             if msg.role == "assistant":
                 try:
                     calls = json.loads(msg.content)
@@ -124,9 +117,16 @@ class ChatSession:
         DBMessage.create(conversation=conversation, role="assistant", content=content)
     async def ask(self, messages: List[Msg], *, think: bool = True) -> ChatResponse:
         return await self._client.chat(
             self._model,
-            messages=messages,
             think=think,
             tools=[execute_terminal],
             options={"num_ctx": NUM_CTX},

         )
         self._vm = None
         self._messages: List[Msg] = self._load_history()
     async def __aenter__(self) -> "ChatSession":
         self._vm = VMRegistry.acquire(self._user.username)
         add_document(self._user.username, str(target), src.name)
         return f"/data/{src.name}"
     def _load_history(self) -> List[Msg]:
         messages: List[Msg] = []
         for msg in self._conversation.messages.order_by(DBMessage.created_at):
+            if msg.role == "system":
+                # Skip persisted system prompts from older versions
+                continue
             if msg.role == "assistant":
                 try:
                     calls = json.loads(msg.content)
         DBMessage.create(conversation=conversation, role="assistant", content=content)
     async def ask(self, messages: List[Msg], *, think: bool = True) -> ChatResponse:
+        """Send a chat request, automatically prepending the system prompt."""
+        if not messages or messages[0].get("role") != "system":
+            payload = [{"role": "system", "content": SYSTEM_PROMPT}, *messages]
+        else:
+            payload = messages
         return await self._client.chat(
             self._model,
+            messages=payload,
             think=think,
             tools=[execute_terminal],
             options={"num_ctx": NUM_CTX},