ai_agent_course_final_project

Sleeping

App Files Files Community

keynes42 commited on May 27

Commit

679d19e

verified ·

1 Parent(s): 01a0138

Update app.py

Browse files

Files changed (1) hide show

app.py +45 -2

app.py CHANGED Viewed

@@ -1,4 +1,5 @@
 import os, sys
 from enum import Enum
 import gradio as gr
 import requests
@@ -14,7 +15,6 @@ from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline, BitsAndB
 from smolagents import CodeAgent, VisitWebpageTool, WebSearchTool, WikipediaSearchTool, PythonInterpreterTool
 from smolagents.models import ChatMessage
 from custom_tools import WebpageStructureAnalyzerTool
-from system_prompts import CODE_AGENT_DEFAULT_SYSTEM_PROMPTS
 subprocess.run(["playwright", "install"], check=True)
@@ -48,6 +48,45 @@ class PreloadedPythonTool(PythonInterpreterTool):
         )
         return super().run(preamble + code)
 def check_token_access():
     token = os.environ.get("HF_TOKEN", "")
     if not token:
@@ -199,6 +238,10 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
         python_tool = PythonInterpreterTool()
         html_parse_tool = VisitWebpageTool()
         # (3) Create the system prompt
         my_added_prompts = """
         When you receive output from a tool (like wiki_tool or html_parse_tool), do not include the entire raw output in your next thought if it is very long.
         Instead, first analyze it (possibly using another tool or by writing code to extract key parts) and only include essential snippets, summaries, or the extracted data relevant to your current plan in your thoughts and observations.
@@ -207,7 +250,7 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
         Your thoughts and reasoning should precede the code block.
         For web pages, always use web_structure_analyzer_tool to understand the page's layout before attempting to write detailed parsing code with bs4.
         """
-        combined_system_prompt = CODE_AGENT_DEFAULT_SYSTEM_PROMPTS + "\n\n" + added_prompts
         # (4) Create the CodeAgent, passing the LLM wrapper and tools
         agent = CodeAgent(model=llm_model,
                           tools=[web_structure_analyzer_tool, wiki_tool, search_tool, python_tool, html_parse_tool],

 import os, sys
+import yaml
 from enum import Enum
 import gradio as gr
 import requests
 from smolagents import CodeAgent, VisitWebpageTool, WebSearchTool, WikipediaSearchTool, PythonInterpreterTool
 from smolagents.models import ChatMessage
 from custom_tools import WebpageStructureAnalyzerTool
 subprocess.run(["playwright", "install"], check=True)
         )
         return super().run(preamble + code)
+# In your app.py (or a helper module like your system_prompts.py)
+import yaml
+import os
+# --- Function to load the prompt from your YAML file ---
+def load_prompt_from_yaml(file_path: str) -> str:
+    try:
+        with open(file_path, 'r', encoding='utf-8') as f:
+            data = yaml.safe_load(f)
+            # Now, how you extract the prompt depends on the YAML's structure:
+            # Scenario A: If codeagent.yaml's *entire content* is the system prompt string
+            # (i.e., it's not a dictionary, just a multi-line string)
+            if isinstance(data, str):
+                return data
+            # Scenario B: If codeagent.yaml is a dictionary with a specific key for the system prompt
+            # For example, if it looks like:
+            # system_prompt: |
+            #   This is the prompt...
+            #   It has multiple lines...
+            # other_key: ...
+            elif isinstance(data, dict):
+                # YOU NEED TO KNOW THE KEY NAME FOR THE SYSTEM PROMPT IN THE YAML
+                # Let's assume the key is 'system_prompt' for this example
+                if "system_prompt" in data: # Replace "system_prompt" with the actual key
+                    return data["system_prompt"]
+                else:
+                    raise ValueError("Key for system prompt not found in YAML dictionary.")
+            else:
+                raise ValueError("YAML content is not in an expected format (string or dict).")
+    except FileNotFoundError:
+        print(f"ERROR: YAML prompt file not found at {file_path}")
+        return "Fallback default system prompt: You are a helpful AI." # Or raise an error
+    except Exception as e:
+        print(f"ERROR: Could not load or parse YAML prompt file {file_path}: {e}")
+        return "Fallback default system prompt: You are a helpful AI."
 def check_token_access():
     token = os.environ.get("HF_TOKEN", "")
     if not token:
         python_tool = PythonInterpreterTool()
         html_parse_tool = VisitWebpageTool()
         # (3) Create the system prompt
+        # Assuming 'my_default_system_prompt.yaml' is in the same directory as app.py
+        current_dir = os.path.dirname(os.path.abspath(__file__))
+        prompt_yaml_file = os.path.join(current_dir, "default_system_prompt.yaml")
+        default_system_prompt = load_prompt_from_yaml(prompt_yaml_file)
         my_added_prompts = """
         When you receive output from a tool (like wiki_tool or html_parse_tool), do not include the entire raw output in your next thought if it is very long.
         Instead, first analyze it (possibly using another tool or by writing code to extract key parts) and only include essential snippets, summaries, or the extracted data relevant to your current plan in your thoughts and observations.
         Your thoughts and reasoning should precede the code block.
         For web pages, always use web_structure_analyzer_tool to understand the page's layout before attempting to write detailed parsing code with bs4.
         """
+        combined_system_prompt = default_system_prompt + "\n\n" + added_prompts
         # (4) Create the CodeAgent, passing the LLM wrapper and tools
         agent = CodeAgent(model=llm_model,
                           tools=[web_structure_analyzer_tool, wiki_tool, search_tool, python_tool, html_parse_tool],