Final_Assignment_AgentJasper

Running

App Files Files Community

Chi-AI-Rookie commited on Jun 17

Commit

9738813

1 Parent(s): 81917a3

The initial update from Qi, solved 2 questions for the timebeing

Browse files

Files changed (4) hide show

.gitignore +40 -0
agent.py +208 -0
app.py +41 -14
requirements.txt +8 -1

.gitignore ADDED Viewed

	@@ -0,0 +1,40 @@

+# Python
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+# Virtual environments
+venv/
+env/
+ENV/
+# Environment variables
+.env
+.env.local
+# IDE
+.vscode/
+.idea/
+*.swp
+*.swo
+# OS
+.DS_Store
+Thumbs.db

agent.py ADDED Viewed

	@@ -0,0 +1,208 @@

+from typing import TypedDict, Annotated
+import os
+from langchain_community.tools import DuckDuckGoSearchRun
+from langchain_community.document_loaders import WikipediaLoader, YoutubeLoader
+from langchain_community.document_loaders.youtube import TranscriptFormat
+from pytube import YouTube
+from langgraph.graph.message import add_messages
+from langchain_core.messages import AnyMessage, HumanMessage, AIMessage
+from langgraph.prebuilt import ToolNode
+from langchain_openai import ChatOpenAI
+from langgraph.graph import START, StateGraph
+from langfuse.langchain import CallbackHandler
+from langgraph.prebuilt import tools_condition
+from langchain_huggingface import HuggingFaceEndpoint, ChatHuggingFace
+from langchain_core.tools import tool
+# Web search tool using DuckDuckGo
+search_tool = DuckDuckGoSearchRun()
+# Create Wikipedia search tool using WikipediaLoader
+@tool
+def search_wikipedia(query: str) -> str:
+    """Search Wikipedia for information about a topic.
+    Args:
+        query: The search query or topic to look up on Wikipedia
+    Returns:
+        str: The Wikipedia content related to the query
+    """
+    try:
+        # Load Wikipedia documents for the query
+        loader = WikipediaLoader(query=query, load_max_docs=2)
+        docs = loader.load()
+        if not docs:
+            return f"No Wikipedia articles found for query: {query}"
+        # Combine the content from the documents
+        content = ""
+        for doc in docs:
+            content += f"Title: {doc.metadata.get('title', 'Unknown')}\n"
+            content += f"Content: {doc.page_content}...\n\n"
+        return content
+    except Exception as e:
+        return f"Error searching Wikipedia: {str(e)}"
+# Create YouTube transcript analysis tool
+@tool
+def analyze_youtube_video(video_url: str) -> str:
+    """Analyze a YouTube video by loading and processing its transcript.
+    Args:
+        video_url: The YouTube video URL to analyze
+    Returns:
+        str: The transcript content of the YouTube video
+    """
+    # try:
+        # # Method 1: Try with basic YoutubeLoader first
+        # try:
+        #     loader = YoutubeLoader.from_youtube_url(
+        #         video_url,
+        #         add_video_info=True,
+        #         language=["en", "en-US", "en-GB"]  # Try multiple English variants
+        #     )
+        #     docs = loader.load()
+        #     if docs:
+        #         content = ""
+        #         for doc in docs:
+        #             title = doc.metadata.get('title', 'Unknown Video')
+        #             author = doc.metadata.get('author', 'Unknown Author')
+        #             length = doc.metadata.get('length', 'Unknown')
+        #             content += f"Video Title: {title}\n"
+        #             content += f"Author: {author}\n"
+        #             content += f"Length: {length} seconds\n"
+        #             content += f"Transcript:\n{doc.page_content}\n\n"
+        #         return content
+        # except Exception as e1:
+        #     print(f"Method 1 failed: {e1}")
+            # Method 2: Try without video info
+            # try:
+            #     loader = YoutubeLoader.from_youtube_url(
+            #         video_url,
+            #         add_video_info=False,
+            #         language=["en"]
+            #     )
+            #     docs = loader.load()
+            #     if docs:
+            #         content = f"Video URL: {video_url}\n"
+            #         content += f"Transcript:\n{docs[0].page_content}\n\n"
+            #         return content
+            # except Exception as e2:
+            #     print(f"Method 2 failed: {e2}")
+            #     # Method 3: Try with chunked format
+    try:
+        loader = YoutubeLoader.from_youtube_url(
+            video_url,
+            add_video_info=False,
+            transcript_format=TranscriptFormat.CHUNKS,
+            chunk_size_seconds=60
+        )
+        docs = loader.load()
+        if docs:
+            content = f"Video URL: {video_url}\n"
+            content += "Transcript (Chunked):\n"
+            for i, doc in enumerate(docs[:5]):  # Limit to first 5 chunks
+                content += f"Chunk {i+1}: {doc.page_content}\n"
+            return content
+    except Exception as e:
+        print(f"Analyze video failed: {e}")
+# Initialize Langfuse CallbackHandler globally
+def get_langfuse_handler():
+    """Get configured Langfuse handler"""
+    # Langfuse will automatically read LANGFUSE_PUBLIC_KEY, LANGFUSE_SECRET_KEY, and LANGFUSE_HOST from environment
+    return CallbackHandler()
+def build_jasper():
+    # Generate the chat interface, including the tools
+    # llm = HuggingFaceEndpoint(
+    #     repo_id="Qwen/Qwen2.5-Coder-32B-Instruct",
+    #     huggingfacehub_api_token=os.getenv("HUGGINGFACE_API_TOKEN"),
+    # )
+    tools = [search_tool, search_wikipedia, analyze_youtube_video]
+    # llm = HuggingFaceEndpoint(
+    #     repo_id="Qwen/Qwen2.5-Omni-3B",
+    #     huggingfacehub_api_token=os.getenv("HUGGINGFACE_API_TOKEN"),
+    # )
+    # chat = ChatHuggingFace(llm=llm, verbose=True)
+    # chat_with_tools = chat.bind_tools(tools)
+    # Set your OpenAI API key here
+    llm = ChatOpenAI(
+    model="gpt-4o",
+    temperature=0,
+    api_key=os.getenv("OPENAI_API_KEY")
+    )
+    chat_with_tools = llm.bind_tools(tools, parallel_tool_calls=False)
+    # Generate the AgentState and Agent graph
+    class AgentState(TypedDict):
+        messages: Annotated[list[AnyMessage], add_messages]
+    def assistant(state: AgentState):
+        return {
+            "messages": [chat_with_tools.invoke(state["messages"])],
+        }
+    ## The graph
+    builder = StateGraph(AgentState)
+    # Define nodes: these do the work
+    builder.add_node("assistant", assistant)
+    builder.add_node("tools", ToolNode(tools))
+    # Define edges: these determine how the control flow moves
+    builder.add_edge(START, "assistant")
+    builder.add_conditional_edges(
+        "assistant",
+        # If the latest message requires a tool, route to tools
+        # Otherwise, provide a direct response
+        tools_condition,
+    )
+    builder.add_edge("tools", "assistant")
+    # Compile the graph without callback parameter
+    jasper = builder.compile()
+    print("Langfuse tracing enabled - traces will be available in your Langfuse dashboard")
+    return jasper
+def run_jasper():
+    jasper = build_jasper()
+    messages = [HumanMessage(content="Examine the video at https://www.youtube.com/watch?v=1htKBjuUWec.\n\nWhat does Teal'c say in response to the question \"Isn't that hot?\"")]
+    # Get Langfuse handler for tracing
+    langfuse_handler = get_langfuse_handler()
+    # Add trace metadata for this specific run
+    response = jasper.invoke(
+        {"messages": messages},
+        config={
+            "callbacks": [langfuse_handler],
+            "metadata": {
+                "trace_name": "YouTube_Video_Analysis",
+                "user_id": "jasper-user",
+                "session_id": "jasper-agent-session"
+            }
+        }
+    )
+    print("Jasper's Response:")
+    print(response['messages'][-1].content)
+if __name__ == "__main__":
+    run_jasper()

app.py CHANGED Viewed

@@ -3,25 +3,49 @@ import gradio as gr
 import requests
 import inspect
 import pandas as pd
 # (Keep Constants as is)
 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
-# --- Basic Agent Definition ---
 # ----- THIS IS WERE YOU CAN BUILD WHAT YOU WANT ------
-class BasicAgent:
     def __init__(self):
-        print("BasicAgent initialized.")
-    def __call__(self, question: str) -> str:
-        print(f"Agent received question (first 50 chars): {question[:50]}...")
-        fixed_answer = "This is a default answer."
-        print(f"Agent returning fixed answer: {fixed_answer}")
-        return fixed_answer
 def run_and_submit_all( profile: gr.OAuthProfile | None):
     """
-    Fetches all questions, runs the BasicAgent on them, submits all answers,
     and displays the results.
     """
     # --- Determine HF Space Runtime URL and Repo URL ---
@@ -40,7 +64,7 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
     # 1. Instantiate Agent ( modify this part to create your agent)
     try:
-        agent = BasicAgent()
     except Exception as e:
         print(f"Error instantiating agent: {e}")
         return f"Error initializing agent: {e}", None
@@ -80,7 +104,8 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
             print(f"Skipping item with missing task_id or question: {item}")
             continue
         try:
-            submitted_answer = agent(question_text)
             answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
             results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
         except Exception as e:
@@ -107,7 +132,8 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
             f"User: {result_data.get('username')}\n"
             f"Overall Score: {result_data.get('score', 'N/A')}% "
             f"({result_data.get('correct_count', '?')}/{result_data.get('total_attempted', '?')} correct)\n"
-            f"Message: {result_data.get('message', 'No message received.')}"
         )
         print("Submission successful.")
         results_df = pd.DataFrame(results_log)
@@ -142,7 +168,7 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
 # --- Build Gradio Interface using Blocks ---
 with gr.Blocks() as demo:
-    gr.Markdown("# Basic Agent Evaluation Runner")
     gr.Markdown(
         """
         **Instructions:**
@@ -150,6 +176,7 @@ with gr.Blocks() as demo:
         1.  Please clone this space, then modify the code to define your agent's logic, the tools, the necessary packages, etc ...
         2.  Log in to your Hugging Face account using the button below. This uses your HF username for submission.
         3.  Click 'Run Evaluation & Submit All Answers' to fetch questions, run your agent, submit answers, and see the score.
         ---
         **Disclaimers:**
@@ -192,5 +219,5 @@ if __name__ == "__main__":
     print("-"*(60 + len(" App Starting ")) + "\n")
-    print("Launching Gradio Interface for Basic Agent Evaluation...")
     demo.launch(debug=True, share=False)

 import requests
 import inspect
 import pandas as pd
+from agent import build_jasper, get_langfuse_handler
+from langchain_core.messages import HumanMessage
 # (Keep Constants as is)
 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
+# --- Jasper Agent Definition ---
 # ----- THIS IS WERE YOU CAN BUILD WHAT YOU WANT ------
+class JasperAgent:
     def __init__(self):
+        print("JasperAgent initialized.")
+        self.jasper = build_jasper()
+        self.langfuse_handler = get_langfuse_handler()
+    def __call__(self, question: str, task_id: str = None) -> str:
+        print(f"Agent received question: {question}.")
+        try:
+            messages = [HumanMessage(content=question)]
+            # Add Langfuse tracing metadata
+            config = {
+                "callbacks": [self.langfuse_handler],
+                "metadata": {
+                    "trace_name": f"Evaluation_Task_{task_id}" if task_id else "Agent_Query",
+                    "user_id": "evaluation-user",
+                    "session_id": "evaluation-session",
+                    "task_id": task_id,
+                    "question_preview": question
+                }
+            }
+            response = self.jasper.invoke({"messages": messages}, config=config)
+            answer = response['messages'][-1].content
+            print(f"Agent returning answer: {answer}.")
+            return answer
+        except Exception as e:
+            print(f"Error in agent processing: {e}")
+            return f"Error processing question: {str(e)}"
 def run_and_submit_all( profile: gr.OAuthProfile | None):
     """
+    Fetches all questions, runs the JasperAgent on them, submits all answers,
     and displays the results.
     """
     # --- Determine HF Space Runtime URL and Repo URL ---
     # 1. Instantiate Agent ( modify this part to create your agent)
     try:
+        agent = JasperAgent()
     except Exception as e:
         print(f"Error instantiating agent: {e}")
         return f"Error initializing agent: {e}", None
             print(f"Skipping item with missing task_id or question: {item}")
             continue
         try:
+            # Pass task_id for better tracing
+            submitted_answer = agent(question_text, task_id=task_id)
             answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
             results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
         except Exception as e:
             f"User: {result_data.get('username')}\n"
             f"Overall Score: {result_data.get('score', 'N/A')}% "
             f"({result_data.get('correct_count', '?')}/{result_data.get('total_attempted', '?')} correct)\n"
+            f"Message: {result_data.get('message', 'No message received.')}\n"
+            f"📊 View detailed traces in your Langfuse dashboard"
         )
         print("Submission successful.")
         results_df = pd.DataFrame(results_log)
 # --- Build Gradio Interface using Blocks ---
 with gr.Blocks() as demo:
+    gr.Markdown("# Jasper Agent Evaluation Runner")
     gr.Markdown(
         """
         **Instructions:**
         1.  Please clone this space, then modify the code to define your agent's logic, the tools, the necessary packages, etc ...
         2.  Log in to your Hugging Face account using the button below. This uses your HF username for submission.
         3.  Click 'Run Evaluation & Submit All Answers' to fetch questions, run your agent, submit answers, and see the score.
+        4.  **Langfuse Tracing**: All agent operations are traced with Langfuse for detailed analysis and debugging.
         ---
         **Disclaimers:**
     print("-"*(60 + len(" App Starting ")) + "\n")
+    print("Launching Gradio Interface for Jasper Agent Evaluation...")
     demo.launch(debug=True, share=False)

requirements.txt CHANGED Viewed

@@ -1,2 +1,9 @@
 gradio
-requests

 gradio
+requests
+langchain-community
+langchain-huggingface
+langgraph
+langfuse
+langchain-openai
+youtube-transcript-api
+pytube