Final_Assignment_Submission

Sleeping

App Files Files Community

Sonu313131 commited on Jun 28

Commit

8753522

verified ·

1 Parent(s): 254e51c

Update app.py

Browse files

Files changed (1) hide show

app.py +20 -14

app.py CHANGED Viewed

@@ -20,14 +20,18 @@ import re
 from youtube_transcript_api import YouTubeTranscriptApi
 from smolagents import Tool
-class YouTubeCaptionTool(Tool):
-    name = "youtube_caption_reader"
-    description = "Extracts captions from a YouTube video given its URL and returns the transcript or a segment."
     inputs = {
         "url": {
             "type": "string",
-            "description": "Full YouTube video URL (e.g., https://www.youtube.com/watch?v=abc123)"
         }
     }
@@ -35,19 +39,21 @@ class YouTubeCaptionTool(Tool):
     def forward(self, url: str) -> str:
         try:
-            # Extract the video ID from the URL
-            match = re.search(r"(?:v=|youtu.be/)([\w-]+)", url)
-            if not match:
-                return "Could not extract video ID from URL."
-            video_id = match.group(1)
-            transcript = YouTubeTranscriptApi.get_transcript(video_id)
-            full_text = " ".join([entry['text'] for entry in transcript])
-            return full_text[:3000]  # return first 3000 characters
         except Exception as e:
-            return f"Failed to retrieve transcript: {str(e)}"
 ##Tool 2
@@ -121,7 +127,7 @@ async def run_and_submit_all(profile: gr.OAuthProfile | None):
                 model=OpenAIServerModel(model_id="gpt-4o-mini",
                                         api_key=os.environ["OPENAI_API_KEY"],
                                        temperature=0.0),
-            max_steps=12,
             verbosity_level=2
         )
     except Exception as e:

 from youtube_transcript_api import YouTubeTranscriptApi
 from smolagents import Tool
+from smolagents import Tool
+from youtube_transcript_api import YouTubeTranscriptApi
+from urllib.parse import urlparse, parse_qs
+class YouTubeTranscriptTool(Tool):
+    name = "youtube_transcript"
+    description = "Fetches the full transcript of a YouTube video from its URL."
     inputs = {
         "url": {
             "type": "string",
+            "description": "The full YouTube video URL"
         }
     }
     def forward(self, url: str) -> str:
         try:
+            # Extract video ID from URL
+            parsed = urlparse(url)
+            video_id = parse_qs(parsed.query).get("v", [None])[0]
+            if not video_id:
+                return "Error: Invalid YouTube URL or missing video ID."
+            # Fetch the transcript
+            transcript_list = YouTubeTranscriptApi.get_transcript(video_id)
+            transcript_text = " ".join(entry["text"] for entry in transcript_list)
+            return transcript_text[:5000]  # Optional: truncate to 5000 chars
         except Exception as e:
+            return f"Error retrieving transcript: {str(e)}"
 ##Tool 2
                 model=OpenAIServerModel(model_id="gpt-4o-mini",
                                         api_key=os.environ["OPENAI_API_KEY"],
                                        temperature=0.0),
+            max_steps=18,
             verbosity_level=2
         )
     except Exception as e: