Final_Assignment_Template / video_translation.py
Synnove's picture
Create video_translation.py
5fe9041 verified
raw
history blame
628 Bytes
from smolagents.tools import Tool
from huggingface_hub import InferenceClient
class AudioTranscriptionTool(Tool):
name = "audio_transcription"
description = "Transcribes speech from an audio file (e.g., MP3)"
inputs = {"audio_path": {"type": "string", "description": "Path to the audio file"}}
output_type = "string"
def __init__(self):
super().__init__()
self.client = InferenceClient("openai/whisper-large-v3")
def forward(self, audio_path: str) -> str:
with open(audio_path, "rb") as f:
transcript = self.client.audio_to_text(f)
return transcript["text"]