Spaces:
Sleeping
Sleeping
File size: 628 Bytes
5fe9041 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 |
from smolagents.tools import Tool
from huggingface_hub import InferenceClient
class AudioTranscriptionTool(Tool):
name = "audio_transcription"
description = "Transcribes speech from an audio file (e.g., MP3)"
inputs = {"audio_path": {"type": "string", "description": "Path to the audio file"}}
output_type = "string"
def __init__(self):
super().__init__()
self.client = InferenceClient("openai/whisper-large-v3")
def forward(self, audio_path: str) -> str:
with open(audio_path, "rb") as f:
transcript = self.client.audio_to_text(f)
return transcript["text"] |