whisperturbo / app.py
yasserrmd's picture
Update app.py
d0d0cf3 verified
raw
history blame
747 Bytes
import gradio as gr
from transformers import pipeline
import spaces
# Load the Whisper model from Hugging Face
model = pipeline("automatic-speech-recognition", model="ylacombe/whisper-large-v3-turbo", chunk_length_s=30, device=0)
# Function to process audio input and transcribe it
@spaces.GPU
def transcribe(audio):
# Load and preprocess the audio
transcription = model(audio,batch_size=1000, generate_kwargs={"task": "transcribe"}, return_timestamps=True)["text"]
return transcription
# Gradio interface
interface = gr.Interface(
fn=transcribe,
inputs=gr.Audio(sources="microphone", type="filepath"),
outputs="text",
title="Whisper Voice Transcription with Hugging Face"
)
# Launch the app
interface.launch()