File size: 557 Bytes
2f82e01
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
import nemo.collections.asr as nemo_asr
import gradio as gr


asr_model = nemo_asr.models.ASRModel.from_pretrained(model_name="QuartzNet15x5Base-En")


def transcribe(audio):
   
    transcription = asr_model.transcribe([audio])
    return transcription[0]


iface = gr.Interface(
    fn=transcribe,
    inputs=gr.inputs.Audio(source="microphone", type="filepath"),
    outputs="text",
    title="ASR with NeMo",
    description="Speak into your microphone and get a transcription using NVIDIA NeMo QuartzNet ASR."
)


iface.launch()