Spaces:

Hunzla
/

whisperaudio

Runtime error

Hunzla commited on Aug 9, 2023

Commit

37ad5f1

•

1 Parent(s): 7c81e92

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -11,7 +11,7 @@ diarization_pipe = Pipeline.from_pretrained("pyannote/speaker-diarization@2.1",
 # Load the speech-to-text model (Whisper)
-asr_pipe = pipeline("automatic-speech-recognition", model="SyedAunZaidi/whisper-small-hi")
 def transcribe_with_diarization(audio_path):
     # Get speaker segments using the diarization model
@@ -51,9 +51,12 @@ def transcribe_with_diarization(audio_path):
 iface = gr.Interface(
     fn=transcribe_with_diarization,
-    inputs=gr.Audio(source="microphone", type="filepath", filetype="wav"),
     outputs="text",
-    title="Whisper Large Hindi with Speaker Diarization",
     description="Real-time demo for Hindi speech recognition using a fine-tuned Whisper large model with speaker diarization.",
 )

 # Load the speech-to-text model (Whisper)
+asr_pipe = pipeline("automatic-speech-recognition", model="openai/whisper-tiny")
 def transcribe_with_diarization(audio_path):
     # Get speaker segments using the diarization model
 iface = gr.Interface(
     fn=transcribe_with_diarization,
+    inputs=[
+        gr.File(label="Audio File"),
+        gr.Audio(source="microphone", type="filepath", filetype="wav")
+    ],
     outputs="text",
+    title="Whisper small Hindi with Speaker Diarization",
     description="Real-time demo for Hindi speech recognition using a fine-tuned Whisper large model with speaker diarization.",
 )