SAML100723GoodVersion

Runtime error

App Files Files Community

on1onmangoes commited on Oct 7, 2023

Commit

9324d2a

•

1 Parent(s): d23a170

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -7

app.py CHANGED Viewed

@@ -32,9 +32,18 @@ def transcribe(audio_path, task="transcribe", group_by_speaker=True, progress=gr
     print(diarization)
     #segments = diarization.for_json()["content"]
     #segments = str(diarization)
-    transcription = "this is a test"
     return transcription
 audio_file = gr.Interface(
     fn=transcribe,
     inputs=[
@@ -43,12 +52,12 @@ audio_file = gr.Interface(
         gr.inputs.Checkbox(default=True, label="Group by speaker"),
     ],
     outputs=[
-        gr.outputs.Textbox(label="Transcription")
-    ]
-    # allow_flagging="never",
-    # title=title,
-    # description=description,
-    # article=article,
 )
 demo = gr.Blocks()

     print(diarization)
     #segments = diarization.for_json()["content"]
     #segments = str(diarization)
+    transcription = "SAML Output"
     return transcription
+title = "SAML Speaker Diarization ⚡️"
+description = """Combine the speed of Whisper JAX with pyannote speaker diarization to transcribe meetings in super fast time. Demo uses Whisper JAX as an [endpoint](https://twitter.com/sanchitgandhi99/status/1656665496463495168) and pyannote speaker diarization running locally. The Whisper JAX endpoint is run asynchronously, meaning speaker diarization is run in parallel to the speech transcription. The diarized timestamps are aligned with the Whisper output to give the final speaker-segmented transcription.
+To duplicate the demo, first accept the pyannote terms of use for the [speaker diarization](https://huggingface.co/pyannote/speaker-diarization) and [segmentation](https://huggingface.co/pyannote/segmentation) models. Then, click [here](https://huggingface.co/spaces/sanchit-gandhi/whisper-jax-diarization?duplicate=true) to duplicate the demo, and enter your Hugging Face access token as a Space secret when prompted.
+"""
+article = "Whisper large-v2 model by OpenAI. Speaker diarization model by pyannote. Whisper JAX backend running JAX on a TPU v4-8 through the generous support of the [TRC](https://sites.research.google/trc/about/) programme. Whisper JAX [code](https://github.com/sanchit-gandhi/whisper-jax) and Gradio demo by 🤗 Hugging Face."
 audio_file = gr.Interface(
     fn=transcribe,
     inputs=[
         gr.inputs.Checkbox(default=True, label="Group by speaker"),
     ],
     outputs=[
+        gr.outputs.Textbox(label="Transcription").style(show_copy_button=True)
+    ],
+    allow_flagging="never",
+    title=title,
+    description=description,
+    article=article,
 )
 demo = gr.Blocks()