Spaces:

kevinwang676
/

Bark-Voice-Cloning

Runtime error

App Files Files Community

kevinwang676 commited on Jun 12, 2023

Commit

974e687

•

1 Parent(s): 6fe5d0a

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -28

app.py CHANGED Viewed

@@ -321,35 +321,11 @@ while run_server:
                 with gr.Column():
                     placeholder = "Enter text here."
                     input_text = gr.Textbox(label="Input Text", lines=4, placeholder=placeholder)
                 with gr.Column():
                         seedcomponent = gr.Number(label="Seed (default -1 = Random)", precision=0, value=-1)
                         batchcount = gr.Number(label="Batch count", precision=0, value=1)
-            with gr.Row():
-                with gr.Column():
-                    examples = [
-                        "Special meanings: [laughter] [laughs] [sighs] [music] [gasps] [clears throat] MAN: WOMAN:",
-                       "♪ Never gonna make you cry, never gonna say goodbye, never gonna tell a lie and hurt you ♪",
-                       "And now — a picture of a larch [laughter]",
-                       """
-                            WOMAN: I would like an oatmilk latte please.
-                            MAN: Wow, that's expensive!
-                       """,
-                       """<?xml version="1.0"?>
-    <speak version="1.0" xmlns="http://www.w3.org/2001/10/synthesis"
-             xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
-             xsi:schemaLocation="http://www.w3.org/2001/10/synthesis
-                       http://www.w3.org/TR/speech-synthesis/synthesis.xsd"
-             xml:lang="en-US">
-    <voice name="/v2/en_speaker_9">Look at that drunk guy!</voice>
-    <voice name="/v2/en_speaker_3">Who is he?</voice>
-    <voice name="/v2/en_speaker_9">WOMAN: [clears throat] 10 years ago, he proposed me and I rejected him.</voice>
-    <voice name="/v2/en_speaker_3">Oh my God [laughs] he is still celebrating</voice>
-    </speak>"""
-                       ]
-                    examples = gr.Examples(examples=examples, inputs=input_text)
-                with gr.Column():
-                    convert_to_ssml_button = gr.Button("Convert Input Text to SSML")
             with gr.Row():
                 with gr.Column():
                     gr.Markdown("[Voice Prompt Library](https://suno-ai.notion.site/8b8e8749ed514b0cbf3f699013548683?v=bc67cff786b04b50b3ceb756fd05f68c)")
@@ -376,7 +352,30 @@ while run_server:
             with gr.Row():
                 output_audio = gr.Audio(label="Generated Audio", type="filepath")
-        with gr.Tab("Swap Voice"):
             with gr.Row():
                  swap_audio_filename = gr.Audio(label="Input audio.wav to swap voice", source="upload", type="filepath")
             with gr.Row():
@@ -387,7 +386,7 @@ while run_server:
                      speaker_swap = gr.Dropdown(speakers_list, value=speakers_list[0], label="Voice")
                      swap_batchcount = gr.Number(label="Batch count", precision=0, value=1)
             with gr.Row():
-                swap_voice_button = gr.Button("Swap Voice")
             with gr.Row():
                 output_swap = gr.Audio(label="Generated Audio", type="filepath")

                 with gr.Column():
                     placeholder = "Enter text here."
                     input_text = gr.Textbox(label="Input Text", lines=4, placeholder=placeholder)
+                    convert_to_ssml_button = gr.Button("Convert Input Text to SSML")
                 with gr.Column():
                         seedcomponent = gr.Number(label="Seed (default -1 = Random)", precision=0, value=-1)
                         batchcount = gr.Number(label="Batch count", precision=0, value=1)
             with gr.Row():
                 with gr.Column():
                     gr.Markdown("[Voice Prompt Library](https://suno-ai.notion.site/8b8e8749ed514b0cbf3f699013548683?v=bc67cff786b04b50b3ceb756fd05f68c)")
             with gr.Row():
                 output_audio = gr.Audio(label="Generated Audio", type="filepath")
+            with gr.Row():
+                examples = [
+                    "Special meanings: [laughter] [laughs] [sighs] [music] [gasps] [clears throat] MAN: WOMAN:",
+                    "♪ Never gonna make you cry, never gonna say goodbye, never gonna tell a lie and hurt you ♪",
+                    "And now — a picture of a larch [laughter]",
+                    """
+                        WOMAN: I would like an oatmilk latte please.
+                        MAN: Wow, that's expensive!
+                    """,
+                    """<?xml version="1.0"?>
+<speak version="1.0" xmlns="http://www.w3.org/2001/10/synthesis"
+            xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+            xsi:schemaLocation="http://www.w3.org/2001/10/synthesis
+                    http://www.w3.org/TR/speech-synthesis/synthesis.xsd"
+            xml:lang="en-US">
+<voice name="/v2/en_speaker_9">Look at that drunk guy!</voice>
+<voice name="/v2/en_speaker_3">Who is he?</voice>
+<voice name="/v2/en_speaker_9">WOMAN: [clears throat] 10 years ago, he proposed me and I rejected him.</voice>
+<voice name="/v2/en_speaker_3">Oh my God [laughs] he is still celebrating</voice>
+</speak>"""
+                    ]
+                examples = gr.Examples(examples=examples, inputs=input_text)
+        with gr.Tab("Voice Conversion"):
             with gr.Row():
                  swap_audio_filename = gr.Audio(label="Input audio.wav to swap voice", source="upload", type="filepath")
             with gr.Row():
                      speaker_swap = gr.Dropdown(speakers_list, value=speakers_list[0], label="Voice")
                      swap_batchcount = gr.Number(label="Batch count", precision=0, value=1)
             with gr.Row():
+                swap_voice_button = gr.Button("Voice Conversion")
             with gr.Row():
                 output_swap = gr.Audio(label="Generated Audio", type="filepath")