voice_clone_v2

Paused

App Files Files Community

ahassoun commited on Sep 13, 2023

Commit

b4f3031

1 Parent(s): 9a1196d

Update app.py

Browse files

Files changed (1) hide show

app.py +1 -68

app.py CHANGED Viewed

@@ -352,14 +352,7 @@ with gr.Blocks(css=css) as demo:
     with gr.Column(elem_id="col-container"):
         gr.Markdown("""
-        <h1 style="text-align: center;">Coqui + Bark Voice Cloning</h1>
-        <p style="text-align: center;">
-        Mimic any voice character in less than 2 minutes with this <a href="https://tts.readthedocs.io/en/dev/models/bark.html" target="_blank">Coqui TTS + Bark</a> demo ! <br />
-        Upload a clean 20 seconds WAV file of the vocal persona you want to mimic, <br />
-        type your text-to-speech prompt and hit submit ! <br />
-        </p>
-        [![Duplicate this Space](https://huggingface.co/datasets/huggingface/badges/raw/main/duplicate-this-space-sm.svg#center)](https://huggingface.co/spaces/fffiloni/instant-TTS-Bark-cloning?duplicate=true)
         """)
         with gr.Row():
             with gr.Column():
@@ -378,7 +371,6 @@ with gr.Blocks(css=css) as demo:
                     source="upload",
                     interactive = False
                 )
-                clean_sample = gr.Checkbox(label="Clean sample ?", value=False)
                 hidden_audio_numpy = gr.Audio(type="numpy", visible=False)
                 submit_btn = gr.Button("Submit")
@@ -415,20 +407,6 @@ with gr.Blocks(css=css) as demo:
                 audio_in.upload(fn=load_hidden, inputs=[audio_in], outputs=[hidden_audio_numpy], queue=False)
                 micro_in.stop_recording(fn=load_hidden_mic, inputs=[micro_in], outputs=[hidden_audio_numpy], queue=False)
-                with gr.Tab("Voices Characters"):
-                    selected_state = gr.State()
-                    gallery_in = gr.Gallery(
-                                label="Character Gallery",
-                                value=[(item["image"], item["title"]) for item in characters],
-                                interactive = True,
-                                allow_preview=False,
-                                columns=3,
-                                elem_id="gallery",
-                                show_share_button=False
-                            )
-                    c_submit_btn = gr.Button("Submit")
             with gr.Column():
@@ -450,34 +428,8 @@ with gr.Blocks(css=css) as demo:
                 folder_path = gr.Textbox(visible=False)
-                character_name = gr.Textbox(
-                    label="Character Name",
-                    placeholder="Name that voice character",
-                    elem_id = "character-name"
-                )
-                voice_description = gr.Textbox(
-                    label="description",
-                    placeholder="How would you describe that voice ? ",
-                    elem_id = "voice-description"
-                )
-                with gr.Group(elem_id="share-btn-container", visible=False) as share_group:
-                    community_icon = gr.HTML(community_icon_html)
-                    loading_icon = gr.HTML(loading_icon_html)
-                    share_button = gr.Button("Share with Community", elem_id="share-btn")
-        share_button.click(None, [], [], _js=share_js, queue=False)
-        gallery_in.select(
-            update_selection,
-            outputs=[character_name, selected_state],
-            queue=False,
-            show_progress=False,
-        )
         audio_in.change(fn=wipe_npz_file, inputs=[folder_path], queue=False)
         micro_in.clear(fn=wipe_npz_file, inputs=[folder_path], queue=False)
@@ -500,14 +452,12 @@ with gr.Blocks(css=css) as demo:
             inputs = [
                 prompt,
                 audio_in,
-                clean_sample,
                 hidden_audio_numpy
             ],
             outputs = [
                 cloned_out,
                 video_out,
                 npz_file,
-                share_group,
                 folder_path
             ],
             cache_examples = False
@@ -534,14 +484,12 @@ with gr.Blocks(css=css) as demo:
         inputs = [
             prompt,
             audio_in,
-            clean_sample,
             hidden_audio_numpy
         ],
         outputs = [
             cloned_out,
             video_out,
             npz_file,
-            share_group,
             folder_path
         ]
     )
@@ -558,23 +506,8 @@ with gr.Blocks(css=css) as demo:
             cloned_out,
             video_out,
             npz_file,
-            share_group,
             folder_path
         ]
     )
-    c_submit_btn.click(
-        fn = infer_from_c,
-        inputs = [
-            prompt,
-            character_name
-        ],
-        outputs = [
-            cloned_out,
-            video_out,
-            npz_file,
-            share_group
-        ]
-    )
 demo.queue(api_open=False, max_size=10).launch()

     with gr.Column(elem_id="col-container"):
         gr.Markdown("""
+        <h1 style="text-align: center;">Voice Cloning Demo</h1>
         """)
         with gr.Row():
             with gr.Column():
                     source="upload",
                     interactive = False
                 )
                 hidden_audio_numpy = gr.Audio(type="numpy", visible=False)
                 submit_btn = gr.Button("Submit")
                 audio_in.upload(fn=load_hidden, inputs=[audio_in], outputs=[hidden_audio_numpy], queue=False)
                 micro_in.stop_recording(fn=load_hidden_mic, inputs=[micro_in], outputs=[hidden_audio_numpy], queue=False)
             with gr.Column():
                 folder_path = gr.Textbox(visible=False)
         audio_in.change(fn=wipe_npz_file, inputs=[folder_path], queue=False)
         micro_in.clear(fn=wipe_npz_file, inputs=[folder_path], queue=False)
             inputs = [
                 prompt,
                 audio_in,
                 hidden_audio_numpy
             ],
             outputs = [
                 cloned_out,
                 video_out,
                 npz_file,
                 folder_path
             ],
             cache_examples = False
         inputs = [
             prompt,
             audio_in,
             hidden_audio_numpy
         ],
         outputs = [
             cloned_out,
             video_out,
             npz_file,
             folder_path
         ]
     )
             cloned_out,
             video_out,
             npz_file,
             folder_path
         ]
     )
 demo.queue(api_open=False, max_size=10).launch()