Spaces:

Flux9665
/

MassivelyMultilingualTTS

Running on T4

App Files Files

Flux9665 commited on Oct 31, 2024

Commit

3abac7b

verified ·

1 Parent(s): 2889ed0

Update app.py

Browse files

Files changed (1) hide show

app.py +2 -8

app.py CHANGED Viewed

@@ -16,18 +16,12 @@ class TTSWebUI:
                  tts_model_path=None,
                  vocoder_model_path=None,
                  embedding_gan_path=None,
-                 available_artificial_voices=50  # be careful with this, if you want too many, it might lead to an endless loop
                  ):
         path_to_iso_list = hf_hub_download(repo_id="Flux9665/ToucanTTS", filename="iso_to_fullname.json")
         iso_to_name = load_json_from_path(path_to_iso_list)
         text_selection = [f"{iso_to_name[iso_code]} ({iso_code})" for iso_code in iso_to_name]
         # accent_selection = [f"{iso_to_name[iso_code]} Accent ({iso_code})" for iso_code in iso_to_name]
-        if tts_model_path is None:
-            tts_model_path = hf_hub_download(repo_id="Flux9665/ToucanTTS", filename="ToucanTTS.pt")
-        if vocoder_model_path is None:
-            vocoder_model_path = hf_hub_download(repo_id="Flux9665/ToucanTTS", filename="Vocoder.pt")
-        if embedding_gan_path is None:
-            embedding_gan_path = hf_hub_download(repo_id="Flux9665/ToucanTTS", filename="embedding_gan.pt")
         self.controllable_ui = ControllableInterface(gpu_id=gpu_id,
                                                      available_artificial_voices=available_artificial_voices,
@@ -45,7 +39,7 @@ class TTSWebUI:
                                                       label="Select the Language of the Text (type on your keyboard to find it quickly)"),
                                           gr.Slider(minimum=0.0, maximum=0.8, step=0.1, value=0.5, label="Prosody Creativity"),
                                           gr.Slider(minimum=0.7, maximum=1.3, step=0.1, value=1.0, label="Faster - Slower"),
-                                          gr.Slider(minimum=0, maximum=available_artificial_voices, step=1, value=27, label="Random Seed for the artificial Voice"),
                                           gr.Slider(minimum=-10.0, maximum=10.0, step=0.1, value=0.0, label="Gender of artificial Voice"),
                                           gr.Audio(type="filepath", show_label=True, container=True, label="[OPTIONAL] Voice to Clone (if left empty, will use an artificial voice instead)"),
                                           # gr.Slider(minimum=0.5, maximum=1.5, step=0.1, value=1.0, label="Pitch Variance Scale"),

                  tts_model_path=None,
                  vocoder_model_path=None,
                  embedding_gan_path=None,
+                 available_artificial_voices=10  # be careful with this, if you want too many, it might lead to an endless loop
                  ):
         path_to_iso_list = hf_hub_download(repo_id="Flux9665/ToucanTTS", filename="iso_to_fullname.json")
         iso_to_name = load_json_from_path(path_to_iso_list)
         text_selection = [f"{iso_to_name[iso_code]} ({iso_code})" for iso_code in iso_to_name]
         # accent_selection = [f"{iso_to_name[iso_code]} Accent ({iso_code})" for iso_code in iso_to_name]
         self.controllable_ui = ControllableInterface(gpu_id=gpu_id,
                                                      available_artificial_voices=available_artificial_voices,
                                                       label="Select the Language of the Text (type on your keyboard to find it quickly)"),
                                           gr.Slider(minimum=0.0, maximum=0.8, step=0.1, value=0.5, label="Prosody Creativity"),
                                           gr.Slider(minimum=0.7, maximum=1.3, step=0.1, value=1.0, label="Faster - Slower"),
+                                          gr.Slider(minimum=0, maximum=available_artificial_voices, step=1, value=5, label="Random Seed for the artificial Voice"),
                                           gr.Slider(minimum=-10.0, maximum=10.0, step=0.1, value=0.0, label="Gender of artificial Voice"),
                                           gr.Audio(type="filepath", show_label=True, container=True, label="[OPTIONAL] Voice to Clone (if left empty, will use an artificial voice instead)"),
                                           # gr.Slider(minimum=0.5, maximum=1.5, step=0.1, value=1.0, label="Pitch Variance Scale"),