Multi-language_Text-to-Speech

Running

App Files Files Community

Olivier-Truong commited on Sep 21, 2023

Commit

915ef6e

1 Parent(s): b7e7e06

Update app.py

Browse files

Files changed (1) hide show

app.py +6 -33

app.py CHANGED Viewed

@@ -8,28 +8,9 @@ from TTS.api import TTS
 model_names = TTS().list_models()
 m = model_names[0]
-#for model in model_names:
-#    if model.find("/fr/") != -1:
-#        m = model
-#        break
 print(model_names)
-"""
-print(os.listdir("/home/user/.local/lib/python3.10/site-packages/TTS/"))
-print(os.listdir("/home/user/.local/lib/python3.10/site-packages/TTS/utils"))
-old = open("/home/user/.local/lib/python3.10/site-packages/TTS/utils/io.py", "r").read()
-new_one = old.replace("return torch.load(f, map_location=map_location, **kwargs)", "return torch.load(f, map_location=torch.device('cpu'), **kwargs)")
-open("/home/user/.local/lib/python3.10/site-packages/TTS/utils/io.py", "w").write(new_one)
-old = open("/home/user/.local/lib/python3.10/site-packages/TTS/tts/models/xtts.py", "r").read()
-new_one = old.replace("self.load_state_dict(load_fsspec(model_path)[\"model\"], strict=strict)", "self.load_state_dict(load_fsspec(model_path, ** map_location=self.device ** )[\"model\"], strict=strict)")
-open("/home/user/.local/lib/python3.10/site-packages/TTS/tts/models/xtts.py", "w").write(new_one)
-try:
-    print(open("/home/user/.local/lib/python3.10/site-packages/TTS/utils/io.py", "r").read())
-except:
-    print("mauvais fichier")
-"""
-tts = TTS(m, gpu=False).to("cpu")
 #tts.to("cuda") # cuda only
 def predict(prompt, language, audio_file_pth, mic_file_path, use_mic, agree):
@@ -53,7 +34,7 @@ def predict(prompt, language, audio_file_pth, mic_file_path, use_mic, agree):
                     None,
                     None,
                 )
-        if len(prompt)>200:
             gr.Warning("Text length limited to 200 characters for this demo, please try shorter text")
             return (
                     None,
@@ -71,14 +52,6 @@ def predict(prompt, language, audio_file_pth, mic_file_path, use_mic, agree):
                 speaker_wav=speaker_wav,
                 language=language
             )
-            """
-            tts.tts_to_file(
-                text=prompt,
-                file_path="output.wav",
-                speaker_wav=speaker_wav,
-                language=language,
-            )
-            """
         except RuntimeError as e :
             if "device-assert" in str(e):
                 # cannot do anything on cuda device side error, need tor estart
@@ -102,7 +75,7 @@ def predict(prompt, language, audio_file_pth, mic_file_path, use_mic, agree):
             )
-title = "Coqui🐸 XTTS"
 description = """
 <a href="https://huggingface.co/coqui/XTTS-v1">XTTS</a> is a Voice generation model that lets you clone voices into different languages by using just a quick 3-second audio clip.
@@ -232,7 +205,7 @@ gr.Interface(
         gr.Textbox(
             label="Text Prompt",
             info="One or two sentences at a time is better",
-            value="Hi there, I'm your new voice clone. Try your best to upload quality audio",
         ),
         gr.Dropdown(
             label="Language",
@@ -253,7 +226,7 @@ gr.Interface(
                 "zh-cn",
             ],
             max_choices=1,
-            value="en",
         ),
         gr.Audio(
             label="Reference Audio",

 model_names = TTS().list_models()
 m = model_names[0]
 print(model_names)
+tts = TTS(m, gpu=False)
+tts.to("cpu") # no GPU or Amd
 #tts.to("cuda") # cuda only
 def predict(prompt, language, audio_file_pth, mic_file_path, use_mic, agree):
                     None,
                     None,
                 )
+        if len(prompt)>10000:
             gr.Warning("Text length limited to 200 characters for this demo, please try shorter text")
             return (
                     None,
                 speaker_wav=speaker_wav,
                 language=language
             )
         except RuntimeError as e :
             if "device-assert" in str(e):
                 # cannot do anything on cuda device side error, need tor estart
             )
+title = "Coqui XTTS Glz's remake"
 description = """
 <a href="https://huggingface.co/coqui/XTTS-v1">XTTS</a> is a Voice generation model that lets you clone voices into different languages by using just a quick 3-second audio clip.
         gr.Textbox(
             label="Text Prompt",
             info="One or two sentences at a time is better",
+            value="Hello, World !, here is an example of light voice clonaaning. Try your best to upload quality audio",
         ),
         gr.Dropdown(
             label="Language",
                 "zh-cn",
             ],
             max_choices=1,
+            value="fr",
         ),
         gr.Audio(
             label="Reference Audio",