Spaces:

AlexK-PL
/

vits-v2-8khz-inference

Runtime error

App Files Files Community

AlexK-PL commited on Jan 18, 2024

Commit

c8797aa

verified ·

1 Parent(s): b0910d2

Update app.py

Browse files

Files changed (1) hide show

app.py +19 -10

app.py CHANGED Viewed

@@ -57,17 +57,17 @@ commonvoice_speakers = [s for s in speakers_list if len(s) > 20]  #
 DEFAULT_SPEAKER_ID = os.environ.get("DEFAULT_SPEAKER_ID", default="pau")
 DEFAULT_CHECKPOINT = os.environ.get("DEFAULT_CHECKPOINT", default=model_files[0])
-model_file = model_files[0]  # change this!!
-model_path = os.path.join(os.getcwd(), model_file)
-config_path = "config.json"
 vocoder_path = None
 vocoder_config_path = None
-synthesizer = Synthesizer(
-    model_path, config_path, speakers_path, None, vocoder_path, vocoder_config_path,
-)
 def get_phonetic_transcription(text: str):
@@ -85,7 +85,16 @@ def get_phonetic_transcription(text: str):
         return None
-def tts_inference(text: str, speaker_idx: str = None):
     # synthesize
     if synthesizer is None:
         raise NameError("model not found")
@@ -113,11 +122,11 @@ description = """
 """
-def submit_input(input_, speaker_id):
     output_audio = None
     output_phonetic = None
     if input_ is not None and len(input_) < MAX_INPUT_TEXT_LEN:
-        output_audio = tts_inference(input_, speaker_id)
         output_phonetic = get_phonetic_transcription(input_)
     else:
         gr.Warning(f"Your text exceeds the {MAX_INPUT_TEXT_LEN}-character limit.")
@@ -196,7 +205,7 @@ with gr.Blocks(**AinaGradioTheme().get_kwargs()) as app:
         input_.change(fn=change_interactive, inputs=[input_], outputs=button)
     # clear_btn.click(fn=clean, inputs=[], outputs=[input_, output_audio, output_phonetic], queue=False)
-    submit_btn.click(fn=submit_input, inputs=[input_, speaker_id], outputs=[output_audio, output_phonetic])
 app.queue(concurrency_count=1, api_open=False)
 app.launch(show_api=False, server_name="0.0.0.0", server_port=7860)

 DEFAULT_SPEAKER_ID = os.environ.get("DEFAULT_SPEAKER_ID", default="pau")
 DEFAULT_CHECKPOINT = os.environ.get("DEFAULT_CHECKPOINT", default=model_files[0])
+# model_file = model_files[0]  # change this!!
+# model_path = os.path.join(os.getcwd(), model_file)
+# config_path = os.path.join(os.getcwd(), "config.json")
 vocoder_path = None
 vocoder_config_path = None
+# synthesizer = Synthesizer(
+#     model_path, config_path, speakers_path, None, vocoder_path, vocoder_config_path,
+# )
 def get_phonetic_transcription(text: str):
         return None
+def tts_inference(text: str, speaker_idx: str = None, model_file: str=None):
+    model_path = os.path.join(os.getcwd(), model_file)
+    speakers_file_path = "speakers.pth"
+    config_path = "config.json"
+    vocoder_path = None
+    vocoder_config_path = None
+    synthesizer = Synthesizer(model_path, config_path, speakers_path, None,
+                              vocoder_path, vocoder_config_path)
     # synthesize
     if synthesizer is None:
         raise NameError("model not found")
 """
+def submit_input(input_, speaker_id, model_chkpt):
     output_audio = None
     output_phonetic = None
     if input_ is not None and len(input_) < MAX_INPUT_TEXT_LEN:
+        output_audio = tts_inference(input_, speaker_id, model_chkpt)
         output_phonetic = get_phonetic_transcription(input_)
     else:
         gr.Warning(f"Your text exceeds the {MAX_INPUT_TEXT_LEN}-character limit.")
         input_.change(fn=change_interactive, inputs=[input_], outputs=button)
     # clear_btn.click(fn=clean, inputs=[], outputs=[input_, output_audio, output_phonetic], queue=False)
+    submit_btn.click(fn=submit_input, inputs=[input_, speaker_id, model_chkpt], outputs=[output_audio, output_phonetic])
 app.queue(concurrency_count=1, api_open=False)
 app.launch(show_api=False, server_name="0.0.0.0", server_port=7860)