TTS-Spaces-Arena

Running

App Files Files Community

Pendrokar commited on 22 days ago

Commit

75485ec

•

1 Parent(s): 2dfe855

F5 TTS API nfe_slider param fix

Browse files

Files changed (2) hide show

app.py +7 -6
test_tts_e2_f5_f5.py +1 -0

app.py CHANGED Viewed

@@ -427,7 +427,8 @@ OVERRIDE_INPUTS = {
 		1: DEFAULT_VOICE_TRANSCRIPT, # transcript of sample (< 15 seconds required)
 		3: False, # cleanup silence
         4: 0.15, #crossfade
-        5: 1, #speed
     },
     # IMS-Toucan
@@ -1135,7 +1136,7 @@ def synthandreturn(text, request: gr.Request):
                         # assume the index is one of the first 9 return params
                         return_audio_index = int(HF_SPACES[model]['return_audio_index'])
                         endpoints = mdl_space.view_api(all_endpoints=True, print_info=False, return_format='dict')
                         api_name = None
                         fn_index = None
                         end_parameters = None
@@ -1143,7 +1144,7 @@ def synthandreturn(text, request: gr.Request):
                         if '/' == HF_SPACES[model]['function'][0]:
                             # audio sync function name
                             api_name = HF_SPACES[model]['function']
                             end_parameters = _get_param_examples(
                                 endpoints['named_endpoints'][api_name]['parameters']
                             )
@@ -1151,7 +1152,7 @@ def synthandreturn(text, request: gr.Request):
                         else:
                             # endpoint index is the first character
                             fn_index = int(HF_SPACES[model]['function'])
                             end_parameters = _get_param_examples(
                                 endpoints['unnamed_endpoints'][str(fn_index)]['parameters']
                             )
@@ -1248,7 +1249,7 @@ def synthandreturn(text, request: gr.Request):
             pass
         return inputs
     def _cache_sample(text, model):
         # skip caching if not hardcoded sentence
         if (text not in sents):
@@ -1310,7 +1311,7 @@ def synthandreturn(text, request: gr.Request):
         # cache the result
         for model in [mdl1k, mdl2k]:
             _cache_sample(text, model)
     #debug
     # print(results)
     # print(list(results.keys())[0])

 		1: DEFAULT_VOICE_TRANSCRIPT, # transcript of sample (< 15 seconds required)
 		3: False, # cleanup silence
         4: 0.15, #crossfade
+        5: 32, #nfe_slider
+        6: 1, #speed
     },
     # IMS-Toucan
                         # assume the index is one of the first 9 return params
                         return_audio_index = int(HF_SPACES[model]['return_audio_index'])
                         endpoints = mdl_space.view_api(all_endpoints=True, print_info=False, return_format='dict')
                         api_name = None
                         fn_index = None
                         end_parameters = None
                         if '/' == HF_SPACES[model]['function'][0]:
                             # audio sync function name
                             api_name = HF_SPACES[model]['function']
                             end_parameters = _get_param_examples(
                                 endpoints['named_endpoints'][api_name]['parameters']
                             )
                         else:
                             # endpoint index is the first character
                             fn_index = int(HF_SPACES[model]['function'])
                             end_parameters = _get_param_examples(
                                 endpoints['unnamed_endpoints'][str(fn_index)]['parameters']
                             )
             pass
         return inputs
     def _cache_sample(text, model):
         # skip caching if not hardcoded sentence
         if (text not in sents):
         # cache the result
         for model in [mdl1k, mdl2k]:
             _cache_sample(text, model)
     #debug
     # print(results)
     # print(list(results.keys())[0])

test_tts_e2_f5_f5.py CHANGED Viewed

@@ -9,6 +9,7 @@ result = client.predict(
 		gen_text_input="Please surprise me and speak in whatever voice you enjoy.",
 		remove_silence=False,
 		cross_fade_duration_slider=0.15,
 		speed_slider=1,
 		api_name="/basic_tts",
 )

 		gen_text_input="Please surprise me and speak in whatever voice you enjoy.",
 		remove_silence=False,
 		cross_fade_duration_slider=0.15,
+		nfe_slider=32,
 		speed_slider=1,
 		api_name="/basic_tts",
 )