Spaces:

Gregniuki
/

Pipertts

Running

App Files Files Community

Gregniuki commited on Oct 3, 2023

Commit

09b7ce7

1 Parent(s): 34b4e53

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -7

app.py CHANGED Viewed

@@ -91,8 +91,8 @@ def detect_onnx_models(path):
     else:
         return None
-#@app.post("/synthesize")
-@app.post("/synthesize", response_class=FileResponse)
 async def main(
     request: Request,
     text_input: str = Form(...),
@@ -189,10 +189,9 @@ async def main(
         inferencing(model, config, sid, text, rate, noise_scale, noise_scale_w, auto_play)
         # Save the audio as a temporary WAV file
-    temp_audio_path = os.path.join(tempfile.gettempdir(), "generated_audio.wav")
-    sf.write(temp_audio_path, merged_audio, config["audio"]["sample_rate"])
-    return FileResponse(temp_audio_path)
-#    return {"message": f"Text to synthesize: {text_input}, Speed: {speed_slider}, Play: {play}"}
 def load_onnx(model, sess_options, providers = ["CPUExecutionProvider"]):
     _LOGGER.debug("Loading model from %s", model)
@@ -242,6 +241,7 @@ def phonemes_to_ids(config, phonemes: List[str]) -> List[int]:
     ids.extend(id_map[EOS])
     return ids
 def inferencing(model, config, sid, line, length_scale = 1, noise_scale = 0.667, noise_scale_w = 0.8, auto_play=True):
     audios = []
     if config["phoneme_type"] == "PhonemeType.ESPEAK":
@@ -276,7 +276,9 @@ def inferencing(model, config, sid, line, length_scale = 1, noise_scale = 0.667,
         audios.append(audio)
     merged_audio = np.concatenate(audios)
     sample_rate = config["audio"]["sample_rate"]
     # Return the audio file as a FastAPI response
   #  display(Markdown(f"{line}"))
    # display(Audio(merged_audio, rate=sample_rate, autoplay=auto_play))

     else:
         return None
+@app.post("/synthesize")
+#@app.post("/synthesize", response_class=FileResponse)
 async def main(
     request: Request,
     text_input: str = Form(...),
         inferencing(model, config, sid, text, rate, noise_scale, noise_scale_w, auto_play)
         # Save the audio as a temporary WAV file
+    return {"message": "Post request received", "data": data}
+  #  return {"message": f"Text to synthesize: {text_input}, Speed: {speed_slider}, Play: {play}"}
 def load_onnx(model, sess_options, providers = ["CPUExecutionProvider"]):
     _LOGGER.debug("Loading model from %s", model)
     ids.extend(id_map[EOS])
     return ids
+@app.get(generate_audio)
 def inferencing(model, config, sid, line, length_scale = 1, noise_scale = 0.667, noise_scale_w = 0.8, auto_play=True):
     audios = []
     if config["phoneme_type"] == "PhonemeType.ESPEAK":
         audios.append(audio)
     merged_audio = np.concatenate(audios)
     sample_rate = config["audio"]["sample_rate"]
+    temp_audio_path = os.path.join(tempfile.gettempdir(), "generated_audio.wav")
+    sf.write(temp_audio_path, merged_audio, config["audio"]["sample_rate"])
+    return FileResponse(temp_audio_path)
     # Return the audio file as a FastAPI response
   #  display(Markdown(f"{line}"))
    # display(Audio(merged_audio, rate=sample_rate, autoplay=auto_play))