Voice / app.py
TheMaisk's picture
Update app.py
41d76e7 verified
raw
history blame
1.22 kB
import subprocess
import gradio as gr
import torch
from TTS.api import TTS
# Run the setup.py install command
try:
subprocess.run(['python', 'setup.py', 'install', '--user'], check=True)
print("Installation successful.")
except subprocess.CalledProcessError as e:
print(f"Installation failed with error: {e}")
# Get device
device = "cuda" if torch.cuda.is_available() else "cpu"
# Init TTS
tts = TTS("tts_models/multilingual/multi-dataset/xtts_v2").to(device)
def voice_clone(text: str, speaker_wav: str, language: str):
# Run TTS
print("Speaker wav:", speaker_wav)
tts.tts_to_file(text=text, speaker_wav=speaker_wav, language=language, file_path="output.wav")
return "output.wav"
iface = gr.Interface(
fn=voice_clone,
inputs=[
gr.Textbox(lines=2, placeholder="Enter the text...", label="Text"),
gr.Audio(type="filepath", label="Upload audio file"),
gr.Radio(['ru', 'en', 'zh-cn', 'ja', 'de', 'fr', 'it', 'pt', 'pl', 'tr', 'ko', 'nl', 'cs', 'ar', 'es', 'hu'], label="language"),
],
outputs=gr.Audio(type="filepath", label="Generated audio file"),
title="Voice Cloning",
theme="syddharth/gray-minimal" # Add the theme here
)
iface.launch()