yuvscherbatov
commited on
Commit
·
665125d
1
Parent(s):
e2334e5
Upload app.py
Browse files
app.py
CHANGED
@@ -23,7 +23,7 @@ translation_pipe = pipeline("translation", model="facebook/wmt19-en-ru")
|
|
23 |
|
24 |
#rus text to rus speech transformation
|
25 |
vits_model = VitsModel.from_pretrained("facebook/mms-tts-rus")
|
26 |
-
|
27 |
|
28 |
def transform_audio_to_speech_en(audio):
|
29 |
outputs = asr_pipe(audio, max_new_tokens=256, generate_kwargs={"task": "translate"})
|
@@ -35,7 +35,7 @@ def translator(text):
|
|
35 |
|
36 |
def synthesise(translated_text):
|
37 |
translated_text = translator(translated_text)
|
38 |
-
inputs =
|
39 |
with torch.no_grad():
|
40 |
speech = vits_model(**inputs).waveform
|
41 |
return speech.cpu()
|
|
|
23 |
|
24 |
#rus text to rus speech transformation
|
25 |
vits_model = VitsModel.from_pretrained("facebook/mms-tts-rus")
|
26 |
+
vits_tokenizer = VitsTokenizer.from_pretrained("facebook/mms-tts-rus")
|
27 |
|
28 |
def transform_audio_to_speech_en(audio):
|
29 |
outputs = asr_pipe(audio, max_new_tokens=256, generate_kwargs={"task": "translate"})
|
|
|
35 |
|
36 |
def synthesise(translated_text):
|
37 |
translated_text = translator(translated_text)
|
38 |
+
inputs = vits_tokenizer(translated_text, return_tensors="pt")
|
39 |
with torch.no_grad():
|
40 |
speech = vits_model(**inputs).waveform
|
41 |
return speech.cpu()
|