yuvscherbatov commited on
Commit
665125d
·
1 Parent(s): e2334e5

Upload app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -23,7 +23,7 @@ translation_pipe = pipeline("translation", model="facebook/wmt19-en-ru")
23
 
24
  #rus text to rus speech transformation
25
  vits_model = VitsModel.from_pretrained("facebook/mms-tts-rus")
26
- vits_tokanizer = tokenizer = VitsTokenizer.from_pretrained("facebook/mms-tts-rus")
27
 
28
  def transform_audio_to_speech_en(audio):
29
  outputs = asr_pipe(audio, max_new_tokens=256, generate_kwargs={"task": "translate"})
@@ -35,7 +35,7 @@ def translator(text):
35
 
36
  def synthesise(translated_text):
37
  translated_text = translator(translated_text)
38
- inputs = vits_tokanizer(translated_text, return_tensors="pt")
39
  with torch.no_grad():
40
  speech = vits_model(**inputs).waveform
41
  return speech.cpu()
 
23
 
24
  #rus text to rus speech transformation
25
  vits_model = VitsModel.from_pretrained("facebook/mms-tts-rus")
26
+ vits_tokenizer = VitsTokenizer.from_pretrained("facebook/mms-tts-rus")
27
 
28
  def transform_audio_to_speech_en(audio):
29
  outputs = asr_pipe(audio, max_new_tokens=256, generate_kwargs={"task": "translate"})
 
35
 
36
  def synthesise(translated_text):
37
  translated_text = translator(translated_text)
38
+ inputs = vits_tokenizer(translated_text, return_tensors="pt")
39
  with torch.no_grad():
40
  speech = vits_model(**inputs).waveform
41
  return speech.cpu()