dkounadis
/

artificial-styletts2

@@ -42,7 +42,7 @@ Beta version of [SHIFT](https://shift-europe.eu/) TTS tool with [AudioGen sounds
 Build virtualenv & run api.py
 </summary>
-Above `demo.py` is a standalone script that loads SHIFT TTS & AudioGen model(s) and synthesizes a txt. We also provide a Flask `api.py` that allows faster inference with
 loading only once the TTS & AudioGen model.
 Clone

 Build virtualenv & run api.py
 </summary>
+Above [TTS Demo](https://huggingface.co/dkounadis/artificial-styletts2/blob/main/demo.py) is a standalone script that loads SHIFT TTS & AudioGen model(s) and synthesizes a txt. We also provide a Flask `api.py` that allows faster inference with
 loading only once the TTS & AudioGen model.
 Clone

landscape2soundscape.py CHANGED Viewed

@@ -2,7 +2,7 @@ import numpy as np
 import subprocess
 import cv2
-# with subprocess and an extra argument 'scene' and a 'resized image saved as png' we can call the server
 # yt-dlp is instaled in .d4
 # Download Part of Video
 # yt-dlp https://www.youtube.com/watch?v=UZ9uyQI3pF0 --downloader ffmpeg --downloader-args "ffmpeg_i:-ss 997 -to 2512"
@@ -47,7 +47,7 @@ DESCRIPTIONS = [
         '01_Schick_AII840_001.txt',                               # text
         'statue in shire, hill river, vogels.',                  # audiocraft
         'G. Schick, Bildnis der Heinrike Dannecker, 1802', # cv2 puttext title
-        'en_UK/apope_low', #'en_US/m-ailabs_low#judy_bieber', #'en_US/m-ailabs_low#mary_ann',
      ],
     # 2
     [
@@ -69,7 +69,7 @@ DESCRIPTIONS = [
     [
         '04_Friedrich_FV317_001.jpg',
         '04_Friedrich_FV317_001.txt',
-        'Land steppes',
         'C. D. Friedrich, Der Watzmann, 1824',
         'en_US/m-ailabs_low#mary_ann',
     ],
@@ -146,7 +146,7 @@ SILENT_VIDEO = '_silent_video.mp4'
 # SILENT CLIP
-for img, text, scene, title, voice in DESCRIPTIONS[2:4]:
@@ -185,7 +185,7 @@ for img, text, scene, title, voice in DESCRIPTIONS[2:4]:
              "tts.py",
              "--text", PIC_DIR + text,
              '--image', '_tmp_banner.png',
-             '--scene', scene,
              '--voice', voice,
              '--out_file', OUT_FILE,  # save to correct location is handled in client
                 ])

 import subprocess
 import cv2
+# with subprocess and an extra argument 'soundscape' and a 'resized image saved as png' we can call the server
 # yt-dlp is instaled in .d4
 # Download Part of Video
 # yt-dlp https://www.youtube.com/watch?v=UZ9uyQI3pF0 --downloader ffmpeg --downloader-args "ffmpeg_i:-ss 997 -to 2512"
         '01_Schick_AII840_001.txt',                               # text
         'statue in shire, hill river, vogels.',                  # audiocraft
         'G. Schick, Bildnis der Heinrike Dannecker, 1802', # cv2 puttext title
+        'en_US/vctk_low#p326', #'en_US/m-ailabs_low#judy_bieber', #'en_US/m-ailabs_low#mary_ann',
      ],
     # 2
     [
     [
         '04_Friedrich_FV317_001.jpg',
         '04_Friedrich_FV317_001.txt',
+        'mountain wind',
         'C. D. Friedrich, Der Watzmann, 1824',
         'en_US/m-ailabs_low#mary_ann',
     ],
 # SILENT CLIP
+for img, text, soundscape, title, voice in DESCRIPTIONS[2:4]:
              "tts.py",
              "--text", PIC_DIR + text,
              '--image', '_tmp_banner.png',
+             '--soundscape', soundscape,
              '--voice', voice,
              '--out_file', OUT_FILE,  # save to correct location is handled in client
                 ])