format
Browse files
README.md
CHANGED
@@ -19,9 +19,9 @@ tags:
|
|
19 |
# Affective TTS / SoundScapes
|
20 |
|
21 |
- [SHIFT TTS tool](https://github.com/audeering/shift)
|
22 |
-
- Analysis of emotionality [#1](https://huggingface.co/dkounadis/artificial-styletts2/discussions/2)
|
23 |
-
- Soundscapes `trees, water,
|
24 |
-
- `landscape2soundscape.py`
|
25 |
|
26 |
## Available Voices
|
27 |
|
@@ -29,16 +29,16 @@ tags:
|
|
29 |
|
30 |
## Flask API
|
31 |
|
32 |
-
|
33 |
-
```
|
34 |
-
git clone https://huggingface.co/dkounadis/artificial-styletts2
|
35 |
-
```
|
36 |
-
|
37 |
<details>
|
38 |
<summary>
|
39 |
Create virtualenv
|
40 |
</summary>
|
41 |
|
|
|
|
|
|
|
|
|
|
|
42 |
```
|
43 |
virtualenv --python=python3 ~/.envs/.my_env
|
44 |
source ~/.envs/.my_env/bin/activate
|
@@ -46,7 +46,6 @@ cd artificial-styletts2/
|
|
46 |
pip install -r requirements.txt
|
47 |
```
|
48 |
|
49 |
-
|
50 |
</details>
|
51 |
|
52 |
Start Flask
|
@@ -57,7 +56,7 @@ CUDA_DEVICE_ORDER=PCI_BUS_ID HF_HOME=./hf_home CUDA_VISIBLE_DEVICES=2 python api
|
|
57 |
|
58 |
## Landscape 2 Soundscape
|
59 |
|
60 |
-
The following needs `api.py` to be already running
|
61 |
|
62 |
```python
|
63 |
# TTS & soundscape - overlay to .mp4
|
|
|
19 |
# Affective TTS / SoundScapes
|
20 |
|
21 |
- [SHIFT TTS tool](https://github.com/audeering/shift)
|
22 |
+
- Analysis of TTS emotionality [#1](https://huggingface.co/dkounadis/artificial-styletts2/discussions/2)
|
23 |
+
- Soundscapes `trees, water, ..` via [AudioGen](https://huggingface.co/dkounadis/artificial-styletts2/discussions/3)
|
24 |
+
- `landscape2soundscape.py` - overlays TTS & sound to still image and create video
|
25 |
|
26 |
## Available Voices
|
27 |
|
|
|
29 |
|
30 |
## Flask API
|
31 |
|
|
|
|
|
|
|
|
|
|
|
32 |
<details>
|
33 |
<summary>
|
34 |
Create virtualenv
|
35 |
</summary>
|
36 |
|
37 |
+
|
38 |
+
```
|
39 |
+
git clone https://huggingface.co/dkounadis/artificial-styletts2
|
40 |
+
```
|
41 |
+
|
42 |
```
|
43 |
virtualenv --python=python3 ~/.envs/.my_env
|
44 |
source ~/.envs/.my_env/bin/activate
|
|
|
46 |
pip install -r requirements.txt
|
47 |
```
|
48 |
|
|
|
49 |
</details>
|
50 |
|
51 |
Start Flask
|
|
|
56 |
|
57 |
## Landscape 2 Soundscape
|
58 |
|
59 |
+
The following needs `api.py` to be already running on a tmux session.
|
60 |
|
61 |
```python
|
62 |
# TTS & soundscape - overlay to .mp4
|
demo.py
CHANGED
@@ -4,7 +4,7 @@ import numpy as np
|
|
4 |
|
5 |
print('\n\n\n\n___________________')
|
6 |
|
7 |
-
txt = '
|
8 |
|
9 |
sound_generator = AudioGen.get_pretrained('facebook/audiogen-medium')
|
10 |
sound_generator.set_generation_params(duration=1) # why is generating so long at 14 seconds
|
@@ -12,4 +12,4 @@ sound_generator.set_generation_params(duration=1) # why is generating so long
|
|
12 |
x = sound_generator.generate([txt])[0].detach().cpu().numpy()[0, :]
|
13 |
x /= np.abs(x).max() + 1e-7
|
14 |
|
15 |
-
audiofile.write('
|
|
|
4 |
|
5 |
print('\n\n\n\n___________________')
|
6 |
|
7 |
+
txt = 'car'
|
8 |
|
9 |
sound_generator = AudioGen.get_pretrained('facebook/audiogen-medium')
|
10 |
sound_generator.set_generation_params(duration=1) # why is generating so long at 14 seconds
|
|
|
12 |
x = sound_generator.generate([txt])[0].detach().cpu().numpy()[0, :]
|
13 |
x /= np.abs(x).max() + 1e-7
|
14 |
|
15 |
+
audiofile.write('_audio1_.wav', x, 16000)
|