yoshipon0520
commited on
Commit
·
6d5b0af
1
Parent(s):
d161ea3
Upload 2 files
Browse files- config.yaml +101 -0
- version_0/checkpoints/last.ckpt +3 -0
config.yaml
ADDED
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
base_config: ${base_config_path}/train_ddp.yaml
|
2 |
+
|
3 |
+
sr: 16000
|
4 |
+
n_fft: 512
|
5 |
+
hop_length: 160
|
6 |
+
|
7 |
+
n_mic: 8
|
8 |
+
n_src: 6
|
9 |
+
dim_latent: 64
|
10 |
+
|
11 |
+
autocast: True
|
12 |
+
|
13 |
+
trainer:
|
14 |
+
max_epochs: 200
|
15 |
+
gradient_clip_val: 5.0
|
16 |
+
sync_batchnorm: True
|
17 |
+
|
18 |
+
precision: 16-mixed
|
19 |
+
|
20 |
+
benchmark: True
|
21 |
+
use_distributed_sampler: False
|
22 |
+
|
23 |
+
callbacks:
|
24 |
+
- _target_: lightning.pytorch.callbacks.ModelCheckpoint
|
25 |
+
filename: "{epoch:04d}"
|
26 |
+
save_last: True
|
27 |
+
save_top_k: -1
|
28 |
+
|
29 |
+
- _target_: lightning.pytorch.callbacks.RichProgressBar
|
30 |
+
refresh_rate: 5
|
31 |
+
|
32 |
+
- _target_: lightning.pytorch.callbacks.RichModelSummary
|
33 |
+
max_depth: 3
|
34 |
+
|
35 |
+
- _target_: neural_fcasa.callbacks.cyclic_annealer.CyclicAnnealerCallback
|
36 |
+
name: beta
|
37 |
+
cycle: 10
|
38 |
+
max_value: 1.0
|
39 |
+
ini_period: 50
|
40 |
+
ini_max_value: 1.0
|
41 |
+
|
42 |
+
- _target_: neural_fcasa.callbacks.visualizer.VisualizerCallback
|
43 |
+
|
44 |
+
dataset_name: chunk.derev-hop${hop_length}
|
45 |
+
datamodule:
|
46 |
+
_target_: neural_fcasa.datamodules.hdf5_wavact_datamodule.DataModule
|
47 |
+
train_dataset_path: ${working_directory}/../../hdf5/${dataset_name}-tr.hdf5
|
48 |
+
val_dataset_path: ${working_directory}/../../hdf5/${dataset_name}-cv.hdf5
|
49 |
+
batch_size: 2
|
50 |
+
duration: 10
|
51 |
+
sr: ${sr}
|
52 |
+
hop_length: ${hop_length}
|
53 |
+
|
54 |
+
task:
|
55 |
+
_target_: neural_fcasa.tasks.avi_scl_allsort_task.AVITask
|
56 |
+
n_fft: ${n_fft}
|
57 |
+
hop_length: ${hop_length}
|
58 |
+
n_src: ${n_src}
|
59 |
+
beta: 1.0
|
60 |
+
gamma: 1.0
|
61 |
+
|
62 |
+
encoder:
|
63 |
+
_target_: neural_fcasa.encoders.resepformer_encoder.RESepFormerEncoder
|
64 |
+
n_fft: ${n_fft}
|
65 |
+
n_mic: ${n_mic}
|
66 |
+
n_src: ${n_src}
|
67 |
+
dim_latent: ${dim_latent}
|
68 |
+
chunk_size: 100
|
69 |
+
step_size: 100
|
70 |
+
d_model: 256
|
71 |
+
dim_feedforward: 1024
|
72 |
+
n_blocks: 8
|
73 |
+
norm_first: True
|
74 |
+
autocast: ${autocast}
|
75 |
+
|
76 |
+
diagonalizer:
|
77 |
+
_target_: neural_fcasa.diagonalizers.iss_nrmxt_diagonalizer.ISSDiagonalizer
|
78 |
+
eps: 1.e-4
|
79 |
+
n_iter: 2
|
80 |
+
|
81 |
+
spec_aug:
|
82 |
+
_target_: torchaudio.transforms.SpecAugment
|
83 |
+
n_time_masks: 2
|
84 |
+
time_mask_param: 64
|
85 |
+
n_freq_masks: 2
|
86 |
+
freq_mask_param: 20
|
87 |
+
zero_masking: True
|
88 |
+
|
89 |
+
decoder:
|
90 |
+
_target_: neural_fcasa.decoders.res_lin_decoder.Decoder
|
91 |
+
n_fft: ${n_fft}
|
92 |
+
dim_latent: ${dim_latent}
|
93 |
+
dim_latent_noi: 10
|
94 |
+
|
95 |
+
optimizer_config:
|
96 |
+
_target_: aiaccel.torch.lightning.OptimizerConfig
|
97 |
+
optimizer_generator:
|
98 |
+
_partial_: True
|
99 |
+
_target_: torch.optim.AdamW
|
100 |
+
lr: 1.e-4
|
101 |
+
weight_decay: 1.e-5
|
version_0/checkpoints/last.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd409f8ae01b3b66fc28a4d203ebe280cb2faef0d18aff59c450903f022534c7
|
3 |
+
size 331573975
|