thanks to advimman ❤
Browse files- big-lama-with-discr/config.yaml +159 -0
- big-lama-with-discr/models/best.ckpt +3 -0
- big-lama/config.yaml +157 -0
- big-lama/models/best.ckpt +3 -0
- lama-celeba-hq-pl-abl/lama-no-pl/config.yaml +122 -0
- lama-celeba-hq-pl-abl/lama-no-pl/models/best.ckpt +3 -0
- lama-celeba-hq/ lama-regular/config.yaml +123 -0
- lama-celeba-hq/ lama-regular/models/best.ckpt +3 -0
- lama-celeba-hq/lama-deep/config.yaml +123 -0
- lama-celeba-hq/lama-deep/models/best.ckpt +3 -0
- lama-celeba-hq/lama-dilated/config.yaml +127 -0
- lama-celeba-hq/lama-dilated/models/best.ckpt +3 -0
- lama-celeba-hq/lama-fourier-shallow/config.yaml +134 -0
- lama-celeba-hq/lama-fourier-shallow/models/best.ckpt +3 -0
- lama-celeba-hq/lama-fourier/config.yaml +134 -0
- lama-celeba-hq/lama-fourier/models/best.ckpt +3 -0
- lama-celeba-hq/lama_small_train_masks/config.yaml +123 -0
- lama-celeba-hq/lama_small_train_masks/models/best.ckpt +3 -0
- lama-pl-abl/aashukha_2021-08-16_21-52-12_train_ablv2_work_no_segmpl_csirpl_csirpl03_fixed/config.yaml +130 -0
- lama-pl-abl/aashukha_2021-08-16_21-52-12_train_ablv2_work_no_segmpl_csirpl_csirpl03_fixed/models/best.ckpt +3 -0
- lama-pl-abl/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_csdilirpl_csdilirpl1_new/config.yaml +130 -0
- lama-pl-abl/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_csdilirpl_csdilirpl1_new/models/best.ckpt +3 -0
- lama-pl-abl/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_vgg_l2_vgg003_new/config.yaml +130 -0
- lama-pl-abl/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_vgg_l2_vgg003_new/models/best.ckpt +3 -0
- lama-places/big-lama-regular/config.yaml +129 -0
- lama-places/big-lama-regular/models/best.ckpt +3 -0
- lama-places/lama-dilated/config.yaml +133 -0
- lama-places/lama-dilated/models/best.ckpt +3 -0
- lama-places/lama-fourier/config.yaml +142 -0
- lama-places/lama-fourier/models/best.ckpt +3 -0
- lama-places/lama-fourier/models/last.ckpt +3 -0
- lama-places/lama-regular/config.yaml +130 -0
- lama-places/lama-regular/models/best.ckpt +3 -0
- lama-places/lama_small_train_masks/config.yaml +130 -0
- lama-places/lama_small_train_masks/models/best.ckpt +3 -0
big-lama-with-discr/config.yaml
ADDED
@@ -0,0 +1,159 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
run_title: b18_ffc075_batch8x15
|
2 |
+
training_model:
|
3 |
+
kind: default
|
4 |
+
visualize_each_iters: 1000
|
5 |
+
concat_mask: true
|
6 |
+
store_discr_outputs_for_vis: true
|
7 |
+
losses:
|
8 |
+
l1:
|
9 |
+
weight_missing: 0
|
10 |
+
weight_known: 10
|
11 |
+
perceptual:
|
12 |
+
weight: 0
|
13 |
+
adversarial:
|
14 |
+
kind: r1
|
15 |
+
weight: 10
|
16 |
+
gp_coef: 0.001
|
17 |
+
mask_as_fake_target: true
|
18 |
+
allow_scale_mask: true
|
19 |
+
feature_matching:
|
20 |
+
weight: 100
|
21 |
+
segm_pl:
|
22 |
+
weight: 30
|
23 |
+
weights_path: ${env:TORCH_HOME}
|
24 |
+
depth_pl:
|
25 |
+
weight: 0
|
26 |
+
use_features: true
|
27 |
+
optimizers:
|
28 |
+
generator:
|
29 |
+
kind: adam
|
30 |
+
lr: 0.001
|
31 |
+
discriminator:
|
32 |
+
kind: adam
|
33 |
+
lr: 0.0001
|
34 |
+
visualizer:
|
35 |
+
key_order:
|
36 |
+
- image
|
37 |
+
- predicted_image
|
38 |
+
- discr_output_fake
|
39 |
+
- discr_output_real
|
40 |
+
- inpainted
|
41 |
+
rescale_keys:
|
42 |
+
- discr_output_fake
|
43 |
+
- discr_output_real
|
44 |
+
kind: directory
|
45 |
+
outdir: /group-volume/User-Driven-Content-Generation/r.suvorov/inpainting/experiments/r.suvorov_2021-04-30_14-41-12_train_simple_pix2pix2_gap_sdpl_novgg_large_b18_ffc075_batch8x15/samples
|
46 |
+
location:
|
47 |
+
data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_large
|
48 |
+
out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
|
49 |
+
tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
|
50 |
+
data:
|
51 |
+
batch_size: 15
|
52 |
+
val_batch_size: 2
|
53 |
+
num_workers: 3
|
54 |
+
train:
|
55 |
+
indir: ${location.data_root_dir}/train
|
56 |
+
out_size: 256
|
57 |
+
mask_gen_kwargs:
|
58 |
+
irregular_proba: 1
|
59 |
+
irregular_kwargs:
|
60 |
+
max_angle: 4
|
61 |
+
max_len: 200
|
62 |
+
max_width: 100
|
63 |
+
max_times: 5
|
64 |
+
min_times: 1
|
65 |
+
box_proba: 1
|
66 |
+
box_kwargs:
|
67 |
+
margin: 10
|
68 |
+
bbox_min_size: 30
|
69 |
+
bbox_max_size: 150
|
70 |
+
max_times: 3
|
71 |
+
min_times: 1
|
72 |
+
segm_proba: 0
|
73 |
+
segm_kwargs:
|
74 |
+
confidence_threshold: 0.5
|
75 |
+
max_object_area: 0.5
|
76 |
+
min_mask_area: 0.07
|
77 |
+
downsample_levels: 6
|
78 |
+
num_variants_per_mask: 1
|
79 |
+
rigidness_mode: 1
|
80 |
+
max_foreground_coverage: 0.3
|
81 |
+
max_foreground_intersection: 0.7
|
82 |
+
max_mask_intersection: 0.1
|
83 |
+
max_hidden_area: 0.1
|
84 |
+
max_scale_change: 0.25
|
85 |
+
horizontal_flip: true
|
86 |
+
max_vertical_shift: 0.2
|
87 |
+
position_shuffle: true
|
88 |
+
transform_variant: distortions
|
89 |
+
dataloader_kwargs:
|
90 |
+
batch_size: ${data.batch_size}
|
91 |
+
shuffle: true
|
92 |
+
num_workers: ${data.num_workers}
|
93 |
+
val:
|
94 |
+
indir: ${location.data_root_dir}/val
|
95 |
+
img_suffix: .png
|
96 |
+
dataloader_kwargs:
|
97 |
+
batch_size: ${data.val_batch_size}
|
98 |
+
shuffle: false
|
99 |
+
num_workers: ${data.num_workers}
|
100 |
+
visual_test:
|
101 |
+
indir: ${location.data_root_dir}/korean_test
|
102 |
+
img_suffix: _input.png
|
103 |
+
pad_out_to_modulo: 32
|
104 |
+
dataloader_kwargs:
|
105 |
+
batch_size: 1
|
106 |
+
shuffle: false
|
107 |
+
num_workers: ${data.num_workers}
|
108 |
+
generator:
|
109 |
+
kind: ffc_resnet
|
110 |
+
input_nc: 4
|
111 |
+
output_nc: 3
|
112 |
+
ngf: 64
|
113 |
+
n_downsampling: 3
|
114 |
+
n_blocks: 18
|
115 |
+
add_out_act: sigmoid
|
116 |
+
init_conv_kwargs:
|
117 |
+
ratio_gin: 0
|
118 |
+
ratio_gout: 0
|
119 |
+
enable_lfu: false
|
120 |
+
downsample_conv_kwargs:
|
121 |
+
ratio_gin: ${generator.init_conv_kwargs.ratio_gout}
|
122 |
+
ratio_gout: ${generator.downsample_conv_kwargs.ratio_gin}
|
123 |
+
enable_lfu: false
|
124 |
+
resnet_conv_kwargs:
|
125 |
+
ratio_gin: 0.75
|
126 |
+
ratio_gout: ${generator.resnet_conv_kwargs.ratio_gin}
|
127 |
+
enable_lfu: false
|
128 |
+
discriminator:
|
129 |
+
kind: pix2pixhd_nlayer
|
130 |
+
input_nc: 3
|
131 |
+
ndf: 64
|
132 |
+
n_layers: 4
|
133 |
+
evaluator:
|
134 |
+
kind: default
|
135 |
+
inpainted_key: inpainted
|
136 |
+
integral_kind: ssim_fid100_f1
|
137 |
+
trainer:
|
138 |
+
kwargs:
|
139 |
+
gpus: -1
|
140 |
+
accelerator: ddp
|
141 |
+
max_epochs: 200
|
142 |
+
gradient_clip_val: 1
|
143 |
+
log_gpu_memory: None
|
144 |
+
limit_train_batches: 25000
|
145 |
+
val_check_interval: ${trainer.kwargs.limit_train_batches}
|
146 |
+
log_every_n_steps: 1000
|
147 |
+
precision: 32
|
148 |
+
terminate_on_nan: false
|
149 |
+
check_val_every_n_epoch: 1
|
150 |
+
num_sanity_val_steps: 8
|
151 |
+
limit_val_batches: 1000
|
152 |
+
replace_sampler_ddp: false
|
153 |
+
checkpoint_kwargs:
|
154 |
+
verbose: true
|
155 |
+
save_top_k: 5
|
156 |
+
save_last: true
|
157 |
+
period: 1
|
158 |
+
monitor: val_ssim_fid100_f1_total_mean
|
159 |
+
mode: max
|
big-lama-with-discr/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0806dc98a99c09561f5e45542ded1126a7ea9eeb91858a468d92c63a0054a550
|
3 |
+
size 532770031
|
big-lama/config.yaml
ADDED
@@ -0,0 +1,157 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
run_title: b18_ffc075_batch8x15
|
2 |
+
training_model:
|
3 |
+
kind: default
|
4 |
+
visualize_each_iters: 1000
|
5 |
+
concat_mask: true
|
6 |
+
store_discr_outputs_for_vis: true
|
7 |
+
losses:
|
8 |
+
l1:
|
9 |
+
weight_missing: 0
|
10 |
+
weight_known: 10
|
11 |
+
perceptual:
|
12 |
+
weight: 0
|
13 |
+
adversarial:
|
14 |
+
kind: r1
|
15 |
+
weight: 10
|
16 |
+
gp_coef: 0.001
|
17 |
+
mask_as_fake_target: true
|
18 |
+
allow_scale_mask: true
|
19 |
+
feature_matching:
|
20 |
+
weight: 100
|
21 |
+
resnet_pl:
|
22 |
+
weight: 30
|
23 |
+
weights_path: ${env:TORCH_HOME}
|
24 |
+
|
25 |
+
optimizers:
|
26 |
+
generator:
|
27 |
+
kind: adam
|
28 |
+
lr: 0.001
|
29 |
+
discriminator:
|
30 |
+
kind: adam
|
31 |
+
lr: 0.0001
|
32 |
+
visualizer:
|
33 |
+
key_order:
|
34 |
+
- image
|
35 |
+
- predicted_image
|
36 |
+
- discr_output_fake
|
37 |
+
- discr_output_real
|
38 |
+
- inpainted
|
39 |
+
rescale_keys:
|
40 |
+
- discr_output_fake
|
41 |
+
- discr_output_real
|
42 |
+
kind: directory
|
43 |
+
outdir: /group-volume/User-Driven-Content-Generation/r.suvorov/inpainting/experiments/r.suvorov_2021-04-30_14-41-12_train_simple_pix2pix2_gap_sdpl_novgg_large_b18_ffc075_batch8x15/samples
|
44 |
+
location:
|
45 |
+
data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_large
|
46 |
+
out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
|
47 |
+
tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
|
48 |
+
data:
|
49 |
+
batch_size: 15
|
50 |
+
val_batch_size: 2
|
51 |
+
num_workers: 3
|
52 |
+
train:
|
53 |
+
indir: ${location.data_root_dir}/train
|
54 |
+
out_size: 256
|
55 |
+
mask_gen_kwargs:
|
56 |
+
irregular_proba: 1
|
57 |
+
irregular_kwargs:
|
58 |
+
max_angle: 4
|
59 |
+
max_len: 200
|
60 |
+
max_width: 100
|
61 |
+
max_times: 5
|
62 |
+
min_times: 1
|
63 |
+
box_proba: 1
|
64 |
+
box_kwargs:
|
65 |
+
margin: 10
|
66 |
+
bbox_min_size: 30
|
67 |
+
bbox_max_size: 150
|
68 |
+
max_times: 3
|
69 |
+
min_times: 1
|
70 |
+
segm_proba: 0
|
71 |
+
segm_kwargs:
|
72 |
+
confidence_threshold: 0.5
|
73 |
+
max_object_area: 0.5
|
74 |
+
min_mask_area: 0.07
|
75 |
+
downsample_levels: 6
|
76 |
+
num_variants_per_mask: 1
|
77 |
+
rigidness_mode: 1
|
78 |
+
max_foreground_coverage: 0.3
|
79 |
+
max_foreground_intersection: 0.7
|
80 |
+
max_mask_intersection: 0.1
|
81 |
+
max_hidden_area: 0.1
|
82 |
+
max_scale_change: 0.25
|
83 |
+
horizontal_flip: true
|
84 |
+
max_vertical_shift: 0.2
|
85 |
+
position_shuffle: true
|
86 |
+
transform_variant: distortions
|
87 |
+
dataloader_kwargs:
|
88 |
+
batch_size: ${data.batch_size}
|
89 |
+
shuffle: true
|
90 |
+
num_workers: ${data.num_workers}
|
91 |
+
val:
|
92 |
+
indir: ${location.data_root_dir}/val
|
93 |
+
img_suffix: .png
|
94 |
+
dataloader_kwargs:
|
95 |
+
batch_size: ${data.val_batch_size}
|
96 |
+
shuffle: false
|
97 |
+
num_workers: ${data.num_workers}
|
98 |
+
visual_test:
|
99 |
+
indir: ${location.data_root_dir}/korean_test
|
100 |
+
img_suffix: _input.png
|
101 |
+
pad_out_to_modulo: 32
|
102 |
+
dataloader_kwargs:
|
103 |
+
batch_size: 1
|
104 |
+
shuffle: false
|
105 |
+
num_workers: ${data.num_workers}
|
106 |
+
generator:
|
107 |
+
kind: ffc_resnet
|
108 |
+
input_nc: 4
|
109 |
+
output_nc: 3
|
110 |
+
ngf: 64
|
111 |
+
n_downsampling: 3
|
112 |
+
n_blocks: 18
|
113 |
+
add_out_act: sigmoid
|
114 |
+
init_conv_kwargs:
|
115 |
+
ratio_gin: 0
|
116 |
+
ratio_gout: 0
|
117 |
+
enable_lfu: false
|
118 |
+
downsample_conv_kwargs:
|
119 |
+
ratio_gin: ${generator.init_conv_kwargs.ratio_gout}
|
120 |
+
ratio_gout: ${generator.downsample_conv_kwargs.ratio_gin}
|
121 |
+
enable_lfu: false
|
122 |
+
resnet_conv_kwargs:
|
123 |
+
ratio_gin: 0.75
|
124 |
+
ratio_gout: ${generator.resnet_conv_kwargs.ratio_gin}
|
125 |
+
enable_lfu: false
|
126 |
+
discriminator:
|
127 |
+
kind: pix2pixhd_nlayer
|
128 |
+
input_nc: 3
|
129 |
+
ndf: 64
|
130 |
+
n_layers: 4
|
131 |
+
evaluator:
|
132 |
+
kind: default
|
133 |
+
inpainted_key: inpainted
|
134 |
+
integral_kind: ssim_fid100_f1
|
135 |
+
trainer:
|
136 |
+
kwargs:
|
137 |
+
gpus: -1
|
138 |
+
accelerator: ddp
|
139 |
+
max_epochs: 200
|
140 |
+
gradient_clip_val: 1
|
141 |
+
log_gpu_memory: None
|
142 |
+
limit_train_batches: 25000
|
143 |
+
val_check_interval: ${trainer.kwargs.limit_train_batches}
|
144 |
+
log_every_n_steps: 1000
|
145 |
+
precision: 32
|
146 |
+
terminate_on_nan: false
|
147 |
+
check_val_every_n_epoch: 1
|
148 |
+
num_sanity_val_steps: 8
|
149 |
+
limit_val_batches: 1000
|
150 |
+
replace_sampler_ddp: false
|
151 |
+
checkpoint_kwargs:
|
152 |
+
verbose: true
|
153 |
+
save_top_k: 5
|
154 |
+
save_last: true
|
155 |
+
period: 1
|
156 |
+
monitor: val_ssim_fid100_f1_total_mean
|
157 |
+
mode: max
|
big-lama/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fccb7adffd53ec0974ee5503c3731c2c2f1e7e07856fd9228cdcc0b46fd5d423
|
3 |
+
size 410046389
|
lama-celeba-hq-pl-abl/lama-no-pl/config.yaml
ADDED
@@ -0,0 +1,122 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
run_title: swu_celeba_bs30
|
2 |
+
training_model:
|
3 |
+
kind: default
|
4 |
+
visualize_each_iters: 1000
|
5 |
+
concat_mask: true
|
6 |
+
store_discr_outputs_for_vis: true
|
7 |
+
losses:
|
8 |
+
l1:
|
9 |
+
weight_missing: 0
|
10 |
+
weight_known: 10
|
11 |
+
perceptual:
|
12 |
+
weight: 0
|
13 |
+
adversarial:
|
14 |
+
kind: r1
|
15 |
+
weight: 10
|
16 |
+
gp_coef: 0.001
|
17 |
+
mask_as_fake_target: true
|
18 |
+
allow_scale_mask: true
|
19 |
+
feature_matching:
|
20 |
+
weight: 100
|
21 |
+
segm_pl:
|
22 |
+
weight: 0
|
23 |
+
optimizers:
|
24 |
+
generator:
|
25 |
+
kind: adam
|
26 |
+
lr: 0.001
|
27 |
+
discriminator:
|
28 |
+
kind: adam
|
29 |
+
lr: 0.0001
|
30 |
+
visualizer:
|
31 |
+
key_order:
|
32 |
+
- image
|
33 |
+
- predicted_image
|
34 |
+
- discr_output_fake
|
35 |
+
- discr_output_real
|
36 |
+
- inpainted
|
37 |
+
rescale_keys:
|
38 |
+
- discr_output_fake
|
39 |
+
- discr_output_real
|
40 |
+
kind: directory
|
41 |
+
outdir: /group-volume/orc_srr/multimodal/e.logacheva/CelebA-HQ-inpainting/experiments/e.logacheva_2021-03-16_16-02-59_train_ablv2_work_no_segmpl_swu_celeba_bs30/samples
|
42 |
+
location:
|
43 |
+
data_root_dir: ${env:HOME}/CelebA-HQ
|
44 |
+
out_root_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/experiments
|
45 |
+
tb_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/tb_logs
|
46 |
+
pretrained_models: /group-volume/orc_srr/multimodal/pretrained/
|
47 |
+
data:
|
48 |
+
batch_size: 5
|
49 |
+
val_batch_size: 2
|
50 |
+
num_workers: 3
|
51 |
+
train:
|
52 |
+
indir: ${location.data_root_dir}/train_256
|
53 |
+
out_size: 256
|
54 |
+
mask_gen_kwargs:
|
55 |
+
irregular_proba: 1
|
56 |
+
irregular_kwargs:
|
57 |
+
max_angle: 4
|
58 |
+
max_len: 200
|
59 |
+
max_width: 100
|
60 |
+
max_times: 5
|
61 |
+
min_times: 1
|
62 |
+
box_proba: 1
|
63 |
+
box_kwargs:
|
64 |
+
margin: 10
|
65 |
+
bbox_min_size: 30
|
66 |
+
bbox_max_size: 150
|
67 |
+
max_times: 4
|
68 |
+
min_times: 1
|
69 |
+
segm_proba: 0
|
70 |
+
transform_variant: no_augs
|
71 |
+
dataloader_kwargs:
|
72 |
+
batch_size: ${data.batch_size}
|
73 |
+
shuffle: true
|
74 |
+
num_workers: ${data.num_workers}
|
75 |
+
val:
|
76 |
+
indir: ${location.data_root_dir}/val_256
|
77 |
+
img_suffix: .png
|
78 |
+
dataloader_kwargs:
|
79 |
+
batch_size: ${data.val_batch_size}
|
80 |
+
shuffle: false
|
81 |
+
num_workers: ${data.num_workers}
|
82 |
+
visual_test: null
|
83 |
+
generator:
|
84 |
+
kind: pix2pixhd_global
|
85 |
+
input_nc: 4
|
86 |
+
output_nc: 3
|
87 |
+
ngf: 64
|
88 |
+
n_downsampling: 3
|
89 |
+
n_blocks: 9
|
90 |
+
conv_kind: default
|
91 |
+
add_out_act: sigmoid
|
92 |
+
discriminator:
|
93 |
+
kind: pix2pixhd_nlayer
|
94 |
+
input_nc: 3
|
95 |
+
ndf: 64
|
96 |
+
n_layers: 4
|
97 |
+
evaluator:
|
98 |
+
kind: default
|
99 |
+
inpainted_key: inpainted
|
100 |
+
integral_kind: ssim_fid100_f1
|
101 |
+
trainer:
|
102 |
+
kwargs:
|
103 |
+
gpus: -1
|
104 |
+
distributed_backend: ddp
|
105 |
+
max_epochs: 40
|
106 |
+
gradient_clip_val: 1
|
107 |
+
log_gpu_memory: None
|
108 |
+
limit_train_batches: 25000
|
109 |
+
val_check_interval: 2600
|
110 |
+
log_save_interval: 250
|
111 |
+
precision: 32
|
112 |
+
terminate_on_nan: false
|
113 |
+
check_val_every_n_epoch: 1
|
114 |
+
num_sanity_val_steps: 8
|
115 |
+
replace_sampler_ddp: false
|
116 |
+
checkpoint_kwargs:
|
117 |
+
verbose: true
|
118 |
+
save_top_k: 5
|
119 |
+
save_last: true
|
120 |
+
period: 1
|
121 |
+
monitor: val_ssim_fid100_f1_total_mean
|
122 |
+
mode: max
|
lama-celeba-hq-pl-abl/lama-no-pl/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66b111ddcbf7253685b16ceeb291210381c5a9f9f3310efd6275b90e95d67cb9
|
3 |
+
size 388001399
|
lama-celeba-hq/ lama-regular/config.yaml
ADDED
@@ -0,0 +1,123 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
run_title: swu_celeba_bs30
|
2 |
+
training_model:
|
3 |
+
kind: default
|
4 |
+
visualize_each_iters: 1000
|
5 |
+
concat_mask: true
|
6 |
+
store_discr_outputs_for_vis: true
|
7 |
+
losses:
|
8 |
+
l1:
|
9 |
+
weight_missing: 0
|
10 |
+
weight_known: 10
|
11 |
+
perceptual:
|
12 |
+
weight: 0
|
13 |
+
adversarial:
|
14 |
+
kind: r1
|
15 |
+
weight: 10
|
16 |
+
gp_coef: 0.001
|
17 |
+
mask_as_fake_target: true
|
18 |
+
allow_scale_mask: true
|
19 |
+
feature_matching:
|
20 |
+
weight: 100
|
21 |
+
segm_pl:
|
22 |
+
weight: 30
|
23 |
+
weights_path: ${env:TORCH_HOME}
|
24 |
+
optimizers:
|
25 |
+
generator:
|
26 |
+
kind: adam
|
27 |
+
lr: 0.001
|
28 |
+
discriminator:
|
29 |
+
kind: adam
|
30 |
+
lr: 0.0001
|
31 |
+
visualizer:
|
32 |
+
key_order:
|
33 |
+
- image
|
34 |
+
- predicted_image
|
35 |
+
- discr_output_fake
|
36 |
+
- discr_output_real
|
37 |
+
- inpainted
|
38 |
+
rescale_keys:
|
39 |
+
- discr_output_fake
|
40 |
+
- discr_output_real
|
41 |
+
kind: directory
|
42 |
+
outdir: /group-volume/orc_srr/multimodal/e.logacheva/CelebA-HQ-inpainting/experiments/e.logacheva_2021-03-16_16-00-45_train_ablv2_work_swu_celeba_bs30/samples
|
43 |
+
location:
|
44 |
+
data_root_dir: ${env:HOME}/CelebA-HQ
|
45 |
+
out_root_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/experiments
|
46 |
+
tb_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/tb_logs
|
47 |
+
pretrained_models: /group-volume/orc_srr/multimodal/pretrained/
|
48 |
+
data:
|
49 |
+
batch_size: 5
|
50 |
+
val_batch_size: 2
|
51 |
+
num_workers: 3
|
52 |
+
train:
|
53 |
+
indir: ${location.data_root_dir}/train_256
|
54 |
+
out_size: 256
|
55 |
+
mask_gen_kwargs:
|
56 |
+
irregular_proba: 1
|
57 |
+
irregular_kwargs:
|
58 |
+
max_angle: 4
|
59 |
+
max_len: 200
|
60 |
+
max_width: 100
|
61 |
+
max_times: 5
|
62 |
+
min_times: 1
|
63 |
+
box_proba: 1
|
64 |
+
box_kwargs:
|
65 |
+
margin: 10
|
66 |
+
bbox_min_size: 30
|
67 |
+
bbox_max_size: 150
|
68 |
+
max_times: 4
|
69 |
+
min_times: 1
|
70 |
+
segm_proba: 0
|
71 |
+
transform_variant: no_augs
|
72 |
+
dataloader_kwargs:
|
73 |
+
batch_size: ${data.batch_size}
|
74 |
+
shuffle: true
|
75 |
+
num_workers: ${data.num_workers}
|
76 |
+
val:
|
77 |
+
indir: ${location.data_root_dir}/val_256
|
78 |
+
img_suffix: .png
|
79 |
+
dataloader_kwargs:
|
80 |
+
batch_size: ${data.val_batch_size}
|
81 |
+
shuffle: false
|
82 |
+
num_workers: ${data.num_workers}
|
83 |
+
visual_test: null
|
84 |
+
generator:
|
85 |
+
kind: pix2pixhd_global
|
86 |
+
input_nc: 4
|
87 |
+
output_nc: 3
|
88 |
+
ngf: 64
|
89 |
+
n_downsampling: 3
|
90 |
+
n_blocks: 9
|
91 |
+
conv_kind: default
|
92 |
+
add_out_act: sigmoid
|
93 |
+
discriminator:
|
94 |
+
kind: pix2pixhd_nlayer
|
95 |
+
input_nc: 3
|
96 |
+
ndf: 64
|
97 |
+
n_layers: 4
|
98 |
+
evaluator:
|
99 |
+
kind: default
|
100 |
+
inpainted_key: inpainted
|
101 |
+
integral_kind: ssim_fid100_f1
|
102 |
+
trainer:
|
103 |
+
kwargs:
|
104 |
+
gpus: -1
|
105 |
+
distributed_backend: ddp
|
106 |
+
max_epochs: 40
|
107 |
+
gradient_clip_val: 1
|
108 |
+
log_gpu_memory: None
|
109 |
+
limit_train_batches: 25000
|
110 |
+
val_check_interval: 2600
|
111 |
+
log_save_interval: 250
|
112 |
+
precision: 32
|
113 |
+
terminate_on_nan: false
|
114 |
+
check_val_every_n_epoch: 1
|
115 |
+
num_sanity_val_steps: 8
|
116 |
+
replace_sampler_ddp: false
|
117 |
+
checkpoint_kwargs:
|
118 |
+
verbose: true
|
119 |
+
save_top_k: 5
|
120 |
+
save_last: true
|
121 |
+
period: 1
|
122 |
+
monitor: val_ssim_fid100_f1_total_mean
|
123 |
+
mode: max
|
lama-celeba-hq/ lama-regular/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5641c7655a82749e22c0a392c80dd94d7266ae0f63fbaf6b2a96671ac2d0e918
|
3 |
+
size 388009385
|
lama-celeba-hq/lama-deep/config.yaml
ADDED
@@ -0,0 +1,123 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
run_title: swu_celeba_bs30_b15
|
2 |
+
training_model:
|
3 |
+
kind: default
|
4 |
+
visualize_each_iters: 1000
|
5 |
+
concat_mask: true
|
6 |
+
store_discr_outputs_for_vis: true
|
7 |
+
losses:
|
8 |
+
l1:
|
9 |
+
weight_missing: 0
|
10 |
+
weight_known: 10
|
11 |
+
perceptual:
|
12 |
+
weight: 0
|
13 |
+
adversarial:
|
14 |
+
kind: r1
|
15 |
+
weight: 10
|
16 |
+
gp_coef: 0.001
|
17 |
+
mask_as_fake_target: true
|
18 |
+
allow_scale_mask: true
|
19 |
+
feature_matching:
|
20 |
+
weight: 100
|
21 |
+
segm_pl:
|
22 |
+
weight: 30
|
23 |
+
weights_path: ${env:TORCH_HOME}
|
24 |
+
optimizers:
|
25 |
+
generator:
|
26 |
+
kind: adam
|
27 |
+
lr: 0.001
|
28 |
+
discriminator:
|
29 |
+
kind: adam
|
30 |
+
lr: 0.0001
|
31 |
+
visualizer:
|
32 |
+
key_order:
|
33 |
+
- image
|
34 |
+
- predicted_image
|
35 |
+
- discr_output_fake
|
36 |
+
- discr_output_real
|
37 |
+
- inpainted
|
38 |
+
rescale_keys:
|
39 |
+
- discr_output_fake
|
40 |
+
- discr_output_real
|
41 |
+
kind: directory
|
42 |
+
outdir: /group-volume/orc_srr/multimodal/e.logacheva/CelebA-HQ-inpainting/experiments/e.logacheva_2021-06-11_18-11-09_train_ablv2_work_swu_celeba_bs30_b15/samples
|
43 |
+
location:
|
44 |
+
data_root_dir: ${env:HOME}/CelebA-HQ
|
45 |
+
out_root_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/experiments
|
46 |
+
tb_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/tb_logs
|
47 |
+
pretrained_models: /group-volume/orc_srr/multimodal/pretrained/
|
48 |
+
data:
|
49 |
+
batch_size: 5
|
50 |
+
val_batch_size: 2
|
51 |
+
num_workers: 3
|
52 |
+
train:
|
53 |
+
indir: ${location.data_root_dir}/train_256
|
54 |
+
out_size: 256
|
55 |
+
mask_gen_kwargs:
|
56 |
+
irregular_proba: 1
|
57 |
+
irregular_kwargs:
|
58 |
+
max_angle: 4
|
59 |
+
max_len: 200
|
60 |
+
max_width: 100
|
61 |
+
max_times: 5
|
62 |
+
min_times: 1
|
63 |
+
box_proba: 1
|
64 |
+
box_kwargs:
|
65 |
+
margin: 10
|
66 |
+
bbox_min_size: 30
|
67 |
+
bbox_max_size: 150
|
68 |
+
max_times: 4
|
69 |
+
min_times: 1
|
70 |
+
segm_proba: 0
|
71 |
+
transform_variant: no_augs
|
72 |
+
dataloader_kwargs:
|
73 |
+
batch_size: ${data.batch_size}
|
74 |
+
shuffle: true
|
75 |
+
num_workers: ${data.num_workers}
|
76 |
+
val:
|
77 |
+
indir: ${location.data_root_dir}/val_256
|
78 |
+
img_suffix: .png
|
79 |
+
dataloader_kwargs:
|
80 |
+
batch_size: ${data.val_batch_size}
|
81 |
+
shuffle: false
|
82 |
+
num_workers: ${data.num_workers}
|
83 |
+
visual_test: null
|
84 |
+
generator:
|
85 |
+
kind: pix2pixhd_global
|
86 |
+
input_nc: 4
|
87 |
+
output_nc: 3
|
88 |
+
ngf: 64
|
89 |
+
n_downsampling: 3
|
90 |
+
n_blocks: 15
|
91 |
+
conv_kind: default
|
92 |
+
add_out_act: sigmoid
|
93 |
+
discriminator:
|
94 |
+
kind: pix2pixhd_nlayer
|
95 |
+
input_nc: 3
|
96 |
+
ndf: 64
|
97 |
+
n_layers: 4
|
98 |
+
evaluator:
|
99 |
+
kind: default
|
100 |
+
inpainted_key: inpainted
|
101 |
+
integral_kind: ssim_fid100_f1
|
102 |
+
trainer:
|
103 |
+
kwargs:
|
104 |
+
gpus: -1
|
105 |
+
distributed_backend: ddp
|
106 |
+
max_epochs: 40
|
107 |
+
gradient_clip_val: 1
|
108 |
+
log_gpu_memory: None
|
109 |
+
limit_train_batches: 25000
|
110 |
+
val_check_interval: 2600
|
111 |
+
log_save_interval: 250
|
112 |
+
precision: 32
|
113 |
+
terminate_on_nan: false
|
114 |
+
check_val_every_n_epoch: 1
|
115 |
+
num_sanity_val_steps: 8
|
116 |
+
replace_sampler_ddp: false
|
117 |
+
checkpoint_kwargs:
|
118 |
+
verbose: true
|
119 |
+
save_top_k: 5
|
120 |
+
save_last: true
|
121 |
+
period: 1
|
122 |
+
monitor: val_ssim_fid100_f1_total_mean
|
123 |
+
mode: max
|
lama-celeba-hq/lama-deep/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec02f080ef3adf6395a111efc061dd2d869ab78fe014c6f4431e61a8a448332e
|
3 |
+
size 501258959
|
lama-celeba-hq/lama-dilated/config.yaml
ADDED
@@ -0,0 +1,127 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
run_title: swu_celeba_bs30
|
2 |
+
training_model:
|
3 |
+
kind: default
|
4 |
+
visualize_each_iters: 1000
|
5 |
+
concat_mask: true
|
6 |
+
store_discr_outputs_for_vis: true
|
7 |
+
losses:
|
8 |
+
l1:
|
9 |
+
weight_missing: 0
|
10 |
+
weight_known: 10
|
11 |
+
perceptual:
|
12 |
+
weight: 0
|
13 |
+
adversarial:
|
14 |
+
kind: r1
|
15 |
+
weight: 10
|
16 |
+
gp_coef: 0.001
|
17 |
+
mask_as_fake_target: true
|
18 |
+
allow_scale_mask: true
|
19 |
+
feature_matching:
|
20 |
+
weight: 100
|
21 |
+
segm_pl:
|
22 |
+
weight: 30
|
23 |
+
weights_path: ${env:TORCH_HOME}
|
24 |
+
optimizers:
|
25 |
+
generator:
|
26 |
+
kind: adam
|
27 |
+
lr: 0.001
|
28 |
+
discriminator:
|
29 |
+
kind: adam
|
30 |
+
lr: 0.0001
|
31 |
+
visualizer:
|
32 |
+
key_order:
|
33 |
+
- image
|
34 |
+
- predicted_image
|
35 |
+
- discr_output_fake
|
36 |
+
- discr_output_real
|
37 |
+
- inpainted
|
38 |
+
rescale_keys:
|
39 |
+
- discr_output_fake
|
40 |
+
- discr_output_real
|
41 |
+
kind: directory
|
42 |
+
outdir: /group-volume/orc_srr/multimodal/e.logacheva/CelebA-HQ-inpainting/experiments/e.logacheva_2021-03-16_00-49-10_train_final_md_swu_celeba_bs30/samples
|
43 |
+
location:
|
44 |
+
data_root_dir: ${env:HOME}/CelebA-HQ
|
45 |
+
out_root_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/experiments
|
46 |
+
tb_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/tb_logs
|
47 |
+
pretrained_models: /group-volume/orc_srr/multimodal/pretrained/
|
48 |
+
data:
|
49 |
+
batch_size: 5
|
50 |
+
val_batch_size: 2
|
51 |
+
num_workers: 3
|
52 |
+
train:
|
53 |
+
indir: ${location.data_root_dir}/train_256
|
54 |
+
out_size: 256
|
55 |
+
mask_gen_kwargs:
|
56 |
+
irregular_proba: 1
|
57 |
+
irregular_kwargs:
|
58 |
+
max_angle: 4
|
59 |
+
max_len: 200
|
60 |
+
max_width: 100
|
61 |
+
max_times: 5
|
62 |
+
min_times: 1
|
63 |
+
box_proba: 1
|
64 |
+
box_kwargs:
|
65 |
+
margin: 10
|
66 |
+
bbox_min_size: 30
|
67 |
+
bbox_max_size: 150
|
68 |
+
max_times: 4
|
69 |
+
min_times: 1
|
70 |
+
segm_proba: 0
|
71 |
+
transform_variant: no_augs
|
72 |
+
dataloader_kwargs:
|
73 |
+
batch_size: ${data.batch_size}
|
74 |
+
shuffle: true
|
75 |
+
num_workers: ${data.num_workers}
|
76 |
+
val:
|
77 |
+
indir: ${location.data_root_dir}/val_256
|
78 |
+
img_suffix: .png
|
79 |
+
dataloader_kwargs:
|
80 |
+
batch_size: ${data.val_batch_size}
|
81 |
+
shuffle: false
|
82 |
+
num_workers: ${data.num_workers}
|
83 |
+
visual_test: null
|
84 |
+
generator:
|
85 |
+
kind: pix2pixhd_multidilated
|
86 |
+
input_nc: 4
|
87 |
+
output_nc: 3
|
88 |
+
ngf: 64
|
89 |
+
n_downsampling: 3
|
90 |
+
n_blocks: 9
|
91 |
+
conv_kind: default
|
92 |
+
add_out_act: sigmoid
|
93 |
+
multidilation_kwargs:
|
94 |
+
comb_mode: cat_in
|
95 |
+
dilation_num: 4
|
96 |
+
discriminator:
|
97 |
+
kind: pix2pixhd_nlayer
|
98 |
+
input_nc: 3
|
99 |
+
ndf: 64
|
100 |
+
n_layers: 4
|
101 |
+
evaluator:
|
102 |
+
kind: default
|
103 |
+
inpainted_key: inpainted
|
104 |
+
integral_kind: ssim_fid100_f1
|
105 |
+
trainer:
|
106 |
+
kwargs:
|
107 |
+
gpus: -1
|
108 |
+
distributed_backend: ddp
|
109 |
+
max_epochs: 40
|
110 |
+
gradient_clip_val: 1
|
111 |
+
log_gpu_memory: None
|
112 |
+
limit_train_batches: 25000
|
113 |
+
val_check_interval: 2600
|
114 |
+
log_save_interval: 250
|
115 |
+
precision: 32
|
116 |
+
terminate_on_nan: false
|
117 |
+
check_val_every_n_epoch: 1
|
118 |
+
num_sanity_val_steps: 8
|
119 |
+
replace_sampler_ddp: false
|
120 |
+
benchmark: true
|
121 |
+
checkpoint_kwargs:
|
122 |
+
verbose: true
|
123 |
+
save_top_k: 5
|
124 |
+
save_last: true
|
125 |
+
period: 1
|
126 |
+
monitor: val_ssim_fid100_f1_total_mean
|
127 |
+
mode: max
|
lama-celeba-hq/lama-dilated/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c71a0e8195c0944c27b5e2ba785c6e7fe2bef32da68bd1a46ee2b1c36f425476
|
3 |
+
size 388160827
|
lama-celeba-hq/lama-fourier-shallow/config.yaml
ADDED
@@ -0,0 +1,134 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
run_title: swu_celeba_bs30_b6
|
2 |
+
training_model:
|
3 |
+
kind: default
|
4 |
+
visualize_each_iters: 1000
|
5 |
+
concat_mask: true
|
6 |
+
store_discr_outputs_for_vis: true
|
7 |
+
losses:
|
8 |
+
l1:
|
9 |
+
weight_missing: 0
|
10 |
+
weight_known: 10
|
11 |
+
perceptual:
|
12 |
+
weight: 0
|
13 |
+
adversarial:
|
14 |
+
kind: r1
|
15 |
+
weight: 10
|
16 |
+
gp_coef: 0.001
|
17 |
+
mask_as_fake_target: true
|
18 |
+
allow_scale_mask: true
|
19 |
+
feature_matching:
|
20 |
+
weight: 100
|
21 |
+
segm_pl:
|
22 |
+
weight: 30
|
23 |
+
weights_path: ${env:TORCH_HOME}
|
24 |
+
optimizers:
|
25 |
+
generator:
|
26 |
+
kind: adam
|
27 |
+
lr: 0.001
|
28 |
+
discriminator:
|
29 |
+
kind: adam
|
30 |
+
lr: 0.0001
|
31 |
+
visualizer:
|
32 |
+
key_order:
|
33 |
+
- image
|
34 |
+
- predicted_image
|
35 |
+
- discr_output_fake
|
36 |
+
- discr_output_real
|
37 |
+
- inpainted
|
38 |
+
rescale_keys:
|
39 |
+
- discr_output_fake
|
40 |
+
- discr_output_real
|
41 |
+
kind: directory
|
42 |
+
outdir: /group-volume/orc_srr/multimodal/e.logacheva/CelebA-HQ-inpainting/experiments/e.logacheva_2021-06-11_18-21-08_train_ablv2_work_ffc075_swu_celeba_bs30_b6/samples
|
43 |
+
location:
|
44 |
+
data_root_dir: ${env:HOME}/CelebA-HQ
|
45 |
+
out_root_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/experiments
|
46 |
+
tb_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/tb_logs
|
47 |
+
pretrained_models: /group-volume/orc_srr/multimodal/pretrained/
|
48 |
+
data:
|
49 |
+
batch_size: 6
|
50 |
+
val_batch_size: 2
|
51 |
+
num_workers: 3
|
52 |
+
train:
|
53 |
+
indir: ${location.data_root_dir}/train_256
|
54 |
+
out_size: 256
|
55 |
+
mask_gen_kwargs:
|
56 |
+
irregular_proba: 1
|
57 |
+
irregular_kwargs:
|
58 |
+
max_angle: 4
|
59 |
+
max_len: 200
|
60 |
+
max_width: 100
|
61 |
+
max_times: 5
|
62 |
+
min_times: 1
|
63 |
+
box_proba: 1
|
64 |
+
box_kwargs:
|
65 |
+
margin: 10
|
66 |
+
bbox_min_size: 30
|
67 |
+
bbox_max_size: 150
|
68 |
+
max_times: 4
|
69 |
+
min_times: 1
|
70 |
+
segm_proba: 0
|
71 |
+
transform_variant: no_augs
|
72 |
+
dataloader_kwargs:
|
73 |
+
batch_size: ${data.batch_size}
|
74 |
+
shuffle: true
|
75 |
+
num_workers: ${data.num_workers}
|
76 |
+
val:
|
77 |
+
indir: ${location.data_root_dir}/val_256
|
78 |
+
img_suffix: .png
|
79 |
+
dataloader_kwargs:
|
80 |
+
batch_size: ${data.val_batch_size}
|
81 |
+
shuffle: false
|
82 |
+
num_workers: ${data.num_workers}
|
83 |
+
visual_test: null
|
84 |
+
generator:
|
85 |
+
kind: ffc_resnet
|
86 |
+
input_nc: 4
|
87 |
+
output_nc: 3
|
88 |
+
ngf: 64
|
89 |
+
n_downsampling: 3
|
90 |
+
n_blocks: 6
|
91 |
+
add_out_act: sigmoid
|
92 |
+
init_conv_kwargs:
|
93 |
+
ratio_gin: 0
|
94 |
+
ratio_gout: 0
|
95 |
+
enable_lfu: false
|
96 |
+
downsample_conv_kwargs:
|
97 |
+
ratio_gin: ${generator.init_conv_kwargs.ratio_gout}
|
98 |
+
ratio_gout: ${generator.downsample_conv_kwargs.ratio_gin}
|
99 |
+
enable_lfu: false
|
100 |
+
resnet_conv_kwargs:
|
101 |
+
ratio_gin: 0.75
|
102 |
+
ratio_gout: ${generator.resnet_conv_kwargs.ratio_gin}
|
103 |
+
enable_lfu: false
|
104 |
+
discriminator:
|
105 |
+
kind: pix2pixhd_nlayer
|
106 |
+
input_nc: 3
|
107 |
+
ndf: 64
|
108 |
+
n_layers: 4
|
109 |
+
evaluator:
|
110 |
+
kind: default
|
111 |
+
inpainted_key: inpainted
|
112 |
+
integral_kind: ssim_fid100_f1
|
113 |
+
trainer:
|
114 |
+
kwargs:
|
115 |
+
gpus: -1
|
116 |
+
distributed_backend: ddp
|
117 |
+
max_epochs: 40
|
118 |
+
gradient_clip_val: 1
|
119 |
+
log_gpu_memory: None
|
120 |
+
limit_train_batches: 25000
|
121 |
+
val_check_interval: 2600
|
122 |
+
log_save_interval: 250
|
123 |
+
precision: 32
|
124 |
+
terminate_on_nan: false
|
125 |
+
check_val_every_n_epoch: 1
|
126 |
+
num_sanity_val_steps: 8
|
127 |
+
replace_sampler_ddp: false
|
128 |
+
checkpoint_kwargs:
|
129 |
+
verbose: true
|
130 |
+
save_top_k: 5
|
131 |
+
save_last: true
|
132 |
+
period: 1
|
133 |
+
monitor: val_ssim_fid100_f1_total_mean
|
134 |
+
mode: max
|
lama-celeba-hq/lama-fourier-shallow/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ba34746ca7e365c56429317e64c6ff964ecb1217b0599c735a76118197cbb06
|
3 |
+
size 281772850
|
lama-celeba-hq/lama-fourier/config.yaml
ADDED
@@ -0,0 +1,134 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
run_title: swu_celeba_bs30
|
2 |
+
training_model:
|
3 |
+
kind: default
|
4 |
+
visualize_each_iters: 1000
|
5 |
+
concat_mask: true
|
6 |
+
store_discr_outputs_for_vis: true
|
7 |
+
losses:
|
8 |
+
l1:
|
9 |
+
weight_missing: 0
|
10 |
+
weight_known: 10
|
11 |
+
perceptual:
|
12 |
+
weight: 0
|
13 |
+
adversarial:
|
14 |
+
kind: r1
|
15 |
+
weight: 10
|
16 |
+
gp_coef: 0.001
|
17 |
+
mask_as_fake_target: true
|
18 |
+
allow_scale_mask: true
|
19 |
+
feature_matching:
|
20 |
+
weight: 100
|
21 |
+
segm_pl:
|
22 |
+
weight: 30
|
23 |
+
weights_path: ${env:TORCH_HOME}
|
24 |
+
optimizers:
|
25 |
+
generator:
|
26 |
+
kind: adam
|
27 |
+
lr: 0.001
|
28 |
+
discriminator:
|
29 |
+
kind: adam
|
30 |
+
lr: 0.0001
|
31 |
+
visualizer:
|
32 |
+
key_order:
|
33 |
+
- image
|
34 |
+
- predicted_image
|
35 |
+
- discr_output_fake
|
36 |
+
- discr_output_real
|
37 |
+
- inpainted
|
38 |
+
rescale_keys:
|
39 |
+
- discr_output_fake
|
40 |
+
- discr_output_real
|
41 |
+
kind: directory
|
42 |
+
outdir: /group-volume/orc_srr/multimodal/e.logacheva/CelebA-HQ-inpainting/experiments/e.logacheva_2021-03-16_00-40-44_train_ablv2_work_ffc075_swu_celeba_bs30/samples
|
43 |
+
location:
|
44 |
+
data_root_dir: ${env:HOME}/CelebA-HQ
|
45 |
+
out_root_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/experiments
|
46 |
+
tb_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/tb_logs
|
47 |
+
pretrained_models: /group-volume/orc_srr/multimodal/pretrained/
|
48 |
+
data:
|
49 |
+
batch_size: 5
|
50 |
+
val_batch_size: 2
|
51 |
+
num_workers: 3
|
52 |
+
train:
|
53 |
+
indir: ${location.data_root_dir}/train_256
|
54 |
+
out_size: 256
|
55 |
+
mask_gen_kwargs:
|
56 |
+
irregular_proba: 1
|
57 |
+
irregular_kwargs:
|
58 |
+
max_angle: 4
|
59 |
+
max_len: 200
|
60 |
+
max_width: 100
|
61 |
+
max_times: 5
|
62 |
+
min_times: 1
|
63 |
+
box_proba: 1
|
64 |
+
box_kwargs:
|
65 |
+
margin: 10
|
66 |
+
bbox_min_size: 30
|
67 |
+
bbox_max_size: 150
|
68 |
+
max_times: 4
|
69 |
+
min_times: 1
|
70 |
+
segm_proba: 0
|
71 |
+
transform_variant: no_augs
|
72 |
+
dataloader_kwargs:
|
73 |
+
batch_size: ${data.batch_size}
|
74 |
+
shuffle: true
|
75 |
+
num_workers: ${data.num_workers}
|
76 |
+
val:
|
77 |
+
indir: ${location.data_root_dir}/val_256
|
78 |
+
img_suffix: .png
|
79 |
+
dataloader_kwargs:
|
80 |
+
batch_size: ${data.val_batch_size}
|
81 |
+
shuffle: false
|
82 |
+
num_workers: ${data.num_workers}
|
83 |
+
visual_test: null
|
84 |
+
generator:
|
85 |
+
kind: ffc_resnet
|
86 |
+
input_nc: 4
|
87 |
+
output_nc: 3
|
88 |
+
ngf: 64
|
89 |
+
n_downsampling: 3
|
90 |
+
n_blocks: 9
|
91 |
+
add_out_act: sigmoid
|
92 |
+
init_conv_kwargs:
|
93 |
+
ratio_gin: 0
|
94 |
+
ratio_gout: 0
|
95 |
+
enable_lfu: false
|
96 |
+
downsample_conv_kwargs:
|
97 |
+
ratio_gin: ${generator.init_conv_kwargs.ratio_gout}
|
98 |
+
ratio_gout: ${generator.downsample_conv_kwargs.ratio_gin}
|
99 |
+
enable_lfu: false
|
100 |
+
resnet_conv_kwargs:
|
101 |
+
ratio_gin: 0.75
|
102 |
+
ratio_gout: ${generator.resnet_conv_kwargs.ratio_gin}
|
103 |
+
enable_lfu: false
|
104 |
+
discriminator:
|
105 |
+
kind: pix2pixhd_nlayer
|
106 |
+
input_nc: 3
|
107 |
+
ndf: 64
|
108 |
+
n_layers: 4
|
109 |
+
evaluator:
|
110 |
+
kind: default
|
111 |
+
inpainted_key: inpainted
|
112 |
+
integral_kind: ssim_fid100_f1
|
113 |
+
trainer:
|
114 |
+
kwargs:
|
115 |
+
gpus: -1
|
116 |
+
distributed_backend: ddp
|
117 |
+
max_epochs: 40
|
118 |
+
gradient_clip_val: 1
|
119 |
+
log_gpu_memory: None
|
120 |
+
limit_train_batches: 25000
|
121 |
+
val_check_interval: 2600
|
122 |
+
log_save_interval: 250
|
123 |
+
precision: 32
|
124 |
+
terminate_on_nan: false
|
125 |
+
check_val_every_n_epoch: 1
|
126 |
+
num_sanity_val_steps: 8
|
127 |
+
replace_sampler_ddp: false
|
128 |
+
checkpoint_kwargs:
|
129 |
+
verbose: true
|
130 |
+
save_top_k: 5
|
131 |
+
save_last: true
|
132 |
+
period: 1
|
133 |
+
monitor: val_ssim_fid100_f1_total_mean
|
134 |
+
mode: max
|
lama-celeba-hq/lama-fourier/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3060742ea7464288d7d5fa8e83c940ddbd359ba1640f79135759da9c8c81f281
|
3 |
+
size 313953334
|
lama-celeba-hq/lama_small_train_masks/config.yaml
ADDED
@@ -0,0 +1,123 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
run_title: swu_celeba_bs30
|
2 |
+
training_model:
|
3 |
+
kind: default
|
4 |
+
visualize_each_iters: 1000
|
5 |
+
concat_mask: true
|
6 |
+
store_discr_outputs_for_vis: true
|
7 |
+
losses:
|
8 |
+
l1:
|
9 |
+
weight_missing: 0
|
10 |
+
weight_known: 10
|
11 |
+
perceptual:
|
12 |
+
weight: 0
|
13 |
+
adversarial:
|
14 |
+
kind: r1
|
15 |
+
weight: 10
|
16 |
+
gp_coef: 0.001
|
17 |
+
mask_as_fake_target: true
|
18 |
+
allow_scale_mask: true
|
19 |
+
feature_matching:
|
20 |
+
weight: 100
|
21 |
+
segm_pl:
|
22 |
+
weight: 30
|
23 |
+
weights_path: ${env:TORCH_HOME}
|
24 |
+
optimizers:
|
25 |
+
generator:
|
26 |
+
kind: adam
|
27 |
+
lr: 0.001
|
28 |
+
discriminator:
|
29 |
+
kind: adam
|
30 |
+
lr: 0.0001
|
31 |
+
visualizer:
|
32 |
+
key_order:
|
33 |
+
- image
|
34 |
+
- predicted_image
|
35 |
+
- discr_output_fake
|
36 |
+
- discr_output_real
|
37 |
+
- inpainted
|
38 |
+
rescale_keys:
|
39 |
+
- discr_output_fake
|
40 |
+
- discr_output_real
|
41 |
+
kind: directory
|
42 |
+
outdir: /group-volume/orc_srr/multimodal/e.logacheva/CelebA-HQ-inpainting/experiments/e.logacheva_2021-03-16_16-02-59_train_ablv2_work_small_holes_swu_celeba_bs30/samples
|
43 |
+
location:
|
44 |
+
data_root_dir: ${env:HOME}/CelebA-HQ
|
45 |
+
out_root_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/experiments
|
46 |
+
tb_dir: /group-volume/orc_srr/multimodal/${env:USER}/CelebA-HQ-inpainting/tb_logs
|
47 |
+
pretrained_models: /group-volume/orc_srr/multimodal/pretrained/
|
48 |
+
data:
|
49 |
+
batch_size: 5
|
50 |
+
val_batch_size: 2
|
51 |
+
num_workers: 3
|
52 |
+
train:
|
53 |
+
indir: ${location.data_root_dir}/train_256
|
54 |
+
out_size: 256
|
55 |
+
mask_gen_kwargs:
|
56 |
+
irregular_proba: 1
|
57 |
+
irregular_kwargs:
|
58 |
+
max_angle: 4
|
59 |
+
max_len: 200
|
60 |
+
max_width: 100
|
61 |
+
max_times: 5
|
62 |
+
min_times: 1
|
63 |
+
box_proba: 1
|
64 |
+
box_kwargs:
|
65 |
+
margin: 10
|
66 |
+
bbox_min_size: 30
|
67 |
+
bbox_max_size: 150
|
68 |
+
max_times: 4
|
69 |
+
min_times: 1
|
70 |
+
segm_proba: 0
|
71 |
+
transform_variant: no_augs
|
72 |
+
dataloader_kwargs:
|
73 |
+
batch_size: ${data.batch_size}
|
74 |
+
shuffle: true
|
75 |
+
num_workers: ${data.num_workers}
|
76 |
+
val:
|
77 |
+
indir: ${location.data_root_dir}/val_256
|
78 |
+
img_suffix: .png
|
79 |
+
dataloader_kwargs:
|
80 |
+
batch_size: ${data.val_batch_size}
|
81 |
+
shuffle: false
|
82 |
+
num_workers: ${data.num_workers}
|
83 |
+
visual_test: null
|
84 |
+
generator:
|
85 |
+
kind: pix2pixhd_global
|
86 |
+
input_nc: 4
|
87 |
+
output_nc: 3
|
88 |
+
ngf: 64
|
89 |
+
n_downsampling: 3
|
90 |
+
n_blocks: 9
|
91 |
+
conv_kind: default
|
92 |
+
add_out_act: sigmoid
|
93 |
+
discriminator:
|
94 |
+
kind: pix2pixhd_nlayer
|
95 |
+
input_nc: 3
|
96 |
+
ndf: 64
|
97 |
+
n_layers: 4
|
98 |
+
evaluator:
|
99 |
+
kind: default
|
100 |
+
inpainted_key: inpainted
|
101 |
+
integral_kind: ssim_fid100_f1
|
102 |
+
trainer:
|
103 |
+
kwargs:
|
104 |
+
gpus: -1
|
105 |
+
distributed_backend: ddp
|
106 |
+
max_epochs: 40
|
107 |
+
gradient_clip_val: 1
|
108 |
+
log_gpu_memory: None
|
109 |
+
limit_train_batches: 25000
|
110 |
+
val_check_interval: 2600
|
111 |
+
log_save_interval: 250
|
112 |
+
precision: 32
|
113 |
+
terminate_on_nan: false
|
114 |
+
check_val_every_n_epoch: 1
|
115 |
+
num_sanity_val_steps: 8
|
116 |
+
replace_sampler_ddp: false
|
117 |
+
checkpoint_kwargs:
|
118 |
+
verbose: true
|
119 |
+
save_top_k: 5
|
120 |
+
save_last: true
|
121 |
+
period: 1
|
122 |
+
monitor: val_ssim_fid100_f1_total_mean
|
123 |
+
mode: max
|
lama-celeba-hq/lama_small_train_masks/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e84c94a80cdbd6fb1315dffbf418cd421fb2e4f16ee260bd6d455fa2ff1a1ef6
|
3 |
+
size 388009574
|
lama-pl-abl/aashukha_2021-08-16_21-52-12_train_ablv2_work_no_segmpl_csirpl_csirpl03_fixed/config.yaml
ADDED
@@ -0,0 +1,130 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
location:
|
2 |
+
data_root_dir: /home/${env:USER}/inpainting_data_root_final
|
3 |
+
out_root_dir: /home/${env:USER}/inpainting/experiments
|
4 |
+
tb_dir: /home/${env:USER}/inpainting/tb_logs
|
5 |
+
data:
|
6 |
+
batch_size: 10
|
7 |
+
val_batch_size: 2
|
8 |
+
num_workers: 3
|
9 |
+
train:
|
10 |
+
indir: ${location.data_root_dir}/train
|
11 |
+
out_size: 256
|
12 |
+
mask_gen_kwargs:
|
13 |
+
irregular_proba: 1
|
14 |
+
irregular_kwargs:
|
15 |
+
max_angle: 4
|
16 |
+
max_len: 200
|
17 |
+
max_width: 100
|
18 |
+
max_times: 5
|
19 |
+
min_times: 1
|
20 |
+
box_proba: 1
|
21 |
+
box_kwargs:
|
22 |
+
margin: 10
|
23 |
+
bbox_min_size: 30
|
24 |
+
bbox_max_size: 150
|
25 |
+
max_times: 4
|
26 |
+
min_times: 1
|
27 |
+
segm_proba: 0
|
28 |
+
transform_variant: distortions
|
29 |
+
dataloader_kwargs:
|
30 |
+
batch_size: ${data.batch_size}
|
31 |
+
shuffle: true
|
32 |
+
num_workers: ${data.num_workers}
|
33 |
+
val:
|
34 |
+
indir: ${location.data_root_dir}/val
|
35 |
+
img_suffix: .png
|
36 |
+
dataloader_kwargs:
|
37 |
+
batch_size: ${data.val_batch_size}
|
38 |
+
shuffle: false
|
39 |
+
num_workers: ${data.num_workers}
|
40 |
+
visual_test:
|
41 |
+
indir: ${location.data_root_dir}/korean_test
|
42 |
+
img_suffix: _input.png
|
43 |
+
pad_out_to_modulo: 32
|
44 |
+
dataloader_kwargs:
|
45 |
+
batch_size: 1
|
46 |
+
shuffle: false
|
47 |
+
num_workers: ${data.num_workers}
|
48 |
+
generator:
|
49 |
+
kind: pix2pixhd_global
|
50 |
+
input_nc: 4
|
51 |
+
output_nc: 3
|
52 |
+
ngf: 64
|
53 |
+
n_downsampling: 3
|
54 |
+
n_blocks: 9
|
55 |
+
conv_kind: default
|
56 |
+
add_out_act: sigmoid
|
57 |
+
discriminator:
|
58 |
+
kind: pix2pixhd_nlayer
|
59 |
+
input_nc: 3
|
60 |
+
ndf: 64
|
61 |
+
n_layers: 4
|
62 |
+
visualizer:
|
63 |
+
kind: directory
|
64 |
+
outdir: /home/${env:USER}/inpainting/experiments/aashukha_2021-08-16_21-52-12_train_ablv2_work_no_segmpl_csirpl_csirpl03_fixed/samples
|
65 |
+
key_order:
|
66 |
+
- image
|
67 |
+
- predicted_image
|
68 |
+
- discr_output_fake
|
69 |
+
- discr_output_real
|
70 |
+
- inpainted
|
71 |
+
rescale_keys:
|
72 |
+
- discr_output_fake
|
73 |
+
- discr_output_real
|
74 |
+
evaluator:
|
75 |
+
kind: default
|
76 |
+
inpainted_key: inpainted
|
77 |
+
integral_kind: ssim_fid100_f1
|
78 |
+
trainer:
|
79 |
+
kwargs:
|
80 |
+
gpus: -1
|
81 |
+
accelerator: ddp
|
82 |
+
max_epochs: 40
|
83 |
+
gradient_clip_val: 1
|
84 |
+
log_gpu_memory: None
|
85 |
+
limit_train_batches: 25000
|
86 |
+
val_check_interval: ${trainer.kwargs.limit_train_batches}
|
87 |
+
log_every_n_steps: 250
|
88 |
+
precision: 32
|
89 |
+
terminate_on_nan: false
|
90 |
+
check_val_every_n_epoch: 1
|
91 |
+
num_sanity_val_steps: 8
|
92 |
+
replace_sampler_ddp: false
|
93 |
+
checkpoint_kwargs:
|
94 |
+
verbose: true
|
95 |
+
save_top_k: 5
|
96 |
+
save_last: true
|
97 |
+
period: 1
|
98 |
+
monitor: val_ssim_fid100_f1_total_mean
|
99 |
+
mode: max
|
100 |
+
run_title: csirpl03_fixed
|
101 |
+
training_model:
|
102 |
+
kind: default
|
103 |
+
visualize_each_iters: 1000
|
104 |
+
concat_mask: true
|
105 |
+
store_discr_outputs_for_vis: true
|
106 |
+
losses:
|
107 |
+
l1:
|
108 |
+
weight_missing: 0
|
109 |
+
weight_known: 10
|
110 |
+
perceptual:
|
111 |
+
weight: 0
|
112 |
+
adversarial:
|
113 |
+
kind: r1
|
114 |
+
weight: 10
|
115 |
+
gp_coef: 0.001
|
116 |
+
mask_as_fake_target: true
|
117 |
+
allow_scale_mask: true
|
118 |
+
feature_matching:
|
119 |
+
weight: 100
|
120 |
+
segm_pl:
|
121 |
+
weight: 0.3
|
122 |
+
arch_encoder: resnet50
|
123 |
+
imagenet_weights: true
|
124 |
+
optimizers:
|
125 |
+
generator:
|
126 |
+
kind: adam
|
127 |
+
lr: 0.001
|
128 |
+
discriminator:
|
129 |
+
kind: adam
|
130 |
+
lr: 0.0001
|
lama-pl-abl/aashukha_2021-08-16_21-52-12_train_ablv2_work_no_segmpl_csirpl_csirpl03_fixed/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5bcc70055960584b05717e0f4c4aa11fa2e17165f930d38966497a7829144c7
|
3 |
+
size 388032511
|
lama-pl-abl/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_csdilirpl_csdilirpl1_new/config.yaml
ADDED
@@ -0,0 +1,130 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
location:
|
2 |
+
data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_final
|
3 |
+
out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
|
4 |
+
tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
|
5 |
+
data:
|
6 |
+
batch_size: 10
|
7 |
+
val_batch_size: 2
|
8 |
+
num_workers: 3
|
9 |
+
train:
|
10 |
+
indir: ${location.data_root_dir}/train
|
11 |
+
out_size: 256
|
12 |
+
mask_gen_kwargs:
|
13 |
+
irregular_proba: 1
|
14 |
+
irregular_kwargs:
|
15 |
+
max_angle: 4
|
16 |
+
max_len: 200
|
17 |
+
max_width: 100
|
18 |
+
max_times: 5
|
19 |
+
min_times: 1
|
20 |
+
box_proba: 1
|
21 |
+
box_kwargs:
|
22 |
+
margin: 10
|
23 |
+
bbox_min_size: 30
|
24 |
+
bbox_max_size: 150
|
25 |
+
max_times: 4
|
26 |
+
min_times: 1
|
27 |
+
segm_proba: 0
|
28 |
+
transform_variant: distortions
|
29 |
+
dataloader_kwargs:
|
30 |
+
batch_size: ${data.batch_size}
|
31 |
+
shuffle: true
|
32 |
+
num_workers: ${data.num_workers}
|
33 |
+
val:
|
34 |
+
indir: ${location.data_root_dir}/val
|
35 |
+
img_suffix: .png
|
36 |
+
dataloader_kwargs:
|
37 |
+
batch_size: ${data.val_batch_size}
|
38 |
+
shuffle: false
|
39 |
+
num_workers: ${data.num_workers}
|
40 |
+
visual_test:
|
41 |
+
indir: ${location.data_root_dir}/korean_test
|
42 |
+
img_suffix: _input.png
|
43 |
+
pad_out_to_modulo: 32
|
44 |
+
dataloader_kwargs:
|
45 |
+
batch_size: 1
|
46 |
+
shuffle: false
|
47 |
+
num_workers: ${data.num_workers}
|
48 |
+
generator:
|
49 |
+
kind: pix2pixhd_global
|
50 |
+
input_nc: 4
|
51 |
+
output_nc: 3
|
52 |
+
ngf: 64
|
53 |
+
n_downsampling: 3
|
54 |
+
n_blocks: 9
|
55 |
+
conv_kind: default
|
56 |
+
add_out_act: sigmoid
|
57 |
+
discriminator:
|
58 |
+
kind: pix2pixhd_nlayer
|
59 |
+
input_nc: 3
|
60 |
+
ndf: 64
|
61 |
+
n_layers: 4
|
62 |
+
visualizer:
|
63 |
+
kind: directory
|
64 |
+
outdir: /group-volume/User-Driven-Content-Generation/e.logacheva/inpainting/experiments/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_csdilirpl_csdilirpl1_new/samples
|
65 |
+
key_order:
|
66 |
+
- image
|
67 |
+
- predicted_image
|
68 |
+
- discr_output_fake
|
69 |
+
- discr_output_real
|
70 |
+
- inpainted
|
71 |
+
rescale_keys:
|
72 |
+
- discr_output_fake
|
73 |
+
- discr_output_real
|
74 |
+
evaluator:
|
75 |
+
kind: default
|
76 |
+
inpainted_key: inpainted
|
77 |
+
integral_kind: ssim_fid100_f1
|
78 |
+
trainer:
|
79 |
+
kwargs:
|
80 |
+
gpus: -1
|
81 |
+
accelerator: ddp
|
82 |
+
max_epochs: 40
|
83 |
+
gradient_clip_val: 1
|
84 |
+
log_gpu_memory: None
|
85 |
+
limit_train_batches: 25000
|
86 |
+
val_check_interval: ${trainer.kwargs.limit_train_batches}
|
87 |
+
log_every_n_steps: 250
|
88 |
+
precision: 32
|
89 |
+
terminate_on_nan: false
|
90 |
+
check_val_every_n_epoch: 1
|
91 |
+
num_sanity_val_steps: 8
|
92 |
+
replace_sampler_ddp: false
|
93 |
+
benchmark: true
|
94 |
+
checkpoint_kwargs:
|
95 |
+
verbose: true
|
96 |
+
save_top_k: 5
|
97 |
+
save_last: true
|
98 |
+
period: 1
|
99 |
+
monitor: val_ssim_fid100_f1_total_mean
|
100 |
+
mode: max
|
101 |
+
run_title: csdilirpl1_new
|
102 |
+
training_model:
|
103 |
+
kind: default
|
104 |
+
visualize_each_iters: 1000
|
105 |
+
concat_mask: true
|
106 |
+
store_discr_outputs_for_vis: true
|
107 |
+
losses:
|
108 |
+
l1:
|
109 |
+
weight_missing: 0
|
110 |
+
weight_known: 10
|
111 |
+
perceptual:
|
112 |
+
weight: 0
|
113 |
+
adversarial:
|
114 |
+
kind: r1
|
115 |
+
weight: 10
|
116 |
+
gp_coef: 0.001
|
117 |
+
mask_as_fake_target: true
|
118 |
+
allow_scale_mask: true
|
119 |
+
feature_matching:
|
120 |
+
weight: 100
|
121 |
+
segm_pl:
|
122 |
+
weight: 1
|
123 |
+
imagenet_weights: true
|
124 |
+
optimizers:
|
125 |
+
generator:
|
126 |
+
kind: adam
|
127 |
+
lr: 0.001
|
128 |
+
discriminator:
|
129 |
+
kind: adam
|
130 |
+
lr: 0.0001
|
lama-pl-abl/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_csdilirpl_csdilirpl1_new/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e5f5fc644afefa2ecfddb232b1c397d87bd490fd34f1b2d94c8d44b94fad292
|
3 |
+
size 388032365
|
lama-pl-abl/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_vgg_l2_vgg003_new/config.yaml
ADDED
@@ -0,0 +1,130 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
location:
|
2 |
+
data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_final
|
3 |
+
out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
|
4 |
+
tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
|
5 |
+
data:
|
6 |
+
batch_size: 10
|
7 |
+
val_batch_size: 2
|
8 |
+
num_workers: 3
|
9 |
+
train:
|
10 |
+
indir: ${location.data_root_dir}/train
|
11 |
+
out_size: 256
|
12 |
+
mask_gen_kwargs:
|
13 |
+
irregular_proba: 1
|
14 |
+
irregular_kwargs:
|
15 |
+
max_angle: 4
|
16 |
+
max_len: 200
|
17 |
+
max_width: 100
|
18 |
+
max_times: 5
|
19 |
+
min_times: 1
|
20 |
+
box_proba: 1
|
21 |
+
box_kwargs:
|
22 |
+
margin: 10
|
23 |
+
bbox_min_size: 30
|
24 |
+
bbox_max_size: 150
|
25 |
+
max_times: 4
|
26 |
+
min_times: 1
|
27 |
+
segm_proba: 0
|
28 |
+
transform_variant: distortions
|
29 |
+
dataloader_kwargs:
|
30 |
+
batch_size: ${data.batch_size}
|
31 |
+
shuffle: true
|
32 |
+
num_workers: ${data.num_workers}
|
33 |
+
val:
|
34 |
+
indir: ${location.data_root_dir}/val
|
35 |
+
img_suffix: .png
|
36 |
+
dataloader_kwargs:
|
37 |
+
batch_size: ${data.val_batch_size}
|
38 |
+
shuffle: false
|
39 |
+
num_workers: ${data.num_workers}
|
40 |
+
visual_test:
|
41 |
+
indir: ${location.data_root_dir}/korean_test
|
42 |
+
img_suffix: _input.png
|
43 |
+
pad_out_to_modulo: 32
|
44 |
+
dataloader_kwargs:
|
45 |
+
batch_size: 1
|
46 |
+
shuffle: false
|
47 |
+
num_workers: ${data.num_workers}
|
48 |
+
generator:
|
49 |
+
kind: pix2pixhd_global
|
50 |
+
input_nc: 4
|
51 |
+
output_nc: 3
|
52 |
+
ngf: 64
|
53 |
+
n_downsampling: 3
|
54 |
+
n_blocks: 9
|
55 |
+
conv_kind: default
|
56 |
+
add_out_act: sigmoid
|
57 |
+
discriminator:
|
58 |
+
kind: pix2pixhd_nlayer
|
59 |
+
input_nc: 3
|
60 |
+
ndf: 64
|
61 |
+
n_layers: 4
|
62 |
+
visualizer:
|
63 |
+
kind: directory
|
64 |
+
outdir: /group-volume/User-Driven-Content-Generation/e.logacheva/inpainting/experiments/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_vgg_l2_vgg003_new/samples
|
65 |
+
key_order:
|
66 |
+
- image
|
67 |
+
- predicted_image
|
68 |
+
- discr_output_fake
|
69 |
+
- discr_output_real
|
70 |
+
- inpainted
|
71 |
+
rescale_keys:
|
72 |
+
- discr_output_fake
|
73 |
+
- discr_output_real
|
74 |
+
evaluator:
|
75 |
+
kind: default
|
76 |
+
inpainted_key: inpainted
|
77 |
+
integral_kind: ssim_fid100_f1
|
78 |
+
trainer:
|
79 |
+
kwargs:
|
80 |
+
gpus: -1
|
81 |
+
accelerator: ddp
|
82 |
+
max_epochs: 40
|
83 |
+
gradient_clip_val: 1
|
84 |
+
log_gpu_memory: None
|
85 |
+
limit_train_batches: 25000
|
86 |
+
val_check_interval: ${trainer.kwargs.limit_train_batches}
|
87 |
+
log_every_n_steps: 250
|
88 |
+
precision: 32
|
89 |
+
terminate_on_nan: false
|
90 |
+
check_val_every_n_epoch: 1
|
91 |
+
num_sanity_val_steps: 8
|
92 |
+
replace_sampler_ddp: false
|
93 |
+
checkpoint_kwargs:
|
94 |
+
verbose: true
|
95 |
+
save_top_k: 5
|
96 |
+
save_last: true
|
97 |
+
period: 1
|
98 |
+
monitor: val_ssim_fid100_f1_total_mean
|
99 |
+
mode: max
|
100 |
+
run_title: l2_vgg003_new
|
101 |
+
training_model:
|
102 |
+
kind: default
|
103 |
+
visualize_each_iters: 1000
|
104 |
+
concat_mask: true
|
105 |
+
store_discr_outputs_for_vis: true
|
106 |
+
losses:
|
107 |
+
l1:
|
108 |
+
weight_missing: 0
|
109 |
+
weight_known: 10
|
110 |
+
perceptual:
|
111 |
+
weight: 0.03
|
112 |
+
kwargs:
|
113 |
+
metric: l2
|
114 |
+
adversarial:
|
115 |
+
kind: r1
|
116 |
+
weight: 10
|
117 |
+
gp_coef: 0.001
|
118 |
+
mask_as_fake_target: true
|
119 |
+
allow_scale_mask: true
|
120 |
+
feature_matching:
|
121 |
+
weight: 100
|
122 |
+
segm_pl:
|
123 |
+
weight: 0
|
124 |
+
optimizers:
|
125 |
+
generator:
|
126 |
+
kind: adam
|
127 |
+
lr: 0.001
|
128 |
+
discriminator:
|
129 |
+
kind: adam
|
130 |
+
lr: 0.0001
|
lama-pl-abl/e.logacheva_2021-10-04_00-15-00_train_ablv2_work_no_segmpl_vgg_l2_vgg003_new/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e66fd161b99155ae00b001ba3d727d2b468805529852f6f798ae348f1b2fb9e1
|
3 |
+
size 388025416
|
lama-places/big-lama-regular/config.yaml
ADDED
@@ -0,0 +1,129 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
location:
|
2 |
+
data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_final
|
3 |
+
out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
|
4 |
+
tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
|
5 |
+
data:
|
6 |
+
batch_size: 5
|
7 |
+
val_batch_size: 2
|
8 |
+
num_workers: 3
|
9 |
+
train:
|
10 |
+
indir: ${location.data_root_dir}/train
|
11 |
+
out_size: 256
|
12 |
+
mask_gen_kwargs:
|
13 |
+
irregular_proba: 1
|
14 |
+
irregular_kwargs:
|
15 |
+
max_angle: 4
|
16 |
+
max_len: 200
|
17 |
+
max_width: 100
|
18 |
+
max_times: 5
|
19 |
+
min_times: 1
|
20 |
+
box_proba: 1
|
21 |
+
box_kwargs:
|
22 |
+
margin: 10
|
23 |
+
bbox_min_size: 30
|
24 |
+
bbox_max_size: 150
|
25 |
+
max_times: 4
|
26 |
+
min_times: 1
|
27 |
+
segm_proba: 0
|
28 |
+
transform_variant: distortions
|
29 |
+
dataloader_kwargs:
|
30 |
+
batch_size: ${data.batch_size}
|
31 |
+
shuffle: true
|
32 |
+
num_workers: ${data.num_workers}
|
33 |
+
val:
|
34 |
+
indir: ${location.data_root_dir}/val
|
35 |
+
img_suffix: .png
|
36 |
+
dataloader_kwargs:
|
37 |
+
batch_size: ${data.val_batch_size}
|
38 |
+
shuffle: false
|
39 |
+
num_workers: ${data.num_workers}
|
40 |
+
visual_test:
|
41 |
+
indir: ${location.data_root_dir}/korean_test
|
42 |
+
img_suffix: _input.png
|
43 |
+
pad_out_to_modulo: 32
|
44 |
+
dataloader_kwargs:
|
45 |
+
batch_size: 1
|
46 |
+
shuffle: false
|
47 |
+
num_workers: ${data.num_workers}
|
48 |
+
generator:
|
49 |
+
kind: pix2pixhd_global
|
50 |
+
input_nc: 4
|
51 |
+
output_nc: 3
|
52 |
+
ngf: 64
|
53 |
+
n_downsampling: 3
|
54 |
+
n_blocks: 15
|
55 |
+
conv_kind: default
|
56 |
+
add_out_act: sigmoid
|
57 |
+
discriminator:
|
58 |
+
kind: pix2pixhd_nlayer
|
59 |
+
input_nc: 3
|
60 |
+
ndf: 64
|
61 |
+
n_layers: 4
|
62 |
+
visualizer:
|
63 |
+
kind: directory
|
64 |
+
outdir: /group-volume/User-Driven-Content-Generation/r.suvorov/inpainting/experiments/r.suvorov_2021-06-11_13-21-15_train_ablv2_work_rebuttal-b15/samples
|
65 |
+
key_order:
|
66 |
+
- image
|
67 |
+
- predicted_image
|
68 |
+
- discr_output_fake
|
69 |
+
- discr_output_real
|
70 |
+
- inpainted
|
71 |
+
rescale_keys:
|
72 |
+
- discr_output_fake
|
73 |
+
- discr_output_real
|
74 |
+
evaluator:
|
75 |
+
kind: default
|
76 |
+
inpainted_key: inpainted
|
77 |
+
integral_kind: ssim_fid100_f1
|
78 |
+
trainer:
|
79 |
+
kwargs:
|
80 |
+
gpus: -1
|
81 |
+
accelerator: ddp
|
82 |
+
max_epochs: 40
|
83 |
+
gradient_clip_val: 1
|
84 |
+
log_gpu_memory: None
|
85 |
+
limit_train_batches: 25000
|
86 |
+
val_check_interval: ${trainer.kwargs.limit_train_batches}
|
87 |
+
log_every_n_steps: 250
|
88 |
+
precision: 32
|
89 |
+
terminate_on_nan: false
|
90 |
+
check_val_every_n_epoch: 1
|
91 |
+
num_sanity_val_steps: 8
|
92 |
+
replace_sampler_ddp: false
|
93 |
+
checkpoint_kwargs:
|
94 |
+
verbose: true
|
95 |
+
save_top_k: 5
|
96 |
+
save_last: true
|
97 |
+
period: 1
|
98 |
+
monitor: val_ssim_fid100_f1_total_mean
|
99 |
+
mode: max
|
100 |
+
run_title: rebuttal-b15
|
101 |
+
training_model:
|
102 |
+
kind: default
|
103 |
+
visualize_each_iters: 1000
|
104 |
+
concat_mask: true
|
105 |
+
store_discr_outputs_for_vis: true
|
106 |
+
losses:
|
107 |
+
l1:
|
108 |
+
weight_missing: 0
|
109 |
+
weight_known: 10
|
110 |
+
perceptual:
|
111 |
+
weight: 0
|
112 |
+
adversarial:
|
113 |
+
kind: r1
|
114 |
+
weight: 10
|
115 |
+
gp_coef: 0.001
|
116 |
+
mask_as_fake_target: true
|
117 |
+
allow_scale_mask: true
|
118 |
+
feature_matching:
|
119 |
+
weight: 100
|
120 |
+
resnet_pl:
|
121 |
+
weight: 30
|
122 |
+
weights_path: ${env:TORCH_HOME}
|
123 |
+
optimizers:
|
124 |
+
generator:
|
125 |
+
kind: adam
|
126 |
+
lr: 0.001
|
127 |
+
discriminator:
|
128 |
+
kind: adam
|
129 |
+
lr: 0.0001
|
lama-places/big-lama-regular/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40886923da4741b8c5fa25264371c0fca6ebc1b680e4744ae94714f2c26a8e11
|
3 |
+
size 501445597
|
lama-places/lama-dilated/config.yaml
ADDED
@@ -0,0 +1,133 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
location:
|
2 |
+
data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_final
|
3 |
+
out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
|
4 |
+
tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
|
5 |
+
data:
|
6 |
+
batch_size: 10
|
7 |
+
val_batch_size: 2
|
8 |
+
num_workers: 3
|
9 |
+
train:
|
10 |
+
indir: ${location.data_root_dir}/train
|
11 |
+
out_size: 256
|
12 |
+
mask_gen_kwargs:
|
13 |
+
irregular_proba: 1
|
14 |
+
irregular_kwargs:
|
15 |
+
max_angle: 4
|
16 |
+
max_len: 200
|
17 |
+
max_width: 100
|
18 |
+
max_times: 5
|
19 |
+
min_times: 1
|
20 |
+
box_proba: 1
|
21 |
+
box_kwargs:
|
22 |
+
margin: 10
|
23 |
+
bbox_min_size: 30
|
24 |
+
bbox_max_size: 150
|
25 |
+
max_times: 4
|
26 |
+
min_times: 1
|
27 |
+
segm_proba: 0
|
28 |
+
transform_variant: distortions
|
29 |
+
dataloader_kwargs:
|
30 |
+
batch_size: ${data.batch_size}
|
31 |
+
shuffle: true
|
32 |
+
num_workers: ${data.num_workers}
|
33 |
+
val:
|
34 |
+
indir: ${location.data_root_dir}/val
|
35 |
+
img_suffix: .png
|
36 |
+
dataloader_kwargs:
|
37 |
+
batch_size: ${data.val_batch_size}
|
38 |
+
shuffle: false
|
39 |
+
num_workers: ${data.num_workers}
|
40 |
+
visual_test:
|
41 |
+
indir: ${location.data_root_dir}/korean_test
|
42 |
+
img_suffix: _input.png
|
43 |
+
pad_out_to_modulo: 32
|
44 |
+
dataloader_kwargs:
|
45 |
+
batch_size: 1
|
46 |
+
shuffle: false
|
47 |
+
num_workers: ${data.num_workers}
|
48 |
+
generator:
|
49 |
+
kind: pix2pixhd_multidilated
|
50 |
+
input_nc: 4
|
51 |
+
output_nc: 3
|
52 |
+
ngf: 64
|
53 |
+
n_downsampling: 3
|
54 |
+
n_blocks: 9
|
55 |
+
conv_kind: default
|
56 |
+
add_out_act: sigmoid
|
57 |
+
multidilation_kwargs:
|
58 |
+
comb_mode: cat_in
|
59 |
+
dilation_num: 4
|
60 |
+
discriminator:
|
61 |
+
kind: pix2pixhd_nlayer
|
62 |
+
input_nc: 3
|
63 |
+
ndf: 64
|
64 |
+
n_layers: 4
|
65 |
+
visualizer:
|
66 |
+
kind: directory
|
67 |
+
outdir: /group-volume/User-Driven-Content-Generation/e.logacheva/inpainting/experiments/e.logacheva_2021-09-23_11-53-00_train_ablv2_work_md_new/samples
|
68 |
+
key_order:
|
69 |
+
- image
|
70 |
+
- predicted_image
|
71 |
+
- discr_output_fake
|
72 |
+
- discr_output_real
|
73 |
+
- inpainted
|
74 |
+
rescale_keys:
|
75 |
+
- discr_output_fake
|
76 |
+
- discr_output_real
|
77 |
+
evaluator:
|
78 |
+
kind: default
|
79 |
+
inpainted_key: inpainted
|
80 |
+
integral_kind: ssim_fid100_f1
|
81 |
+
trainer:
|
82 |
+
kwargs:
|
83 |
+
gpus: -1
|
84 |
+
accelerator: ddp
|
85 |
+
max_epochs: 40
|
86 |
+
gradient_clip_val: 1
|
87 |
+
log_gpu_memory: None
|
88 |
+
limit_train_batches: 25000
|
89 |
+
val_check_interval: ${trainer.kwargs.limit_train_batches}
|
90 |
+
log_every_n_steps: 250
|
91 |
+
precision: 32
|
92 |
+
terminate_on_nan: false
|
93 |
+
check_val_every_n_epoch: 1
|
94 |
+
num_sanity_val_steps: 8
|
95 |
+
replace_sampler_ddp: false
|
96 |
+
benchmark: true
|
97 |
+
checkpoint_kwargs:
|
98 |
+
verbose: true
|
99 |
+
save_top_k: 5
|
100 |
+
save_last: true
|
101 |
+
period: 1
|
102 |
+
monitor: val_ssim_fid100_f1_total_mean
|
103 |
+
mode: max
|
104 |
+
run_title: new
|
105 |
+
training_model:
|
106 |
+
kind: default
|
107 |
+
visualize_each_iters: 1000
|
108 |
+
concat_mask: true
|
109 |
+
store_discr_outputs_for_vis: true
|
110 |
+
losses:
|
111 |
+
l1:
|
112 |
+
weight_missing: 0
|
113 |
+
weight_known: 10
|
114 |
+
perceptual:
|
115 |
+
weight: 0
|
116 |
+
adversarial:
|
117 |
+
kind: r1
|
118 |
+
weight: 10
|
119 |
+
gp_coef: 0.001
|
120 |
+
mask_as_fake_target: true
|
121 |
+
allow_scale_mask: true
|
122 |
+
feature_matching:
|
123 |
+
weight: 100
|
124 |
+
segm_pl:
|
125 |
+
weight: 30
|
126 |
+
weights_path: ${env:TORCH_HOME}
|
127 |
+
optimizers:
|
128 |
+
generator:
|
129 |
+
kind: adam
|
130 |
+
lr: 0.001
|
131 |
+
discriminator:
|
132 |
+
kind: adam
|
133 |
+
lr: 0.0001
|
lama-places/lama-dilated/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e09dfa9ab3c74149a4ee5db115f23904acc6349f55f16972d11aea903c9496a0
|
3 |
+
size 388184818
|
lama-places/lama-fourier/config.yaml
ADDED
@@ -0,0 +1,142 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
run_title: resume
|
2 |
+
training_model:
|
3 |
+
kind: default
|
4 |
+
visualize_each_iters: 1000
|
5 |
+
concat_mask: true
|
6 |
+
store_discr_outputs_for_vis: true
|
7 |
+
losses:
|
8 |
+
l1:
|
9 |
+
weight_missing: 0
|
10 |
+
weight_known: 10
|
11 |
+
perceptual:
|
12 |
+
weight: 0
|
13 |
+
adversarial:
|
14 |
+
kind: r1
|
15 |
+
weight: 10
|
16 |
+
gp_coef: 0.001
|
17 |
+
mask_as_fake_target: true
|
18 |
+
allow_scale_mask: true
|
19 |
+
feature_matching:
|
20 |
+
weight: 100
|
21 |
+
resnet_pl:
|
22 |
+
weight: 30
|
23 |
+
weights_path: ${env:TORCH_HOME}
|
24 |
+
optimizers:
|
25 |
+
generator:
|
26 |
+
kind: adam
|
27 |
+
lr: 0.001
|
28 |
+
discriminator:
|
29 |
+
kind: adam
|
30 |
+
lr: 0.0001
|
31 |
+
visualizer:
|
32 |
+
key_order:
|
33 |
+
- image
|
34 |
+
- predicted_image
|
35 |
+
- discr_output_fake
|
36 |
+
- discr_output_real
|
37 |
+
- inpainted
|
38 |
+
rescale_keys:
|
39 |
+
- discr_output_fake
|
40 |
+
- discr_output_real
|
41 |
+
kind: directory
|
42 |
+
outdir: dummy_lol
|
43 |
+
|
44 |
+
location:
|
45 |
+
data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_final
|
46 |
+
out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
|
47 |
+
tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
|
48 |
+
data:
|
49 |
+
batch_size: 10
|
50 |
+
val_batch_size: 2
|
51 |
+
num_workers: 3
|
52 |
+
train:
|
53 |
+
indir: ${location.data_root_dir}/train
|
54 |
+
out_size: 256
|
55 |
+
mask_gen_kwargs:
|
56 |
+
irregular_proba: 1
|
57 |
+
irregular_kwargs:
|
58 |
+
max_angle: 4
|
59 |
+
max_len: 200
|
60 |
+
max_width: 100
|
61 |
+
max_times: 5
|
62 |
+
min_times: 1
|
63 |
+
box_proba: 1
|
64 |
+
box_kwargs:
|
65 |
+
margin: 10
|
66 |
+
bbox_min_size: 30
|
67 |
+
bbox_max_size: 150
|
68 |
+
max_times: 4
|
69 |
+
min_times: 1
|
70 |
+
segm_proba: 0
|
71 |
+
transform_variant: distortions
|
72 |
+
dataloader_kwargs:
|
73 |
+
batch_size: ${data.batch_size}
|
74 |
+
shuffle: true
|
75 |
+
num_workers: ${data.num_workers}
|
76 |
+
val:
|
77 |
+
indir: ${location.data_root_dir}/val
|
78 |
+
img_suffix: .png
|
79 |
+
dataloader_kwargs:
|
80 |
+
batch_size: ${data.val_batch_size}
|
81 |
+
shuffle: false
|
82 |
+
num_workers: ${data.num_workers}
|
83 |
+
visual_test:
|
84 |
+
indir: ${location.data_root_dir}/korean_test
|
85 |
+
img_suffix: _input.png
|
86 |
+
pad_out_to_modulo: 32
|
87 |
+
dataloader_kwargs:
|
88 |
+
batch_size: 1
|
89 |
+
shuffle: false
|
90 |
+
num_workers: ${data.num_workers}
|
91 |
+
generator:
|
92 |
+
kind: ffc_resnet
|
93 |
+
input_nc: 4
|
94 |
+
output_nc: 3
|
95 |
+
ngf: 64
|
96 |
+
n_downsampling: 3
|
97 |
+
n_blocks: 9
|
98 |
+
add_out_act: sigmoid
|
99 |
+
init_conv_kwargs:
|
100 |
+
ratio_gin: 0
|
101 |
+
ratio_gout: 0
|
102 |
+
enable_lfu: false
|
103 |
+
downsample_conv_kwargs:
|
104 |
+
ratio_gin: ${generator.init_conv_kwargs.ratio_gout}
|
105 |
+
ratio_gout: ${generator.downsample_conv_kwargs.ratio_gin}
|
106 |
+
enable_lfu: false
|
107 |
+
resnet_conv_kwargs:
|
108 |
+
ratio_gin: 0.75
|
109 |
+
ratio_gout: ${generator.resnet_conv_kwargs.ratio_gin}
|
110 |
+
enable_lfu: false
|
111 |
+
discriminator:
|
112 |
+
kind: pix2pixhd_nlayer
|
113 |
+
input_nc: 3
|
114 |
+
ndf: 64
|
115 |
+
n_layers: 4
|
116 |
+
evaluator:
|
117 |
+
kind: default
|
118 |
+
inpainted_key: inpainted
|
119 |
+
integral_kind: ssim_fid100_f1
|
120 |
+
trainer:
|
121 |
+
kwargs:
|
122 |
+
gpus: -1
|
123 |
+
distributed_backend: ddp
|
124 |
+
max_epochs: 40
|
125 |
+
gradient_clip_val: 1
|
126 |
+
log_gpu_memory: None
|
127 |
+
limit_train_batches: 25000
|
128 |
+
val_check_interval: ${trainer.kwargs.limit_train_batches}
|
129 |
+
log_save_interval: 250
|
130 |
+
precision: 32
|
131 |
+
terminate_on_nan: false
|
132 |
+
check_val_every_n_epoch: 1
|
133 |
+
num_sanity_val_steps: 8
|
134 |
+
replace_sampler_ddp: false
|
135 |
+
resume_from_checkpoint: /group-volume/User-Driven-Content-Generation/r.suvorov/inpainting/experiments/r.suvorov_2021-03-04_13-48-33_train_ablv2_work_ffc075_/models/last.ckpt
|
136 |
+
checkpoint_kwargs:
|
137 |
+
verbose: true
|
138 |
+
save_top_k: 5
|
139 |
+
save_last: true
|
140 |
+
period: 1
|
141 |
+
monitor: val_ssim_fid100_f1_total_mean
|
142 |
+
mode: max
|
lama-places/lama-fourier/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2456284b604786a88a38549432ddf2e73a5911f9868ea692b5122e89a5f1f54
|
3 |
+
size 313967681
|
lama-places/lama-fourier/models/last.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2456284b604786a88a38549432ddf2e73a5911f9868ea692b5122e89a5f1f54
|
3 |
+
size 313967681
|
lama-places/lama-regular/config.yaml
ADDED
@@ -0,0 +1,130 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
run_title: resume
|
2 |
+
training_model:
|
3 |
+
kind: default
|
4 |
+
visualize_each_iters: 1000
|
5 |
+
concat_mask: true
|
6 |
+
store_discr_outputs_for_vis: true
|
7 |
+
losses:
|
8 |
+
l1:
|
9 |
+
weight_missing: 0
|
10 |
+
weight_known: 10
|
11 |
+
perceptual:
|
12 |
+
weight: 0
|
13 |
+
adversarial:
|
14 |
+
kind: r1
|
15 |
+
weight: 10
|
16 |
+
gp_coef: 0.001
|
17 |
+
mask_as_fake_target: true
|
18 |
+
allow_scale_mask: true
|
19 |
+
feature_matching:
|
20 |
+
weight: 100
|
21 |
+
resnet_pl:
|
22 |
+
weight: 30
|
23 |
+
weights_path: ${env:TORCH_HOME}
|
24 |
+
optimizers:
|
25 |
+
generator:
|
26 |
+
kind: adam
|
27 |
+
lr: 0.001
|
28 |
+
discriminator:
|
29 |
+
kind: adam
|
30 |
+
lr: 0.0001
|
31 |
+
visualizer:
|
32 |
+
key_order:
|
33 |
+
- image
|
34 |
+
- predicted_image
|
35 |
+
- discr_output_fake
|
36 |
+
- discr_output_real
|
37 |
+
- inpainted
|
38 |
+
rescale_keys:
|
39 |
+
- discr_output_fake
|
40 |
+
- discr_output_real
|
41 |
+
kind: directory
|
42 |
+
outdir: /group-volume/User-Driven-Content-Generation/r.suvorov/inpainting/experiments/r.suvorov_2021-03-05_17-08-35_train_ablv2_work_resume/samples
|
43 |
+
location:
|
44 |
+
data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_final
|
45 |
+
out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
|
46 |
+
tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
|
47 |
+
data:
|
48 |
+
batch_size: 10
|
49 |
+
val_batch_size: 2
|
50 |
+
num_workers: 3
|
51 |
+
train:
|
52 |
+
indir: ${location.data_root_dir}/train
|
53 |
+
out_size: 256
|
54 |
+
mask_gen_kwargs:
|
55 |
+
irregular_proba: 1
|
56 |
+
irregular_kwargs:
|
57 |
+
max_angle: 4
|
58 |
+
max_len: 200
|
59 |
+
max_width: 100
|
60 |
+
max_times: 5
|
61 |
+
min_times: 1
|
62 |
+
box_proba: 1
|
63 |
+
box_kwargs:
|
64 |
+
margin: 10
|
65 |
+
bbox_min_size: 30
|
66 |
+
bbox_max_size: 150
|
67 |
+
max_times: 4
|
68 |
+
min_times: 1
|
69 |
+
segm_proba: 0
|
70 |
+
transform_variant: distortions
|
71 |
+
dataloader_kwargs:
|
72 |
+
batch_size: ${data.batch_size}
|
73 |
+
shuffle: true
|
74 |
+
num_workers: ${data.num_workers}
|
75 |
+
val:
|
76 |
+
indir: ${location.data_root_dir}/val
|
77 |
+
img_suffix: .png
|
78 |
+
dataloader_kwargs:
|
79 |
+
batch_size: ${data.val_batch_size}
|
80 |
+
shuffle: false
|
81 |
+
num_workers: ${data.num_workers}
|
82 |
+
visual_test:
|
83 |
+
indir: ${location.data_root_dir}/korean_test
|
84 |
+
img_suffix: _input.png
|
85 |
+
pad_out_to_modulo: 32
|
86 |
+
dataloader_kwargs:
|
87 |
+
batch_size: 1
|
88 |
+
shuffle: false
|
89 |
+
num_workers: ${data.num_workers}
|
90 |
+
generator:
|
91 |
+
kind: pix2pixhd_global
|
92 |
+
input_nc: 4
|
93 |
+
output_nc: 3
|
94 |
+
ngf: 64
|
95 |
+
n_downsampling: 3
|
96 |
+
n_blocks: 9
|
97 |
+
conv_kind: default
|
98 |
+
add_out_act: sigmoid
|
99 |
+
discriminator:
|
100 |
+
kind: pix2pixhd_nlayer
|
101 |
+
input_nc: 3
|
102 |
+
ndf: 64
|
103 |
+
n_layers: 4
|
104 |
+
evaluator:
|
105 |
+
kind: default
|
106 |
+
inpainted_key: inpainted
|
107 |
+
integral_kind: ssim_fid100_f1
|
108 |
+
trainer:
|
109 |
+
kwargs:
|
110 |
+
gpus: -1
|
111 |
+
distributed_backend: ddp
|
112 |
+
max_epochs: 40
|
113 |
+
gradient_clip_val: 1
|
114 |
+
log_gpu_memory: None
|
115 |
+
limit_train_batches: 25000
|
116 |
+
val_check_interval: ${trainer.kwargs.limit_train_batches}
|
117 |
+
log_save_interval: 250
|
118 |
+
precision: 32
|
119 |
+
terminate_on_nan: false
|
120 |
+
check_val_every_n_epoch: 1
|
121 |
+
num_sanity_val_steps: 8
|
122 |
+
replace_sampler_ddp: false
|
123 |
+
resume_from_checkpoint: /group-volume/User-Driven-Content-Generation/r.suvorov/inpainting/experiments/r.suvorov_2021-03-04_13-44-49_train_ablv2_work_/models/last.ckpt
|
124 |
+
checkpoint_kwargs:
|
125 |
+
verbose: true
|
126 |
+
save_top_k: 5
|
127 |
+
save_last: true
|
128 |
+
period: 1
|
129 |
+
monitor: val_ssim_fid100_f1_total_mean
|
130 |
+
mode: max
|
lama-places/lama-regular/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acb3a3693e0c0f363d4ee1a0d22aeb1dd7dcda6c84cb442d8d479131ff0b14b5
|
3 |
+
size 388021609
|
lama-places/lama_small_train_masks/config.yaml
ADDED
@@ -0,0 +1,130 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
run_title: resume
|
2 |
+
training_model:
|
3 |
+
kind: default
|
4 |
+
visualize_each_iters: 1000
|
5 |
+
concat_mask: true
|
6 |
+
store_discr_outputs_for_vis: true
|
7 |
+
losses:
|
8 |
+
l1:
|
9 |
+
weight_missing: 0
|
10 |
+
weight_known: 10
|
11 |
+
perceptual:
|
12 |
+
weight: 0
|
13 |
+
adversarial:
|
14 |
+
kind: r1
|
15 |
+
weight: 10
|
16 |
+
gp_coef: 0.001
|
17 |
+
mask_as_fake_target: true
|
18 |
+
allow_scale_mask: true
|
19 |
+
feature_matching:
|
20 |
+
weight: 100
|
21 |
+
resnet_pl:
|
22 |
+
weight: 30
|
23 |
+
weights_path: ${env:TORCH_HOME}
|
24 |
+
optimizers:
|
25 |
+
generator:
|
26 |
+
kind: adam
|
27 |
+
lr: 0.001
|
28 |
+
discriminator:
|
29 |
+
kind: adam
|
30 |
+
lr: 0.0001
|
31 |
+
visualizer:
|
32 |
+
key_order:
|
33 |
+
- image
|
34 |
+
- predicted_image
|
35 |
+
- discr_output_fake
|
36 |
+
- discr_output_real
|
37 |
+
- inpainted
|
38 |
+
rescale_keys:
|
39 |
+
- discr_output_fake
|
40 |
+
- discr_output_real
|
41 |
+
kind: directory
|
42 |
+
outdir: /group-volume/User-Driven-Content-Generation/r.suvorov/inpainting/experiments/r.suvorov_2021-03-05_17-04-06_train_ablv2_work_small_holes_resume/samples
|
43 |
+
location:
|
44 |
+
data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_final
|
45 |
+
out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
|
46 |
+
tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
|
47 |
+
data:
|
48 |
+
batch_size: 10
|
49 |
+
val_batch_size: 2
|
50 |
+
num_workers: 3
|
51 |
+
train:
|
52 |
+
indir: ${location.data_root_dir}/train
|
53 |
+
out_size: 256
|
54 |
+
mask_gen_kwargs:
|
55 |
+
irregular_proba: 1
|
56 |
+
irregular_kwargs:
|
57 |
+
max_angle: 4
|
58 |
+
max_len: 80
|
59 |
+
max_width: 40
|
60 |
+
max_times: 12
|
61 |
+
min_times: 4
|
62 |
+
box_proba: 1
|
63 |
+
box_kwargs:
|
64 |
+
margin: 0
|
65 |
+
bbox_min_size: 30
|
66 |
+
bbox_max_size: 128
|
67 |
+
max_times: 1
|
68 |
+
min_times: 1
|
69 |
+
segm_proba: 0
|
70 |
+
transform_variant: default
|
71 |
+
dataloader_kwargs:
|
72 |
+
batch_size: ${data.batch_size}
|
73 |
+
shuffle: true
|
74 |
+
num_workers: ${data.num_workers}
|
75 |
+
val:
|
76 |
+
indir: ${location.data_root_dir}/val
|
77 |
+
img_suffix: .png
|
78 |
+
dataloader_kwargs:
|
79 |
+
batch_size: ${data.val_batch_size}
|
80 |
+
shuffle: false
|
81 |
+
num_workers: ${data.num_workers}
|
82 |
+
visual_test:
|
83 |
+
indir: ${location.data_root_dir}/korean_test
|
84 |
+
img_suffix: _input.png
|
85 |
+
pad_out_to_modulo: 32
|
86 |
+
dataloader_kwargs:
|
87 |
+
batch_size: 1
|
88 |
+
shuffle: false
|
89 |
+
num_workers: ${data.num_workers}
|
90 |
+
generator:
|
91 |
+
kind: pix2pixhd_global
|
92 |
+
input_nc: 4
|
93 |
+
output_nc: 3
|
94 |
+
ngf: 64
|
95 |
+
n_downsampling: 3
|
96 |
+
n_blocks: 9
|
97 |
+
conv_kind: default
|
98 |
+
add_out_act: sigmoid
|
99 |
+
discriminator:
|
100 |
+
kind: pix2pixhd_nlayer
|
101 |
+
input_nc: 3
|
102 |
+
ndf: 64
|
103 |
+
n_layers: 4
|
104 |
+
evaluator:
|
105 |
+
kind: default
|
106 |
+
inpainted_key: inpainted
|
107 |
+
integral_kind: ssim_fid100_f1
|
108 |
+
trainer:
|
109 |
+
kwargs:
|
110 |
+
gpus: -1
|
111 |
+
distributed_backend: ddp
|
112 |
+
max_epochs: 40
|
113 |
+
gradient_clip_val: 1
|
114 |
+
log_gpu_memory: None
|
115 |
+
limit_train_batches: 25000
|
116 |
+
val_check_interval: ${trainer.kwargs.limit_train_batches}
|
117 |
+
log_save_interval: 250
|
118 |
+
precision: 32
|
119 |
+
terminate_on_nan: false
|
120 |
+
check_val_every_n_epoch: 1
|
121 |
+
num_sanity_val_steps: 8
|
122 |
+
replace_sampler_ddp: false
|
123 |
+
resume_from_checkpoint: /group-volume/User-Driven-Content-Generation/r.suvorov/inpainting/experiments/r.suvorov_2021-03-04_15-09-38_train_ablv2_work_small_holes_/models/last.ckpt
|
124 |
+
checkpoint_kwargs:
|
125 |
+
verbose: true
|
126 |
+
save_top_k: 5
|
127 |
+
save_last: true
|
128 |
+
period: 1
|
129 |
+
monitor: val_ssim_fid100_f1_total_mean
|
130 |
+
mode: max
|
lama-places/lama_small_train_masks/models/best.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6423c4d504c5f135557b316ee6574983424a6078d591d332c97d243f46195e20
|
3 |
+
size 388021609
|