face-inpainting / config.yaml
givkashi's picture
Update config.yaml
48997cb verified
location:
data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_large
out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments
tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs
pretrained_models: ${location.data_root_dir}
data:
batch_size: 25
val_batch_size: 40
num_workers: 4
train:
indir: ${location.data_root_dir}/train_256
out_size: 256
mask_gen_kwargs:
irregular_proba: 1
irregular_kwargs:
max_angle: 4
max_len: 200
max_width: 100
max_times: 5
min_times: 1
box_proba: 1
box_kwargs:
margin: 10
bbox_min_size: 30
bbox_max_size: 150
max_times: 4
min_times: 1
segm_proba: 0
transform_variant: no_augs
dataloader_kwargs:
batch_size: ${data.batch_size}
shuffle: true
num_workers: ${data.num_workers}
val:
indir: ${location.data_root_dir}/val_256
img_suffix: .png
dataloader_kwargs:
batch_size: ${data.val_batch_size}
shuffle: false
num_workers: ${data.num_workers}
visual_test: null
generator:
kind: Swin_UNET
discriminator:
kind: pix2pixhd_nlayer
input_nc: 3
ndf: 64
n_layers: 4
optimizers:
generator:
kind: adam
lr: 0.001
discriminator:
kind: adam
lr: 0.0001
visualizer:
kind: directory
outdir: ${location.data_root_dir}/samples
key_order:
- image
- predicted_image
- discr_output_fake
- discr_output_real
- inpainted
- eye
- eye_pred
- hair
- hair_pred
- skin
- skin_pred
rescale_keys:
- discr_output_fake
- discr_output_real
evaluator:
kind: default
inpainted_key: inpainted
integral_kind: ssim_fid100_f1
trainer:
kwargs:
gpus: 1
accelerator: dp
max_epochs: 50
gradient_clip_val: 1
limit_train_batches: 25000
log_every_n_steps: 300
precision: 32
terminate_on_nan: false
check_val_every_n_epoch: 5
num_sanity_val_steps: 0
replace_sampler_ddp: false
checkpoint_kwargs:
verbose: true
save_top_k: 5
save_last: true
monitor: val_ssim_fid100_f1_total_mean
mode: max
run_title: aaa
training_model:
kind: default
visualize_each_iters: 100
concat_mask: true
store_discr_outputs_for_vis: true
losses:
l1:
weight_missing: 0
weight_known: 10
weight_known_skin: 3
weight_known_eye: 3
weight_known_ear: 3
weight_known_lip: 3
weight_known_cloth: 3
weight_known_hair: 3
perceptual:
weight: 0
adversarial_component:
weight_skin: 0.1
weight_eye: 0.15
weight_ear: 0.15
weight_lip: 0.15
weight_cloth: 0.1
weight_hair: 0.1
adversarial:
kind: r1
weight: 10
gp_coef: 0.001
mask_as_fake_target: true
allow_scale_mask: true
feature_matching:
weight: 100
weight_skin: 10
weight_eye: 15
weight_ear: 15
weight_lip: 15
weight_cloth: 10
weight_hair: 10
resnet_pl:
weight: 30
weights_path: ${location.data_root_dir}/lama-main