location: data_root_dir: /group-volume/User-Driven-Content-Generation/datasets/inpainting_data_root_large out_root_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/experiments tb_dir: /group-volume/User-Driven-Content-Generation/${env:USER}/inpainting/tb_logs pretrained_models: ${location.data_root_dir} data: batch_size: 25 val_batch_size: 40 num_workers: 4 train: indir: ${location.data_root_dir}/train_256 out_size: 256 mask_gen_kwargs: irregular_proba: 1 irregular_kwargs: max_angle: 4 max_len: 200 max_width: 100 max_times: 5 min_times: 1 box_proba: 1 box_kwargs: margin: 10 bbox_min_size: 30 bbox_max_size: 150 max_times: 4 min_times: 1 segm_proba: 0 transform_variant: no_augs dataloader_kwargs: batch_size: ${data.batch_size} shuffle: true num_workers: ${data.num_workers} val: indir: ${location.data_root_dir}/val_256 img_suffix: .png dataloader_kwargs: batch_size: ${data.val_batch_size} shuffle: false num_workers: ${data.num_workers} visual_test: null generator: kind: Swin_UNET discriminator: kind: pix2pixhd_nlayer input_nc: 3 ndf: 64 n_layers: 4 optimizers: generator: kind: adam lr: 0.001 discriminator: kind: adam lr: 0.0001 visualizer: kind: directory outdir: ${location.data_root_dir}/samples key_order: - image - predicted_image - discr_output_fake - discr_output_real - inpainted - eye - eye_pred - hair - hair_pred - skin - skin_pred rescale_keys: - discr_output_fake - discr_output_real evaluator: kind: default inpainted_key: inpainted integral_kind: ssim_fid100_f1 trainer: kwargs: gpus: 1 accelerator: dp max_epochs: 50 gradient_clip_val: 1 limit_train_batches: 25000 log_every_n_steps: 300 precision: 32 terminate_on_nan: false check_val_every_n_epoch: 5 num_sanity_val_steps: 0 replace_sampler_ddp: false checkpoint_kwargs: verbose: true save_top_k: 5 save_last: true monitor: val_ssim_fid100_f1_total_mean mode: max run_title: aaa training_model: kind: default visualize_each_iters: 100 concat_mask: true store_discr_outputs_for_vis: true losses: l1: weight_missing: 0 weight_known: 10 weight_known_skin: 3 weight_known_eye: 3 weight_known_ear: 3 weight_known_lip: 3 weight_known_cloth: 3 weight_known_hair: 3 perceptual: weight: 0 adversarial_component: weight_skin: 0.1 weight_eye: 0.15 weight_ear: 0.15 weight_lip: 0.15 weight_cloth: 0.1 weight_hair: 0.1 adversarial: kind: r1 weight: 10 gp_coef: 0.001 mask_as_fake_target: true allow_scale_mask: true feature_matching: weight: 100 weight_skin: 10 weight_eye: 15 weight_ear: 15 weight_lip: 15 weight_cloth: 10 weight_hair: 10 resnet_pl: weight: 30 weights_path: ${location.data_root_dir}/lama-main