{ "model_params": { "decoder": { "resblock_dilation_sizes": [ [ 1, 3, 5 ], [ 1, 3, 5 ], [ 1, 3, 5 ] ], "resblock_kernel_sizes": [ 3, 7, 11 ], "type": "hifigan", "upsample_initial_channel": 512, "upsample_kernel_sizes": [ 20, 10, 6, 4 ], "upsample_rates": [ 10, 5, 3, 2 ] }, "diffusion": { "dist": { "estimate_sigma_data": true, "mean": -3.0, "sigma_data": 0.2, "std": 1.0 }, "embedding_mask_proba": 0.1, "transformer": { "head_features": 64, "multiplier": 2, "num_heads": 8, "num_layers": 3 } }, "dim_in": 64, "dropout": 0.2, "hidden_dim": 512, "max_conv_dim": 512, "max_dur": 50, "multispeaker": false, "n_layer": 3, "n_mels": 80, "n_token": 178, "slm": { "hidden": 768, "initial_channel": 64, "model": "microsoft/wavlm-base-plus", "nlayers": 13, "sr": 16000 }, "style_dim": 128 }, "training_config": { "epochs": 30, "batch_size": 2, "max_len": 120, "optimizer": { "bert_lr": 1e-05, "ft_lr": 0.0001, "lr": 0.0001 }, "loss_params": { "diff_epoch": 10, "joint_epoch": 110, "lambda_F0": 1.0, "lambda_ce": 20.0, "lambda_diff": 1.0, "lambda_dur": 1.0, "lambda_gen": 1.0, "lambda_mel": 5.0, "lambda_mono": 1.0, "lambda_norm": 1.0, "lambda_s2s": 1.0, "lambda_slm": 1.0, "lambda_sty": 1.0 } }, "preprocess_params": { "spect_params": { "hop_length": 300, "n_fft": 2048, "win_length": 1200 }, "sr": 24000 }, "data_params": { "OOD_data": "Data/OOD_texts.txt", "min_length": 50, "root_path": "Data/wavs", "train_data": "Data/train_list.txt", "val_data": "Data/val_list.txt" }, "model_state": { "epoch": 14, "iterations": 1169, "val_loss": 0.4189014434814453 }, "training_metrics": { "train_loss": [], "val_loss": [ 41.0, 36.0, 31.0, 29.0, 25.0, 34.0, 33.0, 32.0, 31.0, 27.0, 52.0, 59.0, 4.0, 11.0, 17.0, 31.0, 37.0, 42.0 ], "dur_loss": [ 0.448, 0.449, 0.441, 0.488, 0.469, 0.437, 0.461, 0.42, 0.447, 0.436, 0.428, 0.425, 0.444, 0.44, 0.419, 0.423, 0.427, 0.405 ], "F0_loss": [ 1.223, 1.189, 1.208, 1.176, 1.141, 1.102, 1.168, 1.081, 1.119, 1.108, 1.108, 1.153, 1.093, 1.211, 1.102, 1.177, 1.162, 1.11 ], "epochs": [ 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18 ] } }