|
{ |
|
"experiment": "ota_boun", |
|
"name": "bert-base-turkish-cased", |
|
"n_gpu": 1, |
|
"model": { |
|
"type": "MultiParser", |
|
"args": { |
|
"embeddings_processor": { |
|
"type": "BertWrapper", |
|
"args": { |
|
"model_path": "data/pretrained_embeddings/bert-base-turkish-cased-nonpretrained", |
|
"fine_tune": true, |
|
"hidden_dropout": 0.2, |
|
"attn_dropout": 0.2, |
|
"output_dropout": 0.5, |
|
"scalar_mix_layer_dropout": 0.1, |
|
"token_mask_prob": 0.15 |
|
} |
|
}, |
|
"outputs": { |
|
"heads": { |
|
"type": "ArcScorer", |
|
"args": { |
|
"scorer_class": "DeepBiaffineScorer", |
|
"head_mode": "single_head", |
|
"hidden_size": 768, |
|
"dropout": 0.33, |
|
"vocab": { |
|
"type": "IntegerVocab" |
|
} |
|
} |
|
}, |
|
"labels": { |
|
"type": "DependencyClassifier", |
|
"args": { |
|
"scorer_class": "DeepBiaffineScorer", |
|
"hidden_size": 256, |
|
"dropout": 0.33, |
|
"vocab": { |
|
"type": "BasicVocab", |
|
"args": { |
|
"vocab_filename": "data/corpora/ota_boun/vocab/basic.vocab" |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"post_processors": [ |
|
{ |
|
"type": "FactorizedMSTPostProcessor", |
|
"args": { |
|
"annotation_ids": [ |
|
"heads", |
|
"labels" |
|
] |
|
} |
|
} |
|
] |
|
} |
|
}, |
|
"data_loaders": { |
|
"type": "BucketedCONLLLoader", |
|
"args": { |
|
"annotation_layers": { |
|
"heads": { |
|
"type": "TagSequence", |
|
"source_column": 6, |
|
"args": { |
|
"ignore_root": true |
|
} |
|
}, |
|
"labels": { |
|
"type": "DependencyMatrix", |
|
"source_column": [ |
|
6, |
|
7 |
|
], |
|
"args": { |
|
"ignore_non_relations": true |
|
} |
|
} |
|
}, |
|
"batch_size": 32, |
|
"bucket_size": 256, |
|
"max_tokens_per_batch": 156800, |
|
"num_workers": 2 |
|
}, |
|
"paths": { |
|
"train": "data/corpora/ota_boun/ota_boun-ud-train.conllu", |
|
"dev": "data/corpora/ota_boun/ota_boun-ud-test.conllu", |
|
"test": "data/corpora/ota_boun/tr_boun-ud-test.conllu" |
|
} |
|
}, |
|
"trainer": { |
|
"min_epochs": 15, |
|
"max_epochs": 300, |
|
"early_stop": 15, |
|
"save_dir": "data/saved_models/", |
|
"save_period": 20, |
|
"verbosity": 2, |
|
"validation_criterion": { |
|
"metrics": { |
|
"heads": "fscore", |
|
"labels": "fscore" |
|
}, |
|
"weighting": "multiplicative" |
|
}, |
|
"optimizer": { |
|
"type": "AdamW", |
|
"args": { |
|
"lr": 4e-05, |
|
"weight_decay": 0.0 |
|
} |
|
}, |
|
"lr_scheduler": { |
|
"type": "LambdaLR", |
|
"args": { |
|
"lr_lambda": "SqrtSchedule(400)" |
|
} |
|
}, |
|
"loss": { |
|
"type": "CrossEntropyLoss", |
|
"args": { |
|
"ignore_index": -1 |
|
} |
|
} |
|
} |
|
} |