enrico-taxo-v3 / config.json
urchade's picture
better version
ceeae9d verified
raw
history blame contribute delete
654 Bytes
{
"model_name": "microsoft/deberta-v3-base",
"hidden_size": 512,
"ffn_mul": 2,
"span_mode": "markerV0",
"dropout": 0.1,
"max_width": 8,
"max_top_k": 54,
"add_top_k": 10,
"lr_encoder": "1e-5",
"lr_others": "5e-5",
"freeze_token_rep": false,
"num_steps": 55000,
"warmup_ratio": 1000,
"train_batch_size": 12,
"eval_every": 5000,
"max_neg_type_ratio": 3,
"size_sup": -1,
"max_len": 384,
"max_types": 30,
"shuffle_types": true,
"random_drop": false,
"refine_span": false,
"refine_relation": false,
"refine_prompt": true,
"scorer": "dot",
"fine_tune": true,
"subtoken_pooling": "first",
"name": "large"
}