|
{ |
|
"architectures": [ |
|
"ModernBertForTokenClassification" |
|
], |
|
"attention_bias": false, |
|
"attention_dropout": 0.0, |
|
"auto_map": { |
|
"AutoConfig": "configuration_modernbert.ModernBertConfig", |
|
"AutoModel": "modeling_modernbert.ModernBertModel", |
|
"AutoModelForMaskedLM": "modeling_modernbert.ModernBertForMaskedLM", |
|
"AutoModelForSequenceClassification": "modeling_modernbert.ModernBertForSequenceClassification", |
|
"AutoModelForTokenClassification": "modeling_modernbert.ModernBertForTokenClassification" |
|
}, |
|
"bos_token_id": 0, |
|
"classifier_activation": "gelu", |
|
"classifier_bias": false, |
|
"classifier_dropout": 0.0, |
|
"classifier_pooling": "mean", |
|
"cls_token_id": 0, |
|
"custom_pipelines": { |
|
"universal-dependencies": { |
|
"impl": "ud.UniversalDependenciesPipeline", |
|
"pt": "AutoModelForTokenClassification" |
|
} |
|
}, |
|
"decoder_bias": true, |
|
"deterministic_flash_attn": false, |
|
"embedding_dropout": 0.0, |
|
"eos_token_id": 2, |
|
"global_attn_every_n_layers": 3, |
|
"global_rope_theta": 160000.0, |
|
"gradient_checkpointing": false, |
|
"hidden_activation": "gelu", |
|
"hidden_size": 1024, |
|
"id2label": { |
|
"0": "ADJ", |
|
"1": "ADJ.", |
|
"2": "ADJ.|[acl]", |
|
"3": "ADJ.|[advcl]", |
|
"4": "ADJ.|[amod]", |
|
"5": "ADJ.|[ccomp]", |
|
"6": "ADJ.|[csubj:outer]", |
|
"7": "ADJ.|[csubj]", |
|
"8": "ADJ.|[dep]", |
|
"9": "ADJ.|[nmod]", |
|
"10": "ADJ.|[nsubj]", |
|
"11": "ADJ.|[obj]", |
|
"12": "ADJ.|[obl]", |
|
"13": "ADJ.|[root]", |
|
"14": "ADJ|[acl]", |
|
"15": "ADJ|[advcl]", |
|
"16": "ADJ|[amod]", |
|
"17": "ADJ|[ccomp]", |
|
"18": "ADJ|[csubj:outer]", |
|
"19": "ADJ|[csubj]", |
|
"20": "ADJ|[dep]", |
|
"21": "ADJ|[nmod]", |
|
"22": "ADJ|[nsubj]", |
|
"23": "ADJ|[obj]", |
|
"24": "ADJ|[obl]", |
|
"25": "ADJ|[root]", |
|
"26": "ADP", |
|
"27": "ADP.", |
|
"28": "ADP.|[case]", |
|
"29": "ADP.|[fixed]", |
|
"30": "ADP|[case]", |
|
"31": "ADP|[fixed]", |
|
"32": "ADV", |
|
"33": "ADV.", |
|
"34": "ADV.|[advcl]", |
|
"35": "ADV.|[advmod]", |
|
"36": "ADV.|[dep]", |
|
"37": "ADV.|[obj]", |
|
"38": "ADV.|[root]", |
|
"39": "ADV|[advcl]", |
|
"40": "ADV|[advmod]", |
|
"41": "ADV|[dep]", |
|
"42": "ADV|[obj]", |
|
"43": "ADV|[root]", |
|
"44": "AUX", |
|
"45": "AUX.", |
|
"46": "AUX.|Polarity=Neg", |
|
"47": "AUX.|Polarity=Neg|[aux]", |
|
"48": "AUX.|Polarity=Neg|[fixed]", |
|
"49": "AUX.|[aux]", |
|
"50": "AUX.|[cop]", |
|
"51": "AUX.|[fixed]", |
|
"52": "AUX.|[root]", |
|
"53": "AUX|Polarity=Neg", |
|
"54": "AUX|Polarity=Neg|[aux]", |
|
"55": "AUX|Polarity=Neg|[fixed]", |
|
"56": "AUX|[aux]", |
|
"57": "AUX|[cop]", |
|
"58": "AUX|[fixed]", |
|
"59": "AUX|[root]", |
|
"60": "CCONJ", |
|
"61": "CCONJ.", |
|
"62": "CCONJ.|[cc]", |
|
"63": "CCONJ|[cc]", |
|
"64": "DET", |
|
"65": "DET.", |
|
"66": "DET.|[det]", |
|
"67": "DET|[det]", |
|
"68": "INTJ", |
|
"69": "INTJ.", |
|
"70": "INTJ.|[discourse]", |
|
"71": "INTJ.|[root]", |
|
"72": "INTJ|[discourse]", |
|
"73": "INTJ|[root]", |
|
"74": "NOUN", |
|
"75": "NOUN.", |
|
"76": "NOUN.|Polarity=Neg", |
|
"77": "NOUN.|Polarity=Neg|[obl]", |
|
"78": "NOUN.|Polarity=Neg|[root]", |
|
"79": "NOUN.|[acl]", |
|
"80": "NOUN.|[advcl]", |
|
"81": "NOUN.|[ccomp]", |
|
"82": "NOUN.|[compound]", |
|
"83": "NOUN.|[csubj:outer]", |
|
"84": "NOUN.|[csubj]", |
|
"85": "NOUN.|[nmod]", |
|
"86": "NOUN.|[nsubj:outer]", |
|
"87": "NOUN.|[nsubj]", |
|
"88": "NOUN.|[obj]", |
|
"89": "NOUN.|[obl]", |
|
"90": "NOUN.|[root]", |
|
"91": "NOUN|Polarity=Neg", |
|
"92": "NOUN|Polarity=Neg|[obl]", |
|
"93": "NOUN|Polarity=Neg|[root]", |
|
"94": "NOUN|[acl]", |
|
"95": "NOUN|[advcl]", |
|
"96": "NOUN|[ccomp]", |
|
"97": "NOUN|[compound]", |
|
"98": "NOUN|[csubj:outer]", |
|
"99": "NOUN|[csubj]", |
|
"100": "NOUN|[nmod]", |
|
"101": "NOUN|[nsubj:outer]", |
|
"102": "NOUN|[nsubj]", |
|
"103": "NOUN|[obj]", |
|
"104": "NOUN|[obl]", |
|
"105": "NOUN|[root]", |
|
"106": "NUM", |
|
"107": "NUM.", |
|
"108": "NUM.|[advcl]", |
|
"109": "NUM.|[compound]", |
|
"110": "NUM.|[nmod]", |
|
"111": "NUM.|[nsubj:outer]", |
|
"112": "NUM.|[nsubj]", |
|
"113": "NUM.|[nummod]", |
|
"114": "NUM.|[obj]", |
|
"115": "NUM.|[obl]", |
|
"116": "NUM.|[root]", |
|
"117": "NUM|[advcl]", |
|
"118": "NUM|[compound]", |
|
"119": "NUM|[nmod]", |
|
"120": "NUM|[nsubj:outer]", |
|
"121": "NUM|[nsubj]", |
|
"122": "NUM|[nummod]", |
|
"123": "NUM|[obj]", |
|
"124": "NUM|[obl]", |
|
"125": "NUM|[root]", |
|
"126": "PART", |
|
"127": "PART.", |
|
"128": "PART.|[mark]", |
|
"129": "PART|[mark]", |
|
"130": "PRON", |
|
"131": "PRON.", |
|
"132": "PRON.|[acl]", |
|
"133": "PRON.|[advcl]", |
|
"134": "PRON.|[nmod]", |
|
"135": "PRON.|[nsubj:outer]", |
|
"136": "PRON.|[nsubj]", |
|
"137": "PRON.|[obj]", |
|
"138": "PRON.|[obl]", |
|
"139": "PRON.|[root]", |
|
"140": "PRON|[acl]", |
|
"141": "PRON|[advcl]", |
|
"142": "PRON|[nmod]", |
|
"143": "PRON|[nsubj:outer]", |
|
"144": "PRON|[nsubj]", |
|
"145": "PRON|[obj]", |
|
"146": "PRON|[obl]", |
|
"147": "PRON|[root]", |
|
"148": "PROPN", |
|
"149": "PROPN.", |
|
"150": "PROPN.|[acl]", |
|
"151": "PROPN.|[advcl]", |
|
"152": "PROPN.|[compound]", |
|
"153": "PROPN.|[nmod]", |
|
"154": "PROPN.|[nsubj:outer]", |
|
"155": "PROPN.|[nsubj]", |
|
"156": "PROPN.|[obj]", |
|
"157": "PROPN.|[obl]", |
|
"158": "PROPN.|[root]", |
|
"159": "PROPN|[acl]", |
|
"160": "PROPN|[advcl]", |
|
"161": "PROPN|[compound]", |
|
"162": "PROPN|[nmod]", |
|
"163": "PROPN|[nsubj:outer]", |
|
"164": "PROPN|[nsubj]", |
|
"165": "PROPN|[obj]", |
|
"166": "PROPN|[obl]", |
|
"167": "PROPN|[root]", |
|
"168": "PUNCT", |
|
"169": "PUNCT.", |
|
"170": "PUNCT.|[punct]", |
|
"171": "PUNCT|[punct]", |
|
"172": "SCONJ", |
|
"173": "SCONJ.", |
|
"174": "SCONJ.|[dep]", |
|
"175": "SCONJ.|[fixed]", |
|
"176": "SCONJ.|[mark]", |
|
"177": "SCONJ|[dep]", |
|
"178": "SCONJ|[fixed]", |
|
"179": "SCONJ|[mark]", |
|
"180": "SYM", |
|
"181": "SYM.", |
|
"182": "SYM.|[compound]", |
|
"183": "SYM.|[dep]", |
|
"184": "SYM.|[nmod]", |
|
"185": "SYM.|[obl]", |
|
"186": "SYM|[compound]", |
|
"187": "SYM|[dep]", |
|
"188": "SYM|[nmod]", |
|
"189": "SYM|[obl]", |
|
"190": "VERB", |
|
"191": "VERB.", |
|
"192": "VERB.|[acl]", |
|
"193": "VERB.|[advcl]", |
|
"194": "VERB.|[ccomp]", |
|
"195": "VERB.|[compound]", |
|
"196": "VERB.|[csubj:outer]", |
|
"197": "VERB.|[csubj]", |
|
"198": "VERB.|[nmod]", |
|
"199": "VERB.|[obj]", |
|
"200": "VERB.|[obl]", |
|
"201": "VERB.|[root]", |
|
"202": "VERB|[acl]", |
|
"203": "VERB|[advcl]", |
|
"204": "VERB|[ccomp]", |
|
"205": "VERB|[compound]", |
|
"206": "VERB|[csubj:outer]", |
|
"207": "VERB|[csubj]", |
|
"208": "VERB|[nmod]", |
|
"209": "VERB|[obj]", |
|
"210": "VERB|[obl]", |
|
"211": "VERB|[root]", |
|
"212": "X", |
|
"213": "X.", |
|
"214": "X.|[dep]", |
|
"215": "X.|[goeswith]", |
|
"216": "X.|[nmod]", |
|
"217": "X|[dep]", |
|
"218": "X|[nmod]" |
|
}, |
|
"initializer_cutoff_factor": 2.0, |
|
"initializer_range": 0.02, |
|
"intermediate_size": 2624, |
|
"label2id": { |
|
"ADJ": 0, |
|
"ADJ.": 1, |
|
"ADJ.|[acl]": 2, |
|
"ADJ.|[advcl]": 3, |
|
"ADJ.|[amod]": 4, |
|
"ADJ.|[ccomp]": 5, |
|
"ADJ.|[csubj:outer]": 6, |
|
"ADJ.|[csubj]": 7, |
|
"ADJ.|[dep]": 8, |
|
"ADJ.|[nmod]": 9, |
|
"ADJ.|[nsubj]": 10, |
|
"ADJ.|[obj]": 11, |
|
"ADJ.|[obl]": 12, |
|
"ADJ.|[root]": 13, |
|
"ADJ|[acl]": 14, |
|
"ADJ|[advcl]": 15, |
|
"ADJ|[amod]": 16, |
|
"ADJ|[ccomp]": 17, |
|
"ADJ|[csubj:outer]": 18, |
|
"ADJ|[csubj]": 19, |
|
"ADJ|[dep]": 20, |
|
"ADJ|[nmod]": 21, |
|
"ADJ|[nsubj]": 22, |
|
"ADJ|[obj]": 23, |
|
"ADJ|[obl]": 24, |
|
"ADJ|[root]": 25, |
|
"ADP": 26, |
|
"ADP.": 27, |
|
"ADP.|[case]": 28, |
|
"ADP.|[fixed]": 29, |
|
"ADP|[case]": 30, |
|
"ADP|[fixed]": 31, |
|
"ADV": 32, |
|
"ADV.": 33, |
|
"ADV.|[advcl]": 34, |
|
"ADV.|[advmod]": 35, |
|
"ADV.|[dep]": 36, |
|
"ADV.|[obj]": 37, |
|
"ADV.|[root]": 38, |
|
"ADV|[advcl]": 39, |
|
"ADV|[advmod]": 40, |
|
"ADV|[dep]": 41, |
|
"ADV|[obj]": 42, |
|
"ADV|[root]": 43, |
|
"AUX": 44, |
|
"AUX.": 45, |
|
"AUX.|Polarity=Neg": 46, |
|
"AUX.|Polarity=Neg|[aux]": 47, |
|
"AUX.|Polarity=Neg|[fixed]": 48, |
|
"AUX.|[aux]": 49, |
|
"AUX.|[cop]": 50, |
|
"AUX.|[fixed]": 51, |
|
"AUX.|[root]": 52, |
|
"AUX|Polarity=Neg": 53, |
|
"AUX|Polarity=Neg|[aux]": 54, |
|
"AUX|Polarity=Neg|[fixed]": 55, |
|
"AUX|[aux]": 56, |
|
"AUX|[cop]": 57, |
|
"AUX|[fixed]": 58, |
|
"AUX|[root]": 59, |
|
"CCONJ": 60, |
|
"CCONJ.": 61, |
|
"CCONJ.|[cc]": 62, |
|
"CCONJ|[cc]": 63, |
|
"DET": 64, |
|
"DET.": 65, |
|
"DET.|[det]": 66, |
|
"DET|[det]": 67, |
|
"INTJ": 68, |
|
"INTJ.": 69, |
|
"INTJ.|[discourse]": 70, |
|
"INTJ.|[root]": 71, |
|
"INTJ|[discourse]": 72, |
|
"INTJ|[root]": 73, |
|
"NOUN": 74, |
|
"NOUN.": 75, |
|
"NOUN.|Polarity=Neg": 76, |
|
"NOUN.|Polarity=Neg|[obl]": 77, |
|
"NOUN.|Polarity=Neg|[root]": 78, |
|
"NOUN.|[acl]": 79, |
|
"NOUN.|[advcl]": 80, |
|
"NOUN.|[ccomp]": 81, |
|
"NOUN.|[compound]": 82, |
|
"NOUN.|[csubj:outer]": 83, |
|
"NOUN.|[csubj]": 84, |
|
"NOUN.|[nmod]": 85, |
|
"NOUN.|[nsubj:outer]": 86, |
|
"NOUN.|[nsubj]": 87, |
|
"NOUN.|[obj]": 88, |
|
"NOUN.|[obl]": 89, |
|
"NOUN.|[root]": 90, |
|
"NOUN|Polarity=Neg": 91, |
|
"NOUN|Polarity=Neg|[obl]": 92, |
|
"NOUN|Polarity=Neg|[root]": 93, |
|
"NOUN|[acl]": 94, |
|
"NOUN|[advcl]": 95, |
|
"NOUN|[ccomp]": 96, |
|
"NOUN|[compound]": 97, |
|
"NOUN|[csubj:outer]": 98, |
|
"NOUN|[csubj]": 99, |
|
"NOUN|[nmod]": 100, |
|
"NOUN|[nsubj:outer]": 101, |
|
"NOUN|[nsubj]": 102, |
|
"NOUN|[obj]": 103, |
|
"NOUN|[obl]": 104, |
|
"NOUN|[root]": 105, |
|
"NUM": 106, |
|
"NUM.": 107, |
|
"NUM.|[advcl]": 108, |
|
"NUM.|[compound]": 109, |
|
"NUM.|[nmod]": 110, |
|
"NUM.|[nsubj:outer]": 111, |
|
"NUM.|[nsubj]": 112, |
|
"NUM.|[nummod]": 113, |
|
"NUM.|[obj]": 114, |
|
"NUM.|[obl]": 115, |
|
"NUM.|[root]": 116, |
|
"NUM|[advcl]": 117, |
|
"NUM|[compound]": 118, |
|
"NUM|[nmod]": 119, |
|
"NUM|[nsubj:outer]": 120, |
|
"NUM|[nsubj]": 121, |
|
"NUM|[nummod]": 122, |
|
"NUM|[obj]": 123, |
|
"NUM|[obl]": 124, |
|
"NUM|[root]": 125, |
|
"PART": 126, |
|
"PART.": 127, |
|
"PART.|[mark]": 128, |
|
"PART|[mark]": 129, |
|
"PRON": 130, |
|
"PRON.": 131, |
|
"PRON.|[acl]": 132, |
|
"PRON.|[advcl]": 133, |
|
"PRON.|[nmod]": 134, |
|
"PRON.|[nsubj:outer]": 135, |
|
"PRON.|[nsubj]": 136, |
|
"PRON.|[obj]": 137, |
|
"PRON.|[obl]": 138, |
|
"PRON.|[root]": 139, |
|
"PRON|[acl]": 140, |
|
"PRON|[advcl]": 141, |
|
"PRON|[nmod]": 142, |
|
"PRON|[nsubj:outer]": 143, |
|
"PRON|[nsubj]": 144, |
|
"PRON|[obj]": 145, |
|
"PRON|[obl]": 146, |
|
"PRON|[root]": 147, |
|
"PROPN": 148, |
|
"PROPN.": 149, |
|
"PROPN.|[acl]": 150, |
|
"PROPN.|[advcl]": 151, |
|
"PROPN.|[compound]": 152, |
|
"PROPN.|[nmod]": 153, |
|
"PROPN.|[nsubj:outer]": 154, |
|
"PROPN.|[nsubj]": 155, |
|
"PROPN.|[obj]": 156, |
|
"PROPN.|[obl]": 157, |
|
"PROPN.|[root]": 158, |
|
"PROPN|[acl]": 159, |
|
"PROPN|[advcl]": 160, |
|
"PROPN|[compound]": 161, |
|
"PROPN|[nmod]": 162, |
|
"PROPN|[nsubj:outer]": 163, |
|
"PROPN|[nsubj]": 164, |
|
"PROPN|[obj]": 165, |
|
"PROPN|[obl]": 166, |
|
"PROPN|[root]": 167, |
|
"PUNCT": 168, |
|
"PUNCT.": 169, |
|
"PUNCT.|[punct]": 170, |
|
"PUNCT|[punct]": 171, |
|
"SCONJ": 172, |
|
"SCONJ.": 173, |
|
"SCONJ.|[dep]": 174, |
|
"SCONJ.|[fixed]": 175, |
|
"SCONJ.|[mark]": 176, |
|
"SCONJ|[dep]": 177, |
|
"SCONJ|[fixed]": 178, |
|
"SCONJ|[mark]": 179, |
|
"SYM": 180, |
|
"SYM.": 181, |
|
"SYM.|[compound]": 182, |
|
"SYM.|[dep]": 183, |
|
"SYM.|[nmod]": 184, |
|
"SYM.|[obl]": 185, |
|
"SYM|[compound]": 186, |
|
"SYM|[dep]": 187, |
|
"SYM|[nmod]": 188, |
|
"SYM|[obl]": 189, |
|
"VERB": 190, |
|
"VERB.": 191, |
|
"VERB.|[acl]": 192, |
|
"VERB.|[advcl]": 193, |
|
"VERB.|[ccomp]": 194, |
|
"VERB.|[compound]": 195, |
|
"VERB.|[csubj:outer]": 196, |
|
"VERB.|[csubj]": 197, |
|
"VERB.|[nmod]": 198, |
|
"VERB.|[obj]": 199, |
|
"VERB.|[obl]": 200, |
|
"VERB.|[root]": 201, |
|
"VERB|[acl]": 202, |
|
"VERB|[advcl]": 203, |
|
"VERB|[ccomp]": 204, |
|
"VERB|[compound]": 205, |
|
"VERB|[csubj:outer]": 206, |
|
"VERB|[csubj]": 207, |
|
"VERB|[nmod]": 208, |
|
"VERB|[obj]": 209, |
|
"VERB|[obl]": 210, |
|
"VERB|[root]": 211, |
|
"X": 212, |
|
"X.": 213, |
|
"X.|[dep]": 214, |
|
"X.|[goeswith]": 215, |
|
"X.|[nmod]": 216, |
|
"X|[dep]": 217, |
|
"X|[nmod]": 218 |
|
}, |
|
"layer_norm_eps": 1e-05, |
|
"local_attention": 128, |
|
"local_rope_theta": 10000.0, |
|
"max_position_embeddings": 8192, |
|
"mlp_bias": false, |
|
"mlp_dropout": 0.0, |
|
"model_type": "modernbert", |
|
"norm_bias": false, |
|
"norm_eps": 1e-05, |
|
"num_attention_heads": 16, |
|
"num_hidden_layers": 28, |
|
"pad_token_id": 1, |
|
"position_embedding_type": "absolute", |
|
"reference_compile": true, |
|
"sep_token_id": 2, |
|
"sparse_pred_ignore_index": -100, |
|
"sparse_prediction": false, |
|
"tokenizer_class": "DebertaV2TokenizerFast", |
|
"torch_dtype": "float32", |
|
"transformers_version": "4.47.1", |
|
"vocab_size": 65000 |
|
} |
|
|