add dependency parsing model, vocab and misc
Browse files
dp/ko/posbert.base/config.json
ADDED
@@ -0,0 +1,129 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "jinmang2/dooly-hub/dp/ko/posbert.base",
|
3 |
+
"architectures": [
|
4 |
+
"RobertaForDependencyParsing"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"bos_token_id": 0,
|
8 |
+
"classifier_dropout": null,
|
9 |
+
"classifier_num_attention_heads": 8,
|
10 |
+
"eos_token_id": 2,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 768,
|
14 |
+
"id2label": {
|
15 |
+
"0": "LABEL_0",
|
16 |
+
"1": "LABEL_1",
|
17 |
+
"2": "LABEL_2",
|
18 |
+
"3": "LABEL_3",
|
19 |
+
"4": "LABEL_4",
|
20 |
+
"5": "LABEL_5",
|
21 |
+
"6": "LABEL_6",
|
22 |
+
"7": "LABEL_7",
|
23 |
+
"8": "LABEL_8",
|
24 |
+
"9": "LABEL_9",
|
25 |
+
"10": "LABEL_10",
|
26 |
+
"11": "LABEL_11",
|
27 |
+
"12": "LABEL_12",
|
28 |
+
"13": "LABEL_13",
|
29 |
+
"14": "LABEL_14",
|
30 |
+
"15": "LABEL_15",
|
31 |
+
"16": "LABEL_16",
|
32 |
+
"17": "LABEL_17",
|
33 |
+
"18": "LABEL_18",
|
34 |
+
"19": "LABEL_19",
|
35 |
+
"20": "LABEL_20",
|
36 |
+
"21": "LABEL_21",
|
37 |
+
"22": "LABEL_22",
|
38 |
+
"23": "LABEL_23",
|
39 |
+
"24": "LABEL_24",
|
40 |
+
"25": "LABEL_25",
|
41 |
+
"26": "LABEL_26",
|
42 |
+
"27": "LABEL_27",
|
43 |
+
"28": "LABEL_28",
|
44 |
+
"29": "LABEL_29",
|
45 |
+
"30": "LABEL_30",
|
46 |
+
"31": "LABEL_31",
|
47 |
+
"32": "LABEL_32",
|
48 |
+
"33": "LABEL_33",
|
49 |
+
"34": "LABEL_34",
|
50 |
+
"35": "LABEL_35",
|
51 |
+
"36": "LABEL_36",
|
52 |
+
"37": "LABEL_37",
|
53 |
+
"38": "LABEL_38",
|
54 |
+
"39": "LABEL_39",
|
55 |
+
"40": "LABEL_40",
|
56 |
+
"41": "LABEL_41",
|
57 |
+
"42": "LABEL_42",
|
58 |
+
"43": "LABEL_43",
|
59 |
+
"44": "LABEL_44",
|
60 |
+
"45": "LABEL_45",
|
61 |
+
"46": "LABEL_46",
|
62 |
+
"47": "LABEL_47"
|
63 |
+
},
|
64 |
+
"initializer_range": 0.02,
|
65 |
+
"intermediate_size": 3072,
|
66 |
+
"label2id": {
|
67 |
+
"LABEL_0": 0,
|
68 |
+
"LABEL_1": 1,
|
69 |
+
"LABEL_10": 10,
|
70 |
+
"LABEL_11": 11,
|
71 |
+
"LABEL_12": 12,
|
72 |
+
"LABEL_13": 13,
|
73 |
+
"LABEL_14": 14,
|
74 |
+
"LABEL_15": 15,
|
75 |
+
"LABEL_16": 16,
|
76 |
+
"LABEL_17": 17,
|
77 |
+
"LABEL_18": 18,
|
78 |
+
"LABEL_19": 19,
|
79 |
+
"LABEL_2": 2,
|
80 |
+
"LABEL_20": 20,
|
81 |
+
"LABEL_21": 21,
|
82 |
+
"LABEL_22": 22,
|
83 |
+
"LABEL_23": 23,
|
84 |
+
"LABEL_24": 24,
|
85 |
+
"LABEL_25": 25,
|
86 |
+
"LABEL_26": 26,
|
87 |
+
"LABEL_27": 27,
|
88 |
+
"LABEL_28": 28,
|
89 |
+
"LABEL_29": 29,
|
90 |
+
"LABEL_3": 3,
|
91 |
+
"LABEL_30": 30,
|
92 |
+
"LABEL_31": 31,
|
93 |
+
"LABEL_32": 32,
|
94 |
+
"LABEL_33": 33,
|
95 |
+
"LABEL_34": 34,
|
96 |
+
"LABEL_35": 35,
|
97 |
+
"LABEL_36": 36,
|
98 |
+
"LABEL_37": 37,
|
99 |
+
"LABEL_38": 38,
|
100 |
+
"LABEL_39": 39,
|
101 |
+
"LABEL_4": 4,
|
102 |
+
"LABEL_40": 40,
|
103 |
+
"LABEL_41": 41,
|
104 |
+
"LABEL_42": 42,
|
105 |
+
"LABEL_43": 43,
|
106 |
+
"LABEL_44": 44,
|
107 |
+
"LABEL_45": 45,
|
108 |
+
"LABEL_46": 46,
|
109 |
+
"LABEL_47": 47,
|
110 |
+
"LABEL_5": 5,
|
111 |
+
"LABEL_6": 6,
|
112 |
+
"LABEL_7": 7,
|
113 |
+
"LABEL_8": 8,
|
114 |
+
"LABEL_9": 9
|
115 |
+
},
|
116 |
+
"layer_norm_eps": 1e-05,
|
117 |
+
"max_position_embeddings": 514,
|
118 |
+
"model_type": "roberta",
|
119 |
+
"num_attention_heads": 12,
|
120 |
+
"num_hidden_layers": 12,
|
121 |
+
"num_segments": 52,
|
122 |
+
"pad_token_id": 1,
|
123 |
+
"position_embedding_type": "absolute",
|
124 |
+
"torch_dtype": "float32",
|
125 |
+
"transformers_version": "4.17.0",
|
126 |
+
"type_vocab_size": 1,
|
127 |
+
"use_cache": true,
|
128 |
+
"vocab_size": 64000
|
129 |
+
}
|
dp/ko/posbert.base/input0.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
dp/ko/posbert.base/input1.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"NNG": "1895353", "VV": "409964", "NNP": "266798", "SN": "199504", "JKB": "152522", "EC": "142215", "NNB": "138624", "SY": "138390", "JX": "127535", "JKO": "127387", "XX": "120062", "XSV": "113650", "MAG": "107408", "SF": "107387", "JKS": "86794", "EF": "86715", "VX": "85374", "NNBC": "80463", "VA": "76609", "ETM": "69932", "MM": "69735", "SSO": "67194", "XSN": "61054", "JKG": "59393", "VCP": "50555", "SC": "48998", "SSC": "45406", "NP": "35529", "SL": "30076", "JC": "26525", "XSA": "24532", "XR": "23295", "NR": "22214", "EP": "19860", "XPN": "17852", "MAJ": "16432", "ETN": "12085", "JKQ": "7548", "VCN": "7105", "IC": "3656", "SE": "3555", "JKC": "1755", "SH": "1200", "UNKNOWN": "483", "JKV": "106", "NA": "2", "madeupword0000": "0", "madeupword0001": "0", "madeupword0002": "0", "madeupword0003": "0", "madeupword0004": "0", "madeupword0005": "0"}
|
dp/ko/posbert.base/label0.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"<s>": 0, "<pad>": 1, "</s>": 2, "<unk>": 3, "0": 4, "1": 5, "2": 6, "3": 7, "4": 8, "5": 9, "6": 10, "7": 11, "8": 12, "9": 13, "10": 14, "11": 15, "12": 16, "13": 17, "14": 18, "15": 19, "16": 20, "17": 21, "18": 22, "19": 23, "20": 24, "21": 25, "22": 26, "23": 27, "24": 28, "25": 29, "26": 30, "27": 31, "28": 32, "29": 33, "30": 34, "31": 35, "32": 36, "33": 37, "34": 38, "35": 39, "36": 40, "37": 41, "38": 42, "39": 43, "40": 44, "41": 45, "42": 46, "43": 47, "44": 48, "45": 49, "46": 50, "47": 51, "48": 52, "49": 53, "50": 54, "51": 55, "52": 56, "53": 57, "54": 58, "55": 59, "56": 60, "57": 61, "58": 62, "59": 63, "60": 64, "61": 65, "62": 66, "63": 67, "64": 68, "65": 69, "66": 70, "67": 71, "68": 72, "69": 73, "70": 74, "71": 75, "72": 76, "73": 77, "74": 78, "75": 79, "76": 80, "77": 81, "78": 82, "79": 83, "80": 84, "81": 85, "82": 86, "83": 87, "84": 88, "85": 89, "86": 90, "87": 91, "88": 92, "89": 93, "90": 94, "91": 95, "92": 96, "93": 97, "94": 98, "95": 99, "96": 100, "97": 101, "98": 102, "99": 103, "100": 104, "101": 105, "102": 106, "103": 107, "104": 108, "105": 109, "106": 110, "107": 111, "108": 112, "109": 113, "110": 114, "111": 115, "112": 116, "113": 117, "114": 118, "115": 119, "116": 120, "117": 121, "118": 122, "119": 123, "120": 124, "121": 125, "122": 126, "123": 127, "124": 128, "125": 129, "126": 130, "127": 131, "128": 132, "129": 133, "130": 134, "131": 135, "132": 136, "133": 137, "134": 138, "135": 139, "136": 140, "137": 141, "138": 142, "139": 143, "140": 144, "141": 145, "142": 146, "143": 147, "144": 148, "145": 149, "146": 150, "147": 151, "148": 152, "149": 153, "150": 154, "151": 155, "152": 156, "153": 157, "154": 158, "155": 159, "156": 160, "157": 161, "158": 162, "159": 163, "160": 164, "161": 165, "162": 166, "163": 167, "164": 168, "165": 169, "166": 170, "167": 171, "168": 172, "169": 173, "170": 174, "171": 175, "172": 176, "173": 177, "174": 178, "175": 179, "176": 180, "177": 181, "178": 182, "179": 183, "180": 184, "181": 185, "182": 186, "183": 187, "184": 188, "185": 189, "186": 190, "187": 191, "188": 192, "189": 193, "190": 194, "191": 195, "192": 196, "193": 197, "194": 198, "195": 199, "196": 200, "197": 201, "198": 202, "199": 203, "200": 204, "201": 205, "202": 206, "203": 207, "204": 208, "205": 209, "206": 210, "207": 211, "208": 212, "209": 213, "210": 214, "211": 215, "212": 216, "213": 217, "214": 218, "215": 219, "216": 220, "217": 221, "218": 222, "219": 223, "220": 224, "221": 225, "222": 226, "223": 227, "224": 228, "225": 229, "226": 230, "227": 231, "228": 232, "229": 233, "230": 234, "231": 235, "232": 236, "233": 237, "234": 238, "235": 239, "236": 240, "237": 241, "238": 242, "239": 243, "240": 244, "241": 245, "242": 246, "243": 247, "244": 248, "245": 249, "246": 250, "247": 251, "248": 252, "249": 253, "250": 254, "251": 255, "252": 256, "253": 257, "254": 258, "255": 259, "<mask>": 260}
|
dp/ko/posbert.base/label1.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"<s>": 0, "<pad>": 1, "</s>": 2, "<unk>": 3, "XX": 4, "NP": 5, "VP": 6, "NP_AJT": 7, "NP_SBJ": 8, "VP_MOD": 9, "NP_OBJ": 10, "NP_MOD": 11, "AP": 12, "NP_CNJ": 13, "DP": 14, "VNP": 15, "VNP_MOD": 16, "VP_CMP": 17, "VP_AJT": 18, "NP_CMP": 19, "VP_OBJ": 20, "VNP_CMP": 21, "VP_SBJ": 22, "X": 23, "VNP_OBJ": 24, "VP_CNJ": 25, "IP": 26, "VNP_AJT": 27, "VNP_CNJ": 28, "VNP_SBJ": 29, "AP_AJT": 30, "AP_MOD": 31, "R": 32, "L": 33, "X_CNJ": 34, "IP_CMP": 35, "X_MOD": 36, "AP_CNJ": 37, "X_AJT": 38, "AP_SBJ": 39, "DP_MOD": 40, "X_SBJ": 41, "AP_OBJ": 42, "IP_AJT": 43, "L_MOD": 44, "IP_SBJ": 45, "X_CMP": 46, "X_OBJ": 47, "AP_CMP": 48, "DP_AJT": 49, "DP_SBJ": 50, "IP_CNJ": 51, "IP_OBJ": 52, "madeupword0000": 53, "madeupword0001": 54, "madeupword0002": 55, "<mask>": 56}
|
dp/ko/posbert.base/pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c24807b770c28b452f935026165131ca590fde619ad40b450ee95388bd74a55c
|
3 |
+
size 560069467
|
dp/ko/posbert.base/vocab.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|