leafspark commited on
Commit
d730ac2
·
verified ·
1 Parent(s): 3e53702

model: add config and tokenizer

Browse files
Files changed (3) hide show
  1. added_tokens.json +1002 -0
  2. config.json +30 -0
  3. tokenizer.model +3 -0
added_tokens.json ADDED
@@ -0,0 +1,1002 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "<extra_id_0>": 4,
3
+ "<extra_id_1>": 5,
4
+ "<extra_id_2>": 6,
5
+ "<extra_id_3>": 7,
6
+ "<extra_id_4>": 8,
7
+ "<extra_id_5>": 9,
8
+ "<extra_id_6>": 10,
9
+ "<extra_id_7>": 11,
10
+ "<extra_id_8>": 12,
11
+ "<extra_id_9>": 13,
12
+ "<extra_id_10>": 14,
13
+ "<extra_id_11>": 15,
14
+ "<extra_id_12>": 16,
15
+ "<extra_id_13>": 17,
16
+ "<extra_id_14>": 18,
17
+ "<extra_id_15>": 19,
18
+ "<extra_id_16>": 20,
19
+ "<extra_id_17>": 21,
20
+ "<extra_id_18>": 22,
21
+ "<extra_id_19>": 23,
22
+ "<extra_id_20>": 24,
23
+ "<extra_id_21>": 25,
24
+ "<extra_id_22>": 26,
25
+ "<extra_id_23>": 27,
26
+ "<extra_id_24>": 28,
27
+ "<extra_id_25>": 29,
28
+ "<extra_id_26>": 30,
29
+ "<extra_id_27>": 31,
30
+ "<extra_id_28>": 32,
31
+ "<extra_id_29>": 33,
32
+ "<extra_id_30>": 34,
33
+ "<extra_id_31>": 35,
34
+ "<extra_id_32>": 36,
35
+ "<extra_id_33>": 37,
36
+ "<extra_id_34>": 38,
37
+ "<extra_id_35>": 39,
38
+ "<extra_id_36>": 40,
39
+ "<extra_id_37>": 41,
40
+ "<extra_id_38>": 42,
41
+ "<extra_id_39>": 43,
42
+ "<extra_id_40>": 44,
43
+ "<extra_id_41>": 45,
44
+ "<extra_id_42>": 46,
45
+ "<extra_id_43>": 47,
46
+ "<extra_id_44>": 48,
47
+ "<extra_id_45>": 49,
48
+ "<extra_id_46>": 50,
49
+ "<extra_id_47>": 51,
50
+ "<extra_id_48>": 52,
51
+ "<extra_id_49>": 53,
52
+ "<extra_id_50>": 54,
53
+ "<extra_id_51>": 55,
54
+ "<extra_id_52>": 56,
55
+ "<extra_id_53>": 57,
56
+ "<extra_id_54>": 58,
57
+ "<extra_id_55>": 59,
58
+ "<extra_id_56>": 60,
59
+ "<extra_id_57>": 61,
60
+ "<extra_id_58>": 62,
61
+ "<extra_id_59>": 63,
62
+ "<extra_id_60>": 64,
63
+ "<extra_id_61>": 65,
64
+ "<extra_id_62>": 66,
65
+ "<extra_id_63>": 67,
66
+ "<extra_id_64>": 68,
67
+ "<extra_id_65>": 69,
68
+ "<extra_id_66>": 70,
69
+ "<extra_id_67>": 71,
70
+ "<extra_id_68>": 72,
71
+ "<extra_id_69>": 73,
72
+ "<extra_id_70>": 74,
73
+ "<extra_id_71>": 75,
74
+ "<extra_id_72>": 76,
75
+ "<extra_id_73>": 77,
76
+ "<extra_id_74>": 78,
77
+ "<extra_id_75>": 79,
78
+ "<extra_id_76>": 80,
79
+ "<extra_id_77>": 81,
80
+ "<extra_id_78>": 82,
81
+ "<extra_id_79>": 83,
82
+ "<extra_id_80>": 84,
83
+ "<extra_id_81>": 85,
84
+ "<extra_id_82>": 86,
85
+ "<extra_id_83>": 87,
86
+ "<extra_id_84>": 88,
87
+ "<extra_id_85>": 89,
88
+ "<extra_id_86>": 90,
89
+ "<extra_id_87>": 91,
90
+ "<extra_id_88>": 92,
91
+ "<extra_id_89>": 93,
92
+ "<extra_id_90>": 94,
93
+ "<extra_id_91>": 95,
94
+ "<extra_id_92>": 96,
95
+ "<extra_id_93>": 97,
96
+ "<extra_id_94>": 98,
97
+ "<extra_id_95>": 99,
98
+ "<extra_id_96>": 100,
99
+ "<extra_id_97>": 101,
100
+ "<extra_id_98>": 102,
101
+ "<extra_id_99>": 103,
102
+ "<extra_id_100>": 104,
103
+ "<extra_id_101>": 105,
104
+ "<extra_id_102>": 106,
105
+ "<extra_id_103>": 107,
106
+ "<extra_id_104>": 108,
107
+ "<extra_id_105>": 109,
108
+ "<extra_id_106>": 110,
109
+ "<extra_id_107>": 111,
110
+ "<extra_id_108>": 112,
111
+ "<extra_id_109>": 113,
112
+ "<extra_id_110>": 114,
113
+ "<extra_id_111>": 115,
114
+ "<extra_id_112>": 116,
115
+ "<extra_id_113>": 117,
116
+ "<extra_id_114>": 118,
117
+ "<extra_id_115>": 119,
118
+ "<extra_id_116>": 120,
119
+ "<extra_id_117>": 121,
120
+ "<extra_id_118>": 122,
121
+ "<extra_id_119>": 123,
122
+ "<extra_id_120>": 124,
123
+ "<extra_id_121>": 125,
124
+ "<extra_id_122>": 126,
125
+ "<extra_id_123>": 127,
126
+ "<extra_id_124>": 128,
127
+ "<extra_id_125>": 129,
128
+ "<extra_id_126>": 130,
129
+ "<extra_id_127>": 131,
130
+ "<extra_id_128>": 132,
131
+ "<extra_id_129>": 133,
132
+ "<extra_id_130>": 134,
133
+ "<extra_id_131>": 135,
134
+ "<extra_id_132>": 136,
135
+ "<extra_id_133>": 137,
136
+ "<extra_id_134>": 138,
137
+ "<extra_id_135>": 139,
138
+ "<extra_id_136>": 140,
139
+ "<extra_id_137>": 141,
140
+ "<extra_id_138>": 142,
141
+ "<extra_id_139>": 143,
142
+ "<extra_id_140>": 144,
143
+ "<extra_id_141>": 145,
144
+ "<extra_id_142>": 146,
145
+ "<extra_id_143>": 147,
146
+ "<extra_id_144>": 148,
147
+ "<extra_id_145>": 149,
148
+ "<extra_id_146>": 150,
149
+ "<extra_id_147>": 151,
150
+ "<extra_id_148>": 152,
151
+ "<extra_id_149>": 153,
152
+ "<extra_id_150>": 154,
153
+ "<extra_id_151>": 155,
154
+ "<extra_id_152>": 156,
155
+ "<extra_id_153>": 157,
156
+ "<extra_id_154>": 158,
157
+ "<extra_id_155>": 159,
158
+ "<extra_id_156>": 160,
159
+ "<extra_id_157>": 161,
160
+ "<extra_id_158>": 162,
161
+ "<extra_id_159>": 163,
162
+ "<extra_id_160>": 164,
163
+ "<extra_id_161>": 165,
164
+ "<extra_id_162>": 166,
165
+ "<extra_id_163>": 167,
166
+ "<extra_id_164>": 168,
167
+ "<extra_id_165>": 169,
168
+ "<extra_id_166>": 170,
169
+ "<extra_id_167>": 171,
170
+ "<extra_id_168>": 172,
171
+ "<extra_id_169>": 173,
172
+ "<extra_id_170>": 174,
173
+ "<extra_id_171>": 175,
174
+ "<extra_id_172>": 176,
175
+ "<extra_id_173>": 177,
176
+ "<extra_id_174>": 178,
177
+ "<extra_id_175>": 179,
178
+ "<extra_id_176>": 180,
179
+ "<extra_id_177>": 181,
180
+ "<extra_id_178>": 182,
181
+ "<extra_id_179>": 183,
182
+ "<extra_id_180>": 184,
183
+ "<extra_id_181>": 185,
184
+ "<extra_id_182>": 186,
185
+ "<extra_id_183>": 187,
186
+ "<extra_id_184>": 188,
187
+ "<extra_id_185>": 189,
188
+ "<extra_id_186>": 190,
189
+ "<extra_id_187>": 191,
190
+ "<extra_id_188>": 192,
191
+ "<extra_id_189>": 193,
192
+ "<extra_id_190>": 194,
193
+ "<extra_id_191>": 195,
194
+ "<extra_id_192>": 196,
195
+ "<extra_id_193>": 197,
196
+ "<extra_id_194>": 198,
197
+ "<extra_id_195>": 199,
198
+ "<extra_id_196>": 200,
199
+ "<extra_id_197>": 201,
200
+ "<extra_id_198>": 202,
201
+ "<extra_id_199>": 203,
202
+ "<extra_id_200>": 204,
203
+ "<extra_id_201>": 205,
204
+ "<extra_id_202>": 206,
205
+ "<extra_id_203>": 207,
206
+ "<extra_id_204>": 208,
207
+ "<extra_id_205>": 209,
208
+ "<extra_id_206>": 210,
209
+ "<extra_id_207>": 211,
210
+ "<extra_id_208>": 212,
211
+ "<extra_id_209>": 213,
212
+ "<extra_id_210>": 214,
213
+ "<extra_id_211>": 215,
214
+ "<extra_id_212>": 216,
215
+ "<extra_id_213>": 217,
216
+ "<extra_id_214>": 218,
217
+ "<extra_id_215>": 219,
218
+ "<extra_id_216>": 220,
219
+ "<extra_id_217>": 221,
220
+ "<extra_id_218>": 222,
221
+ "<extra_id_219>": 223,
222
+ "<extra_id_220>": 224,
223
+ "<extra_id_221>": 225,
224
+ "<extra_id_222>": 226,
225
+ "<extra_id_223>": 227,
226
+ "<extra_id_224>": 228,
227
+ "<extra_id_225>": 229,
228
+ "<extra_id_226>": 230,
229
+ "<extra_id_227>": 231,
230
+ "<extra_id_228>": 232,
231
+ "<extra_id_229>": 233,
232
+ "<extra_id_230>": 234,
233
+ "<extra_id_231>": 235,
234
+ "<extra_id_232>": 236,
235
+ "<extra_id_233>": 237,
236
+ "<extra_id_234>": 238,
237
+ "<extra_id_235>": 239,
238
+ "<extra_id_236>": 240,
239
+ "<extra_id_237>": 241,
240
+ "<extra_id_238>": 242,
241
+ "<extra_id_239>": 243,
242
+ "<extra_id_240>": 244,
243
+ "<extra_id_241>": 245,
244
+ "<extra_id_242>": 246,
245
+ "<extra_id_243>": 247,
246
+ "<extra_id_244>": 248,
247
+ "<extra_id_245>": 249,
248
+ "<extra_id_246>": 250,
249
+ "<extra_id_247>": 251,
250
+ "<extra_id_248>": 252,
251
+ "<extra_id_249>": 253,
252
+ "<extra_id_250>": 254,
253
+ "<extra_id_251>": 255,
254
+ "<extra_id_252>": 256,
255
+ "<extra_id_253>": 257,
256
+ "<extra_id_254>": 258,
257
+ "<extra_id_255>": 259,
258
+ "<extra_id_256>": 260,
259
+ "<extra_id_257>": 261,
260
+ "<extra_id_258>": 262,
261
+ "<extra_id_259>": 263,
262
+ "<extra_id_260>": 264,
263
+ "<extra_id_261>": 265,
264
+ "<extra_id_262>": 266,
265
+ "<extra_id_263>": 267,
266
+ "<extra_id_264>": 268,
267
+ "<extra_id_265>": 269,
268
+ "<extra_id_266>": 270,
269
+ "<extra_id_267>": 271,
270
+ "<extra_id_268>": 272,
271
+ "<extra_id_269>": 273,
272
+ "<extra_id_270>": 274,
273
+ "<extra_id_271>": 275,
274
+ "<extra_id_272>": 276,
275
+ "<extra_id_273>": 277,
276
+ "<extra_id_274>": 278,
277
+ "<extra_id_275>": 279,
278
+ "<extra_id_276>": 280,
279
+ "<extra_id_277>": 281,
280
+ "<extra_id_278>": 282,
281
+ "<extra_id_279>": 283,
282
+ "<extra_id_280>": 284,
283
+ "<extra_id_281>": 285,
284
+ "<extra_id_282>": 286,
285
+ "<extra_id_283>": 287,
286
+ "<extra_id_284>": 288,
287
+ "<extra_id_285>": 289,
288
+ "<extra_id_286>": 290,
289
+ "<extra_id_287>": 291,
290
+ "<extra_id_288>": 292,
291
+ "<extra_id_289>": 293,
292
+ "<extra_id_290>": 294,
293
+ "<extra_id_291>": 295,
294
+ "<extra_id_292>": 296,
295
+ "<extra_id_293>": 297,
296
+ "<extra_id_294>": 298,
297
+ "<extra_id_295>": 299,
298
+ "<extra_id_296>": 300,
299
+ "<extra_id_297>": 301,
300
+ "<extra_id_298>": 302,
301
+ "<extra_id_299>": 303,
302
+ "<extra_id_300>": 304,
303
+ "<extra_id_301>": 305,
304
+ "<extra_id_302>": 306,
305
+ "<extra_id_303>": 307,
306
+ "<extra_id_304>": 308,
307
+ "<extra_id_305>": 309,
308
+ "<extra_id_306>": 310,
309
+ "<extra_id_307>": 311,
310
+ "<extra_id_308>": 312,
311
+ "<extra_id_309>": 313,
312
+ "<extra_id_310>": 314,
313
+ "<extra_id_311>": 315,
314
+ "<extra_id_312>": 316,
315
+ "<extra_id_313>": 317,
316
+ "<extra_id_314>": 318,
317
+ "<extra_id_315>": 319,
318
+ "<extra_id_316>": 320,
319
+ "<extra_id_317>": 321,
320
+ "<extra_id_318>": 322,
321
+ "<extra_id_319>": 323,
322
+ "<extra_id_320>": 324,
323
+ "<extra_id_321>": 325,
324
+ "<extra_id_322>": 326,
325
+ "<extra_id_323>": 327,
326
+ "<extra_id_324>": 328,
327
+ "<extra_id_325>": 329,
328
+ "<extra_id_326>": 330,
329
+ "<extra_id_327>": 331,
330
+ "<extra_id_328>": 332,
331
+ "<extra_id_329>": 333,
332
+ "<extra_id_330>": 334,
333
+ "<extra_id_331>": 335,
334
+ "<extra_id_332>": 336,
335
+ "<extra_id_333>": 337,
336
+ "<extra_id_334>": 338,
337
+ "<extra_id_335>": 339,
338
+ "<extra_id_336>": 340,
339
+ "<extra_id_337>": 341,
340
+ "<extra_id_338>": 342,
341
+ "<extra_id_339>": 343,
342
+ "<extra_id_340>": 344,
343
+ "<extra_id_341>": 345,
344
+ "<extra_id_342>": 346,
345
+ "<extra_id_343>": 347,
346
+ "<extra_id_344>": 348,
347
+ "<extra_id_345>": 349,
348
+ "<extra_id_346>": 350,
349
+ "<extra_id_347>": 351,
350
+ "<extra_id_348>": 352,
351
+ "<extra_id_349>": 353,
352
+ "<extra_id_350>": 354,
353
+ "<extra_id_351>": 355,
354
+ "<extra_id_352>": 356,
355
+ "<extra_id_353>": 357,
356
+ "<extra_id_354>": 358,
357
+ "<extra_id_355>": 359,
358
+ "<extra_id_356>": 360,
359
+ "<extra_id_357>": 361,
360
+ "<extra_id_358>": 362,
361
+ "<extra_id_359>": 363,
362
+ "<extra_id_360>": 364,
363
+ "<extra_id_361>": 365,
364
+ "<extra_id_362>": 366,
365
+ "<extra_id_363>": 367,
366
+ "<extra_id_364>": 368,
367
+ "<extra_id_365>": 369,
368
+ "<extra_id_366>": 370,
369
+ "<extra_id_367>": 371,
370
+ "<extra_id_368>": 372,
371
+ "<extra_id_369>": 373,
372
+ "<extra_id_370>": 374,
373
+ "<extra_id_371>": 375,
374
+ "<extra_id_372>": 376,
375
+ "<extra_id_373>": 377,
376
+ "<extra_id_374>": 378,
377
+ "<extra_id_375>": 379,
378
+ "<extra_id_376>": 380,
379
+ "<extra_id_377>": 381,
380
+ "<extra_id_378>": 382,
381
+ "<extra_id_379>": 383,
382
+ "<extra_id_380>": 384,
383
+ "<extra_id_381>": 385,
384
+ "<extra_id_382>": 386,
385
+ "<extra_id_383>": 387,
386
+ "<extra_id_384>": 388,
387
+ "<extra_id_385>": 389,
388
+ "<extra_id_386>": 390,
389
+ "<extra_id_387>": 391,
390
+ "<extra_id_388>": 392,
391
+ "<extra_id_389>": 393,
392
+ "<extra_id_390>": 394,
393
+ "<extra_id_391>": 395,
394
+ "<extra_id_392>": 396,
395
+ "<extra_id_393>": 397,
396
+ "<extra_id_394>": 398,
397
+ "<extra_id_395>": 399,
398
+ "<extra_id_396>": 400,
399
+ "<extra_id_397>": 401,
400
+ "<extra_id_398>": 402,
401
+ "<extra_id_399>": 403,
402
+ "<extra_id_400>": 404,
403
+ "<extra_id_401>": 405,
404
+ "<extra_id_402>": 406,
405
+ "<extra_id_403>": 407,
406
+ "<extra_id_404>": 408,
407
+ "<extra_id_405>": 409,
408
+ "<extra_id_406>": 410,
409
+ "<extra_id_407>": 411,
410
+ "<extra_id_408>": 412,
411
+ "<extra_id_409>": 413,
412
+ "<extra_id_410>": 414,
413
+ "<extra_id_411>": 415,
414
+ "<extra_id_412>": 416,
415
+ "<extra_id_413>": 417,
416
+ "<extra_id_414>": 418,
417
+ "<extra_id_415>": 419,
418
+ "<extra_id_416>": 420,
419
+ "<extra_id_417>": 421,
420
+ "<extra_id_418>": 422,
421
+ "<extra_id_419>": 423,
422
+ "<extra_id_420>": 424,
423
+ "<extra_id_421>": 425,
424
+ "<extra_id_422>": 426,
425
+ "<extra_id_423>": 427,
426
+ "<extra_id_424>": 428,
427
+ "<extra_id_425>": 429,
428
+ "<extra_id_426>": 430,
429
+ "<extra_id_427>": 431,
430
+ "<extra_id_428>": 432,
431
+ "<extra_id_429>": 433,
432
+ "<extra_id_430>": 434,
433
+ "<extra_id_431>": 435,
434
+ "<extra_id_432>": 436,
435
+ "<extra_id_433>": 437,
436
+ "<extra_id_434>": 438,
437
+ "<extra_id_435>": 439,
438
+ "<extra_id_436>": 440,
439
+ "<extra_id_437>": 441,
440
+ "<extra_id_438>": 442,
441
+ "<extra_id_439>": 443,
442
+ "<extra_id_440>": 444,
443
+ "<extra_id_441>": 445,
444
+ "<extra_id_442>": 446,
445
+ "<extra_id_443>": 447,
446
+ "<extra_id_444>": 448,
447
+ "<extra_id_445>": 449,
448
+ "<extra_id_446>": 450,
449
+ "<extra_id_447>": 451,
450
+ "<extra_id_448>": 452,
451
+ "<extra_id_449>": 453,
452
+ "<extra_id_450>": 454,
453
+ "<extra_id_451>": 455,
454
+ "<extra_id_452>": 456,
455
+ "<extra_id_453>": 457,
456
+ "<extra_id_454>": 458,
457
+ "<extra_id_455>": 459,
458
+ "<extra_id_456>": 460,
459
+ "<extra_id_457>": 461,
460
+ "<extra_id_458>": 462,
461
+ "<extra_id_459>": 463,
462
+ "<extra_id_460>": 464,
463
+ "<extra_id_461>": 465,
464
+ "<extra_id_462>": 466,
465
+ "<extra_id_463>": 467,
466
+ "<extra_id_464>": 468,
467
+ "<extra_id_465>": 469,
468
+ "<extra_id_466>": 470,
469
+ "<extra_id_467>": 471,
470
+ "<extra_id_468>": 472,
471
+ "<extra_id_469>": 473,
472
+ "<extra_id_470>": 474,
473
+ "<extra_id_471>": 475,
474
+ "<extra_id_472>": 476,
475
+ "<extra_id_473>": 477,
476
+ "<extra_id_474>": 478,
477
+ "<extra_id_475>": 479,
478
+ "<extra_id_476>": 480,
479
+ "<extra_id_477>": 481,
480
+ "<extra_id_478>": 482,
481
+ "<extra_id_479>": 483,
482
+ "<extra_id_480>": 484,
483
+ "<extra_id_481>": 485,
484
+ "<extra_id_482>": 486,
485
+ "<extra_id_483>": 487,
486
+ "<extra_id_484>": 488,
487
+ "<extra_id_485>": 489,
488
+ "<extra_id_486>": 490,
489
+ "<extra_id_487>": 491,
490
+ "<extra_id_488>": 492,
491
+ "<extra_id_489>": 493,
492
+ "<extra_id_490>": 494,
493
+ "<extra_id_491>": 495,
494
+ "<extra_id_492>": 496,
495
+ "<extra_id_493>": 497,
496
+ "<extra_id_494>": 498,
497
+ "<extra_id_495>": 499,
498
+ "<extra_id_496>": 500,
499
+ "<extra_id_497>": 501,
500
+ "<extra_id_498>": 502,
501
+ "<extra_id_499>": 503,
502
+ "<extra_id_500>": 504,
503
+ "<extra_id_501>": 505,
504
+ "<extra_id_502>": 506,
505
+ "<extra_id_503>": 507,
506
+ "<extra_id_504>": 508,
507
+ "<extra_id_505>": 509,
508
+ "<extra_id_506>": 510,
509
+ "<extra_id_507>": 511,
510
+ "<extra_id_508>": 512,
511
+ "<extra_id_509>": 513,
512
+ "<extra_id_510>": 514,
513
+ "<extra_id_511>": 515,
514
+ "<extra_id_512>": 516,
515
+ "<extra_id_513>": 517,
516
+ "<extra_id_514>": 518,
517
+ "<extra_id_515>": 519,
518
+ "<extra_id_516>": 520,
519
+ "<extra_id_517>": 521,
520
+ "<extra_id_518>": 522,
521
+ "<extra_id_519>": 523,
522
+ "<extra_id_520>": 524,
523
+ "<extra_id_521>": 525,
524
+ "<extra_id_522>": 526,
525
+ "<extra_id_523>": 527,
526
+ "<extra_id_524>": 528,
527
+ "<extra_id_525>": 529,
528
+ "<extra_id_526>": 530,
529
+ "<extra_id_527>": 531,
530
+ "<extra_id_528>": 532,
531
+ "<extra_id_529>": 533,
532
+ "<extra_id_530>": 534,
533
+ "<extra_id_531>": 535,
534
+ "<extra_id_532>": 536,
535
+ "<extra_id_533>": 537,
536
+ "<extra_id_534>": 538,
537
+ "<extra_id_535>": 539,
538
+ "<extra_id_536>": 540,
539
+ "<extra_id_537>": 541,
540
+ "<extra_id_538>": 542,
541
+ "<extra_id_539>": 543,
542
+ "<extra_id_540>": 544,
543
+ "<extra_id_541>": 545,
544
+ "<extra_id_542>": 546,
545
+ "<extra_id_543>": 547,
546
+ "<extra_id_544>": 548,
547
+ "<extra_id_545>": 549,
548
+ "<extra_id_546>": 550,
549
+ "<extra_id_547>": 551,
550
+ "<extra_id_548>": 552,
551
+ "<extra_id_549>": 553,
552
+ "<extra_id_550>": 554,
553
+ "<extra_id_551>": 555,
554
+ "<extra_id_552>": 556,
555
+ "<extra_id_553>": 557,
556
+ "<extra_id_554>": 558,
557
+ "<extra_id_555>": 559,
558
+ "<extra_id_556>": 560,
559
+ "<extra_id_557>": 561,
560
+ "<extra_id_558>": 562,
561
+ "<extra_id_559>": 563,
562
+ "<extra_id_560>": 564,
563
+ "<extra_id_561>": 565,
564
+ "<extra_id_562>": 566,
565
+ "<extra_id_563>": 567,
566
+ "<extra_id_564>": 568,
567
+ "<extra_id_565>": 569,
568
+ "<extra_id_566>": 570,
569
+ "<extra_id_567>": 571,
570
+ "<extra_id_568>": 572,
571
+ "<extra_id_569>": 573,
572
+ "<extra_id_570>": 574,
573
+ "<extra_id_571>": 575,
574
+ "<extra_id_572>": 576,
575
+ "<extra_id_573>": 577,
576
+ "<extra_id_574>": 578,
577
+ "<extra_id_575>": 579,
578
+ "<extra_id_576>": 580,
579
+ "<extra_id_577>": 581,
580
+ "<extra_id_578>": 582,
581
+ "<extra_id_579>": 583,
582
+ "<extra_id_580>": 584,
583
+ "<extra_id_581>": 585,
584
+ "<extra_id_582>": 586,
585
+ "<extra_id_583>": 587,
586
+ "<extra_id_584>": 588,
587
+ "<extra_id_585>": 589,
588
+ "<extra_id_586>": 590,
589
+ "<extra_id_587>": 591,
590
+ "<extra_id_588>": 592,
591
+ "<extra_id_589>": 593,
592
+ "<extra_id_590>": 594,
593
+ "<extra_id_591>": 595,
594
+ "<extra_id_592>": 596,
595
+ "<extra_id_593>": 597,
596
+ "<extra_id_594>": 598,
597
+ "<extra_id_595>": 599,
598
+ "<extra_id_596>": 600,
599
+ "<extra_id_597>": 601,
600
+ "<extra_id_598>": 602,
601
+ "<extra_id_599>": 603,
602
+ "<extra_id_600>": 604,
603
+ "<extra_id_601>": 605,
604
+ "<extra_id_602>": 606,
605
+ "<extra_id_603>": 607,
606
+ "<extra_id_604>": 608,
607
+ "<extra_id_605>": 609,
608
+ "<extra_id_606>": 610,
609
+ "<extra_id_607>": 611,
610
+ "<extra_id_608>": 612,
611
+ "<extra_id_609>": 613,
612
+ "<extra_id_610>": 614,
613
+ "<extra_id_611>": 615,
614
+ "<extra_id_612>": 616,
615
+ "<extra_id_613>": 617,
616
+ "<extra_id_614>": 618,
617
+ "<extra_id_615>": 619,
618
+ "<extra_id_616>": 620,
619
+ "<extra_id_617>": 621,
620
+ "<extra_id_618>": 622,
621
+ "<extra_id_619>": 623,
622
+ "<extra_id_620>": 624,
623
+ "<extra_id_621>": 625,
624
+ "<extra_id_622>": 626,
625
+ "<extra_id_623>": 627,
626
+ "<extra_id_624>": 628,
627
+ "<extra_id_625>": 629,
628
+ "<extra_id_626>": 630,
629
+ "<extra_id_627>": 631,
630
+ "<extra_id_628>": 632,
631
+ "<extra_id_629>": 633,
632
+ "<extra_id_630>": 634,
633
+ "<extra_id_631>": 635,
634
+ "<extra_id_632>": 636,
635
+ "<extra_id_633>": 637,
636
+ "<extra_id_634>": 638,
637
+ "<extra_id_635>": 639,
638
+ "<extra_id_636>": 640,
639
+ "<extra_id_637>": 641,
640
+ "<extra_id_638>": 642,
641
+ "<extra_id_639>": 643,
642
+ "<extra_id_640>": 644,
643
+ "<extra_id_641>": 645,
644
+ "<extra_id_642>": 646,
645
+ "<extra_id_643>": 647,
646
+ "<extra_id_644>": 648,
647
+ "<extra_id_645>": 649,
648
+ "<extra_id_646>": 650,
649
+ "<extra_id_647>": 651,
650
+ "<extra_id_648>": 652,
651
+ "<extra_id_649>": 653,
652
+ "<extra_id_650>": 654,
653
+ "<extra_id_651>": 655,
654
+ "<extra_id_652>": 656,
655
+ "<extra_id_653>": 657,
656
+ "<extra_id_654>": 658,
657
+ "<extra_id_655>": 659,
658
+ "<extra_id_656>": 660,
659
+ "<extra_id_657>": 661,
660
+ "<extra_id_658>": 662,
661
+ "<extra_id_659>": 663,
662
+ "<extra_id_660>": 664,
663
+ "<extra_id_661>": 665,
664
+ "<extra_id_662>": 666,
665
+ "<extra_id_663>": 667,
666
+ "<extra_id_664>": 668,
667
+ "<extra_id_665>": 669,
668
+ "<extra_id_666>": 670,
669
+ "<extra_id_667>": 671,
670
+ "<extra_id_668>": 672,
671
+ "<extra_id_669>": 673,
672
+ "<extra_id_670>": 674,
673
+ "<extra_id_671>": 675,
674
+ "<extra_id_672>": 676,
675
+ "<extra_id_673>": 677,
676
+ "<extra_id_674>": 678,
677
+ "<extra_id_675>": 679,
678
+ "<extra_id_676>": 680,
679
+ "<extra_id_677>": 681,
680
+ "<extra_id_678>": 682,
681
+ "<extra_id_679>": 683,
682
+ "<extra_id_680>": 684,
683
+ "<extra_id_681>": 685,
684
+ "<extra_id_682>": 686,
685
+ "<extra_id_683>": 687,
686
+ "<extra_id_684>": 688,
687
+ "<extra_id_685>": 689,
688
+ "<extra_id_686>": 690,
689
+ "<extra_id_687>": 691,
690
+ "<extra_id_688>": 692,
691
+ "<extra_id_689>": 693,
692
+ "<extra_id_690>": 694,
693
+ "<extra_id_691>": 695,
694
+ "<extra_id_692>": 696,
695
+ "<extra_id_693>": 697,
696
+ "<extra_id_694>": 698,
697
+ "<extra_id_695>": 699,
698
+ "<extra_id_696>": 700,
699
+ "<extra_id_697>": 701,
700
+ "<extra_id_698>": 702,
701
+ "<extra_id_699>": 703,
702
+ "<extra_id_700>": 704,
703
+ "<extra_id_701>": 705,
704
+ "<extra_id_702>": 706,
705
+ "<extra_id_703>": 707,
706
+ "<extra_id_704>": 708,
707
+ "<extra_id_705>": 709,
708
+ "<extra_id_706>": 710,
709
+ "<extra_id_707>": 711,
710
+ "<extra_id_708>": 712,
711
+ "<extra_id_709>": 713,
712
+ "<extra_id_710>": 714,
713
+ "<extra_id_711>": 715,
714
+ "<extra_id_712>": 716,
715
+ "<extra_id_713>": 717,
716
+ "<extra_id_714>": 718,
717
+ "<extra_id_715>": 719,
718
+ "<extra_id_716>": 720,
719
+ "<extra_id_717>": 721,
720
+ "<extra_id_718>": 722,
721
+ "<extra_id_719>": 723,
722
+ "<extra_id_720>": 724,
723
+ "<extra_id_721>": 725,
724
+ "<extra_id_722>": 726,
725
+ "<extra_id_723>": 727,
726
+ "<extra_id_724>": 728,
727
+ "<extra_id_725>": 729,
728
+ "<extra_id_726>": 730,
729
+ "<extra_id_727>": 731,
730
+ "<extra_id_728>": 732,
731
+ "<extra_id_729>": 733,
732
+ "<extra_id_730>": 734,
733
+ "<extra_id_731>": 735,
734
+ "<extra_id_732>": 736,
735
+ "<extra_id_733>": 737,
736
+ "<extra_id_734>": 738,
737
+ "<extra_id_735>": 739,
738
+ "<extra_id_736>": 740,
739
+ "<extra_id_737>": 741,
740
+ "<extra_id_738>": 742,
741
+ "<extra_id_739>": 743,
742
+ "<extra_id_740>": 744,
743
+ "<extra_id_741>": 745,
744
+ "<extra_id_742>": 746,
745
+ "<extra_id_743>": 747,
746
+ "<extra_id_744>": 748,
747
+ "<extra_id_745>": 749,
748
+ "<extra_id_746>": 750,
749
+ "<extra_id_747>": 751,
750
+ "<extra_id_748>": 752,
751
+ "<extra_id_749>": 753,
752
+ "<extra_id_750>": 754,
753
+ "<extra_id_751>": 755,
754
+ "<extra_id_752>": 756,
755
+ "<extra_id_753>": 757,
756
+ "<extra_id_754>": 758,
757
+ "<extra_id_755>": 759,
758
+ "<extra_id_756>": 760,
759
+ "<extra_id_757>": 761,
760
+ "<extra_id_758>": 762,
761
+ "<extra_id_759>": 763,
762
+ "<extra_id_760>": 764,
763
+ "<extra_id_761>": 765,
764
+ "<extra_id_762>": 766,
765
+ "<extra_id_763>": 767,
766
+ "<extra_id_764>": 768,
767
+ "<extra_id_765>": 769,
768
+ "<extra_id_766>": 770,
769
+ "<extra_id_767>": 771,
770
+ "<extra_id_768>": 772,
771
+ "<extra_id_769>": 773,
772
+ "<extra_id_770>": 774,
773
+ "<extra_id_771>": 775,
774
+ "<extra_id_772>": 776,
775
+ "<extra_id_773>": 777,
776
+ "<extra_id_774>": 778,
777
+ "<extra_id_775>": 779,
778
+ "<extra_id_776>": 780,
779
+ "<extra_id_777>": 781,
780
+ "<extra_id_778>": 782,
781
+ "<extra_id_779>": 783,
782
+ "<extra_id_780>": 784,
783
+ "<extra_id_781>": 785,
784
+ "<extra_id_782>": 786,
785
+ "<extra_id_783>": 787,
786
+ "<extra_id_784>": 788,
787
+ "<extra_id_785>": 789,
788
+ "<extra_id_786>": 790,
789
+ "<extra_id_787>": 791,
790
+ "<extra_id_788>": 792,
791
+ "<extra_id_789>": 793,
792
+ "<extra_id_790>": 794,
793
+ "<extra_id_791>": 795,
794
+ "<extra_id_792>": 796,
795
+ "<extra_id_793>": 797,
796
+ "<extra_id_794>": 798,
797
+ "<extra_id_795>": 799,
798
+ "<extra_id_796>": 800,
799
+ "<extra_id_797>": 801,
800
+ "<extra_id_798>": 802,
801
+ "<extra_id_799>": 803,
802
+ "<extra_id_800>": 804,
803
+ "<extra_id_801>": 805,
804
+ "<extra_id_802>": 806,
805
+ "<extra_id_803>": 807,
806
+ "<extra_id_804>": 808,
807
+ "<extra_id_805>": 809,
808
+ "<extra_id_806>": 810,
809
+ "<extra_id_807>": 811,
810
+ "<extra_id_808>": 812,
811
+ "<extra_id_809>": 813,
812
+ "<extra_id_810>": 814,
813
+ "<extra_id_811>": 815,
814
+ "<extra_id_812>": 816,
815
+ "<extra_id_813>": 817,
816
+ "<extra_id_814>": 818,
817
+ "<extra_id_815>": 819,
818
+ "<extra_id_816>": 820,
819
+ "<extra_id_817>": 821,
820
+ "<extra_id_818>": 822,
821
+ "<extra_id_819>": 823,
822
+ "<extra_id_820>": 824,
823
+ "<extra_id_821>": 825,
824
+ "<extra_id_822>": 826,
825
+ "<extra_id_823>": 827,
826
+ "<extra_id_824>": 828,
827
+ "<extra_id_825>": 829,
828
+ "<extra_id_826>": 830,
829
+ "<extra_id_827>": 831,
830
+ "<extra_id_828>": 832,
831
+ "<extra_id_829>": 833,
832
+ "<extra_id_830>": 834,
833
+ "<extra_id_831>": 835,
834
+ "<extra_id_832>": 836,
835
+ "<extra_id_833>": 837,
836
+ "<extra_id_834>": 838,
837
+ "<extra_id_835>": 839,
838
+ "<extra_id_836>": 840,
839
+ "<extra_id_837>": 841,
840
+ "<extra_id_838>": 842,
841
+ "<extra_id_839>": 843,
842
+ "<extra_id_840>": 844,
843
+ "<extra_id_841>": 845,
844
+ "<extra_id_842>": 846,
845
+ "<extra_id_843>": 847,
846
+ "<extra_id_844>": 848,
847
+ "<extra_id_845>": 849,
848
+ "<extra_id_846>": 850,
849
+ "<extra_id_847>": 851,
850
+ "<extra_id_848>": 852,
851
+ "<extra_id_849>": 853,
852
+ "<extra_id_850>": 854,
853
+ "<extra_id_851>": 855,
854
+ "<extra_id_852>": 856,
855
+ "<extra_id_853>": 857,
856
+ "<extra_id_854>": 858,
857
+ "<extra_id_855>": 859,
858
+ "<extra_id_856>": 860,
859
+ "<extra_id_857>": 861,
860
+ "<extra_id_858>": 862,
861
+ "<extra_id_859>": 863,
862
+ "<extra_id_860>": 864,
863
+ "<extra_id_861>": 865,
864
+ "<extra_id_862>": 866,
865
+ "<extra_id_863>": 867,
866
+ "<extra_id_864>": 868,
867
+ "<extra_id_865>": 869,
868
+ "<extra_id_866>": 870,
869
+ "<extra_id_867>": 871,
870
+ "<extra_id_868>": 872,
871
+ "<extra_id_869>": 873,
872
+ "<extra_id_870>": 874,
873
+ "<extra_id_871>": 875,
874
+ "<extra_id_872>": 876,
875
+ "<extra_id_873>": 877,
876
+ "<extra_id_874>": 878,
877
+ "<extra_id_875>": 879,
878
+ "<extra_id_876>": 880,
879
+ "<extra_id_877>": 881,
880
+ "<extra_id_878>": 882,
881
+ "<extra_id_879>": 883,
882
+ "<extra_id_880>": 884,
883
+ "<extra_id_881>": 885,
884
+ "<extra_id_882>": 886,
885
+ "<extra_id_883>": 887,
886
+ "<extra_id_884>": 888,
887
+ "<extra_id_885>": 889,
888
+ "<extra_id_886>": 890,
889
+ "<extra_id_887>": 891,
890
+ "<extra_id_888>": 892,
891
+ "<extra_id_889>": 893,
892
+ "<extra_id_890>": 894,
893
+ "<extra_id_891>": 895,
894
+ "<extra_id_892>": 896,
895
+ "<extra_id_893>": 897,
896
+ "<extra_id_894>": 898,
897
+ "<extra_id_895>": 899,
898
+ "<extra_id_896>": 900,
899
+ "<extra_id_897>": 901,
900
+ "<extra_id_898>": 902,
901
+ "<extra_id_899>": 903,
902
+ "<extra_id_900>": 904,
903
+ "<extra_id_901>": 905,
904
+ "<extra_id_902>": 906,
905
+ "<extra_id_903>": 907,
906
+ "<extra_id_904>": 908,
907
+ "<extra_id_905>": 909,
908
+ "<extra_id_906>": 910,
909
+ "<extra_id_907>": 911,
910
+ "<extra_id_908>": 912,
911
+ "<extra_id_909>": 913,
912
+ "<extra_id_910>": 914,
913
+ "<extra_id_911>": 915,
914
+ "<extra_id_912>": 916,
915
+ "<extra_id_913>": 917,
916
+ "<extra_id_914>": 918,
917
+ "<extra_id_915>": 919,
918
+ "<extra_id_916>": 920,
919
+ "<extra_id_917>": 921,
920
+ "<extra_id_918>": 922,
921
+ "<extra_id_919>": 923,
922
+ "<extra_id_920>": 924,
923
+ "<extra_id_921>": 925,
924
+ "<extra_id_922>": 926,
925
+ "<extra_id_923>": 927,
926
+ "<extra_id_924>": 928,
927
+ "<extra_id_925>": 929,
928
+ "<extra_id_926>": 930,
929
+ "<extra_id_927>": 931,
930
+ "<extra_id_928>": 932,
931
+ "<extra_id_929>": 933,
932
+ "<extra_id_930>": 934,
933
+ "<extra_id_931>": 935,
934
+ "<extra_id_932>": 936,
935
+ "<extra_id_933>": 937,
936
+ "<extra_id_934>": 938,
937
+ "<extra_id_935>": 939,
938
+ "<extra_id_936>": 940,
939
+ "<extra_id_937>": 941,
940
+ "<extra_id_938>": 942,
941
+ "<extra_id_939>": 943,
942
+ "<extra_id_940>": 944,
943
+ "<extra_id_941>": 945,
944
+ "<extra_id_942>": 946,
945
+ "<extra_id_943>": 947,
946
+ "<extra_id_944>": 948,
947
+ "<extra_id_945>": 949,
948
+ "<extra_id_946>": 950,
949
+ "<extra_id_947>": 951,
950
+ "<extra_id_948>": 952,
951
+ "<extra_id_949>": 953,
952
+ "<extra_id_950>": 954,
953
+ "<extra_id_951>": 955,
954
+ "<extra_id_952>": 956,
955
+ "<extra_id_953>": 957,
956
+ "<extra_id_954>": 958,
957
+ "<extra_id_955>": 959,
958
+ "<extra_id_956>": 960,
959
+ "<extra_id_957>": 961,
960
+ "<extra_id_958>": 962,
961
+ "<extra_id_959>": 963,
962
+ "<extra_id_960>": 964,
963
+ "<extra_id_961>": 965,
964
+ "<extra_id_962>": 966,
965
+ "<extra_id_963>": 967,
966
+ "<extra_id_964>": 968,
967
+ "<extra_id_965>": 969,
968
+ "<extra_id_966>": 970,
969
+ "<extra_id_967>": 971,
970
+ "<extra_id_968>": 972,
971
+ "<extra_id_969>": 973,
972
+ "<extra_id_970>": 974,
973
+ "<extra_id_971>": 975,
974
+ "<extra_id_972>": 976,
975
+ "<extra_id_973>": 977,
976
+ "<extra_id_974>": 978,
977
+ "<extra_id_975>": 979,
978
+ "<extra_id_976>": 980,
979
+ "<extra_id_977>": 981,
980
+ "<extra_id_978>": 982,
981
+ "<extra_id_979>": 983,
982
+ "<extra_id_980>": 984,
983
+ "<extra_id_981>": 985,
984
+ "<extra_id_982>": 986,
985
+ "<extra_id_983>": 987,
986
+ "<extra_id_984>": 988,
987
+ "<extra_id_985>": 989,
988
+ "<extra_id_986>": 990,
989
+ "<extra_id_987>": 991,
990
+ "<extra_id_988>": 992,
991
+ "<extra_id_989>": 993,
992
+ "<extra_id_990>": 994,
993
+ "<extra_id_991>": 995,
994
+ "<extra_id_992>": 996,
995
+ "<extra_id_993>": 997,
996
+ "<extra_id_994>": 998,
997
+ "<extra_id_995>": 999,
998
+ "<extra_id_996>": 1000,
999
+ "<extra_id_997>": 1001,
1000
+ "<extra_id_998>": 1002,
1001
+ "<extra_id_999>": 1003
1002
+ }
config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "NemotronForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "unk_token_id": 1,
8
+ "bos_token_id": 2,
9
+ "eos_token_id": 3,
10
+ "pad_token_id": 0,
11
+ "hidden_act": "relu2",
12
+ "hidden_size": 18432,
13
+ "initializer_range": 0.0063,
14
+ "intermediate_size": 73728,
15
+ "max_position_embeddings": 4096,
16
+ "model_type": "nemotron",
17
+ "num_attention_heads": 96,
18
+ "num_hidden_layers": 96,
19
+ "num_key_value_heads": 8,
20
+ "pretraining_tp": 1,
21
+ "layer_norm_eps": 1e-05,
22
+ "rope_scaling": null,
23
+ "partial_rotary_factor": 0.5,
24
+ "rope_theta": 10000.0,
25
+ "tie_word_embeddings": false,
26
+ "torch_dtype": "bfloat16",
27
+ "transformers_version": "4.40.0.dev0",
28
+ "use_cache": true,
29
+ "vocab_size": 256000
30
+ }
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dfd8b970f437002fc445214304969fe59e64d4f48500bd0b77ba55340f2d811
3
+ size 4545602