{ "version": "1.0", "truncation": null, "padding": null, "added_tokens": [ { "id": 112, "content": "[UNK]", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 113, "content": "[PAD]", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 114, "content": "[MASK]", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 115, "content": "[SEP]", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 116, "content": "[CLS]", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true } ], "normalizer": { "type": "Sequence", "normalizers": [] }, "pre_tokenizer": { "type": "WhitespaceSplit" }, "post_processor": null, "decoder": { "type": "WordPiece", "prefix": "##", "cleanup": true }, "model": { "type": "WordLevel", "vocab": { "": 0, "": 1, "": 2, "": 3, "": 4, "": 5, "IDX_0": 6, "IDX_1": 7, "IDX_2": 8, "IDX_3": 9, "IDX_4": 10, "IDX_5": 11, "IDX_6": 12, "IDX_7": 13, "IDX_8": 14, "IDX_9": 15, "IDX_10": 16, "IDX_11": 17, "IDX_12": 18, "IDX_13": 19, "IDX_14": 20, "IDX_15": 21, "IDX_16": 22, "IDX_17": 23, "IDX_18": 24, "IDX_19": 25, "IDX_20": 26, "IDX_21": 27, "IDX_22": 28, "IDX_23": 29, "IDX_24": 30, "IDX_25": 31, "IDX_26": 32, "IDX_27": 33, "IDX_28": 34, "IDX_29": 35, "IDX_30": 36, "IDX_31": 37, "IDX_32": 38, "IDX_33": 39, "IDX_34": 40, "IDX_35": 41, "IDX_36": 42, "IDX_37": 43, "IDX_38": 44, "IDX_39": 45, "IDX_40": 46, "IDX_41": 47, "IDX_42": 48, "IDX_43": 49, "IDX_44": 50, "IDX_45": 51, "IDX_46": 52, "IDX_47": 53, "IDX_48": 54, "IDX_49": 55, "IDX_50": 56, "IDX_51": 57, "IDX_52": 58, "IDX_53": 59, "IDX_54": 60, "IDX_55": 61, "IDX_56": 62, "IDX_57": 63, "IDX_58": 64, "IDX_59": 65, "IDX_60": 66, "IDX_61": 67, "IDX_62": 68, "IDX_63": 69, "IDX_64": 70, "IDX_65": 71, "IDX_66": 72, "IDX_67": 73, "IDX_68": 74, "IDX_69": 75, "IDX_70": 76, "IDX_71": 77, "IDX_72": 78, "IDX_73": 79, "IDX_74": 80, "IDX_75": 81, "IDX_76": 82, "IDX_77": 83, "IDX_78": 84, "IDX_79": 85, "IDX_80": 86, "IDX_81": 87, "IDX_82": 88, "IDX_83": 89, "IDX_84": 90, "IDX_85": 91, "IDX_86": 92, "IDX_87": 93, "IDX_88": 94, "IDX_89": 95, "ATOM_C": 96, "ATOM_N": 97, "ATOM_O": 98, "ATOM_F": 99, "ATOM_B": 100, "ATOM_Br": 101, "ATOM_Cl": 102, "ATOM_I": 103, "ATOM_P": 104, "ATOM_S": 105, "ATOM_Se": 106, "ATOM_Si": 107, "BOND_SINGLE": 108, "BOND_DOUBLE": 109, "BOND_TRIPLE": 110, "BOND_AROMATIC": 111 }, "unk_token": "[UNK]" } }