kinqsradio commited on
Commit
2e62033
·
verified ·
1 Parent(s): f8f7da7

Update tokenizer_config.json

Browse files
Files changed (1) hide show
  1. tokenizer_config.json +6 -21
tokenizer_config.json CHANGED
@@ -26,36 +26,21 @@
26
  "rstrip": false,
27
  "single_word": false,
28
  "special": true
29
- },
30
- "32000": {
31
- "content": "<|im_end|>",
32
- "lstrip": false,
33
- "normalized": false,
34
- "rstrip": false,
35
- "single_word": false,
36
- "special": true
37
- },
38
- "32001": {
39
- "content": "<|im_start|>",
40
- "lstrip": false,
41
- "normalized": false,
42
- "rstrip": false,
43
- "single_word": false,
44
- "special": false
45
  }
46
  },
47
  "additional_special_tokens": [],
48
  "bos_token": "<s>",
49
- "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
50
  "clean_up_tokenization_spaces": false,
51
- "eos_token": "<|im_end|>",
52
  "legacy": true,
53
  "model_max_length": 1000000000000000019884624838656,
54
- "pad_token": "</s>",
 
55
  "sp_model_kwargs": {},
56
  "spaces_between_special_tokens": false,
 
57
  "tokenizer_class": "LlamaTokenizer",
58
  "unk_token": "<unk>",
59
- "use_default_system_prompt": false,
60
- "use_fast": true
61
  }
 
26
  "rstrip": false,
27
  "single_word": false,
28
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
29
  }
30
  },
31
  "additional_special_tokens": [],
32
  "bos_token": "<s>",
33
+ "chat_template": "{{ bos_token }}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if message['role'] == 'user' %}{{ '[INST] ' + message['content'] + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ message['content'] + eos_token}}{% else %}{{ raise_exception('Only user and assistant roles are supported!') }}{% endif %}{% endfor %}",
34
  "clean_up_tokenization_spaces": false,
35
+ "eos_token": "</s>",
36
  "legacy": true,
37
  "model_max_length": 1000000000000000019884624838656,
38
+ "pad_token": null,
39
+ "padding_side": "left",
40
  "sp_model_kwargs": {},
41
  "spaces_between_special_tokens": false,
42
+ "split_special_tokens": false,
43
  "tokenizer_class": "LlamaTokenizer",
44
  "unk_token": "<unk>",
45
+ "use_default_system_prompt": false
 
46
  }