doberst commited on
Commit
602c611
·
verified ·
1 Parent(s): 85e6a41

Upload 11 files

Browse files
config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "mistralai/Mistral-7B-Instruct-v0.2",
3
+ "architectures": [
4
+ "MistralForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 2,
9
+ "head_dim": 128,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 4096,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 14336,
14
+ "max_position_embeddings": 32768,
15
+ "model_type": "mistral",
16
+ "num_attention_heads": 32,
17
+ "num_hidden_layers": 32,
18
+ "num_key_value_heads": 8,
19
+ "rms_norm_eps": 1e-05,
20
+ "rope_theta": 1000000.0,
21
+ "sliding_window": null,
22
+ "tie_word_embeddings": false,
23
+ "torch_dtype": "bfloat16",
24
+ "transformers_version": "4.44.2",
25
+ "use_cache": true,
26
+ "vocab_size": 32000
27
+ }
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "transformers_version": "4.44.2"
6
+ }
openvino_detokenizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e2e36b822674e05f8500a29c0528b7563dcced4a040e73b5d614126a075940d
3
+ size 332685
openvino_detokenizer.xml ADDED
@@ -0,0 +1,294 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <?xml version="1.0"?>
2
+ <net name="detokenizer" version="11">
3
+ <layers>
4
+ <layer id="0" name="Parameter_259198" type="Parameter" version="opset1">
5
+ <data shape="?,?" element_type="i64" />
6
+ <output>
7
+ <port id="0" precision="I64" names="Parameter_259198">
8
+ <dim>-1</dim>
9
+ <dim>-1</dim>
10
+ </port>
11
+ </output>
12
+ </layer>
13
+ <layer id="1" name="Convert_259220" type="Convert" version="opset1">
14
+ <data destination_type="i32" />
15
+ <input>
16
+ <port id="0" precision="I64">
17
+ <dim>-1</dim>
18
+ <dim>-1</dim>
19
+ </port>
20
+ </input>
21
+ <output>
22
+ <port id="1" precision="I32">
23
+ <dim>-1</dim>
24
+ <dim>-1</dim>
25
+ </port>
26
+ </output>
27
+ </layer>
28
+ <layer id="2" name="Constant_259168" type="Const" version="opset1">
29
+ <data element_type="u8" shape="332678" offset="0" size="332678" />
30
+ <output>
31
+ <port id="0" precision="U8">
32
+ <dim>332678</dim>
33
+ </port>
34
+ </output>
35
+ </layer>
36
+ <layer id="3" name="StringTensorUnpack_259169" type="StringTensorUnpack" version="extension">
37
+ <data mode="begins_ends" />
38
+ <input>
39
+ <port id="0" precision="U8">
40
+ <dim>332678</dim>
41
+ </port>
42
+ </input>
43
+ <output>
44
+ <port id="1" precision="I32">
45
+ <dim>-1</dim>
46
+ </port>
47
+ <port id="2" precision="I32">
48
+ <dim>-1</dim>
49
+ </port>
50
+ <port id="3" precision="U8">
51
+ <dim>-1</dim>
52
+ </port>
53
+ </output>
54
+ </layer>
55
+ <layer id="4" name="VocabDecoder_259199" type="VocabDecoder" version="extension">
56
+ <data skip_tokens="0, 1, 2" />
57
+ <input>
58
+ <port id="0" precision="I32">
59
+ <dim>-1</dim>
60
+ <dim>-1</dim>
61
+ </port>
62
+ <port id="1" precision="I32">
63
+ <dim>-1</dim>
64
+ </port>
65
+ <port id="2" precision="I32">
66
+ <dim>-1</dim>
67
+ </port>
68
+ <port id="3" precision="U8">
69
+ <dim>-1</dim>
70
+ </port>
71
+ </input>
72
+ <output>
73
+ <port id="4" precision="I32">
74
+ <dim>-1</dim>
75
+ </port>
76
+ <port id="5" precision="I32">
77
+ <dim>-1</dim>
78
+ </port>
79
+ <port id="6" precision="I32">
80
+ <dim>-1</dim>
81
+ </port>
82
+ <port id="7" precision="I32">
83
+ <dim>-1</dim>
84
+ </port>
85
+ <port id="8" precision="U8">
86
+ <dim>-1</dim>
87
+ </port>
88
+ </output>
89
+ </layer>
90
+ <layer id="5" name="Constant_259201" type="Const" version="opset1">
91
+ <data element_type="u8" shape="3" offset="332678" size="3" />
92
+ <output>
93
+ <port id="0" precision="U8">
94
+ <dim>3</dim>
95
+ </port>
96
+ </output>
97
+ </layer>
98
+ <layer id="6" name="Constant_259203" type="Const" version="opset1">
99
+ <data element_type="u8" shape="1" offset="332681" size="1" />
100
+ <output>
101
+ <port id="0" precision="U8">
102
+ <dim>1</dim>
103
+ </port>
104
+ </output>
105
+ </layer>
106
+ <layer id="7" name="RegexNormalization_259204" type="RegexNormalization" version="extension">
107
+ <data global_replace="true" />
108
+ <input>
109
+ <port id="0" precision="I32">
110
+ <dim>-1</dim>
111
+ </port>
112
+ <port id="1" precision="I32">
113
+ <dim>-1</dim>
114
+ </port>
115
+ <port id="2" precision="U8">
116
+ <dim>-1</dim>
117
+ </port>
118
+ <port id="3" precision="U8">
119
+ <dim>3</dim>
120
+ </port>
121
+ <port id="4" precision="U8">
122
+ <dim>1</dim>
123
+ </port>
124
+ </input>
125
+ <output>
126
+ <port id="5" precision="I32">
127
+ <dim>-1</dim>
128
+ </port>
129
+ <port id="6" precision="I32">
130
+ <dim>-1</dim>
131
+ </port>
132
+ <port id="7" precision="U8">
133
+ <dim>-1</dim>
134
+ </port>
135
+ </output>
136
+ </layer>
137
+ <layer id="8" name="ByteFallback_259205" type="ByteFallback" version="extension">
138
+ <input>
139
+ <port id="0" precision="I32">
140
+ <dim>-1</dim>
141
+ </port>
142
+ <port id="1" precision="I32">
143
+ <dim>-1</dim>
144
+ </port>
145
+ <port id="2" precision="U8">
146
+ <dim>-1</dim>
147
+ </port>
148
+ </input>
149
+ <output>
150
+ <port id="3" precision="I32">
151
+ <dim>-1</dim>
152
+ </port>
153
+ <port id="4" precision="I32">
154
+ <dim>-1</dim>
155
+ </port>
156
+ <port id="5" precision="U8">
157
+ <dim>-1</dim>
158
+ </port>
159
+ </output>
160
+ </layer>
161
+ <layer id="9" name="FuzeRagged_259206" type="FuzeRagged" version="extension">
162
+ <input>
163
+ <port id="0" precision="I32">
164
+ <dim>-1</dim>
165
+ </port>
166
+ <port id="1" precision="I32">
167
+ <dim>-1</dim>
168
+ </port>
169
+ <port id="2" precision="I32">
170
+ <dim>-1</dim>
171
+ </port>
172
+ <port id="3" precision="I32">
173
+ <dim>-1</dim>
174
+ </port>
175
+ </input>
176
+ <output>
177
+ <port id="4" precision="I32">
178
+ <dim>-1</dim>
179
+ </port>
180
+ <port id="5" precision="I32">
181
+ <dim>-1</dim>
182
+ </port>
183
+ </output>
184
+ </layer>
185
+ <layer id="10" name="Constant_259208" type="Const" version="opset1">
186
+ <data element_type="u8" shape="2" offset="332682" size="2" />
187
+ <output>
188
+ <port id="0" precision="U8">
189
+ <dim>2</dim>
190
+ </port>
191
+ </output>
192
+ </layer>
193
+ <layer id="11" name="Constant_259210" type="Const" version="opset1">
194
+ <data element_type="u8" shape="0" offset="332684" size="1" />
195
+ <output>
196
+ <port id="0" precision="U8">
197
+ <dim>0</dim>
198
+ </port>
199
+ </output>
200
+ </layer>
201
+ <layer id="12" name="RegexNormalization_259211" type="RegexNormalization" version="extension">
202
+ <data global_replace="true" />
203
+ <input>
204
+ <port id="0" precision="I32">
205
+ <dim>-1</dim>
206
+ </port>
207
+ <port id="1" precision="I32">
208
+ <dim>-1</dim>
209
+ </port>
210
+ <port id="2" precision="U8">
211
+ <dim>-1</dim>
212
+ </port>
213
+ <port id="3" precision="U8">
214
+ <dim>2</dim>
215
+ </port>
216
+ <port id="4" precision="U8">
217
+ <dim>0</dim>
218
+ </port>
219
+ </input>
220
+ <output>
221
+ <port id="5" precision="I32">
222
+ <dim>-1</dim>
223
+ </port>
224
+ <port id="6" precision="I32">
225
+ <dim>-1</dim>
226
+ </port>
227
+ <port id="7" precision="U8">
228
+ <dim>-1</dim>
229
+ </port>
230
+ </output>
231
+ </layer>
232
+ <layer id="13" name="StringTensorPack_259212" type="StringTensorPack" version="extension">
233
+ <data mode="begins_ends" />
234
+ <input>
235
+ <port id="0" precision="I32">
236
+ <dim>-1</dim>
237
+ </port>
238
+ <port id="1" precision="I32">
239
+ <dim>-1</dim>
240
+ </port>
241
+ <port id="2" precision="U8">
242
+ <dim>-1</dim>
243
+ </port>
244
+ </input>
245
+ <output>
246
+ <port id="3" precision="STRING" names="string_output">
247
+ <dim>-1</dim>
248
+ </port>
249
+ </output>
250
+ </layer>
251
+ <layer id="14" name="Result_259213" type="Result" version="opset1">
252
+ <input>
253
+ <port id="0" precision="STRING">
254
+ <dim>-1</dim>
255
+ </port>
256
+ </input>
257
+ </layer>
258
+ </layers>
259
+ <edges>
260
+ <edge from-layer="0" from-port="0" to-layer="1" to-port="0" />
261
+ <edge from-layer="1" from-port="1" to-layer="4" to-port="0" />
262
+ <edge from-layer="2" from-port="0" to-layer="3" to-port="0" />
263
+ <edge from-layer="3" from-port="1" to-layer="4" to-port="1" />
264
+ <edge from-layer="3" from-port="2" to-layer="4" to-port="2" />
265
+ <edge from-layer="3" from-port="3" to-layer="4" to-port="3" />
266
+ <edge from-layer="4" from-port="6" to-layer="7" to-port="0" />
267
+ <edge from-layer="4" from-port="7" to-layer="7" to-port="1" />
268
+ <edge from-layer="4" from-port="8" to-layer="7" to-port="2" />
269
+ <edge from-layer="4" from-port="4" to-layer="9" to-port="0" />
270
+ <edge from-layer="4" from-port="5" to-layer="9" to-port="1" />
271
+ <edge from-layer="5" from-port="0" to-layer="7" to-port="3" />
272
+ <edge from-layer="6" from-port="0" to-layer="7" to-port="4" />
273
+ <edge from-layer="7" from-port="5" to-layer="8" to-port="0" />
274
+ <edge from-layer="7" from-port="6" to-layer="8" to-port="1" />
275
+ <edge from-layer="7" from-port="7" to-layer="8" to-port="2" />
276
+ <edge from-layer="8" from-port="3" to-layer="9" to-port="2" />
277
+ <edge from-layer="8" from-port="4" to-layer="9" to-port="3" />
278
+ <edge from-layer="8" from-port="5" to-layer="12" to-port="2" />
279
+ <edge from-layer="9" from-port="4" to-layer="12" to-port="0" />
280
+ <edge from-layer="9" from-port="5" to-layer="12" to-port="1" />
281
+ <edge from-layer="10" from-port="0" to-layer="12" to-port="3" />
282
+ <edge from-layer="11" from-port="0" to-layer="12" to-port="4" />
283
+ <edge from-layer="12" from-port="5" to-layer="13" to-port="0" />
284
+ <edge from-layer="12" from-port="6" to-layer="13" to-port="1" />
285
+ <edge from-layer="12" from-port="7" to-layer="13" to-port="2" />
286
+ <edge from-layer="13" from-port="3" to-layer="14" to-port="0" />
287
+ </edges>
288
+ <rt_info>
289
+ <bos_token_id value="1" />
290
+ <chat_template value="{%- if messages[0]['role'] == 'system' %}&#10; {%- set system_message = messages[0]['content'] %}&#10; {%- set loop_messages = messages[1:] %}&#10;{%- else %}&#10; {%- set loop_messages = messages %}&#10;{%- endif %}&#10;&#10;{{- bos_token }}&#10;{%- for message in loop_messages %}&#10; {%- if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}&#10; {{- raise_exception('After the optional system message, conversation roles must alternate user/assistant/user/assistant/...') }}&#10; {%- endif %}&#10; {%- if message['role'] == 'user' %}&#10; {%- if loop.first and system_message is defined %}&#10; {{- ' [INST] ' + system_message + '\n\n' + message['content'] + ' [/INST]' }}&#10; {%- else %}&#10; {{- ' [INST] ' + message['content'] + ' [/INST]' }}&#10; {%- endif %}&#10; {%- elif message['role'] == 'assistant' %}&#10; {{- ' ' + message['content'] + eos_token}}&#10; {%- else %}&#10; {{- raise_exception('Only user and assistant roles are supported, with the exception of an initial optional system message!') }}&#10; {%- endif %}&#10;{%- endfor %}&#10;" />
291
+ <eos_token_id value="2" />
292
+ <original_tokenizer_class value="&lt;class 'transformers.models.llama.tokenization_llama_fast.LlamaTokenizerFast'>" />
293
+ </rt_info>
294
+ </net>
openvino_model.xml ADDED
The diff for this file is too large to render. See raw diff
 
openvino_tokenizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e84a67e731dc9785f3a0cfadf22ec92b19eaf0c7518f21f7fc22a9d7904d4ff0
3
+ size 1033133
openvino_tokenizer.xml ADDED
@@ -0,0 +1,758 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <?xml version="1.0"?>
2
+ <net name="tokenizer" version="11">
3
+ <layers>
4
+ <layer id="0" name="Parameter_259078" type="Parameter" version="opset1">
5
+ <data shape="?" element_type="string" />
6
+ <output>
7
+ <port id="0" precision="STRING" names="Parameter_259078">
8
+ <dim>-1</dim>
9
+ </port>
10
+ </output>
11
+ </layer>
12
+ <layer id="1" name="Constant_259182" type="Const" version="opset1">
13
+ <data element_type="i32" shape="" offset="0" size="4" />
14
+ <output>
15
+ <port id="0" precision="I32" />
16
+ </output>
17
+ </layer>
18
+ <layer id="2" name="Constant_259183" type="Const" version="opset1">
19
+ <data element_type="i32" shape="" offset="4" size="4" />
20
+ <output>
21
+ <port id="0" precision="I32" />
22
+ </output>
23
+ </layer>
24
+ <layer id="3" name="Constant_259184" type="Const" version="opset1">
25
+ <data element_type="i32" shape="1" offset="4" size="4" />
26
+ <output>
27
+ <port id="0" precision="I32">
28
+ <dim>1</dim>
29
+ </port>
30
+ </output>
31
+ </layer>
32
+ <layer id="4" name="Constant_259094" type="Const" version="opset1">
33
+ <data element_type="i32" shape="" offset="0" size="4" />
34
+ <output>
35
+ <port id="0" precision="I32" />
36
+ </output>
37
+ </layer>
38
+ <layer id="5" name="StringTensorUnpack_259079" type="StringTensorUnpack" version="extension">
39
+ <data mode="begins_ends" />
40
+ <input>
41
+ <port id="0" precision="STRING">
42
+ <dim>-1</dim>
43
+ </port>
44
+ </input>
45
+ <output>
46
+ <port id="1" precision="I32">
47
+ <dim>-1</dim>
48
+ </port>
49
+ <port id="2" precision="I32">
50
+ <dim>-1</dim>
51
+ </port>
52
+ <port id="3" precision="U8">
53
+ <dim>-1</dim>
54
+ </port>
55
+ </output>
56
+ </layer>
57
+ <layer id="6" name="Constant_259081" type="Const" version="opset1">
58
+ <data element_type="u8" shape="1" offset="8" size="1" />
59
+ <output>
60
+ <port id="0" precision="U8">
61
+ <dim>1</dim>
62
+ </port>
63
+ </output>
64
+ </layer>
65
+ <layer id="7" name="Constant_259083" type="Const" version="opset1">
66
+ <data element_type="u8" shape="3" offset="9" size="3" />
67
+ <output>
68
+ <port id="0" precision="U8">
69
+ <dim>3</dim>
70
+ </port>
71
+ </output>
72
+ </layer>
73
+ <layer id="8" name="RegexNormalization_259084" type="RegexNormalization" version="extension">
74
+ <data global_replace="true" />
75
+ <input>
76
+ <port id="0" precision="I32">
77
+ <dim>-1</dim>
78
+ </port>
79
+ <port id="1" precision="I32">
80
+ <dim>-1</dim>
81
+ </port>
82
+ <port id="2" precision="U8">
83
+ <dim>-1</dim>
84
+ </port>
85
+ <port id="3" precision="U8">
86
+ <dim>1</dim>
87
+ </port>
88
+ <port id="4" precision="U8">
89
+ <dim>3</dim>
90
+ </port>
91
+ </input>
92
+ <output>
93
+ <port id="5" precision="I32">
94
+ <dim>-1</dim>
95
+ </port>
96
+ <port id="6" precision="I32">
97
+ <dim>-1</dim>
98
+ </port>
99
+ <port id="7" precision="U8">
100
+ <dim>-1</dim>
101
+ </port>
102
+ </output>
103
+ </layer>
104
+ <layer id="9" name="Constant_259086" type="Const" version="opset1">
105
+ <data element_type="u8" shape="11" offset="12" size="11" />
106
+ <output>
107
+ <port id="0" precision="U8">
108
+ <dim>11</dim>
109
+ </port>
110
+ </output>
111
+ </layer>
112
+ <layer id="10" name="Constant_259088" type="Const" version="opset1">
113
+ <data element_type="u8" shape="5" offset="23" size="5" />
114
+ <output>
115
+ <port id="0" precision="U8">
116
+ <dim>5</dim>
117
+ </port>
118
+ </output>
119
+ </layer>
120
+ <layer id="11" name="RegexNormalization_259089" type="RegexNormalization" version="extension">
121
+ <data global_replace="true" />
122
+ <input>
123
+ <port id="0" precision="I32">
124
+ <dim>-1</dim>
125
+ </port>
126
+ <port id="1" precision="I32">
127
+ <dim>-1</dim>
128
+ </port>
129
+ <port id="2" precision="U8">
130
+ <dim>-1</dim>
131
+ </port>
132
+ <port id="3" precision="U8">
133
+ <dim>11</dim>
134
+ </port>
135
+ <port id="4" precision="U8">
136
+ <dim>5</dim>
137
+ </port>
138
+ </input>
139
+ <output>
140
+ <port id="5" precision="I32">
141
+ <dim>-1</dim>
142
+ </port>
143
+ <port id="6" precision="I32">
144
+ <dim>-1</dim>
145
+ </port>
146
+ <port id="7" precision="U8">
147
+ <dim>-1</dim>
148
+ </port>
149
+ </output>
150
+ </layer>
151
+ <layer id="12" name="ShapeOf_259090" type="ShapeOf" version="opset3">
152
+ <data output_type="i64" />
153
+ <input>
154
+ <port id="0" precision="I32">
155
+ <dim>-1</dim>
156
+ </port>
157
+ </input>
158
+ <output>
159
+ <port id="1" precision="I64">
160
+ <dim>1</dim>
161
+ </port>
162
+ </output>
163
+ </layer>
164
+ <layer id="13" name="Constant_259091" type="Const" version="opset1">
165
+ <data element_type="i32" shape="" offset="0" size="4" />
166
+ <output>
167
+ <port id="0" precision="I32" />
168
+ </output>
169
+ </layer>
170
+ <layer id="14" name="Constant_259092" type="Const" version="opset1">
171
+ <data element_type="i32" shape="" offset="0" size="4" />
172
+ <output>
173
+ <port id="0" precision="I32" />
174
+ </output>
175
+ </layer>
176
+ <layer id="15" name="Gather_259093" type="Gather" version="opset8">
177
+ <data batch_dims="0" />
178
+ <input>
179
+ <port id="0" precision="I64">
180
+ <dim>1</dim>
181
+ </port>
182
+ <port id="1" precision="I32" />
183
+ <port id="2" precision="I32" />
184
+ </input>
185
+ <output>
186
+ <port id="3" precision="I64" />
187
+ </output>
188
+ </layer>
189
+ <layer id="16" name="Constant_259095" type="Const" version="opset1">
190
+ <data element_type="i32" shape="" offset="4" size="4" />
191
+ <output>
192
+ <port id="0" precision="I32" />
193
+ </output>
194
+ </layer>
195
+ <layer id="17" name="Range_259096" type="Range" version="opset4">
196
+ <data output_type="i32" />
197
+ <input>
198
+ <port id="0" precision="I32" />
199
+ <port id="1" precision="I64" />
200
+ <port id="2" precision="I32" />
201
+ </input>
202
+ <output>
203
+ <port id="3" precision="I32">
204
+ <dim>-1</dim>
205
+ </port>
206
+ </output>
207
+ </layer>
208
+ <layer id="18" name="Constant_259098" type="Const" version="opset1">
209
+ <data element_type="i32" shape="" offset="4" size="4" />
210
+ <output>
211
+ <port id="0" precision="I32" />
212
+ </output>
213
+ </layer>
214
+ <layer id="19" name="Constant_259099" type="Const" version="opset1">
215
+ <data element_type="i64" shape="" offset="28" size="8" />
216
+ <output>
217
+ <port id="0" precision="I64" />
218
+ </output>
219
+ </layer>
220
+ <layer id="20" name="Add_259100" type="Add" version="opset1">
221
+ <data auto_broadcast="numpy" />
222
+ <input>
223
+ <port id="0" precision="I64" />
224
+ <port id="1" precision="I64" />
225
+ </input>
226
+ <output>
227
+ <port id="2" precision="I64" />
228
+ </output>
229
+ </layer>
230
+ <layer id="21" name="Constant_259101" type="Const" version="opset1">
231
+ <data element_type="i32" shape="" offset="4" size="4" />
232
+ <output>
233
+ <port id="0" precision="I32" />
234
+ </output>
235
+ </layer>
236
+ <layer id="22" name="Range_259102" type="Range" version="opset4">
237
+ <data output_type="i32" />
238
+ <input>
239
+ <port id="0" precision="I32" />
240
+ <port id="1" precision="I64" />
241
+ <port id="2" precision="I32" />
242
+ </input>
243
+ <output>
244
+ <port id="3" precision="I32">
245
+ <dim>-1</dim>
246
+ </port>
247
+ </output>
248
+ </layer>
249
+ <layer id="23" name="Constant_259165" type="Const" version="opset1">
250
+ <data element_type="u8" shape="13" offset="36" size="13" />
251
+ <output>
252
+ <port id="0" precision="U8">
253
+ <dim>13</dim>
254
+ </port>
255
+ </output>
256
+ </layer>
257
+ <layer id="24" name="RegexSplit_259166" type="RegexSplit" version="extension">
258
+ <data behaviour="isolate" invert="false" max_splits="-1" />
259
+ <input>
260
+ <port id="0" precision="I32">
261
+ <dim>-1</dim>
262
+ </port>
263
+ <port id="1" precision="I32">
264
+ <dim>-1</dim>
265
+ </port>
266
+ <port id="2" precision="I32">
267
+ <dim>-1</dim>
268
+ </port>
269
+ <port id="3" precision="I32">
270
+ <dim>-1</dim>
271
+ </port>
272
+ <port id="4" precision="U8">
273
+ <dim>-1</dim>
274
+ </port>
275
+ <port id="5" precision="U8">
276
+ <dim>13</dim>
277
+ </port>
278
+ </input>
279
+ <output>
280
+ <port id="6" precision="I32">
281
+ <dim>-1</dim>
282
+ </port>
283
+ <port id="7" precision="I32">
284
+ <dim>-1</dim>
285
+ </port>
286
+ <port id="8" precision="I32">
287
+ <dim>-1</dim>
288
+ </port>
289
+ <port id="9" precision="I32">
290
+ <dim>-1</dim>
291
+ </port>
292
+ <port id="10" precision="U8">
293
+ <dim>-1</dim>
294
+ </port>
295
+ </output>
296
+ </layer>
297
+ <layer id="25" name="Constant_259168" type="Const" version="opset1">
298
+ <data element_type="u8" shape="332678" offset="49" size="332678" />
299
+ <output>
300
+ <port id="0" precision="U8">
301
+ <dim>332678</dim>
302
+ </port>
303
+ </output>
304
+ </layer>
305
+ <layer id="26" name="StringTensorUnpack_259169" type="StringTensorUnpack" version="extension">
306
+ <data mode="begins_ends" />
307
+ <input>
308
+ <port id="0" precision="U8">
309
+ <dim>332678</dim>
310
+ </port>
311
+ </input>
312
+ <output>
313
+ <port id="1" precision="I32">
314
+ <dim>-1</dim>
315
+ </port>
316
+ <port id="2" precision="I32">
317
+ <dim>-1</dim>
318
+ </port>
319
+ <port id="3" precision="U8">
320
+ <dim>-1</dim>
321
+ </port>
322
+ </output>
323
+ </layer>
324
+ <layer id="27" name="Constant_259174" type="Const" version="opset1">
325
+ <data element_type="u8" shape="700363" offset="332727" size="700363" />
326
+ <output>
327
+ <port id="0" precision="U8">
328
+ <dim>700363</dim>
329
+ </port>
330
+ </output>
331
+ </layer>
332
+ <layer id="28" name="StringTensorUnpack_259175" type="StringTensorUnpack" version="extension">
333
+ <data mode="begins_ends" />
334
+ <input>
335
+ <port id="0" precision="U8">
336
+ <dim>700363</dim>
337
+ </port>
338
+ </input>
339
+ <output>
340
+ <port id="1" precision="I32">
341
+ <dim>-1</dim>
342
+ </port>
343
+ <port id="2" precision="I32">
344
+ <dim>-1</dim>
345
+ </port>
346
+ <port id="3" precision="U8">
347
+ <dim>-1</dim>
348
+ </port>
349
+ </output>
350
+ </layer>
351
+ <layer id="29" name="Constant_259171" type="Const" version="opset1">
352
+ <data element_type="u8" shape="23" offset="1033090" size="23" />
353
+ <output>
354
+ <port id="0" precision="U8">
355
+ <dim>23</dim>
356
+ </port>
357
+ </output>
358
+ </layer>
359
+ <layer id="30" name="StringTensorUnpack_259172" type="StringTensorUnpack" version="extension">
360
+ <data mode="begins_ends" />
361
+ <input>
362
+ <port id="0" precision="U8">
363
+ <dim>23</dim>
364
+ </port>
365
+ </input>
366
+ <output>
367
+ <port id="1" precision="I32">
368
+ <dim>-1</dim>
369
+ </port>
370
+ <port id="2" precision="I32">
371
+ <dim>-1</dim>
372
+ </port>
373
+ <port id="3" precision="U8">
374
+ <dim>-1</dim>
375
+ </port>
376
+ </output>
377
+ </layer>
378
+ <layer id="31" name="Constant_259176" type="Const" version="opset1">
379
+ <data element_type="i32" shape="2" offset="1033113" size="8" />
380
+ <output>
381
+ <port id="0" precision="I32">
382
+ <dim>2</dim>
383
+ </port>
384
+ </output>
385
+ </layer>
386
+ <layer id="32" name="BPETokenizer_259177" type="BPETokenizer" version="extension">
387
+ <data unk_token="&lt;unk>" fuse_unk="true" suffix_indicator="" end_suffix="" byte_fallback="true" cache_capacity="20000" />
388
+ <input>
389
+ <port id="0" precision="I32">
390
+ <dim>-1</dim>
391
+ </port>
392
+ <port id="1" precision="I32">
393
+ <dim>-1</dim>
394
+ </port>
395
+ <port id="2" precision="I32">
396
+ <dim>-1</dim>
397
+ </port>
398
+ <port id="3" precision="I32">
399
+ <dim>-1</dim>
400
+ </port>
401
+ <port id="4" precision="U8">
402
+ <dim>-1</dim>
403
+ </port>
404
+ <port id="5" precision="I32">
405
+ <dim>-1</dim>
406
+ </port>
407
+ <port id="6" precision="I32">
408
+ <dim>-1</dim>
409
+ </port>
410
+ <port id="7" precision="U8">
411
+ <dim>-1</dim>
412
+ </port>
413
+ <port id="8" precision="I32">
414
+ <dim>-1</dim>
415
+ </port>
416
+ <port id="9" precision="I32">
417
+ <dim>-1</dim>
418
+ </port>
419
+ <port id="10" precision="U8">
420
+ <dim>-1</dim>
421
+ </port>
422
+ <port id="11" precision="I32">
423
+ <dim>-1</dim>
424
+ </port>
425
+ <port id="12" precision="I32">
426
+ <dim>-1</dim>
427
+ </port>
428
+ <port id="13" precision="U8">
429
+ <dim>-1</dim>
430
+ </port>
431
+ <port id="14" precision="I32">
432
+ <dim>2</dim>
433
+ </port>
434
+ </input>
435
+ <output>
436
+ <port id="15" precision="I32">
437
+ <dim>-1</dim>
438
+ </port>
439
+ <port id="16" precision="I32">
440
+ <dim>-1</dim>
441
+ </port>
442
+ <port id="17" precision="I32">
443
+ <dim>-1</dim>
444
+ </port>
445
+ </output>
446
+ </layer>
447
+ <layer id="33" name="Subtract_259178" type="Subtract" version="opset1">
448
+ <data auto_broadcast="numpy" />
449
+ <input>
450
+ <port id="0" precision="I32">
451
+ <dim>-1</dim>
452
+ </port>
453
+ <port id="1" precision="I32">
454
+ <dim>-1</dim>
455
+ </port>
456
+ </input>
457
+ <output>
458
+ <port id="2" precision="I32">
459
+ <dim>-1</dim>
460
+ </port>
461
+ </output>
462
+ </layer>
463
+ <layer id="34" name="Constant_259179" type="Const" version="opset1">
464
+ <data element_type="i32" shape="" offset="1033121" size="4" />
465
+ <output>
466
+ <port id="0" precision="I32" />
467
+ </output>
468
+ </layer>
469
+ <layer id="35" name="Minimum_259180" type="Minimum" version="opset1">
470
+ <data auto_broadcast="numpy" />
471
+ <input>
472
+ <port id="0" precision="I32">
473
+ <dim>-1</dim>
474
+ </port>
475
+ <port id="1" precision="I32" />
476
+ </input>
477
+ <output>
478
+ <port id="2" precision="I32">
479
+ <dim>-1</dim>
480
+ </port>
481
+ </output>
482
+ </layer>
483
+ <layer id="36" name="Subtract_259181" type="Subtract" version="opset1">
484
+ <data auto_broadcast="numpy" />
485
+ <input>
486
+ <port id="0" precision="I32">
487
+ <dim>-1</dim>
488
+ </port>
489
+ <port id="1" precision="I32">
490
+ <dim>-1</dim>
491
+ </port>
492
+ </input>
493
+ <output>
494
+ <port id="2" precision="I32">
495
+ <dim>-1</dim>
496
+ </port>
497
+ </output>
498
+ </layer>
499
+ <layer id="37" name="Constant_259185" type="Const" version="opset1">
500
+ <data element_type="i32" shape="2" offset="1033125" size="8" />
501
+ <output>
502
+ <port id="0" precision="I32">
503
+ <dim>2</dim>
504
+ </port>
505
+ </output>
506
+ </layer>
507
+ <layer id="38" name="CombineSegments_259186" type="CombineSegments" version="extension">
508
+ <input>
509
+ <port id="0" precision="I32" />
510
+ <port id="1" precision="I32" />
511
+ <port id="2" precision="I32">
512
+ <dim>1</dim>
513
+ </port>
514
+ <port id="3" precision="I32">
515
+ <dim>-1</dim>
516
+ </port>
517
+ <port id="4" precision="I32">
518
+ <dim>-1</dim>
519
+ </port>
520
+ <port id="5" precision="I32">
521
+ <dim>-1</dim>
522
+ </port>
523
+ <port id="6" precision="I32">
524
+ <dim>2</dim>
525
+ </port>
526
+ </input>
527
+ <output>
528
+ <port id="7" precision="I32">
529
+ <dim>-1</dim>
530
+ </port>
531
+ <port id="8" precision="I32">
532
+ <dim>-1</dim>
533
+ </port>
534
+ <port id="9" precision="I32">
535
+ <dim>-1</dim>
536
+ </port>
537
+ <port id="10" precision="I32">
538
+ <dim>-1</dim>
539
+ </port>
540
+ <port id="11" precision="I32">
541
+ <dim>-1</dim>
542
+ </port>
543
+ <port id="12" precision="I32">
544
+ <dim>-1</dim>
545
+ </port>
546
+ </output>
547
+ </layer>
548
+ <layer id="39" name="Subtract_259187" type="Subtract" version="opset1">
549
+ <data auto_broadcast="numpy" />
550
+ <input>
551
+ <port id="0" precision="I32">
552
+ <dim>-1</dim>
553
+ </port>
554
+ <port id="1" precision="I32">
555
+ <dim>-1</dim>
556
+ </port>
557
+ </input>
558
+ <output>
559
+ <port id="2" precision="I32">
560
+ <dim>-1</dim>
561
+ </port>
562
+ </output>
563
+ </layer>
564
+ <layer id="40" name="Constant_259188" type="Const" version="opset1">
565
+ <data element_type="i32" shape="" offset="0" size="4" />
566
+ <output>
567
+ <port id="0" precision="I32" />
568
+ </output>
569
+ </layer>
570
+ <layer id="41" name="ReduceMax_259189" type="ReduceMax" version="opset1">
571
+ <data keep_dims="false" />
572
+ <input>
573
+ <port id="0" precision="I32">
574
+ <dim>-1</dim>
575
+ </port>
576
+ <port id="1" precision="I32" />
577
+ </input>
578
+ <output>
579
+ <port id="2" precision="I32" />
580
+ </output>
581
+ </layer>
582
+ <layer id="42" name="Constant_259190" type="Const" version="opset1">
583
+ <data element_type="i32" shape="" offset="0" size="4" />
584
+ <output>
585
+ <port id="0" precision="I32" />
586
+ </output>
587
+ </layer>
588
+ <layer id="43" name="RaggedToDense_259191" type="RaggedToDense" version="extension">
589
+ <data pad_right="false" />
590
+ <input>
591
+ <port id="0" precision="I32">
592
+ <dim>-1</dim>
593
+ </port>
594
+ <port id="1" precision="I32">
595
+ <dim>-1</dim>
596
+ </port>
597
+ <port id="2" precision="I32">
598
+ <dim>-1</dim>
599
+ </port>
600
+ <port id="3" precision="I32" />
601
+ <port id="4" precision="I32" />
602
+ </input>
603
+ <output>
604
+ <port id="5" precision="I32">
605
+ <dim>-1</dim>
606
+ <dim>-1</dim>
607
+ </port>
608
+ <port id="6" precision="BOOL">
609
+ <dim>-1</dim>
610
+ <dim>-1</dim>
611
+ </port>
612
+ </output>
613
+ </layer>
614
+ <layer id="44" name="Convert_259192" type="Convert" version="opset1">
615
+ <data destination_type="i32" />
616
+ <input>
617
+ <port id="0" precision="BOOL">
618
+ <dim>-1</dim>
619
+ <dim>-1</dim>
620
+ </port>
621
+ </input>
622
+ <output>
623
+ <port id="1" precision="I32">
624
+ <dim>-1</dim>
625
+ <dim>-1</dim>
626
+ </port>
627
+ </output>
628
+ </layer>
629
+ <layer id="45" name="Convert_259192" type="Convert" version="opset1">
630
+ <data destination_type="i64" />
631
+ <input>
632
+ <port id="0" precision="I32">
633
+ <dim>-1</dim>
634
+ <dim>-1</dim>
635
+ </port>
636
+ </input>
637
+ <output>
638
+ <port id="1" precision="I64" names="attention_mask">
639
+ <dim>-1</dim>
640
+ <dim>-1</dim>
641
+ </port>
642
+ </output>
643
+ </layer>
644
+ <layer id="47" name="RaggedToDense_259191.0" type="Convert" version="opset1">
645
+ <data destination_type="i64" />
646
+ <input>
647
+ <port id="0" precision="I32">
648
+ <dim>-1</dim>
649
+ <dim>-1</dim>
650
+ </port>
651
+ </input>
652
+ <output>
653
+ <port id="1" precision="I64" names="input_ids">
654
+ <dim>-1</dim>
655
+ <dim>-1</dim>
656
+ </port>
657
+ </output>
658
+ </layer>
659
+ <layer id="48" name="Result_259195" type="Result" version="opset1">
660
+ <input>
661
+ <port id="0" precision="I64">
662
+ <dim>-1</dim>
663
+ <dim>-1</dim>
664
+ </port>
665
+ </input>
666
+ </layer>
667
+ <layer id="46" name="Result_259197" type="Result" version="opset1">
668
+ <input>
669
+ <port id="0" precision="I64">
670
+ <dim>-1</dim>
671
+ <dim>-1</dim>
672
+ </port>
673
+ </input>
674
+ </layer>
675
+ </layers>
676
+ <edges>
677
+ <edge from-layer="0" from-port="0" to-layer="5" to-port="0" />
678
+ <edge from-layer="1" from-port="0" to-layer="38" to-port="0" />
679
+ <edge from-layer="2" from-port="0" to-layer="38" to-port="1" />
680
+ <edge from-layer="3" from-port="0" to-layer="38" to-port="2" />
681
+ <edge from-layer="4" from-port="0" to-layer="17" to-port="0" />
682
+ <edge from-layer="5" from-port="1" to-layer="8" to-port="0" />
683
+ <edge from-layer="5" from-port="2" to-layer="8" to-port="1" />
684
+ <edge from-layer="5" from-port="3" to-layer="8" to-port="2" />
685
+ <edge from-layer="6" from-port="0" to-layer="8" to-port="3" />
686
+ <edge from-layer="7" from-port="0" to-layer="8" to-port="4" />
687
+ <edge from-layer="8" from-port="5" to-layer="11" to-port="0" />
688
+ <edge from-layer="8" from-port="6" to-layer="11" to-port="1" />
689
+ <edge from-layer="8" from-port="7" to-layer="11" to-port="2" />
690
+ <edge from-layer="9" from-port="0" to-layer="11" to-port="3" />
691
+ <edge from-layer="10" from-port="0" to-layer="11" to-port="4" />
692
+ <edge from-layer="11" from-port="5" to-layer="12" to-port="0" />
693
+ <edge from-layer="11" from-port="5" to-layer="24" to-port="2" />
694
+ <edge from-layer="11" from-port="6" to-layer="24" to-port="3" />
695
+ <edge from-layer="11" from-port="7" to-layer="24" to-port="4" />
696
+ <edge from-layer="12" from-port="1" to-layer="15" to-port="0" />
697
+ <edge from-layer="13" from-port="0" to-layer="15" to-port="1" />
698
+ <edge from-layer="14" from-port="0" to-layer="15" to-port="2" />
699
+ <edge from-layer="15" from-port="3" to-layer="17" to-port="1" />
700
+ <edge from-layer="15" from-port="3" to-layer="20" to-port="0" />
701
+ <edge from-layer="16" from-port="0" to-layer="17" to-port="2" />
702
+ <edge from-layer="17" from-port="3" to-layer="24" to-port="0" />
703
+ <edge from-layer="18" from-port="0" to-layer="22" to-port="0" />
704
+ <edge from-layer="19" from-port="0" to-layer="20" to-port="1" />
705
+ <edge from-layer="20" from-port="2" to-layer="22" to-port="1" />
706
+ <edge from-layer="21" from-port="0" to-layer="22" to-port="2" />
707
+ <edge from-layer="22" from-port="3" to-layer="24" to-port="1" />
708
+ <edge from-layer="23" from-port="0" to-layer="24" to-port="5" />
709
+ <edge from-layer="24" from-port="6" to-layer="32" to-port="0" />
710
+ <edge from-layer="24" from-port="7" to-layer="32" to-port="1" />
711
+ <edge from-layer="24" from-port="8" to-layer="32" to-port="2" />
712
+ <edge from-layer="24" from-port="9" to-layer="32" to-port="3" />
713
+ <edge from-layer="24" from-port="10" to-layer="32" to-port="4" />
714
+ <edge from-layer="25" from-port="0" to-layer="26" to-port="0" />
715
+ <edge from-layer="26" from-port="2" to-layer="32" to-port="6" />
716
+ <edge from-layer="26" from-port="3" to-layer="32" to-port="7" />
717
+ <edge from-layer="26" from-port="1" to-layer="32" to-port="5" />
718
+ <edge from-layer="27" from-port="0" to-layer="28" to-port="0" />
719
+ <edge from-layer="28" from-port="2" to-layer="32" to-port="9" />
720
+ <edge from-layer="28" from-port="3" to-layer="32" to-port="10" />
721
+ <edge from-layer="28" from-port="1" to-layer="32" to-port="8" />
722
+ <edge from-layer="29" from-port="0" to-layer="30" to-port="0" />
723
+ <edge from-layer="30" from-port="1" to-layer="32" to-port="11" />
724
+ <edge from-layer="30" from-port="2" to-layer="32" to-port="12" />
725
+ <edge from-layer="30" from-port="3" to-layer="32" to-port="13" />
726
+ <edge from-layer="31" from-port="0" to-layer="32" to-port="14" />
727
+ <edge from-layer="32" from-port="16" to-layer="33" to-port="0" />
728
+ <edge from-layer="32" from-port="15" to-layer="33" to-port="1" />
729
+ <edge from-layer="32" from-port="16" to-layer="38" to-port="4" />
730
+ <edge from-layer="32" from-port="17" to-layer="38" to-port="5" />
731
+ <edge from-layer="32" from-port="16" to-layer="36" to-port="0" />
732
+ <edge from-layer="33" from-port="2" to-layer="35" to-port="0" />
733
+ <edge from-layer="34" from-port="0" to-layer="35" to-port="1" />
734
+ <edge from-layer="35" from-port="2" to-layer="36" to-port="1" />
735
+ <edge from-layer="36" from-port="2" to-layer="38" to-port="3" />
736
+ <edge from-layer="37" from-port="0" to-layer="38" to-port="6" />
737
+ <edge from-layer="38" from-port="8" to-layer="39" to-port="0" />
738
+ <edge from-layer="38" from-port="7" to-layer="39" to-port="1" />
739
+ <edge from-layer="38" from-port="7" to-layer="43" to-port="0" />
740
+ <edge from-layer="38" from-port="8" to-layer="43" to-port="1" />
741
+ <edge from-layer="38" from-port="9" to-layer="43" to-port="2" />
742
+ <edge from-layer="39" from-port="2" to-layer="41" to-port="0" />
743
+ <edge from-layer="40" from-port="0" to-layer="41" to-port="1" />
744
+ <edge from-layer="41" from-port="2" to-layer="43" to-port="3" />
745
+ <edge from-layer="42" from-port="0" to-layer="43" to-port="4" />
746
+ <edge from-layer="43" from-port="6" to-layer="44" to-port="0" />
747
+ <edge from-layer="43" from-port="5" to-layer="47" to-port="0" />
748
+ <edge from-layer="44" from-port="1" to-layer="45" to-port="0" />
749
+ <edge from-layer="45" from-port="1" to-layer="46" to-port="0" />
750
+ <edge from-layer="47" from-port="1" to-layer="48" to-port="0" />
751
+ </edges>
752
+ <rt_info>
753
+ <bos_token_id value="1" />
754
+ <chat_template value="{%- if messages[0]['role'] == 'system' %}&#10; {%- set system_message = messages[0]['content'] %}&#10; {%- set loop_messages = messages[1:] %}&#10;{%- else %}&#10; {%- set loop_messages = messages %}&#10;{%- endif %}&#10;&#10;{{- bos_token }}&#10;{%- for message in loop_messages %}&#10; {%- if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}&#10; {{- raise_exception('After the optional system message, conversation roles must alternate user/assistant/user/assistant/...') }}&#10; {%- endif %}&#10; {%- if message['role'] == 'user' %}&#10; {%- if loop.first and system_message is defined %}&#10; {{- ' [INST] ' + system_message + '\n\n' + message['content'] + ' [/INST]' }}&#10; {%- else %}&#10; {{- ' [INST] ' + message['content'] + ' [/INST]' }}&#10; {%- endif %}&#10; {%- elif message['role'] == 'assistant' %}&#10; {{- ' ' + message['content'] + eos_token}}&#10; {%- else %}&#10; {{- raise_exception('Only user and assistant roles are supported, with the exception of an initial optional system message!') }}&#10; {%- endif %}&#10;{%- endfor %}&#10;" />
755
+ <eos_token_id value="2" />
756
+ <original_tokenizer_class value="&lt;class 'transformers.models.llama.tokenization_llama_fast.LlamaTokenizerFast'>" />
757
+ </rt_info>
758
+ </net>
special_tokens_map.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "unk_token": {
17
+ "content": "<unk>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ }
23
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
3
+ size 493443
tokenizer_config.json ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
+ "add_prefix_space": null,
5
+ "added_tokens_decoder": {
6
+ "0": {
7
+ "content": "<unk>",
8
+ "lstrip": false,
9
+ "normalized": false,
10
+ "rstrip": false,
11
+ "single_word": false,
12
+ "special": true
13
+ },
14
+ "1": {
15
+ "content": "<s>",
16
+ "lstrip": false,
17
+ "normalized": false,
18
+ "rstrip": false,
19
+ "single_word": false,
20
+ "special": true
21
+ },
22
+ "2": {
23
+ "content": "</s>",
24
+ "lstrip": false,
25
+ "normalized": false,
26
+ "rstrip": false,
27
+ "single_word": false,
28
+ "special": true
29
+ }
30
+ },
31
+ "additional_special_tokens": [],
32
+ "bos_token": "<s>",
33
+ "chat_template": "{%- if messages[0]['role'] == 'system' %}\n {%- set system_message = messages[0]['content'] %}\n {%- set loop_messages = messages[1:] %}\n{%- else %}\n {%- set loop_messages = messages %}\n{%- endif %}\n\n{{- bos_token }}\n{%- for message in loop_messages %}\n {%- if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}\n {{- raise_exception('After the optional system message, conversation roles must alternate user/assistant/user/assistant/...') }}\n {%- endif %}\n {%- if message['role'] == 'user' %}\n {%- if loop.first and system_message is defined %}\n {{- ' [INST] ' + system_message + '\\n\\n' + message['content'] + ' [/INST]' }}\n {%- else %}\n {{- ' [INST] ' + message['content'] + ' [/INST]' }}\n {%- endif %}\n {%- elif message['role'] == 'assistant' %}\n {{- ' ' + message['content'] + eos_token}}\n {%- else %}\n {{- raise_exception('Only user and assistant roles are supported, with the exception of an initial optional system message!') }}\n {%- endif %}\n{%- endfor %}\n",
34
+ "clean_up_tokenization_spaces": false,
35
+ "eos_token": "</s>",
36
+ "legacy": false,
37
+ "model_max_length": 1000000000000000019884624838656,
38
+ "pad_token": null,
39
+ "sp_model_kwargs": {},
40
+ "spaces_between_special_tokens": false,
41
+ "tokenizer_class": "LlamaTokenizer",
42
+ "unk_token": "<unk>",
43
+ "use_default_system_prompt": false
44
+ }