openvino-ci
commited on
Commit
•
9dffed2
1
Parent(s):
3edf3f2
Upload folder using huggingface_hub
Browse files- config.json +2 -1
- generation_config.json +1 -1
- openvino_decoder_model.xml +157 -156
- openvino_detokenizer.bin +1 -1
- openvino_detokenizer.xml +32 -12
- openvino_encoder_model.xml +0 -0
- openvino_tokenizer.xml +80 -60
config.json
CHANGED
@@ -1,4 +1,5 @@
|
|
1 |
{
|
|
|
2 |
"_name_or_path": "distil-whisper/distil-large-v2",
|
3 |
"activation_dropout": 0.0,
|
4 |
"activation_function": "gelu",
|
@@ -53,7 +54,7 @@
|
|
53 |
"num_mel_bins": 80,
|
54 |
"pad_token_id": 50257,
|
55 |
"scale_embedding": false,
|
56 |
-
"transformers_version": "4.
|
57 |
"use_cache": true,
|
58 |
"use_weighted_layer_sum": false,
|
59 |
"vocab_size": 51865
|
|
|
1 |
{
|
2 |
+
"_attn_implementation_autoset": true,
|
3 |
"_name_or_path": "distil-whisper/distil-large-v2",
|
4 |
"activation_dropout": 0.0,
|
5 |
"activation_function": "gelu",
|
|
|
54 |
"num_mel_bins": 80,
|
55 |
"pad_token_id": 50257,
|
56 |
"scale_embedding": false,
|
57 |
+
"transformers_version": "4.46.3",
|
58 |
"use_cache": true,
|
59 |
"use_weighted_layer_sum": false,
|
60 |
"vocab_size": 51865
|
generation_config.json
CHANGED
@@ -222,6 +222,6 @@
|
|
222 |
"transcribe": 50359,
|
223 |
"translate": 50358
|
224 |
},
|
225 |
-
"transformers_version": "4.
|
226 |
"use_scan": false
|
227 |
}
|
|
|
222 |
"transcribe": 50359,
|
223 |
"translate": 50358
|
224 |
},
|
225 |
+
"transformers_version": "4.46.3",
|
226 |
"use_scan": false
|
227 |
}
|
openvino_decoder_model.xml
CHANGED
@@ -10,7 +10,7 @@
|
|
10 |
</port>
|
11 |
</output>
|
12 |
</layer>
|
13 |
-
<layer id="0" name="
|
14 |
<data shape="?,?,?" element_type="f32" />
|
15 |
<output>
|
16 |
<port id="0" precision="FP32" names="encoder_hidden_states">
|
@@ -29,7 +29,7 @@
|
|
29 |
</port>
|
30 |
</output>
|
31 |
</layer>
|
32 |
-
<layer id="3" name="
|
33 |
<data destination_type="f16" />
|
34 |
<input>
|
35 |
<port id="0" precision="U8">
|
@@ -53,7 +53,7 @@
|
|
53 |
</port>
|
54 |
</output>
|
55 |
</layer>
|
56 |
-
<layer id="5" name="
|
57 |
<data destination_type="f16" />
|
58 |
<input>
|
59 |
<port id="0" precision="U8">
|
@@ -130,7 +130,7 @@
|
|
130 |
</port>
|
131 |
</output>
|
132 |
</layer>
|
133 |
-
<layer id="10" name="
|
134 |
<data element_type="i64" shape="2" offset="66542795" size="16" />
|
135 |
<output>
|
136 |
<port id="0" precision="I64">
|
@@ -207,7 +207,7 @@
|
|
207 |
</port>
|
208 |
</output>
|
209 |
</layer>
|
210 |
-
<layer id="16" name="
|
211 |
<data destination_type="f16" />
|
212 |
<input>
|
213 |
<port id="0" precision="U8">
|
@@ -231,7 +231,7 @@
|
|
231 |
</port>
|
232 |
</output>
|
233 |
</layer>
|
234 |
-
<layer id="18" name="
|
235 |
<data destination_type="f16" />
|
236 |
<input>
|
237 |
<port id="0" precision="U8">
|
@@ -314,7 +314,7 @@
|
|
314 |
<port id="0" precision="I64" names="23" />
|
315 |
</output>
|
316 |
</layer>
|
317 |
-
<layer id="24" name="
|
318 |
<data output_type="i64" />
|
319 |
<input>
|
320 |
<port id="0" precision="I64">
|
@@ -328,19 +328,19 @@
|
|
328 |
</port>
|
329 |
</output>
|
330 |
</layer>
|
331 |
-
<layer id="25" name="
|
332 |
<data element_type="i64" shape="" offset="67117607" size="8" />
|
333 |
<output>
|
334 |
<port id="0" precision="I64" />
|
335 |
</output>
|
336 |
</layer>
|
337 |
-
<layer id="26" name="
|
338 |
<data element_type="i64" shape="" offset="67117599" size="8" />
|
339 |
<output>
|
340 |
<port id="0" precision="I64" />
|
341 |
</output>
|
342 |
</layer>
|
343 |
-
<layer id="27" name="
|
344 |
<data batch_dims="0" />
|
345 |
<input>
|
346 |
<port id="0" precision="I64">
|
@@ -401,7 +401,7 @@
|
|
401 |
</port>
|
402 |
</output>
|
403 |
</layer>
|
404 |
-
<layer id="32" name="
|
405 |
<data element_type="i32" shape="" offset="66542811" size="4" />
|
406 |
<output>
|
407 |
<port id="0" precision="I32" />
|
@@ -478,7 +478,7 @@
|
|
478 |
</port>
|
479 |
</output>
|
480 |
</layer>
|
481 |
-
<layer id="37" name="
|
482 |
<data element_type="f32" shape="1, 1, 1280" offset="67117623" size="5120" />
|
483 |
<output>
|
484 |
<port id="0" precision="FP32">
|
@@ -510,7 +510,7 @@
|
|
510 |
</port>
|
511 |
</output>
|
512 |
</layer>
|
513 |
-
<layer id="39" name="
|
514 |
<data element_type="f32" shape="1, 1, 1280" offset="67122743" size="5120" />
|
515 |
<output>
|
516 |
<port id="0" precision="FP32">
|
@@ -542,7 +542,7 @@
|
|
542 |
</port>
|
543 |
</output>
|
544 |
</layer>
|
545 |
-
<layer id="41" name="
|
546 |
<data element_type="u8" shape="1280, 1280" offset="67127863" size="1638400" />
|
547 |
<output>
|
548 |
<port id="0" precision="U8">
|
@@ -551,7 +551,7 @@
|
|
551 |
</port>
|
552 |
</output>
|
553 |
</layer>
|
554 |
-
<layer id="42" name="
|
555 |
<data destination_type="f16" />
|
556 |
<input>
|
557 |
<port id="0" precision="U8">
|
@@ -566,7 +566,7 @@
|
|
566 |
</port>
|
567 |
</output>
|
568 |
</layer>
|
569 |
-
<layer id="43" name="
|
570 |
<data element_type="u8" shape="1280, 1" offset="68766263" size="1280" />
|
571 |
<output>
|
572 |
<port id="0" precision="U8">
|
@@ -575,7 +575,7 @@
|
|
575 |
</port>
|
576 |
</output>
|
577 |
</layer>
|
578 |
-
<layer id="44" name="
|
579 |
<data destination_type="f16" />
|
580 |
<input>
|
581 |
<port id="0" precision="U8">
|
@@ -590,7 +590,7 @@
|
|
590 |
</port>
|
591 |
</output>
|
592 |
</layer>
|
593 |
-
<layer id="45" name="
|
594 |
<data auto_broadcast="numpy" />
|
595 |
<input>
|
596 |
<port id="0" precision="FP16">
|
@@ -609,7 +609,7 @@
|
|
609 |
</port>
|
610 |
</output>
|
611 |
</layer>
|
612 |
-
<layer id="46" name="
|
613 |
<data element_type="f16" shape="1280, 1" offset="68767543" size="2560" />
|
614 |
<output>
|
615 |
<port id="0" precision="FP16">
|
@@ -618,7 +618,7 @@
|
|
618 |
</port>
|
619 |
</output>
|
620 |
</layer>
|
621 |
-
<layer id="47" name="
|
622 |
<data auto_broadcast="numpy" />
|
623 |
<input>
|
624 |
<port id="0" precision="FP16">
|
@@ -637,7 +637,7 @@
|
|
637 |
</port>
|
638 |
</output>
|
639 |
</layer>
|
640 |
-
<layer id="48" name="
|
641 |
<data destination_type="f32" />
|
642 |
<input>
|
643 |
<port id="0" precision="FP16">
|
@@ -652,7 +652,7 @@
|
|
652 |
</port>
|
653 |
</output>
|
654 |
</layer>
|
655 |
-
<layer id="49" name="
|
656 |
<data transpose_a="false" transpose_b="true" />
|
657 |
<input>
|
658 |
<port id="0" precision="FP32">
|
@@ -673,7 +673,7 @@
|
|
673 |
</port>
|
674 |
</output>
|
675 |
</layer>
|
676 |
-
<layer id="50" name="
|
677 |
<data element_type="f32" shape="1, 1, 1280" offset="68770103" size="5120" />
|
678 |
<output>
|
679 |
<port id="0" precision="FP32">
|
@@ -705,7 +705,7 @@
|
|
705 |
</port>
|
706 |
</output>
|
707 |
</layer>
|
708 |
-
<layer id="52" name="
|
709 |
<data element_type="i64" shape="4" offset="68775223" size="32" />
|
710 |
<output>
|
711 |
<port id="0" precision="I64">
|
@@ -772,7 +772,7 @@
|
|
772 |
</port>
|
773 |
</output>
|
774 |
</layer>
|
775 |
-
<layer id="57" name="
|
776 |
<data destination_type="f16" />
|
777 |
<input>
|
778 |
<port id="0" precision="U8">
|
@@ -796,7 +796,7 @@
|
|
796 |
</port>
|
797 |
</output>
|
798 |
</layer>
|
799 |
-
<layer id="59" name="
|
800 |
<data destination_type="f16" />
|
801 |
<input>
|
802 |
<port id="0" precision="U8">
|
@@ -894,7 +894,7 @@
|
|
894 |
</port>
|
895 |
</output>
|
896 |
</layer>
|
897 |
-
<layer id="65" name="
|
898 |
<data element_type="i64" shape="4" offset="68775223" size="32" />
|
899 |
<output>
|
900 |
<port id="0" precision="I64">
|
@@ -983,13 +983,13 @@
|
|
983 |
<port id="0" precision="I32" />
|
984 |
</output>
|
985 |
</layer>
|
986 |
-
<layer id="71" name="
|
987 |
<data element_type="f32" shape="" offset="70417511" size="4" />
|
988 |
<output>
|
989 |
-
<port id="0" precision="FP32" />
|
990 |
</output>
|
991 |
</layer>
|
992 |
-
<layer id="72" name="
|
993 |
<data element_type="i64" shape="1" offset="67117607" size="8" />
|
994 |
<output>
|
995 |
<port id="0" precision="I64">
|
@@ -997,7 +997,7 @@
|
|
997 |
</port>
|
998 |
</output>
|
999 |
</layer>
|
1000 |
-
<layer id="73" name="
|
1001 |
<data special_zero="false" />
|
1002 |
<input>
|
1003 |
<port id="0" precision="I64" />
|
@@ -1027,13 +1027,13 @@
|
|
1027 |
<port id="2" precision="I64" names="62,64" />
|
1028 |
</output>
|
1029 |
</layer>
|
1030 |
-
<layer id="76" name="
|
1031 |
<data element_type="i32" shape="" offset="66542811" size="4" />
|
1032 |
<output>
|
1033 |
<port id="0" precision="I32" />
|
1034 |
</output>
|
1035 |
</layer>
|
1036 |
-
<layer id="77" name="
|
1037 |
<input>
|
1038 |
<port id="0" precision="I64" />
|
1039 |
<port id="1" precision="I32" />
|
@@ -1075,7 +1075,7 @@
|
|
1075 |
</port>
|
1076 |
</output>
|
1077 |
</layer>
|
1078 |
-
<layer id="80" name="
|
1079 |
<data output_type="i32" />
|
1080 |
<input>
|
1081 |
<port id="0" precision="FP32">
|
@@ -1089,19 +1089,19 @@
|
|
1089 |
</port>
|
1090 |
</output>
|
1091 |
</layer>
|
1092 |
-
<layer id="81" name="
|
1093 |
<data element_type="i64" shape="" offset="67117607" size="8" />
|
1094 |
<output>
|
1095 |
<port id="0" precision="I64" />
|
1096 |
</output>
|
1097 |
</layer>
|
1098 |
-
<layer id="82" name="
|
1099 |
<data element_type="i64" shape="" offset="67117599" size="8" />
|
1100 |
<output>
|
1101 |
<port id="0" precision="I64" />
|
1102 |
</output>
|
1103 |
</layer>
|
1104 |
-
<layer id="83" name="
|
1105 |
<data batch_dims="0" />
|
1106 |
<input>
|
1107 |
<port id="0" precision="I32">
|
@@ -1153,7 +1153,7 @@
|
|
1153 |
<port id="0" precision="I32" />
|
1154 |
</output>
|
1155 |
</layer>
|
1156 |
-
<layer id="88" name="
|
1157 |
<data destination_type="i32" />
|
1158 |
<input>
|
1159 |
<port id="0" precision="I64" />
|
@@ -1295,7 +1295,7 @@
|
|
1295 |
</port>
|
1296 |
</output>
|
1297 |
</layer>
|
1298 |
-
<layer id="100" name="
|
1299 |
<data element_type="i64" shape="2" offset="70417515" size="16" />
|
1300 |
<output>
|
1301 |
<port id="0" precision="I64" names="70">
|
@@ -1412,7 +1412,7 @@
|
|
1412 |
</port>
|
1413 |
</output>
|
1414 |
</layer>
|
1415 |
-
<layer id="108" name="
|
1416 |
<data element_type="i64" shape="1" offset="67117599" size="8" />
|
1417 |
<output>
|
1418 |
<port id="0" precision="I64">
|
@@ -1420,13 +1420,13 @@
|
|
1420 |
</port>
|
1421 |
</output>
|
1422 |
</layer>
|
1423 |
-
<layer id="109" name="
|
1424 |
<data element_type="i64" shape="" offset="67117599" size="8" />
|
1425 |
<output>
|
1426 |
<port id="0" precision="I64" />
|
1427 |
</output>
|
1428 |
</layer>
|
1429 |
-
<layer id="110" name="
|
1430 |
<data batch_dims="0" />
|
1431 |
<input>
|
1432 |
<port id="0" precision="I64">
|
@@ -1443,7 +1443,7 @@
|
|
1443 |
</port>
|
1444 |
</output>
|
1445 |
</layer>
|
1446 |
-
<layer id="111" name="
|
1447 |
<data element_type="i64" shape="1" offset="67117607" size="8" />
|
1448 |
<output>
|
1449 |
<port id="0" precision="I64">
|
@@ -1451,7 +1451,7 @@
|
|
1451 |
</port>
|
1452 |
</output>
|
1453 |
</layer>
|
1454 |
-
<layer id="112" name="
|
1455 |
<data element_type="i64" shape="1" offset="67117607" size="8" />
|
1456 |
<output>
|
1457 |
<port id="0" precision="I64">
|
@@ -1459,7 +1459,7 @@
|
|
1459 |
</port>
|
1460 |
</output>
|
1461 |
</layer>
|
1462 |
-
<layer id="113" name="
|
1463 |
<data element_type="i64" shape="1" offset="67117607" size="8" />
|
1464 |
<output>
|
1465 |
<port id="0" precision="I64">
|
@@ -1511,7 +1511,7 @@
|
|
1511 |
</port>
|
1512 |
</output>
|
1513 |
</layer>
|
1514 |
-
<layer id="116" name="
|
1515 |
<data element_type="i64" shape="1" offset="67117599" size="8" />
|
1516 |
<output>
|
1517 |
<port id="0" precision="I64">
|
@@ -1519,7 +1519,7 @@
|
|
1519 |
</port>
|
1520 |
</output>
|
1521 |
</layer>
|
1522 |
-
<layer id="117" name="
|
1523 |
<data output_type="i64" />
|
1524 |
<input>
|
1525 |
<port id="0" precision="FP32">
|
@@ -1534,7 +1534,7 @@
|
|
1534 |
</port>
|
1535 |
</output>
|
1536 |
</layer>
|
1537 |
-
<layer id="118" name="
|
1538 |
<data element_type="i64" shape="1" offset="67117607" size="8" />
|
1539 |
<output>
|
1540 |
<port id="0" precision="I64">
|
@@ -1542,13 +1542,13 @@
|
|
1542 |
</port>
|
1543 |
</output>
|
1544 |
</layer>
|
1545 |
-
<layer id="119" name="
|
1546 |
<data element_type="i64" shape="" offset="67117599" size="8" />
|
1547 |
<output>
|
1548 |
<port id="0" precision="I64" />
|
1549 |
</output>
|
1550 |
</layer>
|
1551 |
-
<layer id="120" name="
|
1552 |
<data batch_dims="0" />
|
1553 |
<input>
|
1554 |
<port id="0" precision="I64">
|
@@ -1565,7 +1565,7 @@
|
|
1565 |
</port>
|
1566 |
</output>
|
1567 |
</layer>
|
1568 |
-
<layer id="121" name="
|
1569 |
<data element_type="i64" shape="1" offset="67117607" size="8" />
|
1570 |
<output>
|
1571 |
<port id="0" precision="I64">
|
@@ -1664,7 +1664,7 @@
|
|
1664 |
</port>
|
1665 |
</output>
|
1666 |
</layer>
|
1667 |
-
<layer id="127" name="
|
1668 |
<data destination_type="f16" />
|
1669 |
<input>
|
1670 |
<port id="0" precision="U8">
|
@@ -1688,7 +1688,7 @@
|
|
1688 |
</port>
|
1689 |
</output>
|
1690 |
</layer>
|
1691 |
-
<layer id="129" name="
|
1692 |
<data destination_type="f16" />
|
1693 |
<input>
|
1694 |
<port id="0" precision="U8">
|
@@ -1786,7 +1786,7 @@
|
|
1786 |
</port>
|
1787 |
</output>
|
1788 |
</layer>
|
1789 |
-
<layer id="135" name="
|
1790 |
<data element_type="f32" shape="1, 1, 1280" offset="72059779" size="5120" />
|
1791 |
<output>
|
1792 |
<port id="0" precision="FP32">
|
@@ -1818,7 +1818,7 @@
|
|
1818 |
</port>
|
1819 |
</output>
|
1820 |
</layer>
|
1821 |
-
<layer id="137" name="
|
1822 |
<data element_type="i64" shape="4" offset="68775223" size="32" />
|
1823 |
<output>
|
1824 |
<port id="0" precision="I64">
|
@@ -1930,7 +1930,7 @@
|
|
1930 |
</port>
|
1931 |
</output>
|
1932 |
</layer>
|
1933 |
-
<layer id="144" name="
|
1934 |
<data element_type="i64" shape="3" offset="72064899" size="24" />
|
1935 |
<output>
|
1936 |
<port id="0" precision="I64">
|
@@ -1968,7 +1968,7 @@
|
|
1968 |
</port>
|
1969 |
</output>
|
1970 |
</layer>
|
1971 |
-
<layer id="147" name="
|
1972 |
<data destination_type="f16" />
|
1973 |
<input>
|
1974 |
<port id="0" precision="U8">
|
@@ -1992,7 +1992,7 @@
|
|
1992 |
</port>
|
1993 |
</output>
|
1994 |
</layer>
|
1995 |
-
<layer id="149" name="
|
1996 |
<data destination_type="f16" />
|
1997 |
<input>
|
1998 |
<port id="0" precision="U8">
|
@@ -2090,7 +2090,7 @@
|
|
2090 |
</port>
|
2091 |
</output>
|
2092 |
</layer>
|
2093 |
-
<layer id="155" name="
|
2094 |
<data element_type="f32" shape="1, 1, 1280" offset="73707163" size="5120" />
|
2095 |
<output>
|
2096 |
<port id="0" precision="FP32">
|
@@ -2172,7 +2172,7 @@
|
|
2172 |
</port>
|
2173 |
</output>
|
2174 |
</layer>
|
2175 |
-
<layer id="160" name="
|
2176 |
<data element_type="f32" shape="1, 1, 1280" offset="73712283" size="5120" />
|
2177 |
<output>
|
2178 |
<port id="0" precision="FP32">
|
@@ -2204,7 +2204,7 @@
|
|
2204 |
</port>
|
2205 |
</output>
|
2206 |
</layer>
|
2207 |
-
<layer id="162" name="
|
2208 |
<data element_type="f32" shape="1, 1, 1280" offset="73717403" size="5120" />
|
2209 |
<output>
|
2210 |
<port id="0" precision="FP32">
|
@@ -2236,7 +2236,7 @@
|
|
2236 |
</port>
|
2237 |
</output>
|
2238 |
</layer>
|
2239 |
-
<layer id="164" name="
|
2240 |
<data element_type="u8" shape="1280, 1280" offset="73722523" size="1638400" />
|
2241 |
<output>
|
2242 |
<port id="0" precision="U8">
|
@@ -2245,7 +2245,7 @@
|
|
2245 |
</port>
|
2246 |
</output>
|
2247 |
</layer>
|
2248 |
-
<layer id="165" name="
|
2249 |
<data destination_type="f16" />
|
2250 |
<input>
|
2251 |
<port id="0" precision="U8">
|
@@ -2260,7 +2260,7 @@
|
|
2260 |
</port>
|
2261 |
</output>
|
2262 |
</layer>
|
2263 |
-
<layer id="166" name="
|
2264 |
<data element_type="u8" shape="1280, 1" offset="75360923" size="1280" />
|
2265 |
<output>
|
2266 |
<port id="0" precision="U8">
|
@@ -2269,7 +2269,7 @@
|
|
2269 |
</port>
|
2270 |
</output>
|
2271 |
</layer>
|
2272 |
-
<layer id="167" name="
|
2273 |
<data destination_type="f16" />
|
2274 |
<input>
|
2275 |
<port id="0" precision="U8">
|
@@ -2284,7 +2284,7 @@
|
|
2284 |
</port>
|
2285 |
</output>
|
2286 |
</layer>
|
2287 |
-
<layer id="168" name="
|
2288 |
<data auto_broadcast="numpy" />
|
2289 |
<input>
|
2290 |
<port id="0" precision="FP16">
|
@@ -2303,7 +2303,7 @@
|
|
2303 |
</port>
|
2304 |
</output>
|
2305 |
</layer>
|
2306 |
-
<layer id="169" name="
|
2307 |
<data element_type="f16" shape="1280, 1" offset="75362203" size="2560" />
|
2308 |
<output>
|
2309 |
<port id="0" precision="FP16">
|
@@ -2312,7 +2312,7 @@
|
|
2312 |
</port>
|
2313 |
</output>
|
2314 |
</layer>
|
2315 |
-
<layer id="170" name="
|
2316 |
<data auto_broadcast="numpy" />
|
2317 |
<input>
|
2318 |
<port id="0" precision="FP16">
|
@@ -2331,7 +2331,7 @@
|
|
2331 |
</port>
|
2332 |
</output>
|
2333 |
</layer>
|
2334 |
-
<layer id="171" name="
|
2335 |
<data destination_type="f32" />
|
2336 |
<input>
|
2337 |
<port id="0" precision="FP16">
|
@@ -2346,7 +2346,7 @@
|
|
2346 |
</port>
|
2347 |
</output>
|
2348 |
</layer>
|
2349 |
-
<layer id="172" name="
|
2350 |
<data transpose_a="false" transpose_b="true" />
|
2351 |
<input>
|
2352 |
<port id="0" precision="FP32">
|
@@ -2367,7 +2367,7 @@
|
|
2367 |
</port>
|
2368 |
</output>
|
2369 |
</layer>
|
2370 |
-
<layer id="173" name="
|
2371 |
<data element_type="f32" shape="1, 1, 1280" offset="75364763" size="5120" />
|
2372 |
<output>
|
2373 |
<port id="0" precision="FP32">
|
@@ -2399,7 +2399,7 @@
|
|
2399 |
</port>
|
2400 |
</output>
|
2401 |
</layer>
|
2402 |
-
<layer id="175" name="
|
2403 |
<data element_type="i64" shape="4" offset="68775223" size="32" />
|
2404 |
<output>
|
2405 |
<port id="0" precision="I64">
|
@@ -2466,7 +2466,7 @@
|
|
2466 |
</port>
|
2467 |
</output>
|
2468 |
</layer>
|
2469 |
-
<layer id="180" name="
|
2470 |
<data destination_type="f16" />
|
2471 |
<input>
|
2472 |
<port id="0" precision="U8">
|
@@ -2490,7 +2490,7 @@
|
|
2490 |
</port>
|
2491 |
</output>
|
2492 |
</layer>
|
2493 |
-
<layer id="182" name="
|
2494 |
<data destination_type="f16" />
|
2495 |
<input>
|
2496 |
<port id="0" precision="U8">
|
@@ -2588,7 +2588,7 @@
|
|
2588 |
</port>
|
2589 |
</output>
|
2590 |
</layer>
|
2591 |
-
<layer id="188" name="
|
2592 |
<data element_type="i64" shape="1" offset="77012123" size="8" />
|
2593 |
<output>
|
2594 |
<port id="0" precision="I64">
|
@@ -2596,7 +2596,7 @@
|
|
2596 |
</port>
|
2597 |
</output>
|
2598 |
</layer>
|
2599 |
-
<layer id="189" name="
|
2600 |
<data element_type="i64" shape="1" offset="77012131" size="8" />
|
2601 |
<output>
|
2602 |
<port id="0" precision="I64">
|
@@ -2604,7 +2604,7 @@
|
|
2604 |
</port>
|
2605 |
</output>
|
2606 |
</layer>
|
2607 |
-
<layer id="190" name="
|
2608 |
<data element_type="i64" shape="1" offset="77012139" size="8" />
|
2609 |
<output>
|
2610 |
<port id="0" precision="I64">
|
@@ -2612,7 +2612,7 @@
|
|
2612 |
</port>
|
2613 |
</output>
|
2614 |
</layer>
|
2615 |
-
<layer id="191" name="__module.model.model.decoder.layers.0.
|
2616 |
<data axis="0" />
|
2617 |
<input>
|
2618 |
<port id="0" precision="I64">
|
@@ -2737,7 +2737,7 @@
|
|
2737 |
</port>
|
2738 |
</output>
|
2739 |
</layer>
|
2740 |
-
<layer id="198" name="
|
2741 |
<data destination_type="f16" />
|
2742 |
<input>
|
2743 |
<port id="0" precision="U8">
|
@@ -2761,7 +2761,7 @@
|
|
2761 |
</port>
|
2762 |
</output>
|
2763 |
</layer>
|
2764 |
-
<layer id="200" name="
|
2765 |
<data destination_type="f16" />
|
2766 |
<input>
|
2767 |
<port id="0" precision="U8">
|
@@ -2859,7 +2859,7 @@
|
|
2859 |
</port>
|
2860 |
</output>
|
2861 |
</layer>
|
2862 |
-
<layer id="206" name="
|
2863 |
<data element_type="f32" shape="1, 1, 1280" offset="78654387" size="5120" />
|
2864 |
<output>
|
2865 |
<port id="0" precision="FP32">
|
@@ -2995,7 +2995,7 @@
|
|
2995 |
</port>
|
2996 |
</output>
|
2997 |
</layer>
|
2998 |
-
<layer id="214" name="
|
2999 |
<data element_type="i64" shape="3" offset="78659507" size="24" />
|
3000 |
<output>
|
3001 |
<port id="0" precision="I64">
|
@@ -3033,7 +3033,7 @@
|
|
3033 |
</port>
|
3034 |
</output>
|
3035 |
</layer>
|
3036 |
-
<layer id="217" name="
|
3037 |
<data destination_type="f16" />
|
3038 |
<input>
|
3039 |
<port id="0" precision="U8">
|
@@ -3057,7 +3057,7 @@
|
|
3057 |
</port>
|
3058 |
</output>
|
3059 |
</layer>
|
3060 |
-
<layer id="219" name="
|
3061 |
<data destination_type="f16" />
|
3062 |
<input>
|
3063 |
<port id="0" precision="U8">
|
@@ -3155,7 +3155,7 @@
|
|
3155 |
</port>
|
3156 |
</output>
|
3157 |
</layer>
|
3158 |
-
<layer id="225" name="
|
3159 |
<data element_type="f32" shape="1, 1, 1280" offset="80301771" size="5120" />
|
3160 |
<output>
|
3161 |
<port id="0" precision="FP32">
|
@@ -3237,7 +3237,7 @@
|
|
3237 |
</port>
|
3238 |
</output>
|
3239 |
</layer>
|
3240 |
-
<layer id="230" name="
|
3241 |
<data element_type="f32" shape="1, 1, 1280" offset="80306891" size="5120" />
|
3242 |
<output>
|
3243 |
<port id="0" precision="FP32">
|
@@ -3269,7 +3269,7 @@
|
|
3269 |
</port>
|
3270 |
</output>
|
3271 |
</layer>
|
3272 |
-
<layer id="232" name="
|
3273 |
<data element_type="f32" shape="1, 1, 1280" offset="80312011" size="5120" />
|
3274 |
<output>
|
3275 |
<port id="0" precision="FP32">
|
@@ -3310,7 +3310,7 @@
|
|
3310 |
</port>
|
3311 |
</output>
|
3312 |
</layer>
|
3313 |
-
<layer id="235" name="
|
3314 |
<data destination_type="f16" />
|
3315 |
<input>
|
3316 |
<port id="0" precision="U8">
|
@@ -3334,7 +3334,7 @@
|
|
3334 |
</port>
|
3335 |
</output>
|
3336 |
</layer>
|
3337 |
-
<layer id="237" name="
|
3338 |
<data destination_type="f16" />
|
3339 |
<input>
|
3340 |
<port id="0" precision="U8">
|
@@ -3432,7 +3432,7 @@
|
|
3432 |
</port>
|
3433 |
</output>
|
3434 |
</layer>
|
3435 |
-
<layer id="243" name="
|
3436 |
<data element_type="f32" shape="1, 1, 5120" offset="86886091" size="20480" />
|
3437 |
<output>
|
3438 |
<port id="0" precision="FP32">
|
@@ -3490,7 +3490,7 @@
|
|
3490 |
</port>
|
3491 |
</output>
|
3492 |
</layer>
|
3493 |
-
<layer id="247" name="
|
3494 |
<data destination_type="f16" />
|
3495 |
<input>
|
3496 |
<port id="0" precision="U8">
|
@@ -3514,7 +3514,7 @@
|
|
3514 |
</port>
|
3515 |
</output>
|
3516 |
</layer>
|
3517 |
-
<layer id="249" name="
|
3518 |
<data destination_type="f16" />
|
3519 |
<input>
|
3520 |
<port id="0" precision="U8">
|
@@ -3612,7 +3612,7 @@
|
|
3612 |
</port>
|
3613 |
</output>
|
3614 |
</layer>
|
3615 |
-
<layer id="255" name="
|
3616 |
<data element_type="f32" shape="1, 1, 1280" offset="93464011" size="5120" />
|
3617 |
<output>
|
3618 |
<port id="0" precision="FP32">
|
@@ -3694,7 +3694,7 @@
|
|
3694 |
</port>
|
3695 |
</output>
|
3696 |
</layer>
|
3697 |
-
<layer id="260" name="
|
3698 |
<data element_type="f32" shape="1, 1, 1280" offset="93469131" size="5120" />
|
3699 |
<output>
|
3700 |
<port id="0" precision="FP32">
|
@@ -3726,7 +3726,7 @@
|
|
3726 |
</port>
|
3727 |
</output>
|
3728 |
</layer>
|
3729 |
-
<layer id="262" name="
|
3730 |
<data element_type="f32" shape="1, 1, 1280" offset="93474251" size="5120" />
|
3731 |
<output>
|
3732 |
<port id="0" precision="FP32">
|
@@ -3758,7 +3758,7 @@
|
|
3758 |
</port>
|
3759 |
</output>
|
3760 |
</layer>
|
3761 |
-
<layer id="264" name="
|
3762 |
<data element_type="u8" shape="1280, 1280" offset="93479371" size="1638400" />
|
3763 |
<output>
|
3764 |
<port id="0" precision="U8">
|
@@ -3767,7 +3767,7 @@
|
|
3767 |
</port>
|
3768 |
</output>
|
3769 |
</layer>
|
3770 |
-
<layer id="265" name="
|
3771 |
<data destination_type="f16" />
|
3772 |
<input>
|
3773 |
<port id="0" precision="U8">
|
@@ -3782,7 +3782,7 @@
|
|
3782 |
</port>
|
3783 |
</output>
|
3784 |
</layer>
|
3785 |
-
<layer id="266" name="
|
3786 |
<data element_type="u8" shape="1280, 1" offset="95117771" size="1280" />
|
3787 |
<output>
|
3788 |
<port id="0" precision="U8">
|
@@ -3791,7 +3791,7 @@
|
|
3791 |
</port>
|
3792 |
</output>
|
3793 |
</layer>
|
3794 |
-
<layer id="267" name="
|
3795 |
<data destination_type="f16" />
|
3796 |
<input>
|
3797 |
<port id="0" precision="U8">
|
@@ -3806,7 +3806,7 @@
|
|
3806 |
</port>
|
3807 |
</output>
|
3808 |
</layer>
|
3809 |
-
<layer id="268" name="
|
3810 |
<data auto_broadcast="numpy" />
|
3811 |
<input>
|
3812 |
<port id="0" precision="FP16">
|
@@ -3825,7 +3825,7 @@
|
|
3825 |
</port>
|
3826 |
</output>
|
3827 |
</layer>
|
3828 |
-
<layer id="269" name="
|
3829 |
<data element_type="f16" shape="1280, 1" offset="95119051" size="2560" />
|
3830 |
<output>
|
3831 |
<port id="0" precision="FP16">
|
@@ -3834,7 +3834,7 @@
|
|
3834 |
</port>
|
3835 |
</output>
|
3836 |
</layer>
|
3837 |
-
<layer id="270" name="
|
3838 |
<data auto_broadcast="numpy" />
|
3839 |
<input>
|
3840 |
<port id="0" precision="FP16">
|
@@ -3853,7 +3853,7 @@
|
|
3853 |
</port>
|
3854 |
</output>
|
3855 |
</layer>
|
3856 |
-
<layer id="271" name="
|
3857 |
<data destination_type="f32" />
|
3858 |
<input>
|
3859 |
<port id="0" precision="FP16">
|
@@ -3868,7 +3868,7 @@
|
|
3868 |
</port>
|
3869 |
</output>
|
3870 |
</layer>
|
3871 |
-
<layer id="272" name="
|
3872 |
<data transpose_a="false" transpose_b="true" />
|
3873 |
<input>
|
3874 |
<port id="0" precision="FP32">
|
@@ -3889,7 +3889,7 @@
|
|
3889 |
</port>
|
3890 |
</output>
|
3891 |
</layer>
|
3892 |
-
<layer id="273" name="
|
3893 |
<data element_type="f32" shape="1, 1, 1280" offset="95121611" size="5120" />
|
3894 |
<output>
|
3895 |
<port id="0" precision="FP32">
|
@@ -3921,7 +3921,7 @@
|
|
3921 |
</port>
|
3922 |
</output>
|
3923 |
</layer>
|
3924 |
-
<layer id="275" name="
|
3925 |
<data element_type="i64" shape="4" offset="68775223" size="32" />
|
3926 |
<output>
|
3927 |
<port id="0" precision="I64">
|
@@ -3988,7 +3988,7 @@
|
|
3988 |
</port>
|
3989 |
</output>
|
3990 |
</layer>
|
3991 |
-
<layer id="280" name="
|
3992 |
<data destination_type="f16" />
|
3993 |
<input>
|
3994 |
<port id="0" precision="U8">
|
@@ -4012,7 +4012,7 @@
|
|
4012 |
</port>
|
4013 |
</output>
|
4014 |
</layer>
|
4015 |
-
<layer id="282" name="
|
4016 |
<data destination_type="f16" />
|
4017 |
<input>
|
4018 |
<port id="0" precision="U8">
|
@@ -4110,7 +4110,7 @@
|
|
4110 |
</port>
|
4111 |
</output>
|
4112 |
</layer>
|
4113 |
-
<layer id="288" name="
|
4114 |
<data element_type="i64" shape="4" offset="68775223" size="32" />
|
4115 |
<output>
|
4116 |
<port id="0" precision="I64">
|
@@ -4246,7 +4246,7 @@
|
|
4246 |
</port>
|
4247 |
</output>
|
4248 |
</layer>
|
4249 |
-
<layer id="296" name="
|
4250 |
<data destination_type="f16" />
|
4251 |
<input>
|
4252 |
<port id="0" precision="U8">
|
@@ -4270,7 +4270,7 @@
|
|
4270 |
</port>
|
4271 |
</output>
|
4272 |
</layer>
|
4273 |
-
<layer id="298" name="
|
4274 |
<data destination_type="f16" />
|
4275 |
<input>
|
4276 |
<port id="0" precision="U8">
|
@@ -4368,7 +4368,7 @@
|
|
4368 |
</port>
|
4369 |
</output>
|
4370 |
</layer>
|
4371 |
-
<layer id="304" name="
|
4372 |
<data element_type="f32" shape="1, 1, 1280" offset="98411211" size="5120" />
|
4373 |
<output>
|
4374 |
<port id="0" precision="FP32">
|
@@ -4400,7 +4400,7 @@
|
|
4400 |
</port>
|
4401 |
</output>
|
4402 |
</layer>
|
4403 |
-
<layer id="306" name="
|
4404 |
<data element_type="i64" shape="4" offset="68775223" size="32" />
|
4405 |
<output>
|
4406 |
<port id="0" precision="I64">
|
@@ -4512,7 +4512,7 @@
|
|
4512 |
</port>
|
4513 |
</output>
|
4514 |
</layer>
|
4515 |
-
<layer id="313" name="
|
4516 |
<data element_type="i64" shape="3" offset="72064899" size="24" />
|
4517 |
<output>
|
4518 |
<port id="0" precision="I64">
|
@@ -4550,7 +4550,7 @@
|
|
4550 |
</port>
|
4551 |
</output>
|
4552 |
</layer>
|
4553 |
-
<layer id="316" name="
|
4554 |
<data destination_type="f16" />
|
4555 |
<input>
|
4556 |
<port id="0" precision="U8">
|
@@ -4574,7 +4574,7 @@
|
|
4574 |
</port>
|
4575 |
</output>
|
4576 |
</layer>
|
4577 |
-
<layer id="318" name="
|
4578 |
<data destination_type="f16" />
|
4579 |
<input>
|
4580 |
<port id="0" precision="U8">
|
@@ -4672,7 +4672,7 @@
|
|
4672 |
</port>
|
4673 |
</output>
|
4674 |
</layer>
|
4675 |
-
<layer id="324" name="
|
4676 |
<data element_type="f32" shape="1, 1, 1280" offset="100058571" size="5120" />
|
4677 |
<output>
|
4678 |
<port id="0" precision="FP32">
|
@@ -4754,7 +4754,7 @@
|
|
4754 |
</port>
|
4755 |
</output>
|
4756 |
</layer>
|
4757 |
-
<layer id="329" name="
|
4758 |
<data element_type="f32" shape="1, 1, 1280" offset="100063691" size="5120" />
|
4759 |
<output>
|
4760 |
<port id="0" precision="FP32">
|
@@ -4786,7 +4786,7 @@
|
|
4786 |
</port>
|
4787 |
</output>
|
4788 |
</layer>
|
4789 |
-
<layer id="331" name="
|
4790 |
<data element_type="f32" shape="1, 1, 1280" offset="100068811" size="5120" />
|
4791 |
<output>
|
4792 |
<port id="0" precision="FP32">
|
@@ -4818,7 +4818,7 @@
|
|
4818 |
</port>
|
4819 |
</output>
|
4820 |
</layer>
|
4821 |
-
<layer id="333" name="
|
4822 |
<data element_type="u8" shape="1280, 1280" offset="100073931" size="1638400" />
|
4823 |
<output>
|
4824 |
<port id="0" precision="U8">
|
@@ -4827,7 +4827,7 @@
|
|
4827 |
</port>
|
4828 |
</output>
|
4829 |
</layer>
|
4830 |
-
<layer id="334" name="
|
4831 |
<data destination_type="f16" />
|
4832 |
<input>
|
4833 |
<port id="0" precision="U8">
|
@@ -4842,7 +4842,7 @@
|
|
4842 |
</port>
|
4843 |
</output>
|
4844 |
</layer>
|
4845 |
-
<layer id="335" name="
|
4846 |
<data element_type="u8" shape="1280, 1" offset="101712331" size="1280" />
|
4847 |
<output>
|
4848 |
<port id="0" precision="U8">
|
@@ -4851,7 +4851,7 @@
|
|
4851 |
</port>
|
4852 |
</output>
|
4853 |
</layer>
|
4854 |
-
<layer id="336" name="
|
4855 |
<data destination_type="f16" />
|
4856 |
<input>
|
4857 |
<port id="0" precision="U8">
|
@@ -4866,7 +4866,7 @@
|
|
4866 |
</port>
|
4867 |
</output>
|
4868 |
</layer>
|
4869 |
-
<layer id="337" name="
|
4870 |
<data auto_broadcast="numpy" />
|
4871 |
<input>
|
4872 |
<port id="0" precision="FP16">
|
@@ -4885,7 +4885,7 @@
|
|
4885 |
</port>
|
4886 |
</output>
|
4887 |
</layer>
|
4888 |
-
<layer id="338" name="
|
4889 |
<data element_type="f16" shape="1280, 1" offset="101713611" size="2560" />
|
4890 |
<output>
|
4891 |
<port id="0" precision="FP16">
|
@@ -4894,7 +4894,7 @@
|
|
4894 |
</port>
|
4895 |
</output>
|
4896 |
</layer>
|
4897 |
-
<layer id="339" name="
|
4898 |
<data auto_broadcast="numpy" />
|
4899 |
<input>
|
4900 |
<port id="0" precision="FP16">
|
@@ -4913,7 +4913,7 @@
|
|
4913 |
</port>
|
4914 |
</output>
|
4915 |
</layer>
|
4916 |
-
<layer id="340" name="
|
4917 |
<data destination_type="f32" />
|
4918 |
<input>
|
4919 |
<port id="0" precision="FP16">
|
@@ -4928,7 +4928,7 @@
|
|
4928 |
</port>
|
4929 |
</output>
|
4930 |
</layer>
|
4931 |
-
<layer id="341" name="
|
4932 |
<data transpose_a="false" transpose_b="true" />
|
4933 |
<input>
|
4934 |
<port id="0" precision="FP32">
|
@@ -4949,7 +4949,7 @@
|
|
4949 |
</port>
|
4950 |
</output>
|
4951 |
</layer>
|
4952 |
-
<layer id="342" name="
|
4953 |
<data element_type="f32" shape="1, 1, 1280" offset="101716171" size="5120" />
|
4954 |
<output>
|
4955 |
<port id="0" precision="FP32">
|
@@ -4981,7 +4981,7 @@
|
|
4981 |
</port>
|
4982 |
</output>
|
4983 |
</layer>
|
4984 |
-
<layer id="344" name="
|
4985 |
<data element_type="i64" shape="4" offset="68775223" size="32" />
|
4986 |
<output>
|
4987 |
<port id="0" precision="I64">
|
@@ -5048,7 +5048,7 @@
|
|
5048 |
</port>
|
5049 |
</output>
|
5050 |
</layer>
|
5051 |
-
<layer id="349" name="
|
5052 |
<data destination_type="f16" />
|
5053 |
<input>
|
5054 |
<port id="0" precision="U8">
|
@@ -5072,7 +5072,7 @@
|
|
5072 |
</port>
|
5073 |
</output>
|
5074 |
</layer>
|
5075 |
-
<layer id="351" name="
|
5076 |
<data destination_type="f16" />
|
5077 |
<input>
|
5078 |
<port id="0" precision="U8">
|
@@ -5273,7 +5273,7 @@
|
|
5273 |
</port>
|
5274 |
</output>
|
5275 |
</layer>
|
5276 |
-
<layer id="363" name="
|
5277 |
<data destination_type="f16" />
|
5278 |
<input>
|
5279 |
<port id="0" precision="U8">
|
@@ -5297,7 +5297,7 @@
|
|
5297 |
</port>
|
5298 |
</output>
|
5299 |
</layer>
|
5300 |
-
<layer id="365" name="
|
5301 |
<data destination_type="f16" />
|
5302 |
<input>
|
5303 |
<port id="0" precision="U8">
|
@@ -5395,7 +5395,7 @@
|
|
5395 |
</port>
|
5396 |
</output>
|
5397 |
</layer>
|
5398 |
-
<layer id="371" name="
|
5399 |
<data element_type="f32" shape="1, 1, 1280" offset="105005771" size="5120" />
|
5400 |
<output>
|
5401 |
<port id="0" precision="FP32">
|
@@ -5531,7 +5531,7 @@
|
|
5531 |
</port>
|
5532 |
</output>
|
5533 |
</layer>
|
5534 |
-
<layer id="379" name="
|
5535 |
<data element_type="i64" shape="3" offset="78659507" size="24" />
|
5536 |
<output>
|
5537 |
<port id="0" precision="I64">
|
@@ -5569,7 +5569,7 @@
|
|
5569 |
</port>
|
5570 |
</output>
|
5571 |
</layer>
|
5572 |
-
<layer id="382" name="
|
5573 |
<data destination_type="f16" />
|
5574 |
<input>
|
5575 |
<port id="0" precision="U8">
|
@@ -5593,7 +5593,7 @@
|
|
5593 |
</port>
|
5594 |
</output>
|
5595 |
</layer>
|
5596 |
-
<layer id="384" name="
|
5597 |
<data destination_type="f16" />
|
5598 |
<input>
|
5599 |
<port id="0" precision="U8">
|
@@ -5691,7 +5691,7 @@
|
|
5691 |
</port>
|
5692 |
</output>
|
5693 |
</layer>
|
5694 |
-
<layer id="390" name="
|
5695 |
<data element_type="f32" shape="1, 1, 1280" offset="106653131" size="5120" />
|
5696 |
<output>
|
5697 |
<port id="0" precision="FP32">
|
@@ -5773,7 +5773,7 @@
|
|
5773 |
</port>
|
5774 |
</output>
|
5775 |
</layer>
|
5776 |
-
<layer id="395" name="
|
5777 |
<data element_type="f32" shape="1, 1, 1280" offset="106658251" size="5120" />
|
5778 |
<output>
|
5779 |
<port id="0" precision="FP32">
|
@@ -5805,7 +5805,7 @@
|
|
5805 |
</port>
|
5806 |
</output>
|
5807 |
</layer>
|
5808 |
-
<layer id="397" name="
|
5809 |
<data element_type="f32" shape="1, 1, 1280" offset="106663371" size="5120" />
|
5810 |
<output>
|
5811 |
<port id="0" precision="FP32">
|
@@ -5846,7 +5846,7 @@
|
|
5846 |
</port>
|
5847 |
</output>
|
5848 |
</layer>
|
5849 |
-
<layer id="400" name="
|
5850 |
<data destination_type="f16" />
|
5851 |
<input>
|
5852 |
<port id="0" precision="U8">
|
@@ -5870,7 +5870,7 @@
|
|
5870 |
</port>
|
5871 |
</output>
|
5872 |
</layer>
|
5873 |
-
<layer id="402" name="
|
5874 |
<data destination_type="f16" />
|
5875 |
<input>
|
5876 |
<port id="0" precision="U8">
|
@@ -5968,7 +5968,7 @@
|
|
5968 |
</port>
|
5969 |
</output>
|
5970 |
</layer>
|
5971 |
-
<layer id="408" name="
|
5972 |
<data element_type="f32" shape="1, 1, 5120" offset="113237451" size="20480" />
|
5973 |
<output>
|
5974 |
<port id="0" precision="FP32">
|
@@ -6026,7 +6026,7 @@
|
|
6026 |
</port>
|
6027 |
</output>
|
6028 |
</layer>
|
6029 |
-
<layer id="412" name="
|
6030 |
<data destination_type="f16" />
|
6031 |
<input>
|
6032 |
<port id="0" precision="U8">
|
@@ -6050,7 +6050,7 @@
|
|
6050 |
</port>
|
6051 |
</output>
|
6052 |
</layer>
|
6053 |
-
<layer id="414" name="
|
6054 |
<data destination_type="f16" />
|
6055 |
<input>
|
6056 |
<port id="0" precision="U8">
|
@@ -6148,7 +6148,7 @@
|
|
6148 |
</port>
|
6149 |
</output>
|
6150 |
</layer>
|
6151 |
-
<layer id="420" name="
|
6152 |
<data element_type="f32" shape="1, 1, 1280" offset="119815371" size="5120" />
|
6153 |
<output>
|
6154 |
<port id="0" precision="FP32">
|
@@ -6230,7 +6230,7 @@
|
|
6230 |
</port>
|
6231 |
</output>
|
6232 |
</layer>
|
6233 |
-
<layer id="425" name="
|
6234 |
<data element_type="f32" shape="1, 1, 1280" offset="119820491" size="5120" />
|
6235 |
<output>
|
6236 |
<port id="0" precision="FP32">
|
@@ -6262,7 +6262,7 @@
|
|
6262 |
</port>
|
6263 |
</output>
|
6264 |
</layer>
|
6265 |
-
<layer id="427" name="
|
6266 |
<data element_type="f32" shape="1, 1, 1280" offset="119825611" size="5120" />
|
6267 |
<output>
|
6268 |
<port id="0" precision="FP32">
|
@@ -6315,7 +6315,7 @@
|
|
6315 |
</port>
|
6316 |
</output>
|
6317 |
</layer>
|
6318 |
-
<layer id="430" name="
|
6319 |
<input>
|
6320 |
<port id="0" precision="FP32">
|
6321 |
<dim>-1</dim>
|
@@ -6792,7 +6792,7 @@
|
|
6792 |
<edge from-layer="429" from-port="2" to-layer="430" to-port="0" />
|
6793 |
</edges>
|
6794 |
<rt_info>
|
6795 |
-
<Runtime_version value="2024.5.0-
|
6796 |
<conversion_parameters>
|
6797 |
<framework value="pytorch" />
|
6798 |
<is_python_object value="True" />
|
@@ -6800,9 +6800,10 @@
|
|
6800 |
<nncf>
|
6801 |
<friendly_names_were_updated value="True" />
|
6802 |
<weight_compression>
|
6803 |
-
<advanced_parameters value="{'awq_params': {'subset_size': 32, 'percent_to_apply': 0.002, 'alpha_min': 0.0, 'alpha_max': 1.0, 'steps': 100}, 'scale_estimation_params': {'subset_size': 64, 'initial_steps': 5, 'scale_steps': 5, 'weight_penalty': -1.0}, 'gptq_params': {'damp_percent': 0.1, 'block_size': 128, 'subset_size': 128}, 'lora_correction_params': {'adapter_rank': 8, 'num_iterations': 3, 'apply_regularization': True, 'subset_size': 128, 'use_int8_adapters': True}}" />
|
6804 |
<all_layers value="False" />
|
6805 |
<awq value="False" />
|
|
|
6806 |
<gptq value="False" />
|
6807 |
<group_size value="-1" />
|
6808 |
<ignored_scope value="[]" />
|
@@ -6814,10 +6815,10 @@
|
|
6814 |
</weight_compression>
|
6815 |
</nncf>
|
6816 |
<optimum>
|
6817 |
-
<optimum_intel_version value="1.
|
6818 |
-
<optimum_version value="1.23.
|
6819 |
-
<pytorch_version value="2.5.
|
6820 |
-
<transformers_version value="4.
|
6821 |
</optimum>
|
6822 |
</rt_info>
|
6823 |
</net>
|
|
|
10 |
</port>
|
11 |
</output>
|
12 |
</layer>
|
13 |
+
<layer id="0" name="Parameter_26207" type="Parameter" version="opset1">
|
14 |
<data shape="?,?,?" element_type="f32" />
|
15 |
<output>
|
16 |
<port id="0" precision="FP32" names="encoder_hidden_states">
|
|
|
29 |
</port>
|
30 |
</output>
|
31 |
</layer>
|
32 |
+
<layer id="3" name="Convert_42617" type="Convert" version="opset1">
|
33 |
<data destination_type="f16" />
|
34 |
<input>
|
35 |
<port id="0" precision="U8">
|
|
|
53 |
</port>
|
54 |
</output>
|
55 |
</layer>
|
56 |
+
<layer id="5" name="Convert_42620" type="Convert" version="opset1">
|
57 |
<data destination_type="f16" />
|
58 |
<input>
|
59 |
<port id="0" precision="U8">
|
|
|
130 |
</port>
|
131 |
</output>
|
132 |
</layer>
|
133 |
+
<layer id="10" name="Constant_31708" type="Const" version="opset1">
|
134 |
<data element_type="i64" shape="2" offset="66542795" size="16" />
|
135 |
<output>
|
136 |
<port id="0" precision="I64">
|
|
|
207 |
</port>
|
208 |
</output>
|
209 |
</layer>
|
210 |
+
<layer id="16" name="Convert_42848" type="Convert" version="opset1">
|
211 |
<data destination_type="f16" />
|
212 |
<input>
|
213 |
<port id="0" precision="U8">
|
|
|
231 |
</port>
|
232 |
</output>
|
233 |
</layer>
|
234 |
+
<layer id="18" name="Convert_42851" type="Convert" version="opset1">
|
235 |
<data destination_type="f16" />
|
236 |
<input>
|
237 |
<port id="0" precision="U8">
|
|
|
314 |
<port id="0" precision="I64" names="23" />
|
315 |
</output>
|
316 |
</layer>
|
317 |
+
<layer id="24" name="ShapeOf_31624" type="ShapeOf" version="opset3">
|
318 |
<data output_type="i64" />
|
319 |
<input>
|
320 |
<port id="0" precision="I64">
|
|
|
328 |
</port>
|
329 |
</output>
|
330 |
</layer>
|
331 |
+
<layer id="25" name="Constant_31625" type="Const" version="opset1">
|
332 |
<data element_type="i64" shape="" offset="67117607" size="8" />
|
333 |
<output>
|
334 |
<port id="0" precision="I64" />
|
335 |
</output>
|
336 |
</layer>
|
337 |
+
<layer id="26" name="Constant_31626" type="Const" version="opset1">
|
338 |
<data element_type="i64" shape="" offset="67117599" size="8" />
|
339 |
<output>
|
340 |
<port id="0" precision="I64" />
|
341 |
</output>
|
342 |
</layer>
|
343 |
+
<layer id="27" name="Gather_31627" type="Gather" version="opset8">
|
344 |
<data batch_dims="0" />
|
345 |
<input>
|
346 |
<port id="0" precision="I64">
|
|
|
401 |
</port>
|
402 |
</output>
|
403 |
</layer>
|
404 |
+
<layer id="32" name="__module.model.model.decoder.embed_positions/aten::index/Constant" type="Const" version="opset1">
|
405 |
<data element_type="i32" shape="" offset="66542811" size="4" />
|
406 |
<output>
|
407 |
<port id="0" precision="I32" />
|
|
|
478 |
</port>
|
479 |
</output>
|
480 |
</layer>
|
481 |
+
<layer id="37" name="Constant_31390" type="Const" version="opset1">
|
482 |
<data element_type="f32" shape="1, 1, 1280" offset="67117623" size="5120" />
|
483 |
<output>
|
484 |
<port id="0" precision="FP32">
|
|
|
510 |
</port>
|
511 |
</output>
|
512 |
</layer>
|
513 |
+
<layer id="39" name="Constant_31391" type="Const" version="opset1">
|
514 |
<data element_type="f32" shape="1, 1, 1280" offset="67122743" size="5120" />
|
515 |
<output>
|
516 |
<port id="0" precision="FP32">
|
|
|
542 |
</port>
|
543 |
</output>
|
544 |
</layer>
|
545 |
+
<layer id="41" name="Constant_31293" type="Const" version="opset1">
|
546 |
<data element_type="u8" shape="1280, 1280" offset="67127863" size="1638400" />
|
547 |
<output>
|
548 |
<port id="0" precision="U8">
|
|
|
551 |
</port>
|
552 |
</output>
|
553 |
</layer>
|
554 |
+
<layer id="42" name="Convert_42738" type="Convert" version="opset1">
|
555 |
<data destination_type="f16" />
|
556 |
<input>
|
557 |
<port id="0" precision="U8">
|
|
|
566 |
</port>
|
567 |
</output>
|
568 |
</layer>
|
569 |
+
<layer id="43" name="Constant_31293/zero_point" type="Const" version="opset1">
|
570 |
<data element_type="u8" shape="1280, 1" offset="68766263" size="1280" />
|
571 |
<output>
|
572 |
<port id="0" precision="U8">
|
|
|
575 |
</port>
|
576 |
</output>
|
577 |
</layer>
|
578 |
+
<layer id="44" name="Convert_42741" type="Convert" version="opset1">
|
579 |
<data destination_type="f16" />
|
580 |
<input>
|
581 |
<port id="0" precision="U8">
|
|
|
590 |
</port>
|
591 |
</output>
|
592 |
</layer>
|
593 |
+
<layer id="45" name="Constant_31293/zero_point/subtract" type="Subtract" version="opset1">
|
594 |
<data auto_broadcast="numpy" />
|
595 |
<input>
|
596 |
<port id="0" precision="FP16">
|
|
|
609 |
</port>
|
610 |
</output>
|
611 |
</layer>
|
612 |
+
<layer id="46" name="Constant_31293/scale" type="Const" version="opset1">
|
613 |
<data element_type="f16" shape="1280, 1" offset="68767543" size="2560" />
|
614 |
<output>
|
615 |
<port id="0" precision="FP16">
|
|
|
618 |
</port>
|
619 |
</output>
|
620 |
</layer>
|
621 |
+
<layer id="47" name="Constant_31293/fq_weights_1" type="Multiply" version="opset1">
|
622 |
<data auto_broadcast="numpy" />
|
623 |
<input>
|
624 |
<port id="0" precision="FP16">
|
|
|
637 |
</port>
|
638 |
</output>
|
639 |
</layer>
|
640 |
+
<layer id="48" name="Constant_31293/fq_weights_1/convert" type="Convert" version="opset1">
|
641 |
<data destination_type="f32" />
|
642 |
<input>
|
643 |
<port id="0" precision="FP16">
|
|
|
652 |
</port>
|
653 |
</output>
|
654 |
</layer>
|
655 |
+
<layer id="49" name="Multiply_31276" type="MatMul" version="opset1">
|
656 |
<data transpose_a="false" transpose_b="true" />
|
657 |
<input>
|
658 |
<port id="0" precision="FP32">
|
|
|
673 |
</port>
|
674 |
</output>
|
675 |
</layer>
|
676 |
+
<layer id="50" name="Constant_31392" type="Const" version="opset1">
|
677 |
<data element_type="f32" shape="1, 1, 1280" offset="68770103" size="5120" />
|
678 |
<output>
|
679 |
<port id="0" precision="FP32">
|
|
|
705 |
</port>
|
706 |
</output>
|
707 |
</layer>
|
708 |
+
<layer id="52" name="Constant_31709" type="Const" version="opset1">
|
709 |
<data element_type="i64" shape="4" offset="68775223" size="32" />
|
710 |
<output>
|
711 |
<port id="0" precision="I64">
|
|
|
772 |
</port>
|
773 |
</output>
|
774 |
</layer>
|
775 |
+
<layer id="57" name="Convert_42727" type="Convert" version="opset1">
|
776 |
<data destination_type="f16" />
|
777 |
<input>
|
778 |
<port id="0" precision="U8">
|
|
|
796 |
</port>
|
797 |
</output>
|
798 |
</layer>
|
799 |
+
<layer id="59" name="Convert_42730" type="Convert" version="opset1">
|
800 |
<data destination_type="f16" />
|
801 |
<input>
|
802 |
<port id="0" precision="U8">
|
|
|
894 |
</port>
|
895 |
</output>
|
896 |
</layer>
|
897 |
+
<layer id="65" name="Constant_31710" type="Const" version="opset1">
|
898 |
<data element_type="i64" shape="4" offset="68775223" size="32" />
|
899 |
<output>
|
900 |
<port id="0" precision="I64">
|
|
|
983 |
<port id="0" precision="I32" />
|
984 |
</output>
|
985 |
</layer>
|
986 |
+
<layer id="71" name="17" type="Const" version="opset1">
|
987 |
<data element_type="f32" shape="" offset="70417511" size="4" />
|
988 |
<output>
|
989 |
+
<port id="0" precision="FP32" names="17" />
|
990 |
</output>
|
991 |
</layer>
|
992 |
+
<layer id="72" name="Constant_31648" type="Const" version="opset1">
|
993 |
<data element_type="i64" shape="1" offset="67117607" size="8" />
|
994 |
<output>
|
995 |
<port id="0" precision="I64">
|
|
|
997 |
</port>
|
998 |
</output>
|
999 |
</layer>
|
1000 |
+
<layer id="73" name="Reshape_31649" type="Reshape" version="opset1">
|
1001 |
<data special_zero="false" />
|
1002 |
<input>
|
1003 |
<port id="0" precision="I64" />
|
|
|
1027 |
<port id="2" precision="I64" names="62,64" />
|
1028 |
</output>
|
1029 |
</layer>
|
1030 |
+
<layer id="76" name="Constant_24084" type="Const" version="opset1">
|
1031 |
<data element_type="i32" shape="" offset="66542811" size="4" />
|
1032 |
<output>
|
1033 |
<port id="0" precision="I32" />
|
1034 |
</output>
|
1035 |
</layer>
|
1036 |
+
<layer id="77" name="Unsqueeze_24085" type="Unsqueeze" version="opset1">
|
1037 |
<input>
|
1038 |
<port id="0" precision="I64" />
|
1039 |
<port id="1" precision="I32" />
|
|
|
1075 |
</port>
|
1076 |
</output>
|
1077 |
</layer>
|
1078 |
+
<layer id="80" name="ShapeOf_31655" type="ShapeOf" version="opset3">
|
1079 |
<data output_type="i32" />
|
1080 |
<input>
|
1081 |
<port id="0" precision="FP32">
|
|
|
1089 |
</port>
|
1090 |
</output>
|
1091 |
</layer>
|
1092 |
+
<layer id="81" name="Constant_31656" type="Const" version="opset1">
|
1093 |
<data element_type="i64" shape="" offset="67117607" size="8" />
|
1094 |
<output>
|
1095 |
<port id="0" precision="I64" />
|
1096 |
</output>
|
1097 |
</layer>
|
1098 |
+
<layer id="82" name="Constant_31657" type="Const" version="opset1">
|
1099 |
<data element_type="i64" shape="" offset="67117599" size="8" />
|
1100 |
<output>
|
1101 |
<port id="0" precision="I64" />
|
1102 |
</output>
|
1103 |
</layer>
|
1104 |
+
<layer id="83" name="Gather_31658" type="Gather" version="opset8">
|
1105 |
<data batch_dims="0" />
|
1106 |
<input>
|
1107 |
<port id="0" precision="I32">
|
|
|
1153 |
<port id="0" precision="I32" />
|
1154 |
</output>
|
1155 |
</layer>
|
1156 |
+
<layer id="88" name="Convert_31661" type="Convert" version="opset1">
|
1157 |
<data destination_type="i32" />
|
1158 |
<input>
|
1159 |
<port id="0" precision="I64" />
|
|
|
1295 |
</port>
|
1296 |
</output>
|
1297 |
</layer>
|
1298 |
+
<layer id="100" name="Constant_24187" type="Const" version="opset1">
|
1299 |
<data element_type="i64" shape="2" offset="70417515" size="16" />
|
1300 |
<output>
|
1301 |
<port id="0" precision="I64" names="70">
|
|
|
1412 |
</port>
|
1413 |
</output>
|
1414 |
</layer>
|
1415 |
+
<layer id="108" name="Constant_31639" type="Const" version="opset1">
|
1416 |
<data element_type="i64" shape="1" offset="67117599" size="8" />
|
1417 |
<output>
|
1418 |
<port id="0" precision="I64">
|
|
|
1420 |
</port>
|
1421 |
</output>
|
1422 |
</layer>
|
1423 |
+
<layer id="109" name="Constant_31640" type="Const" version="opset1">
|
1424 |
<data element_type="i64" shape="" offset="67117599" size="8" />
|
1425 |
<output>
|
1426 |
<port id="0" precision="I64" />
|
1427 |
</output>
|
1428 |
</layer>
|
1429 |
+
<layer id="110" name="Gather_31641" type="Gather" version="opset8">
|
1430 |
<data batch_dims="0" />
|
1431 |
<input>
|
1432 |
<port id="0" precision="I64">
|
|
|
1443 |
</port>
|
1444 |
</output>
|
1445 |
</layer>
|
1446 |
+
<layer id="111" name="Constant_30625" type="Const" version="opset1">
|
1447 |
<data element_type="i64" shape="1" offset="67117607" size="8" />
|
1448 |
<output>
|
1449 |
<port id="0" precision="I64">
|
|
|
1451 |
</port>
|
1452 |
</output>
|
1453 |
</layer>
|
1454 |
+
<layer id="112" name="Constant_30627" type="Const" version="opset1">
|
1455 |
<data element_type="i64" shape="1" offset="67117607" size="8" />
|
1456 |
<output>
|
1457 |
<port id="0" precision="I64">
|
|
|
1459 |
</port>
|
1460 |
</output>
|
1461 |
</layer>
|
1462 |
+
<layer id="113" name="Constant_30629" type="Const" version="opset1">
|
1463 |
<data element_type="i64" shape="1" offset="67117607" size="8" />
|
1464 |
<output>
|
1465 |
<port id="0" precision="I64">
|
|
|
1511 |
</port>
|
1512 |
</output>
|
1513 |
</layer>
|
1514 |
+
<layer id="116" name="Constant_24621" type="Const" version="opset1">
|
1515 |
<data element_type="i64" shape="1" offset="67117599" size="8" />
|
1516 |
<output>
|
1517 |
<port id="0" precision="I64">
|
|
|
1519 |
</port>
|
1520 |
</output>
|
1521 |
</layer>
|
1522 |
+
<layer id="117" name="ShapeOf_31670" type="ShapeOf" version="opset3">
|
1523 |
<data output_type="i64" />
|
1524 |
<input>
|
1525 |
<port id="0" precision="FP32">
|
|
|
1534 |
</port>
|
1535 |
</output>
|
1536 |
</layer>
|
1537 |
+
<layer id="118" name="Constant_31671" type="Const" version="opset1">
|
1538 |
<data element_type="i64" shape="1" offset="67117607" size="8" />
|
1539 |
<output>
|
1540 |
<port id="0" precision="I64">
|
|
|
1542 |
</port>
|
1543 |
</output>
|
1544 |
</layer>
|
1545 |
+
<layer id="119" name="Constant_31672" type="Const" version="opset1">
|
1546 |
<data element_type="i64" shape="" offset="67117599" size="8" />
|
1547 |
<output>
|
1548 |
<port id="0" precision="I64" />
|
1549 |
</output>
|
1550 |
</layer>
|
1551 |
+
<layer id="120" name="Gather_31673" type="Gather" version="opset8">
|
1552 |
<data batch_dims="0" />
|
1553 |
<input>
|
1554 |
<port id="0" precision="I64">
|
|
|
1565 |
</port>
|
1566 |
</output>
|
1567 |
</layer>
|
1568 |
+
<layer id="121" name="Constant_24624" type="Const" version="opset1">
|
1569 |
<data element_type="i64" shape="1" offset="67117607" size="8" />
|
1570 |
<output>
|
1571 |
<port id="0" precision="I64">
|
|
|
1664 |
</port>
|
1665 |
</output>
|
1666 |
</layer>
|
1667 |
+
<layer id="127" name="Convert_42716" type="Convert" version="opset1">
|
1668 |
<data destination_type="f16" />
|
1669 |
<input>
|
1670 |
<port id="0" precision="U8">
|
|
|
1688 |
</port>
|
1689 |
</output>
|
1690 |
</layer>
|
1691 |
+
<layer id="129" name="Convert_42719" type="Convert" version="opset1">
|
1692 |
<data destination_type="f16" />
|
1693 |
<input>
|
1694 |
<port id="0" precision="U8">
|
|
|
1786 |
</port>
|
1787 |
</output>
|
1788 |
</layer>
|
1789 |
+
<layer id="135" name="Constant_31393" type="Const" version="opset1">
|
1790 |
<data element_type="f32" shape="1, 1, 1280" offset="72059779" size="5120" />
|
1791 |
<output>
|
1792 |
<port id="0" precision="FP32">
|
|
|
1818 |
</port>
|
1819 |
</output>
|
1820 |
</layer>
|
1821 |
+
<layer id="137" name="Constant_31711" type="Const" version="opset1">
|
1822 |
<data element_type="i64" shape="4" offset="68775223" size="32" />
|
1823 |
<output>
|
1824 |
<port id="0" precision="I64">
|
|
|
1930 |
</port>
|
1931 |
</output>
|
1932 |
</layer>
|
1933 |
+
<layer id="144" name="Constant_31712" type="Const" version="opset1">
|
1934 |
<data element_type="i64" shape="3" offset="72064899" size="24" />
|
1935 |
<output>
|
1936 |
<port id="0" precision="I64">
|
|
|
1968 |
</port>
|
1969 |
</output>
|
1970 |
</layer>
|
1971 |
+
<layer id="147" name="Convert_42749" type="Convert" version="opset1">
|
1972 |
<data destination_type="f16" />
|
1973 |
<input>
|
1974 |
<port id="0" precision="U8">
|
|
|
1992 |
</port>
|
1993 |
</output>
|
1994 |
</layer>
|
1995 |
+
<layer id="149" name="Convert_42752" type="Convert" version="opset1">
|
1996 |
<data destination_type="f16" />
|
1997 |
<input>
|
1998 |
<port id="0" precision="U8">
|
|
|
2090 |
</port>
|
2091 |
</output>
|
2092 |
</layer>
|
2093 |
+
<layer id="155" name="Constant_31394" type="Const" version="opset1">
|
2094 |
<data element_type="f32" shape="1, 1, 1280" offset="73707163" size="5120" />
|
2095 |
<output>
|
2096 |
<port id="0" precision="FP32">
|
|
|
2172 |
</port>
|
2173 |
</output>
|
2174 |
</layer>
|
2175 |
+
<layer id="160" name="Constant_31395" type="Const" version="opset1">
|
2176 |
<data element_type="f32" shape="1, 1, 1280" offset="73712283" size="5120" />
|
2177 |
<output>
|
2178 |
<port id="0" precision="FP32">
|
|
|
2204 |
</port>
|
2205 |
</output>
|
2206 |
</layer>
|
2207 |
+
<layer id="162" name="Constant_31396" type="Const" version="opset1">
|
2208 |
<data element_type="f32" shape="1, 1, 1280" offset="73717403" size="5120" />
|
2209 |
<output>
|
2210 |
<port id="0" precision="FP32">
|
|
|
2236 |
</port>
|
2237 |
</output>
|
2238 |
</layer>
|
2239 |
+
<layer id="164" name="Constant_31296" type="Const" version="opset1">
|
2240 |
<data element_type="u8" shape="1280, 1280" offset="73722523" size="1638400" />
|
2241 |
<output>
|
2242 |
<port id="0" precision="U8">
|
|
|
2245 |
</port>
|
2246 |
</output>
|
2247 |
</layer>
|
2248 |
+
<layer id="165" name="Convert_42760" type="Convert" version="opset1">
|
2249 |
<data destination_type="f16" />
|
2250 |
<input>
|
2251 |
<port id="0" precision="U8">
|
|
|
2260 |
</port>
|
2261 |
</output>
|
2262 |
</layer>
|
2263 |
+
<layer id="166" name="Constant_31296/zero_point" type="Const" version="opset1">
|
2264 |
<data element_type="u8" shape="1280, 1" offset="75360923" size="1280" />
|
2265 |
<output>
|
2266 |
<port id="0" precision="U8">
|
|
|
2269 |
</port>
|
2270 |
</output>
|
2271 |
</layer>
|
2272 |
+
<layer id="167" name="Convert_42763" type="Convert" version="opset1">
|
2273 |
<data destination_type="f16" />
|
2274 |
<input>
|
2275 |
<port id="0" precision="U8">
|
|
|
2284 |
</port>
|
2285 |
</output>
|
2286 |
</layer>
|
2287 |
+
<layer id="168" name="Constant_31296/zero_point/subtract" type="Subtract" version="opset1">
|
2288 |
<data auto_broadcast="numpy" />
|
2289 |
<input>
|
2290 |
<port id="0" precision="FP16">
|
|
|
2303 |
</port>
|
2304 |
</output>
|
2305 |
</layer>
|
2306 |
+
<layer id="169" name="Constant_31296/scale" type="Const" version="opset1">
|
2307 |
<data element_type="f16" shape="1280, 1" offset="75362203" size="2560" />
|
2308 |
<output>
|
2309 |
<port id="0" precision="FP16">
|
|
|
2312 |
</port>
|
2313 |
</output>
|
2314 |
</layer>
|
2315 |
+
<layer id="170" name="Constant_31296/fq_weights_1" type="Multiply" version="opset1">
|
2316 |
<data auto_broadcast="numpy" />
|
2317 |
<input>
|
2318 |
<port id="0" precision="FP16">
|
|
|
2331 |
</port>
|
2332 |
</output>
|
2333 |
</layer>
|
2334 |
+
<layer id="171" name="Constant_31296/fq_weights_1/convert" type="Convert" version="opset1">
|
2335 |
<data destination_type="f32" />
|
2336 |
<input>
|
2337 |
<port id="0" precision="FP16">
|
|
|
2346 |
</port>
|
2347 |
</output>
|
2348 |
</layer>
|
2349 |
+
<layer id="172" name="Multiply_31280" type="MatMul" version="opset1">
|
2350 |
<data transpose_a="false" transpose_b="true" />
|
2351 |
<input>
|
2352 |
<port id="0" precision="FP32">
|
|
|
2367 |
</port>
|
2368 |
</output>
|
2369 |
</layer>
|
2370 |
+
<layer id="173" name="Constant_31397" type="Const" version="opset1">
|
2371 |
<data element_type="f32" shape="1, 1, 1280" offset="75364763" size="5120" />
|
2372 |
<output>
|
2373 |
<port id="0" precision="FP32">
|
|
|
2399 |
</port>
|
2400 |
</output>
|
2401 |
</layer>
|
2402 |
+
<layer id="175" name="Constant_31713" type="Const" version="opset1">
|
2403 |
<data element_type="i64" shape="4" offset="68775223" size="32" />
|
2404 |
<output>
|
2405 |
<port id="0" precision="I64">
|
|
|
2466 |
</port>
|
2467 |
</output>
|
2468 |
</layer>
|
2469 |
+
<layer id="180" name="Convert_42705" type="Convert" version="opset1">
|
2470 |
<data destination_type="f16" />
|
2471 |
<input>
|
2472 |
<port id="0" precision="U8">
|
|
|
2490 |
</port>
|
2491 |
</output>
|
2492 |
</layer>
|
2493 |
+
<layer id="182" name="Convert_42708" type="Convert" version="opset1">
|
2494 |
<data destination_type="f16" />
|
2495 |
<input>
|
2496 |
<port id="0" precision="U8">
|
|
|
2588 |
</port>
|
2589 |
</output>
|
2590 |
</layer>
|
2591 |
+
<layer id="188" name="Constant_24369" type="Const" version="opset1">
|
2592 |
<data element_type="i64" shape="1" offset="77012123" size="8" />
|
2593 |
<output>
|
2594 |
<port id="0" precision="I64">
|
|
|
2596 |
</port>
|
2597 |
</output>
|
2598 |
</layer>
|
2599 |
+
<layer id="189" name="Constant_24370" type="Const" version="opset1">
|
2600 |
<data element_type="i64" shape="1" offset="77012131" size="8" />
|
2601 |
<output>
|
2602 |
<port id="0" precision="I64">
|
|
|
2604 |
</port>
|
2605 |
</output>
|
2606 |
</layer>
|
2607 |
+
<layer id="190" name="Constant_24371" type="Const" version="opset1">
|
2608 |
<data element_type="i64" shape="1" offset="77012139" size="8" />
|
2609 |
<output>
|
2610 |
<port id="0" precision="I64">
|
|
|
2612 |
</port>
|
2613 |
</output>
|
2614 |
</layer>
|
2615 |
+
<layer id="191" name="__module.model.model.decoder.layers.0.self_attn/prim::ListConstruct_1" type="Concat" version="opset1">
|
2616 |
<data axis="0" />
|
2617 |
<input>
|
2618 |
<port id="0" precision="I64">
|
|
|
2737 |
</port>
|
2738 |
</output>
|
2739 |
</layer>
|
2740 |
+
<layer id="198" name="Convert_42694" type="Convert" version="opset1">
|
2741 |
<data destination_type="f16" />
|
2742 |
<input>
|
2743 |
<port id="0" precision="U8">
|
|
|
2761 |
</port>
|
2762 |
</output>
|
2763 |
</layer>
|
2764 |
+
<layer id="200" name="Convert_42697" type="Convert" version="opset1">
|
2765 |
<data destination_type="f16" />
|
2766 |
<input>
|
2767 |
<port id="0" precision="U8">
|
|
|
2859 |
</port>
|
2860 |
</output>
|
2861 |
</layer>
|
2862 |
+
<layer id="206" name="Constant_31398" type="Const" version="opset1">
|
2863 |
<data element_type="f32" shape="1, 1, 1280" offset="78654387" size="5120" />
|
2864 |
<output>
|
2865 |
<port id="0" precision="FP32">
|
|
|
2995 |
</port>
|
2996 |
</output>
|
2997 |
</layer>
|
2998 |
+
<layer id="214" name="Constant_31714" type="Const" version="opset1">
|
2999 |
<data element_type="i64" shape="3" offset="78659507" size="24" />
|
3000 |
<output>
|
3001 |
<port id="0" precision="I64">
|
|
|
3033 |
</port>
|
3034 |
</output>
|
3035 |
</layer>
|
3036 |
+
<layer id="217" name="Convert_42771" type="Convert" version="opset1">
|
3037 |
<data destination_type="f16" />
|
3038 |
<input>
|
3039 |
<port id="0" precision="U8">
|
|
|
3057 |
</port>
|
3058 |
</output>
|
3059 |
</layer>
|
3060 |
+
<layer id="219" name="Convert_42774" type="Convert" version="opset1">
|
3061 |
<data destination_type="f16" />
|
3062 |
<input>
|
3063 |
<port id="0" precision="U8">
|
|
|
3155 |
</port>
|
3156 |
</output>
|
3157 |
</layer>
|
3158 |
+
<layer id="225" name="Constant_31399" type="Const" version="opset1">
|
3159 |
<data element_type="f32" shape="1, 1, 1280" offset="80301771" size="5120" />
|
3160 |
<output>
|
3161 |
<port id="0" precision="FP32">
|
|
|
3237 |
</port>
|
3238 |
</output>
|
3239 |
</layer>
|
3240 |
+
<layer id="230" name="Constant_31400" type="Const" version="opset1">
|
3241 |
<data element_type="f32" shape="1, 1, 1280" offset="80306891" size="5120" />
|
3242 |
<output>
|
3243 |
<port id="0" precision="FP32">
|
|
|
3269 |
</port>
|
3270 |
</output>
|
3271 |
</layer>
|
3272 |
+
<layer id="232" name="Constant_31401" type="Const" version="opset1">
|
3273 |
<data element_type="f32" shape="1, 1, 1280" offset="80312011" size="5120" />
|
3274 |
<output>
|
3275 |
<port id="0" precision="FP32">
|
|
|
3310 |
</port>
|
3311 |
</output>
|
3312 |
</layer>
|
3313 |
+
<layer id="235" name="Convert_42628" type="Convert" version="opset1">
|
3314 |
<data destination_type="f16" />
|
3315 |
<input>
|
3316 |
<port id="0" precision="U8">
|
|
|
3334 |
</port>
|
3335 |
</output>
|
3336 |
</layer>
|
3337 |
+
<layer id="237" name="Convert_42631" type="Convert" version="opset1">
|
3338 |
<data destination_type="f16" />
|
3339 |
<input>
|
3340 |
<port id="0" precision="U8">
|
|
|
3432 |
</port>
|
3433 |
</output>
|
3434 |
</layer>
|
3435 |
+
<layer id="243" name="Constant_31402" type="Const" version="opset1">
|
3436 |
<data element_type="f32" shape="1, 1, 5120" offset="86886091" size="20480" />
|
3437 |
<output>
|
3438 |
<port id="0" precision="FP32">
|
|
|
3490 |
</port>
|
3491 |
</output>
|
3492 |
</layer>
|
3493 |
+
<layer id="247" name="Convert_42639" type="Convert" version="opset1">
|
3494 |
<data destination_type="f16" />
|
3495 |
<input>
|
3496 |
<port id="0" precision="U8">
|
|
|
3514 |
</port>
|
3515 |
</output>
|
3516 |
</layer>
|
3517 |
+
<layer id="249" name="Convert_42642" type="Convert" version="opset1">
|
3518 |
<data destination_type="f16" />
|
3519 |
<input>
|
3520 |
<port id="0" precision="U8">
|
|
|
3612 |
</port>
|
3613 |
</output>
|
3614 |
</layer>
|
3615 |
+
<layer id="255" name="Constant_31403" type="Const" version="opset1">
|
3616 |
<data element_type="f32" shape="1, 1, 1280" offset="93464011" size="5120" />
|
3617 |
<output>
|
3618 |
<port id="0" precision="FP32">
|
|
|
3694 |
</port>
|
3695 |
</output>
|
3696 |
</layer>
|
3697 |
+
<layer id="260" name="Constant_31404" type="Const" version="opset1">
|
3698 |
<data element_type="f32" shape="1, 1, 1280" offset="93469131" size="5120" />
|
3699 |
<output>
|
3700 |
<port id="0" precision="FP32">
|
|
|
3726 |
</port>
|
3727 |
</output>
|
3728 |
</layer>
|
3729 |
+
<layer id="262" name="Constant_31405" type="Const" version="opset1">
|
3730 |
<data element_type="f32" shape="1, 1, 1280" offset="93474251" size="5120" />
|
3731 |
<output>
|
3732 |
<port id="0" precision="FP32">
|
|
|
3758 |
</port>
|
3759 |
</output>
|
3760 |
</layer>
|
3761 |
+
<layer id="264" name="Constant_31299" type="Const" version="opset1">
|
3762 |
<data element_type="u8" shape="1280, 1280" offset="93479371" size="1638400" />
|
3763 |
<output>
|
3764 |
<port id="0" precision="U8">
|
|
|
3767 |
</port>
|
3768 |
</output>
|
3769 |
</layer>
|
3770 |
+
<layer id="265" name="Convert_42804" type="Convert" version="opset1">
|
3771 |
<data destination_type="f16" />
|
3772 |
<input>
|
3773 |
<port id="0" precision="U8">
|
|
|
3782 |
</port>
|
3783 |
</output>
|
3784 |
</layer>
|
3785 |
+
<layer id="266" name="Constant_31299/zero_point" type="Const" version="opset1">
|
3786 |
<data element_type="u8" shape="1280, 1" offset="95117771" size="1280" />
|
3787 |
<output>
|
3788 |
<port id="0" precision="U8">
|
|
|
3791 |
</port>
|
3792 |
</output>
|
3793 |
</layer>
|
3794 |
+
<layer id="267" name="Convert_42807" type="Convert" version="opset1">
|
3795 |
<data destination_type="f16" />
|
3796 |
<input>
|
3797 |
<port id="0" precision="U8">
|
|
|
3806 |
</port>
|
3807 |
</output>
|
3808 |
</layer>
|
3809 |
+
<layer id="268" name="Constant_31299/zero_point/subtract" type="Subtract" version="opset1">
|
3810 |
<data auto_broadcast="numpy" />
|
3811 |
<input>
|
3812 |
<port id="0" precision="FP16">
|
|
|
3825 |
</port>
|
3826 |
</output>
|
3827 |
</layer>
|
3828 |
+
<layer id="269" name="Constant_31299/scale" type="Const" version="opset1">
|
3829 |
<data element_type="f16" shape="1280, 1" offset="95119051" size="2560" />
|
3830 |
<output>
|
3831 |
<port id="0" precision="FP16">
|
|
|
3834 |
</port>
|
3835 |
</output>
|
3836 |
</layer>
|
3837 |
+
<layer id="270" name="Constant_31299/fq_weights_1" type="Multiply" version="opset1">
|
3838 |
<data auto_broadcast="numpy" />
|
3839 |
<input>
|
3840 |
<port id="0" precision="FP16">
|
|
|
3853 |
</port>
|
3854 |
</output>
|
3855 |
</layer>
|
3856 |
+
<layer id="271" name="Constant_31299/fq_weights_1/convert" type="Convert" version="opset1">
|
3857 |
<data destination_type="f32" />
|
3858 |
<input>
|
3859 |
<port id="0" precision="FP16">
|
|
|
3868 |
</port>
|
3869 |
</output>
|
3870 |
</layer>
|
3871 |
+
<layer id="272" name="Multiply_31284" type="MatMul" version="opset1">
|
3872 |
<data transpose_a="false" transpose_b="true" />
|
3873 |
<input>
|
3874 |
<port id="0" precision="FP32">
|
|
|
3889 |
</port>
|
3890 |
</output>
|
3891 |
</layer>
|
3892 |
+
<layer id="273" name="Constant_31406" type="Const" version="opset1">
|
3893 |
<data element_type="f32" shape="1, 1, 1280" offset="95121611" size="5120" />
|
3894 |
<output>
|
3895 |
<port id="0" precision="FP32">
|
|
|
3921 |
</port>
|
3922 |
</output>
|
3923 |
</layer>
|
3924 |
+
<layer id="275" name="Constant_31715" type="Const" version="opset1">
|
3925 |
<data element_type="i64" shape="4" offset="68775223" size="32" />
|
3926 |
<output>
|
3927 |
<port id="0" precision="I64">
|
|
|
3988 |
</port>
|
3989 |
</output>
|
3990 |
</layer>
|
3991 |
+
<layer id="280" name="Convert_42793" type="Convert" version="opset1">
|
3992 |
<data destination_type="f16" />
|
3993 |
<input>
|
3994 |
<port id="0" precision="U8">
|
|
|
4012 |
</port>
|
4013 |
</output>
|
4014 |
</layer>
|
4015 |
+
<layer id="282" name="Convert_42796" type="Convert" version="opset1">
|
4016 |
<data destination_type="f16" />
|
4017 |
<input>
|
4018 |
<port id="0" precision="U8">
|
|
|
4110 |
</port>
|
4111 |
</output>
|
4112 |
</layer>
|
4113 |
+
<layer id="288" name="Constant_31716" type="Const" version="opset1">
|
4114 |
<data element_type="i64" shape="4" offset="68775223" size="32" />
|
4115 |
<output>
|
4116 |
<port id="0" precision="I64">
|
|
|
4246 |
</port>
|
4247 |
</output>
|
4248 |
</layer>
|
4249 |
+
<layer id="296" name="Convert_42782" type="Convert" version="opset1">
|
4250 |
<data destination_type="f16" />
|
4251 |
<input>
|
4252 |
<port id="0" precision="U8">
|
|
|
4270 |
</port>
|
4271 |
</output>
|
4272 |
</layer>
|
4273 |
+
<layer id="298" name="Convert_42785" type="Convert" version="opset1">
|
4274 |
<data destination_type="f16" />
|
4275 |
<input>
|
4276 |
<port id="0" precision="U8">
|
|
|
4368 |
</port>
|
4369 |
</output>
|
4370 |
</layer>
|
4371 |
+
<layer id="304" name="Constant_31407" type="Const" version="opset1">
|
4372 |
<data element_type="f32" shape="1, 1, 1280" offset="98411211" size="5120" />
|
4373 |
<output>
|
4374 |
<port id="0" precision="FP32">
|
|
|
4400 |
</port>
|
4401 |
</output>
|
4402 |
</layer>
|
4403 |
+
<layer id="306" name="Constant_31717" type="Const" version="opset1">
|
4404 |
<data element_type="i64" shape="4" offset="68775223" size="32" />
|
4405 |
<output>
|
4406 |
<port id="0" precision="I64">
|
|
|
4512 |
</port>
|
4513 |
</output>
|
4514 |
</layer>
|
4515 |
+
<layer id="313" name="Constant_31718" type="Const" version="opset1">
|
4516 |
<data element_type="i64" shape="3" offset="72064899" size="24" />
|
4517 |
<output>
|
4518 |
<port id="0" precision="I64">
|
|
|
4550 |
</port>
|
4551 |
</output>
|
4552 |
</layer>
|
4553 |
+
<layer id="316" name="Convert_42815" type="Convert" version="opset1">
|
4554 |
<data destination_type="f16" />
|
4555 |
<input>
|
4556 |
<port id="0" precision="U8">
|
|
|
4574 |
</port>
|
4575 |
</output>
|
4576 |
</layer>
|
4577 |
+
<layer id="318" name="Convert_42818" type="Convert" version="opset1">
|
4578 |
<data destination_type="f16" />
|
4579 |
<input>
|
4580 |
<port id="0" precision="U8">
|
|
|
4672 |
</port>
|
4673 |
</output>
|
4674 |
</layer>
|
4675 |
+
<layer id="324" name="Constant_31408" type="Const" version="opset1">
|
4676 |
<data element_type="f32" shape="1, 1, 1280" offset="100058571" size="5120" />
|
4677 |
<output>
|
4678 |
<port id="0" precision="FP32">
|
|
|
4754 |
</port>
|
4755 |
</output>
|
4756 |
</layer>
|
4757 |
+
<layer id="329" name="Constant_31409" type="Const" version="opset1">
|
4758 |
<data element_type="f32" shape="1, 1, 1280" offset="100063691" size="5120" />
|
4759 |
<output>
|
4760 |
<port id="0" precision="FP32">
|
|
|
4786 |
</port>
|
4787 |
</output>
|
4788 |
</layer>
|
4789 |
+
<layer id="331" name="Constant_31410" type="Const" version="opset1">
|
4790 |
<data element_type="f32" shape="1, 1, 1280" offset="100068811" size="5120" />
|
4791 |
<output>
|
4792 |
<port id="0" precision="FP32">
|
|
|
4818 |
</port>
|
4819 |
</output>
|
4820 |
</layer>
|
4821 |
+
<layer id="333" name="Constant_31302" type="Const" version="opset1">
|
4822 |
<data element_type="u8" shape="1280, 1280" offset="100073931" size="1638400" />
|
4823 |
<output>
|
4824 |
<port id="0" precision="U8">
|
|
|
4827 |
</port>
|
4828 |
</output>
|
4829 |
</layer>
|
4830 |
+
<layer id="334" name="Convert_42826" type="Convert" version="opset1">
|
4831 |
<data destination_type="f16" />
|
4832 |
<input>
|
4833 |
<port id="0" precision="U8">
|
|
|
4842 |
</port>
|
4843 |
</output>
|
4844 |
</layer>
|
4845 |
+
<layer id="335" name="Constant_31302/zero_point" type="Const" version="opset1">
|
4846 |
<data element_type="u8" shape="1280, 1" offset="101712331" size="1280" />
|
4847 |
<output>
|
4848 |
<port id="0" precision="U8">
|
|
|
4851 |
</port>
|
4852 |
</output>
|
4853 |
</layer>
|
4854 |
+
<layer id="336" name="Convert_42829" type="Convert" version="opset1">
|
4855 |
<data destination_type="f16" />
|
4856 |
<input>
|
4857 |
<port id="0" precision="U8">
|
|
|
4866 |
</port>
|
4867 |
</output>
|
4868 |
</layer>
|
4869 |
+
<layer id="337" name="Constant_31302/zero_point/subtract" type="Subtract" version="opset1">
|
4870 |
<data auto_broadcast="numpy" />
|
4871 |
<input>
|
4872 |
<port id="0" precision="FP16">
|
|
|
4885 |
</port>
|
4886 |
</output>
|
4887 |
</layer>
|
4888 |
+
<layer id="338" name="Constant_31302/scale" type="Const" version="opset1">
|
4889 |
<data element_type="f16" shape="1280, 1" offset="101713611" size="2560" />
|
4890 |
<output>
|
4891 |
<port id="0" precision="FP16">
|
|
|
4894 |
</port>
|
4895 |
</output>
|
4896 |
</layer>
|
4897 |
+
<layer id="339" name="Constant_31302/fq_weights_1" type="Multiply" version="opset1">
|
4898 |
<data auto_broadcast="numpy" />
|
4899 |
<input>
|
4900 |
<port id="0" precision="FP16">
|
|
|
4913 |
</port>
|
4914 |
</output>
|
4915 |
</layer>
|
4916 |
+
<layer id="340" name="Constant_31302/fq_weights_1/convert" type="Convert" version="opset1">
|
4917 |
<data destination_type="f32" />
|
4918 |
<input>
|
4919 |
<port id="0" precision="FP16">
|
|
|
4928 |
</port>
|
4929 |
</output>
|
4930 |
</layer>
|
4931 |
+
<layer id="341" name="Multiply_31288" type="MatMul" version="opset1">
|
4932 |
<data transpose_a="false" transpose_b="true" />
|
4933 |
<input>
|
4934 |
<port id="0" precision="FP32">
|
|
|
4949 |
</port>
|
4950 |
</output>
|
4951 |
</layer>
|
4952 |
+
<layer id="342" name="Constant_31411" type="Const" version="opset1">
|
4953 |
<data element_type="f32" shape="1, 1, 1280" offset="101716171" size="5120" />
|
4954 |
<output>
|
4955 |
<port id="0" precision="FP32">
|
|
|
4981 |
</port>
|
4982 |
</output>
|
4983 |
</layer>
|
4984 |
+
<layer id="344" name="Constant_31719" type="Const" version="opset1">
|
4985 |
<data element_type="i64" shape="4" offset="68775223" size="32" />
|
4986 |
<output>
|
4987 |
<port id="0" precision="I64">
|
|
|
5048 |
</port>
|
5049 |
</output>
|
5050 |
</layer>
|
5051 |
+
<layer id="349" name="Convert_42683" type="Convert" version="opset1">
|
5052 |
<data destination_type="f16" />
|
5053 |
<input>
|
5054 |
<port id="0" precision="U8">
|
|
|
5072 |
</port>
|
5073 |
</output>
|
5074 |
</layer>
|
5075 |
+
<layer id="351" name="Convert_42686" type="Convert" version="opset1">
|
5076 |
<data destination_type="f16" />
|
5077 |
<input>
|
5078 |
<port id="0" precision="U8">
|
|
|
5273 |
</port>
|
5274 |
</output>
|
5275 |
</layer>
|
5276 |
+
<layer id="363" name="Convert_42672" type="Convert" version="opset1">
|
5277 |
<data destination_type="f16" />
|
5278 |
<input>
|
5279 |
<port id="0" precision="U8">
|
|
|
5297 |
</port>
|
5298 |
</output>
|
5299 |
</layer>
|
5300 |
+
<layer id="365" name="Convert_42675" type="Convert" version="opset1">
|
5301 |
<data destination_type="f16" />
|
5302 |
<input>
|
5303 |
<port id="0" precision="U8">
|
|
|
5395 |
</port>
|
5396 |
</output>
|
5397 |
</layer>
|
5398 |
+
<layer id="371" name="Constant_31412" type="Const" version="opset1">
|
5399 |
<data element_type="f32" shape="1, 1, 1280" offset="105005771" size="5120" />
|
5400 |
<output>
|
5401 |
<port id="0" precision="FP32">
|
|
|
5531 |
</port>
|
5532 |
</output>
|
5533 |
</layer>
|
5534 |
+
<layer id="379" name="Constant_31720" type="Const" version="opset1">
|
5535 |
<data element_type="i64" shape="3" offset="78659507" size="24" />
|
5536 |
<output>
|
5537 |
<port id="0" precision="I64">
|
|
|
5569 |
</port>
|
5570 |
</output>
|
5571 |
</layer>
|
5572 |
+
<layer id="382" name="Convert_42837" type="Convert" version="opset1">
|
5573 |
<data destination_type="f16" />
|
5574 |
<input>
|
5575 |
<port id="0" precision="U8">
|
|
|
5593 |
</port>
|
5594 |
</output>
|
5595 |
</layer>
|
5596 |
+
<layer id="384" name="Convert_42840" type="Convert" version="opset1">
|
5597 |
<data destination_type="f16" />
|
5598 |
<input>
|
5599 |
<port id="0" precision="U8">
|
|
|
5691 |
</port>
|
5692 |
</output>
|
5693 |
</layer>
|
5694 |
+
<layer id="390" name="Constant_31413" type="Const" version="opset1">
|
5695 |
<data element_type="f32" shape="1, 1, 1280" offset="106653131" size="5120" />
|
5696 |
<output>
|
5697 |
<port id="0" precision="FP32">
|
|
|
5773 |
</port>
|
5774 |
</output>
|
5775 |
</layer>
|
5776 |
+
<layer id="395" name="Constant_31414" type="Const" version="opset1">
|
5777 |
<data element_type="f32" shape="1, 1, 1280" offset="106658251" size="5120" />
|
5778 |
<output>
|
5779 |
<port id="0" precision="FP32">
|
|
|
5805 |
</port>
|
5806 |
</output>
|
5807 |
</layer>
|
5808 |
+
<layer id="397" name="Constant_31415" type="Const" version="opset1">
|
5809 |
<data element_type="f32" shape="1, 1, 1280" offset="106663371" size="5120" />
|
5810 |
<output>
|
5811 |
<port id="0" precision="FP32">
|
|
|
5846 |
</port>
|
5847 |
</output>
|
5848 |
</layer>
|
5849 |
+
<layer id="400" name="Convert_42650" type="Convert" version="opset1">
|
5850 |
<data destination_type="f16" />
|
5851 |
<input>
|
5852 |
<port id="0" precision="U8">
|
|
|
5870 |
</port>
|
5871 |
</output>
|
5872 |
</layer>
|
5873 |
+
<layer id="402" name="Convert_42653" type="Convert" version="opset1">
|
5874 |
<data destination_type="f16" />
|
5875 |
<input>
|
5876 |
<port id="0" precision="U8">
|
|
|
5968 |
</port>
|
5969 |
</output>
|
5970 |
</layer>
|
5971 |
+
<layer id="408" name="Constant_31416" type="Const" version="opset1">
|
5972 |
<data element_type="f32" shape="1, 1, 5120" offset="113237451" size="20480" />
|
5973 |
<output>
|
5974 |
<port id="0" precision="FP32">
|
|
|
6026 |
</port>
|
6027 |
</output>
|
6028 |
</layer>
|
6029 |
+
<layer id="412" name="Convert_42661" type="Convert" version="opset1">
|
6030 |
<data destination_type="f16" />
|
6031 |
<input>
|
6032 |
<port id="0" precision="U8">
|
|
|
6050 |
</port>
|
6051 |
</output>
|
6052 |
</layer>
|
6053 |
+
<layer id="414" name="Convert_42664" type="Convert" version="opset1">
|
6054 |
<data destination_type="f16" />
|
6055 |
<input>
|
6056 |
<port id="0" precision="U8">
|
|
|
6148 |
</port>
|
6149 |
</output>
|
6150 |
</layer>
|
6151 |
+
<layer id="420" name="Constant_31417" type="Const" version="opset1">
|
6152 |
<data element_type="f32" shape="1, 1, 1280" offset="119815371" size="5120" />
|
6153 |
<output>
|
6154 |
<port id="0" precision="FP32">
|
|
|
6230 |
</port>
|
6231 |
</output>
|
6232 |
</layer>
|
6233 |
+
<layer id="425" name="Constant_31418" type="Const" version="opset1">
|
6234 |
<data element_type="f32" shape="1, 1, 1280" offset="119820491" size="5120" />
|
6235 |
<output>
|
6236 |
<port id="0" precision="FP32">
|
|
|
6262 |
</port>
|
6263 |
</output>
|
6264 |
</layer>
|
6265 |
+
<layer id="427" name="Constant_31419" type="Const" version="opset1">
|
6266 |
<data element_type="f32" shape="1, 1, 1280" offset="119825611" size="5120" />
|
6267 |
<output>
|
6268 |
<port id="0" precision="FP32">
|
|
|
6315 |
</port>
|
6316 |
</output>
|
6317 |
</layer>
|
6318 |
+
<layer id="430" name="Result_26206" type="Result" version="opset1">
|
6319 |
<input>
|
6320 |
<port id="0" precision="FP32">
|
6321 |
<dim>-1</dim>
|
|
|
6792 |
<edge from-layer="429" from-port="2" to-layer="430" to-port="0" />
|
6793 |
</edges>
|
6794 |
<rt_info>
|
6795 |
+
<Runtime_version value="2024.5.0-17285-ea5c1dcfdf9-releases/2024/5" />
|
6796 |
<conversion_parameters>
|
6797 |
<framework value="pytorch" />
|
6798 |
<is_python_object value="True" />
|
|
|
6800 |
<nncf>
|
6801 |
<friendly_names_were_updated value="True" />
|
6802 |
<weight_compression>
|
6803 |
+
<advanced_parameters value="{'statistics_path': None, 'awq_params': {'subset_size': 32, 'percent_to_apply': 0.002, 'alpha_min': 0.0, 'alpha_max': 1.0, 'steps': 100}, 'scale_estimation_params': {'subset_size': 64, 'initial_steps': 5, 'scale_steps': 5, 'weight_penalty': -1.0}, 'gptq_params': {'damp_percent': 0.1, 'block_size': 128, 'subset_size': 128}, 'lora_correction_params': {'adapter_rank': 8, 'num_iterations': 3, 'apply_regularization': True, 'subset_size': 128, 'use_int8_adapters': True}}" />
|
6804 |
<all_layers value="False" />
|
6805 |
<awq value="False" />
|
6806 |
+
<backup_mode value="int8_asym" />
|
6807 |
<gptq value="False" />
|
6808 |
<group_size value="-1" />
|
6809 |
<ignored_scope value="[]" />
|
|
|
6815 |
</weight_compression>
|
6816 |
</nncf>
|
6817 |
<optimum>
|
6818 |
+
<optimum_intel_version value="1.21.0.dev0+d357376" />
|
6819 |
+
<optimum_version value="1.23.3" />
|
6820 |
+
<pytorch_version value="2.5.1" />
|
6821 |
+
<transformers_version value="4.46.3" />
|
6822 |
</optimum>
|
6823 |
</rt_info>
|
6824 |
</net>
|
openvino_detokenizer.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 528297
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:369dbe475202046c9ed61f55e4c32ce00c4f821af815f8a7f70523fba0155491
|
3 |
size 528297
|
openvino_detokenizer.xml
CHANGED
@@ -1,16 +1,16 @@
|
|
1 |
<?xml version="1.0"?>
|
2 |
<net name="detokenizer" version="11">
|
3 |
<layers>
|
4 |
-
<layer id="0" name="
|
5 |
<data shape="?,?" element_type="i64" />
|
6 |
<output>
|
7 |
-
<port id="0" precision="I64" names="
|
8 |
<dim>-1</dim>
|
9 |
<dim>-1</dim>
|
10 |
</port>
|
11 |
</output>
|
12 |
</layer>
|
13 |
-
<layer id="1" name="
|
14 |
<data destination_type="i32" />
|
15 |
<input>
|
16 |
<port id="0" precision="I64">
|
@@ -25,7 +25,7 @@
|
|
25 |
</port>
|
26 |
</output>
|
27 |
</layer>
|
28 |
-
<layer id="2" name="
|
29 |
<data element_type="u8" shape="528248" offset="0" size="528248" />
|
30 |
<output>
|
31 |
<port id="0" precision="U8">
|
@@ -33,7 +33,7 @@
|
|
33 |
</port>
|
34 |
</output>
|
35 |
</layer>
|
36 |
-
<layer id="3" name="
|
37 |
<data mode="begins_ends" />
|
38 |
<input>
|
39 |
<port id="0" precision="U8">
|
@@ -52,7 +52,7 @@
|
|
52 |
</port>
|
53 |
</output>
|
54 |
</layer>
|
55 |
-
<layer id="4" name="
|
56 |
<data skip_tokens="50257, 50258, 50259, 50260, 50261, 50262, 50263, 50264, 50265, 50266, 50267, 50268, 50269, 50270, 50271, 50272, 50273, 50274, 50275, 50276, 50277, 50278, 50279, 50280, 50281, 50282, 50283, 50284, 50285, 50286, 50287, 50288, 50289, 50290, 50291, 50292, 50293, 50294, 50295, 50296, 50297, 50298, 50299, 50300, 50301, 50302, 50303, 50304, 50305, 50306, 50307, 50308, 50309, 50310, 50311, 50312, 50313, 50314, 50315, 50316, 50317, 50318, 50319, 50320, 50321, 50322, 50323, 50324, 50325, 50326, 50327, 50328, 50329, 50330, 50331, 50332, 50333, 50334, 50335, 50336, 50337, 50338, 50339, 50340, 50341, 50342, 50343, 50344, 50345, 50346, 50347, 50348, 50349, 50350, 50351, 50352, 50353, 50354, 50355, 50356, 50357, 50358, 50359, 50360, 50361, 50362, 50363" />
|
57 |
<input>
|
58 |
<port id="0" precision="I32">
|
@@ -87,7 +87,7 @@
|
|
87 |
</port>
|
88 |
</output>
|
89 |
</layer>
|
90 |
-
<layer id="5" name="
|
91 |
<input>
|
92 |
<port id="0" precision="I32">
|
93 |
<dim>-1</dim>
|
@@ -111,7 +111,7 @@
|
|
111 |
</port>
|
112 |
</output>
|
113 |
</layer>
|
114 |
-
<layer id="6" name="
|
115 |
<data element_type="u8" shape="47" offset="528248" size="47" />
|
116 |
<output>
|
117 |
<port id="0" precision="U8">
|
@@ -119,7 +119,7 @@
|
|
119 |
</port>
|
120 |
</output>
|
121 |
</layer>
|
122 |
-
<layer id="7" name="
|
123 |
<data element_type="u8" shape="2" offset="528295" size="2" />
|
124 |
<output>
|
125 |
<port id="0" precision="U8">
|
@@ -127,7 +127,7 @@
|
|
127 |
</port>
|
128 |
</output>
|
129 |
</layer>
|
130 |
-
<layer id="8" name="
|
131 |
<data global_replace="true" />
|
132 |
<input>
|
133 |
<port id="0" precision="I32">
|
@@ -158,7 +158,7 @@
|
|
158 |
</port>
|
159 |
</output>
|
160 |
</layer>
|
161 |
-
<layer id="9" name="
|
162 |
<data mode="begins_ends" />
|
163 |
<input>
|
164 |
<port id="0" precision="I32">
|
@@ -177,7 +177,7 @@
|
|
177 |
</port>
|
178 |
</output>
|
179 |
</layer>
|
180 |
-
<layer id="10" name="
|
181 |
<input>
|
182 |
<port id="0" precision="STRING">
|
183 |
<dim>-1</dim>
|
@@ -207,9 +207,29 @@
|
|
207 |
<edge from-layer="9" from-port="3" to-layer="10" to-port="0" />
|
208 |
</edges>
|
209 |
<rt_info>
|
|
|
|
|
|
|
210 |
<bos_token_id value="50257" />
|
|
|
|
|
211 |
<eos_token_id value="50257" />
|
|
|
|
|
|
|
|
|
212 |
<original_tokenizer_class value="<class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
|
213 |
<pad_token_id value="50257" />
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
214 |
</rt_info>
|
215 |
</net>
|
|
|
1 |
<?xml version="1.0"?>
|
2 |
<net name="detokenizer" version="11">
|
3 |
<layers>
|
4 |
+
<layer id="0" name="Parameter_32766" type="Parameter" version="opset1">
|
5 |
<data shape="?,?" element_type="i64" />
|
6 |
<output>
|
7 |
+
<port id="0" precision="I64" names="Parameter_32766">
|
8 |
<dim>-1</dim>
|
9 |
<dim>-1</dim>
|
10 |
</port>
|
11 |
</output>
|
12 |
</layer>
|
13 |
+
<layer id="1" name="Convert_32782" type="Convert" version="opset1">
|
14 |
<data destination_type="i32" />
|
15 |
<input>
|
16 |
<port id="0" precision="I64">
|
|
|
25 |
</port>
|
26 |
</output>
|
27 |
</layer>
|
28 |
+
<layer id="2" name="Constant_32721" type="Const" version="opset1">
|
29 |
<data element_type="u8" shape="528248" offset="0" size="528248" />
|
30 |
<output>
|
31 |
<port id="0" precision="U8">
|
|
|
33 |
</port>
|
34 |
</output>
|
35 |
</layer>
|
36 |
+
<layer id="3" name="StringTensorUnpack_32722" type="StringTensorUnpack" version="extension">
|
37 |
<data mode="begins_ends" />
|
38 |
<input>
|
39 |
<port id="0" precision="U8">
|
|
|
52 |
</port>
|
53 |
</output>
|
54 |
</layer>
|
55 |
+
<layer id="4" name="VocabDecoder_32767" type="VocabDecoder" version="extension">
|
56 |
<data skip_tokens="50257, 50258, 50259, 50260, 50261, 50262, 50263, 50264, 50265, 50266, 50267, 50268, 50269, 50270, 50271, 50272, 50273, 50274, 50275, 50276, 50277, 50278, 50279, 50280, 50281, 50282, 50283, 50284, 50285, 50286, 50287, 50288, 50289, 50290, 50291, 50292, 50293, 50294, 50295, 50296, 50297, 50298, 50299, 50300, 50301, 50302, 50303, 50304, 50305, 50306, 50307, 50308, 50309, 50310, 50311, 50312, 50313, 50314, 50315, 50316, 50317, 50318, 50319, 50320, 50321, 50322, 50323, 50324, 50325, 50326, 50327, 50328, 50329, 50330, 50331, 50332, 50333, 50334, 50335, 50336, 50337, 50338, 50339, 50340, 50341, 50342, 50343, 50344, 50345, 50346, 50347, 50348, 50349, 50350, 50351, 50352, 50353, 50354, 50355, 50356, 50357, 50358, 50359, 50360, 50361, 50362, 50363" />
|
57 |
<input>
|
58 |
<port id="0" precision="I32">
|
|
|
87 |
</port>
|
88 |
</output>
|
89 |
</layer>
|
90 |
+
<layer id="5" name="FuzeRagged_32768" type="FuzeRagged" version="extension">
|
91 |
<input>
|
92 |
<port id="0" precision="I32">
|
93 |
<dim>-1</dim>
|
|
|
111 |
</port>
|
112 |
</output>
|
113 |
</layer>
|
114 |
+
<layer id="6" name="Constant_32770" type="Const" version="opset1">
|
115 |
<data element_type="u8" shape="47" offset="528248" size="47" />
|
116 |
<output>
|
117 |
<port id="0" precision="U8">
|
|
|
119 |
</port>
|
120 |
</output>
|
121 |
</layer>
|
122 |
+
<layer id="7" name="Constant_32772" type="Const" version="opset1">
|
123 |
<data element_type="u8" shape="2" offset="528295" size="2" />
|
124 |
<output>
|
125 |
<port id="0" precision="U8">
|
|
|
127 |
</port>
|
128 |
</output>
|
129 |
</layer>
|
130 |
+
<layer id="8" name="RegexNormalization_32773" type="RegexNormalization" version="extension">
|
131 |
<data global_replace="true" />
|
132 |
<input>
|
133 |
<port id="0" precision="I32">
|
|
|
158 |
</port>
|
159 |
</output>
|
160 |
</layer>
|
161 |
+
<layer id="9" name="StringTensorPack_32774" type="StringTensorPack" version="extension">
|
162 |
<data mode="begins_ends" />
|
163 |
<input>
|
164 |
<port id="0" precision="I32">
|
|
|
177 |
</port>
|
178 |
</output>
|
179 |
</layer>
|
180 |
+
<layer id="10" name="Result_32775" type="Result" version="opset1">
|
181 |
<input>
|
182 |
<port id="0" precision="STRING">
|
183 |
<dim>-1</dim>
|
|
|
207 |
<edge from-layer="9" from-port="3" to-layer="10" to-port="0" />
|
208 |
</edges>
|
209 |
<rt_info>
|
210 |
+
<add_attention_mask value="True" />
|
211 |
+
<add_prefix_space />
|
212 |
+
<add_special_tokens value="True" />
|
213 |
<bos_token_id value="50257" />
|
214 |
+
<clean_up_tokenization_spaces />
|
215 |
+
<detokenizer_input_type value="i64" />
|
216 |
<eos_token_id value="50257" />
|
217 |
+
<handle_special_tokens_with_re />
|
218 |
+
<number_of_inputs value="1" />
|
219 |
+
<openvino_tokenizers_version value="2024.5.0.0" />
|
220 |
+
<openvino_version value="2024.5.0" />
|
221 |
<original_tokenizer_class value="<class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
|
222 |
<pad_token_id value="50257" />
|
223 |
+
<sentencepiece_version value="0.2.0" />
|
224 |
+
<skip_special_tokens value="True" />
|
225 |
+
<streaming_detokenizer value="False" />
|
226 |
+
<tiktoken_version value="0.8.0" />
|
227 |
+
<tokenizer_output_type value="i64" />
|
228 |
+
<tokenizers_version value="0.20.3" />
|
229 |
+
<transformers_version value="4.46.3" />
|
230 |
+
<use_max_padding value="False" />
|
231 |
+
<use_sentencepiece_backend value="False" />
|
232 |
+
<utf8_replace_mode />
|
233 |
+
<with_detokenizer value="True" />
|
234 |
</rt_info>
|
235 |
</net>
|
openvino_encoder_model.xml
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
openvino_tokenizer.xml
CHANGED
@@ -1,27 +1,27 @@
|
|
1 |
<?xml version="1.0"?>
|
2 |
<net name="tokenizer" version="11">
|
3 |
<layers>
|
4 |
-
<layer id="0" name="
|
5 |
<data shape="?" element_type="string" />
|
6 |
<output>
|
7 |
-
<port id="0" precision="STRING" names="
|
8 |
<dim>-1</dim>
|
9 |
</port>
|
10 |
</output>
|
11 |
</layer>
|
12 |
-
<layer id="1" name="
|
13 |
<data element_type="i32" shape="" offset="0" size="4" />
|
14 |
<output>
|
15 |
<port id="0" precision="I32" />
|
16 |
</output>
|
17 |
</layer>
|
18 |
-
<layer id="2" name="
|
19 |
<data element_type="i32" shape="" offset="4" size="4" />
|
20 |
<output>
|
21 |
<port id="0" precision="I32" />
|
22 |
</output>
|
23 |
</layer>
|
24 |
-
<layer id="3" name="
|
25 |
<data element_type="i32" shape="1" offset="8" size="4" />
|
26 |
<output>
|
27 |
<port id="0" precision="I32">
|
@@ -29,19 +29,19 @@
|
|
29 |
</port>
|
30 |
</output>
|
31 |
</layer>
|
32 |
-
<layer id="4" name="
|
33 |
<data element_type="i32" shape="" offset="0" size="4" />
|
34 |
<output>
|
35 |
<port id="0" precision="I32" />
|
36 |
</output>
|
37 |
</layer>
|
38 |
-
<layer id="5" name="
|
39 |
<data element_type="i32" shape="" offset="4" size="4" />
|
40 |
<output>
|
41 |
<port id="0" precision="I32" />
|
42 |
</output>
|
43 |
</layer>
|
44 |
-
<layer id="6" name="
|
45 |
<data element_type="i32" shape="1" offset="12" size="4" />
|
46 |
<output>
|
47 |
<port id="0" precision="I32">
|
@@ -49,19 +49,19 @@
|
|
49 |
</port>
|
50 |
</output>
|
51 |
</layer>
|
52 |
-
<layer id="7" name="
|
53 |
<data element_type="i32" shape="" offset="0" size="4" />
|
54 |
<output>
|
55 |
<port id="0" precision="I32" />
|
56 |
</output>
|
57 |
</layer>
|
58 |
-
<layer id="8" name="
|
59 |
<data element_type="i32" shape="" offset="4" size="4" />
|
60 |
<output>
|
61 |
<port id="0" precision="I32" />
|
62 |
</output>
|
63 |
</layer>
|
64 |
-
<layer id="9" name="
|
65 |
<data element_type="i32" shape="1" offset="16" size="4" />
|
66 |
<output>
|
67 |
<port id="0" precision="I32">
|
@@ -69,19 +69,19 @@
|
|
69 |
</port>
|
70 |
</output>
|
71 |
</layer>
|
72 |
-
<layer id="10" name="
|
73 |
<data element_type="i32" shape="" offset="0" size="4" />
|
74 |
<output>
|
75 |
<port id="0" precision="I32" />
|
76 |
</output>
|
77 |
</layer>
|
78 |
-
<layer id="11" name="
|
79 |
<data element_type="i32" shape="" offset="4" size="4" />
|
80 |
<output>
|
81 |
<port id="0" precision="I32" />
|
82 |
</output>
|
83 |
</layer>
|
84 |
-
<layer id="12" name="
|
85 |
<data element_type="i32" shape="1" offset="20" size="4" />
|
86 |
<output>
|
87 |
<port id="0" precision="I32">
|
@@ -89,13 +89,13 @@
|
|
89 |
</port>
|
90 |
</output>
|
91 |
</layer>
|
92 |
-
<layer id="13" name="
|
93 |
<data element_type="i64" shape="" offset="24" size="8" />
|
94 |
<output>
|
95 |
<port id="0" precision="I64" />
|
96 |
</output>
|
97 |
</layer>
|
98 |
-
<layer id="14" name="
|
99 |
<data mode="begins_ends" />
|
100 |
<input>
|
101 |
<port id="0" precision="STRING">
|
@@ -114,7 +114,7 @@
|
|
114 |
</port>
|
115 |
</output>
|
116 |
</layer>
|
117 |
-
<layer id="15" name="
|
118 |
<data output_type="i64" />
|
119 |
<input>
|
120 |
<port id="0" precision="I32">
|
@@ -127,19 +127,19 @@
|
|
127 |
</port>
|
128 |
</output>
|
129 |
</layer>
|
130 |
-
<layer id="16" name="
|
131 |
<data element_type="i64" shape="" offset="24" size="8" />
|
132 |
<output>
|
133 |
<port id="0" precision="I64" />
|
134 |
</output>
|
135 |
</layer>
|
136 |
-
<layer id="17" name="
|
137 |
<data element_type="i64" shape="" offset="24" size="8" />
|
138 |
<output>
|
139 |
<port id="0" precision="I64" />
|
140 |
</output>
|
141 |
</layer>
|
142 |
-
<layer id="18" name="
|
143 |
<data batch_dims="0" />
|
144 |
<input>
|
145 |
<port id="0" precision="I64">
|
@@ -152,13 +152,13 @@
|
|
152 |
<port id="3" precision="I64" />
|
153 |
</output>
|
154 |
</layer>
|
155 |
-
<layer id="19" name="
|
156 |
<data element_type="i64" shape="" offset="32" size="8" />
|
157 |
<output>
|
158 |
<port id="0" precision="I64" />
|
159 |
</output>
|
160 |
</layer>
|
161 |
-
<layer id="20" name="
|
162 |
<data output_type="i32" />
|
163 |
<input>
|
164 |
<port id="0" precision="I64" />
|
@@ -171,19 +171,19 @@
|
|
171 |
</port>
|
172 |
</output>
|
173 |
</layer>
|
174 |
-
<layer id="21" name="
|
175 |
<data element_type="i64" shape="" offset="32" size="8" />
|
176 |
<output>
|
177 |
<port id="0" precision="I64" />
|
178 |
</output>
|
179 |
</layer>
|
180 |
-
<layer id="22" name="
|
181 |
<data element_type="i64" shape="" offset="32" size="8" />
|
182 |
<output>
|
183 |
<port id="0" precision="I64" />
|
184 |
</output>
|
185 |
</layer>
|
186 |
-
<layer id="23" name="
|
187 |
<data auto_broadcast="numpy" />
|
188 |
<input>
|
189 |
<port id="0" precision="I64" />
|
@@ -193,13 +193,13 @@
|
|
193 |
<port id="2" precision="I64" />
|
194 |
</output>
|
195 |
</layer>
|
196 |
-
<layer id="24" name="
|
197 |
<data element_type="i64" shape="" offset="32" size="8" />
|
198 |
<output>
|
199 |
<port id="0" precision="I64" />
|
200 |
</output>
|
201 |
</layer>
|
202 |
-
<layer id="25" name="
|
203 |
<data output_type="i32" />
|
204 |
<input>
|
205 |
<port id="0" precision="I64" />
|
@@ -212,7 +212,7 @@
|
|
212 |
</port>
|
213 |
</output>
|
214 |
</layer>
|
215 |
-
<layer id="26" name="
|
216 |
<data element_type="u8" shape="26479" offset="40" size="26479" />
|
217 |
<output>
|
218 |
<port id="0" precision="U8">
|
@@ -220,7 +220,7 @@
|
|
220 |
</port>
|
221 |
</output>
|
222 |
</layer>
|
223 |
-
<layer id="27" name="
|
224 |
<input>
|
225 |
<port id="0" precision="I32">
|
226 |
<dim>-1</dim>
|
@@ -262,7 +262,7 @@
|
|
262 |
</port>
|
263 |
</output>
|
264 |
</layer>
|
265 |
-
<layer id="28" name="
|
266 |
<data element_type="u8" shape="64" offset="26519" size="64" />
|
267 |
<output>
|
268 |
<port id="0" precision="U8">
|
@@ -270,7 +270,7 @@
|
|
270 |
</port>
|
271 |
</output>
|
272 |
</layer>
|
273 |
-
<layer id="29" name="
|
274 |
<data behaviour="isolate" invert="false" max_splits="-1" />
|
275 |
<input>
|
276 |
<port id="0" precision="I32">
|
@@ -316,7 +316,7 @@
|
|
316 |
</port>
|
317 |
</output>
|
318 |
</layer>
|
319 |
-
<layer id="30" name="
|
320 |
<data element_type="u8" shape="528248" offset="26583" size="528248" />
|
321 |
<output>
|
322 |
<port id="0" precision="U8">
|
@@ -324,7 +324,7 @@
|
|
324 |
</port>
|
325 |
</output>
|
326 |
</layer>
|
327 |
-
<layer id="31" name="
|
328 |
<data mode="begins_ends" />
|
329 |
<input>
|
330 |
<port id="0" precision="U8">
|
@@ -343,7 +343,7 @@
|
|
343 |
</port>
|
344 |
</output>
|
345 |
</layer>
|
346 |
-
<layer id="32" name="
|
347 |
<data element_type="u8" shape="369953" offset="554831" size="369953" />
|
348 |
<output>
|
349 |
<port id="0" precision="U8">
|
@@ -351,7 +351,7 @@
|
|
351 |
</port>
|
352 |
</output>
|
353 |
</layer>
|
354 |
-
<layer id="33" name="
|
355 |
<data mode="begins_ends" />
|
356 |
<input>
|
357 |
<port id="0" precision="U8">
|
@@ -370,7 +370,7 @@
|
|
370 |
</port>
|
371 |
</output>
|
372 |
</layer>
|
373 |
-
<layer id="34" name="
|
374 |
<data element_type="u8" shape="336854" offset="924784" size="336854" />
|
375 |
<output>
|
376 |
<port id="0" precision="U8">
|
@@ -378,7 +378,7 @@
|
|
378 |
</port>
|
379 |
</output>
|
380 |
</layer>
|
381 |
-
<layer id="35" name="
|
382 |
<data mode="begins_ends" />
|
383 |
<input>
|
384 |
<port id="0" precision="U8">
|
@@ -397,7 +397,7 @@
|
|
397 |
</port>
|
398 |
</output>
|
399 |
</layer>
|
400 |
-
<layer id="36" name="
|
401 |
<data element_type="u8" shape="20163" offset="1261638" size="20163" />
|
402 |
<output>
|
403 |
<port id="0" precision="U8">
|
@@ -405,7 +405,7 @@
|
|
405 |
</port>
|
406 |
</output>
|
407 |
</layer>
|
408 |
-
<layer id="37" name="
|
409 |
<data mode="begins_ends" />
|
410 |
<input>
|
411 |
<port id="0" precision="U8">
|
@@ -424,7 +424,7 @@
|
|
424 |
</port>
|
425 |
</output>
|
426 |
</layer>
|
427 |
-
<layer id="38" name="
|
428 |
<data element_type="i32" shape="1608" offset="1281801" size="6432" />
|
429 |
<output>
|
430 |
<port id="0" precision="I32">
|
@@ -432,7 +432,7 @@
|
|
432 |
</port>
|
433 |
</output>
|
434 |
</layer>
|
435 |
-
<layer id="39" name="
|
436 |
<data unk_token="" fuse_unk="false" suffix_indicator="" end_suffix="" byte_fallback="false" cache_capacity="20000" />
|
437 |
<input>
|
438 |
<port id="0" precision="I32">
|
@@ -502,7 +502,7 @@
|
|
502 |
</port>
|
503 |
</output>
|
504 |
</layer>
|
505 |
-
<layer id="40" name="
|
506 |
<data auto_broadcast="numpy" />
|
507 |
<input>
|
508 |
<port id="0" precision="I32">
|
@@ -518,13 +518,13 @@
|
|
518 |
</port>
|
519 |
</output>
|
520 |
</layer>
|
521 |
-
<layer id="41" name="
|
522 |
<data element_type="i32" shape="" offset="1288233" size="4" />
|
523 |
<output>
|
524 |
<port id="0" precision="I32" />
|
525 |
</output>
|
526 |
</layer>
|
527 |
-
<layer id="42" name="
|
528 |
<data auto_broadcast="numpy" />
|
529 |
<input>
|
530 |
<port id="0" precision="I32">
|
@@ -538,7 +538,7 @@
|
|
538 |
</port>
|
539 |
</output>
|
540 |
</layer>
|
541 |
-
<layer id="43" name="
|
542 |
<data auto_broadcast="numpy" />
|
543 |
<input>
|
544 |
<port id="0" precision="I32">
|
@@ -554,19 +554,19 @@
|
|
554 |
</port>
|
555 |
</output>
|
556 |
</layer>
|
557 |
-
<layer id="44" name="
|
558 |
<data element_type="i32" shape="" offset="0" size="4" />
|
559 |
<output>
|
560 |
<port id="0" precision="I32" />
|
561 |
</output>
|
562 |
</layer>
|
563 |
-
<layer id="45" name="
|
564 |
<data element_type="i32" shape="" offset="4" size="4" />
|
565 |
<output>
|
566 |
<port id="0" precision="I32" />
|
567 |
</output>
|
568 |
</layer>
|
569 |
-
<layer id="46" name="
|
570 |
<data element_type="i32" shape="1" offset="1288237" size="4" />
|
571 |
<output>
|
572 |
<port id="0" precision="I32">
|
@@ -574,7 +574,7 @@
|
|
574 |
</port>
|
575 |
</output>
|
576 |
</layer>
|
577 |
-
<layer id="47" name="
|
578 |
<data element_type="i32" shape="6" offset="1288241" size="24" />
|
579 |
<output>
|
580 |
<port id="0" precision="I32">
|
@@ -582,7 +582,7 @@
|
|
582 |
</port>
|
583 |
</output>
|
584 |
</layer>
|
585 |
-
<layer id="48" name="
|
586 |
<input>
|
587 |
<port id="0" precision="I32" />
|
588 |
<port id="1" precision="I32" />
|
@@ -643,7 +643,7 @@
|
|
643 |
</port>
|
644 |
</output>
|
645 |
</layer>
|
646 |
-
<layer id="49" name="
|
647 |
<data auto_broadcast="numpy" />
|
648 |
<input>
|
649 |
<port id="0" precision="I32">
|
@@ -659,13 +659,13 @@
|
|
659 |
</port>
|
660 |
</output>
|
661 |
</layer>
|
662 |
-
<layer id="50" name="
|
663 |
<data element_type="i32" shape="" offset="0" size="4" />
|
664 |
<output>
|
665 |
<port id="0" precision="I32" />
|
666 |
</output>
|
667 |
</layer>
|
668 |
-
<layer id="51" name="
|
669 |
<data keep_dims="false" />
|
670 |
<input>
|
671 |
<port id="0" precision="I32">
|
@@ -677,13 +677,13 @@
|
|
677 |
<port id="2" precision="I32" />
|
678 |
</output>
|
679 |
</layer>
|
680 |
-
<layer id="52" name="
|
681 |
<data element_type="i32" shape="" offset="1288237" size="4" />
|
682 |
<output>
|
683 |
<port id="0" precision="I32" />
|
684 |
</output>
|
685 |
</layer>
|
686 |
-
<layer id="53" name="
|
687 |
<data pad_right="true" />
|
688 |
<input>
|
689 |
<port id="0" precision="I32">
|
@@ -709,7 +709,7 @@
|
|
709 |
</port>
|
710 |
</output>
|
711 |
</layer>
|
712 |
-
<layer id="54" name="
|
713 |
<data destination_type="i32" />
|
714 |
<input>
|
715 |
<port id="0" precision="BOOL">
|
@@ -724,7 +724,7 @@
|
|
724 |
</port>
|
725 |
</output>
|
726 |
</layer>
|
727 |
-
<layer id="55" name="
|
728 |
<data destination_type="i64" />
|
729 |
<input>
|
730 |
<port id="0" precision="I32">
|
@@ -739,7 +739,7 @@
|
|
739 |
</port>
|
740 |
</output>
|
741 |
</layer>
|
742 |
-
<layer id="57" name="
|
743 |
<data destination_type="i64" />
|
744 |
<input>
|
745 |
<port id="0" precision="I32">
|
@@ -754,7 +754,7 @@
|
|
754 |
</port>
|
755 |
</output>
|
756 |
</layer>
|
757 |
-
<layer id="58" name="
|
758 |
<input>
|
759 |
<port id="0" precision="I64">
|
760 |
<dim>-1</dim>
|
@@ -762,7 +762,7 @@
|
|
762 |
</port>
|
763 |
</input>
|
764 |
</layer>
|
765 |
-
<layer id="56" name="
|
766 |
<input>
|
767 |
<port id="0" precision="I64">
|
768 |
<dim>-1</dim>
|
@@ -861,9 +861,29 @@
|
|
861 |
<edge from-layer="57" from-port="1" to-layer="58" to-port="0" />
|
862 |
</edges>
|
863 |
<rt_info>
|
|
|
|
|
|
|
864 |
<bos_token_id value="50257" />
|
|
|
|
|
865 |
<eos_token_id value="50257" />
|
|
|
|
|
|
|
|
|
866 |
<original_tokenizer_class value="<class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
|
867 |
<pad_token_id value="50257" />
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
868 |
</rt_info>
|
869 |
</net>
|
|
|
1 |
<?xml version="1.0"?>
|
2 |
<net name="tokenizer" version="11">
|
3 |
<layers>
|
4 |
+
<layer id="0" name="Parameter_32640" type="Parameter" version="opset1">
|
5 |
<data shape="?" element_type="string" />
|
6 |
<output>
|
7 |
+
<port id="0" precision="STRING" names="Parameter_32640">
|
8 |
<dim>-1</dim>
|
9 |
</port>
|
10 |
</output>
|
11 |
</layer>
|
12 |
+
<layer id="1" name="Constant_32738" type="Const" version="opset1">
|
13 |
<data element_type="i32" shape="" offset="0" size="4" />
|
14 |
<output>
|
15 |
<port id="0" precision="I32" />
|
16 |
</output>
|
17 |
</layer>
|
18 |
+
<layer id="2" name="Constant_32739" type="Const" version="opset1">
|
19 |
<data element_type="i32" shape="" offset="4" size="4" />
|
20 |
<output>
|
21 |
<port id="0" precision="I32" />
|
22 |
</output>
|
23 |
</layer>
|
24 |
+
<layer id="3" name="Constant_32740" type="Const" version="opset1">
|
25 |
<data element_type="i32" shape="1" offset="8" size="4" />
|
26 |
<output>
|
27 |
<port id="0" precision="I32">
|
|
|
29 |
</port>
|
30 |
</output>
|
31 |
</layer>
|
32 |
+
<layer id="4" name="Constant_32741" type="Const" version="opset1">
|
33 |
<data element_type="i32" shape="" offset="0" size="4" />
|
34 |
<output>
|
35 |
<port id="0" precision="I32" />
|
36 |
</output>
|
37 |
</layer>
|
38 |
+
<layer id="5" name="Constant_32742" type="Const" version="opset1">
|
39 |
<data element_type="i32" shape="" offset="4" size="4" />
|
40 |
<output>
|
41 |
<port id="0" precision="I32" />
|
42 |
</output>
|
43 |
</layer>
|
44 |
+
<layer id="6" name="Constant_32743" type="Const" version="opset1">
|
45 |
<data element_type="i32" shape="1" offset="12" size="4" />
|
46 |
<output>
|
47 |
<port id="0" precision="I32">
|
|
|
49 |
</port>
|
50 |
</output>
|
51 |
</layer>
|
52 |
+
<layer id="7" name="Constant_32744" type="Const" version="opset1">
|
53 |
<data element_type="i32" shape="" offset="0" size="4" />
|
54 |
<output>
|
55 |
<port id="0" precision="I32" />
|
56 |
</output>
|
57 |
</layer>
|
58 |
+
<layer id="8" name="Constant_32745" type="Const" version="opset1">
|
59 |
<data element_type="i32" shape="" offset="4" size="4" />
|
60 |
<output>
|
61 |
<port id="0" precision="I32" />
|
62 |
</output>
|
63 |
</layer>
|
64 |
+
<layer id="9" name="Constant_32746" type="Const" version="opset1">
|
65 |
<data element_type="i32" shape="1" offset="16" size="4" />
|
66 |
<output>
|
67 |
<port id="0" precision="I32">
|
|
|
69 |
</port>
|
70 |
</output>
|
71 |
</layer>
|
72 |
+
<layer id="10" name="Constant_32747" type="Const" version="opset1">
|
73 |
<data element_type="i32" shape="" offset="0" size="4" />
|
74 |
<output>
|
75 |
<port id="0" precision="I32" />
|
76 |
</output>
|
77 |
</layer>
|
78 |
+
<layer id="11" name="Constant_32748" type="Const" version="opset1">
|
79 |
<data element_type="i32" shape="" offset="4" size="4" />
|
80 |
<output>
|
81 |
<port id="0" precision="I32" />
|
82 |
</output>
|
83 |
</layer>
|
84 |
+
<layer id="12" name="Constant_32749" type="Const" version="opset1">
|
85 |
<data element_type="i32" shape="1" offset="20" size="4" />
|
86 |
<output>
|
87 |
<port id="0" precision="I32">
|
|
|
89 |
</port>
|
90 |
</output>
|
91 |
</layer>
|
92 |
+
<layer id="13" name="Constant_32646" type="Const" version="opset1">
|
93 |
<data element_type="i64" shape="" offset="24" size="8" />
|
94 |
<output>
|
95 |
<port id="0" precision="I64" />
|
96 |
</output>
|
97 |
</layer>
|
98 |
+
<layer id="14" name="StringTensorUnpack_32641" type="StringTensorUnpack" version="extension">
|
99 |
<data mode="begins_ends" />
|
100 |
<input>
|
101 |
<port id="0" precision="STRING">
|
|
|
114 |
</port>
|
115 |
</output>
|
116 |
</layer>
|
117 |
+
<layer id="15" name="ShapeOf_32642" type="ShapeOf" version="opset3">
|
118 |
<data output_type="i64" />
|
119 |
<input>
|
120 |
<port id="0" precision="I32">
|
|
|
127 |
</port>
|
128 |
</output>
|
129 |
</layer>
|
130 |
+
<layer id="16" name="Constant_32643" type="Const" version="opset1">
|
131 |
<data element_type="i64" shape="" offset="24" size="8" />
|
132 |
<output>
|
133 |
<port id="0" precision="I64" />
|
134 |
</output>
|
135 |
</layer>
|
136 |
+
<layer id="17" name="Constant_32644" type="Const" version="opset1">
|
137 |
<data element_type="i64" shape="" offset="24" size="8" />
|
138 |
<output>
|
139 |
<port id="0" precision="I64" />
|
140 |
</output>
|
141 |
</layer>
|
142 |
+
<layer id="18" name="Gather_32645" type="Gather" version="opset8">
|
143 |
<data batch_dims="0" />
|
144 |
<input>
|
145 |
<port id="0" precision="I64">
|
|
|
152 |
<port id="3" precision="I64" />
|
153 |
</output>
|
154 |
</layer>
|
155 |
+
<layer id="19" name="Constant_32647" type="Const" version="opset1">
|
156 |
<data element_type="i64" shape="" offset="32" size="8" />
|
157 |
<output>
|
158 |
<port id="0" precision="I64" />
|
159 |
</output>
|
160 |
</layer>
|
161 |
+
<layer id="20" name="Range_32648" type="Range" version="opset4">
|
162 |
<data output_type="i32" />
|
163 |
<input>
|
164 |
<port id="0" precision="I64" />
|
|
|
171 |
</port>
|
172 |
</output>
|
173 |
</layer>
|
174 |
+
<layer id="21" name="Constant_32649" type="Const" version="opset1">
|
175 |
<data element_type="i64" shape="" offset="32" size="8" />
|
176 |
<output>
|
177 |
<port id="0" precision="I64" />
|
178 |
</output>
|
179 |
</layer>
|
180 |
+
<layer id="22" name="Constant_32650" type="Const" version="opset1">
|
181 |
<data element_type="i64" shape="" offset="32" size="8" />
|
182 |
<output>
|
183 |
<port id="0" precision="I64" />
|
184 |
</output>
|
185 |
</layer>
|
186 |
+
<layer id="23" name="Add_32651" type="Add" version="opset1">
|
187 |
<data auto_broadcast="numpy" />
|
188 |
<input>
|
189 |
<port id="0" precision="I64" />
|
|
|
193 |
<port id="2" precision="I64" />
|
194 |
</output>
|
195 |
</layer>
|
196 |
+
<layer id="24" name="Constant_32652" type="Const" version="opset1">
|
197 |
<data element_type="i64" shape="" offset="32" size="8" />
|
198 |
<output>
|
199 |
<port id="0" precision="I64" />
|
200 |
</output>
|
201 |
</layer>
|
202 |
+
<layer id="25" name="Range_32653" type="Range" version="opset4">
|
203 |
<data output_type="i32" />
|
204 |
<input>
|
205 |
<port id="0" precision="I64" />
|
|
|
212 |
</port>
|
213 |
</output>
|
214 |
</layer>
|
215 |
+
<layer id="26" name="Constant_32715" type="Const" version="opset1">
|
216 |
<data element_type="u8" shape="26479" offset="40" size="26479" />
|
217 |
<output>
|
218 |
<port id="0" precision="U8">
|
|
|
220 |
</port>
|
221 |
</output>
|
222 |
</layer>
|
223 |
+
<layer id="27" name="SpecialTokensSplit_32716" type="SpecialTokensSplit" version="extension">
|
224 |
<input>
|
225 |
<port id="0" precision="I32">
|
226 |
<dim>-1</dim>
|
|
|
262 |
</port>
|
263 |
</output>
|
264 |
</layer>
|
265 |
+
<layer id="28" name="Constant_32718" type="Const" version="opset1">
|
266 |
<data element_type="u8" shape="64" offset="26519" size="64" />
|
267 |
<output>
|
268 |
<port id="0" precision="U8">
|
|
|
270 |
</port>
|
271 |
</output>
|
272 |
</layer>
|
273 |
+
<layer id="29" name="RegexSplit_32719" type="RegexSplit" version="extension">
|
274 |
<data behaviour="isolate" invert="false" max_splits="-1" />
|
275 |
<input>
|
276 |
<port id="0" precision="I32">
|
|
|
316 |
</port>
|
317 |
</output>
|
318 |
</layer>
|
319 |
+
<layer id="30" name="Constant_32721" type="Const" version="opset1">
|
320 |
<data element_type="u8" shape="528248" offset="26583" size="528248" />
|
321 |
<output>
|
322 |
<port id="0" precision="U8">
|
|
|
324 |
</port>
|
325 |
</output>
|
326 |
</layer>
|
327 |
+
<layer id="31" name="StringTensorUnpack_32722" type="StringTensorUnpack" version="extension">
|
328 |
<data mode="begins_ends" />
|
329 |
<input>
|
330 |
<port id="0" precision="U8">
|
|
|
343 |
</port>
|
344 |
</output>
|
345 |
</layer>
|
346 |
+
<layer id="32" name="Constant_32727" type="Const" version="opset1">
|
347 |
<data element_type="u8" shape="369953" offset="554831" size="369953" />
|
348 |
<output>
|
349 |
<port id="0" precision="U8">
|
|
|
351 |
</port>
|
352 |
</output>
|
353 |
</layer>
|
354 |
+
<layer id="33" name="StringTensorUnpack_32728" type="StringTensorUnpack" version="extension">
|
355 |
<data mode="begins_ends" />
|
356 |
<input>
|
357 |
<port id="0" precision="U8">
|
|
|
370 |
</port>
|
371 |
</output>
|
372 |
</layer>
|
373 |
+
<layer id="34" name="Constant_32730" type="Const" version="opset1">
|
374 |
<data element_type="u8" shape="336854" offset="924784" size="336854" />
|
375 |
<output>
|
376 |
<port id="0" precision="U8">
|
|
|
378 |
</port>
|
379 |
</output>
|
380 |
</layer>
|
381 |
+
<layer id="35" name="StringTensorUnpack_32731" type="StringTensorUnpack" version="extension">
|
382 |
<data mode="begins_ends" />
|
383 |
<input>
|
384 |
<port id="0" precision="U8">
|
|
|
397 |
</port>
|
398 |
</output>
|
399 |
</layer>
|
400 |
+
<layer id="36" name="Constant_32724" type="Const" version="opset1">
|
401 |
<data element_type="u8" shape="20163" offset="1261638" size="20163" />
|
402 |
<output>
|
403 |
<port id="0" precision="U8">
|
|
|
405 |
</port>
|
406 |
</output>
|
407 |
</layer>
|
408 |
+
<layer id="37" name="StringTensorUnpack_32725" type="StringTensorUnpack" version="extension">
|
409 |
<data mode="begins_ends" />
|
410 |
<input>
|
411 |
<port id="0" precision="U8">
|
|
|
424 |
</port>
|
425 |
</output>
|
426 |
</layer>
|
427 |
+
<layer id="38" name="Constant_32732" type="Const" version="opset1">
|
428 |
<data element_type="i32" shape="1608" offset="1281801" size="6432" />
|
429 |
<output>
|
430 |
<port id="0" precision="I32">
|
|
|
432 |
</port>
|
433 |
</output>
|
434 |
</layer>
|
435 |
+
<layer id="39" name="BPETokenizer_32733" type="BPETokenizer" version="extension">
|
436 |
<data unk_token="" fuse_unk="false" suffix_indicator="" end_suffix="" byte_fallback="false" cache_capacity="20000" />
|
437 |
<input>
|
438 |
<port id="0" precision="I32">
|
|
|
502 |
</port>
|
503 |
</output>
|
504 |
</layer>
|
505 |
+
<layer id="40" name="Subtract_32734" type="Subtract" version="opset1">
|
506 |
<data auto_broadcast="numpy" />
|
507 |
<input>
|
508 |
<port id="0" precision="I32">
|
|
|
518 |
</port>
|
519 |
</output>
|
520 |
</layer>
|
521 |
+
<layer id="41" name="Constant_32735" type="Const" version="opset1">
|
522 |
<data element_type="i32" shape="" offset="1288233" size="4" />
|
523 |
<output>
|
524 |
<port id="0" precision="I32" />
|
525 |
</output>
|
526 |
</layer>
|
527 |
+
<layer id="42" name="Minimum_32736" type="Minimum" version="opset1">
|
528 |
<data auto_broadcast="numpy" />
|
529 |
<input>
|
530 |
<port id="0" precision="I32">
|
|
|
538 |
</port>
|
539 |
</output>
|
540 |
</layer>
|
541 |
+
<layer id="43" name="Add_32737" type="Add" version="opset1">
|
542 |
<data auto_broadcast="numpy" />
|
543 |
<input>
|
544 |
<port id="0" precision="I32">
|
|
|
554 |
</port>
|
555 |
</output>
|
556 |
</layer>
|
557 |
+
<layer id="44" name="Constant_32750" type="Const" version="opset1">
|
558 |
<data element_type="i32" shape="" offset="0" size="4" />
|
559 |
<output>
|
560 |
<port id="0" precision="I32" />
|
561 |
</output>
|
562 |
</layer>
|
563 |
+
<layer id="45" name="Constant_32751" type="Const" version="opset1">
|
564 |
<data element_type="i32" shape="" offset="4" size="4" />
|
565 |
<output>
|
566 |
<port id="0" precision="I32" />
|
567 |
</output>
|
568 |
</layer>
|
569 |
+
<layer id="46" name="Constant_32752" type="Const" version="opset1">
|
570 |
<data element_type="i32" shape="1" offset="1288237" size="4" />
|
571 |
<output>
|
572 |
<port id="0" precision="I32">
|
|
|
574 |
</port>
|
575 |
</output>
|
576 |
</layer>
|
577 |
+
<layer id="47" name="Constant_32753" type="Const" version="opset1">
|
578 |
<data element_type="i32" shape="6" offset="1288241" size="24" />
|
579 |
<output>
|
580 |
<port id="0" precision="I32">
|
|
|
582 |
</port>
|
583 |
</output>
|
584 |
</layer>
|
585 |
+
<layer id="48" name="CombineSegments_32754" type="CombineSegments" version="extension">
|
586 |
<input>
|
587 |
<port id="0" precision="I32" />
|
588 |
<port id="1" precision="I32" />
|
|
|
643 |
</port>
|
644 |
</output>
|
645 |
</layer>
|
646 |
+
<layer id="49" name="Subtract_32755" type="Subtract" version="opset1">
|
647 |
<data auto_broadcast="numpy" />
|
648 |
<input>
|
649 |
<port id="0" precision="I32">
|
|
|
659 |
</port>
|
660 |
</output>
|
661 |
</layer>
|
662 |
+
<layer id="50" name="Constant_32756" type="Const" version="opset1">
|
663 |
<data element_type="i32" shape="" offset="0" size="4" />
|
664 |
<output>
|
665 |
<port id="0" precision="I32" />
|
666 |
</output>
|
667 |
</layer>
|
668 |
+
<layer id="51" name="ReduceMax_32757" type="ReduceMax" version="opset1">
|
669 |
<data keep_dims="false" />
|
670 |
<input>
|
671 |
<port id="0" precision="I32">
|
|
|
677 |
<port id="2" precision="I32" />
|
678 |
</output>
|
679 |
</layer>
|
680 |
+
<layer id="52" name="Constant_32758" type="Const" version="opset1">
|
681 |
<data element_type="i32" shape="" offset="1288237" size="4" />
|
682 |
<output>
|
683 |
<port id="0" precision="I32" />
|
684 |
</output>
|
685 |
</layer>
|
686 |
+
<layer id="53" name="RaggedToDense_32759" type="RaggedToDense" version="extension">
|
687 |
<data pad_right="true" />
|
688 |
<input>
|
689 |
<port id="0" precision="I32">
|
|
|
709 |
</port>
|
710 |
</output>
|
711 |
</layer>
|
712 |
+
<layer id="54" name="Convert_32760" type="Convert" version="opset1">
|
713 |
<data destination_type="i32" />
|
714 |
<input>
|
715 |
<port id="0" precision="BOOL">
|
|
|
724 |
</port>
|
725 |
</output>
|
726 |
</layer>
|
727 |
+
<layer id="55" name="Convert_32760" type="Convert" version="opset1">
|
728 |
<data destination_type="i64" />
|
729 |
<input>
|
730 |
<port id="0" precision="I32">
|
|
|
739 |
</port>
|
740 |
</output>
|
741 |
</layer>
|
742 |
+
<layer id="57" name="RaggedToDense_32759.0" type="Convert" version="opset1">
|
743 |
<data destination_type="i64" />
|
744 |
<input>
|
745 |
<port id="0" precision="I32">
|
|
|
754 |
</port>
|
755 |
</output>
|
756 |
</layer>
|
757 |
+
<layer id="58" name="Result_32763" type="Result" version="opset1">
|
758 |
<input>
|
759 |
<port id="0" precision="I64">
|
760 |
<dim>-1</dim>
|
|
|
762 |
</port>
|
763 |
</input>
|
764 |
</layer>
|
765 |
+
<layer id="56" name="Result_32765" type="Result" version="opset1">
|
766 |
<input>
|
767 |
<port id="0" precision="I64">
|
768 |
<dim>-1</dim>
|
|
|
861 |
<edge from-layer="57" from-port="1" to-layer="58" to-port="0" />
|
862 |
</edges>
|
863 |
<rt_info>
|
864 |
+
<add_attention_mask value="True" />
|
865 |
+
<add_prefix_space />
|
866 |
+
<add_special_tokens value="True" />
|
867 |
<bos_token_id value="50257" />
|
868 |
+
<clean_up_tokenization_spaces />
|
869 |
+
<detokenizer_input_type value="i64" />
|
870 |
<eos_token_id value="50257" />
|
871 |
+
<handle_special_tokens_with_re />
|
872 |
+
<number_of_inputs value="1" />
|
873 |
+
<openvino_tokenizers_version value="2024.5.0.0" />
|
874 |
+
<openvino_version value="2024.5.0" />
|
875 |
<original_tokenizer_class value="<class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
|
876 |
<pad_token_id value="50257" />
|
877 |
+
<sentencepiece_version value="0.2.0" />
|
878 |
+
<skip_special_tokens value="True" />
|
879 |
+
<streaming_detokenizer value="False" />
|
880 |
+
<tiktoken_version value="0.8.0" />
|
881 |
+
<tokenizer_output_type value="i64" />
|
882 |
+
<tokenizers_version value="0.20.3" />
|
883 |
+
<transformers_version value="4.46.3" />
|
884 |
+
<use_max_padding value="False" />
|
885 |
+
<use_sentencepiece_backend value="False" />
|
886 |
+
<utf8_replace_mode />
|
887 |
+
<with_detokenizer value="True" />
|
888 |
</rt_info>
|
889 |
</net>
|