openvino-ci
commited on
Commit
•
43f28c8
1
Parent(s):
566b185
Upload folder using huggingface_hub
Browse files- config.json +2 -1
- generation_config.json +1 -1
- openvino_decoder_model.xml +197 -196
- openvino_detokenizer.bin +1 -1
- openvino_detokenizer.xml +32 -12
- openvino_encoder_model.xml +0 -0
- openvino_tokenizer.xml +74 -54
config.json
CHANGED
@@ -1,4 +1,5 @@
|
|
1 |
{
|
|
|
2 |
"_name_or_path": "distil-whisper/distil-large-v3",
|
3 |
"activation_dropout": 0.0,
|
4 |
"activation_function": "gelu",
|
@@ -39,7 +40,7 @@
|
|
39 |
"num_mel_bins": 128,
|
40 |
"pad_token_id": 50256,
|
41 |
"scale_embedding": false,
|
42 |
-
"transformers_version": "4.
|
43 |
"use_cache": true,
|
44 |
"use_weighted_layer_sum": false,
|
45 |
"vocab_size": 51866
|
|
|
1 |
{
|
2 |
+
"_attn_implementation_autoset": true,
|
3 |
"_name_or_path": "distil-whisper/distil-large-v3",
|
4 |
"activation_dropout": 0.0,
|
5 |
"activation_function": "gelu",
|
|
|
40 |
"num_mel_bins": 128,
|
41 |
"pad_token_id": 50256,
|
42 |
"scale_embedding": false,
|
43 |
+
"transformers_version": "4.46.3",
|
44 |
"use_cache": true,
|
45 |
"use_weighted_layer_sum": false,
|
46 |
"vocab_size": 51866
|
generation_config.json
CHANGED
@@ -303,5 +303,5 @@
|
|
303 |
"transcribe": 50360,
|
304 |
"translate": 50359
|
305 |
},
|
306 |
-
"transformers_version": "4.
|
307 |
}
|
|
|
303 |
"transcribe": 50360,
|
304 |
"translate": 50359
|
305 |
},
|
306 |
+
"transformers_version": "4.46.3"
|
307 |
}
|
openvino_decoder_model.xml
CHANGED
@@ -10,7 +10,7 @@
|
|
10 |
</port>
|
11 |
</output>
|
12 |
</layer>
|
13 |
-
<layer id="0" name="
|
14 |
<data shape="?,?,?" element_type="f32" />
|
15 |
<output>
|
16 |
<port id="0" precision="FP32" names="encoder_hidden_states">
|
@@ -29,7 +29,7 @@
|
|
29 |
</port>
|
30 |
</output>
|
31 |
</layer>
|
32 |
-
<layer id="3" name="
|
33 |
<data destination_type="f16" />
|
34 |
<input>
|
35 |
<port id="0" precision="U8">
|
@@ -53,7 +53,7 @@
|
|
53 |
</port>
|
54 |
</output>
|
55 |
</layer>
|
56 |
-
<layer id="5" name="
|
57 |
<data destination_type="f16" />
|
58 |
<input>
|
59 |
<port id="0" precision="U8">
|
@@ -130,7 +130,7 @@
|
|
130 |
</port>
|
131 |
</output>
|
132 |
</layer>
|
133 |
-
<layer id="10" name="
|
134 |
<data element_type="i64" shape="2" offset="66544078" size="16" />
|
135 |
<output>
|
136 |
<port id="0" precision="I64">
|
@@ -207,7 +207,7 @@
|
|
207 |
</port>
|
208 |
</output>
|
209 |
</layer>
|
210 |
-
<layer id="16" name="
|
211 |
<data destination_type="f16" />
|
212 |
<input>
|
213 |
<port id="0" precision="U8">
|
@@ -231,7 +231,7 @@
|
|
231 |
</port>
|
232 |
</output>
|
233 |
</layer>
|
234 |
-
<layer id="18" name="
|
235 |
<data destination_type="f16" />
|
236 |
<input>
|
237 |
<port id="0" precision="U8">
|
@@ -314,7 +314,7 @@
|
|
314 |
<port id="0" precision="I64" names="23" />
|
315 |
</output>
|
316 |
</layer>
|
317 |
-
<layer id="24" name="
|
318 |
<data output_type="i64" />
|
319 |
<input>
|
320 |
<port id="0" precision="I64">
|
@@ -328,19 +328,19 @@
|
|
328 |
</port>
|
329 |
</output>
|
330 |
</layer>
|
331 |
-
<layer id="25" name="
|
332 |
<data element_type="i64" shape="" offset="67118890" size="8" />
|
333 |
<output>
|
334 |
<port id="0" precision="I64" />
|
335 |
</output>
|
336 |
</layer>
|
337 |
-
<layer id="26" name="
|
338 |
<data element_type="i64" shape="" offset="67118882" size="8" />
|
339 |
<output>
|
340 |
<port id="0" precision="I64" />
|
341 |
</output>
|
342 |
</layer>
|
343 |
-
<layer id="27" name="
|
344 |
<data batch_dims="0" />
|
345 |
<input>
|
346 |
<port id="0" precision="I64">
|
@@ -401,7 +401,7 @@
|
|
401 |
</port>
|
402 |
</output>
|
403 |
</layer>
|
404 |
-
<layer id="32" name="
|
405 |
<data element_type="i32" shape="" offset="66544094" size="4" />
|
406 |
<output>
|
407 |
<port id="0" precision="I32" />
|
@@ -478,7 +478,7 @@
|
|
478 |
</port>
|
479 |
</output>
|
480 |
</layer>
|
481 |
-
<layer id="37" name="
|
482 |
<data element_type="f32" shape="1, 1, 1280" offset="67118906" size="5120" />
|
483 |
<output>
|
484 |
<port id="0" precision="FP32">
|
@@ -510,7 +510,7 @@
|
|
510 |
</port>
|
511 |
</output>
|
512 |
</layer>
|
513 |
-
<layer id="39" name="
|
514 |
<data element_type="f32" shape="1, 1, 1280" offset="67124026" size="5120" />
|
515 |
<output>
|
516 |
<port id="0" precision="FP32">
|
@@ -542,7 +542,7 @@
|
|
542 |
</port>
|
543 |
</output>
|
544 |
</layer>
|
545 |
-
<layer id="41" name="
|
546 |
<data element_type="u4" shape="1280, 10, 128" offset="67129146" size="819200" />
|
547 |
<output>
|
548 |
<port id="0" precision="U4">
|
@@ -552,7 +552,7 @@
|
|
552 |
</port>
|
553 |
</output>
|
554 |
</layer>
|
555 |
-
<layer id="42" name="
|
556 |
<data destination_type="f16" />
|
557 |
<input>
|
558 |
<port id="0" precision="U4">
|
@@ -569,7 +569,7 @@
|
|
569 |
</port>
|
570 |
</output>
|
571 |
</layer>
|
572 |
-
<layer id="43" name="
|
573 |
<data element_type="u4" shape="1280, 10, 1" offset="67948346" size="6400" />
|
574 |
<output>
|
575 |
<port id="0" precision="U4">
|
@@ -579,7 +579,7 @@
|
|
579 |
</port>
|
580 |
</output>
|
581 |
</layer>
|
582 |
-
<layer id="44" name="
|
583 |
<data destination_type="f16" />
|
584 |
<input>
|
585 |
<port id="0" precision="U4">
|
@@ -596,7 +596,7 @@
|
|
596 |
</port>
|
597 |
</output>
|
598 |
</layer>
|
599 |
-
<layer id="45" name="
|
600 |
<data auto_broadcast="numpy" />
|
601 |
<input>
|
602 |
<port id="0" precision="FP16">
|
@@ -618,7 +618,7 @@
|
|
618 |
</port>
|
619 |
</output>
|
620 |
</layer>
|
621 |
-
<layer id="46" name="
|
622 |
<data element_type="f16" shape="1280, 10, 1" offset="67954746" size="25600" />
|
623 |
<output>
|
624 |
<port id="0" precision="FP16">
|
@@ -628,7 +628,7 @@
|
|
628 |
</port>
|
629 |
</output>
|
630 |
</layer>
|
631 |
-
<layer id="47" name="
|
632 |
<data auto_broadcast="numpy" />
|
633 |
<input>
|
634 |
<port id="0" precision="FP16">
|
@@ -650,7 +650,7 @@
|
|
650 |
</port>
|
651 |
</output>
|
652 |
</layer>
|
653 |
-
<layer id="48" name="
|
654 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
655 |
<output>
|
656 |
<port id="0" precision="I64">
|
@@ -658,7 +658,7 @@
|
|
658 |
</port>
|
659 |
</output>
|
660 |
</layer>
|
661 |
-
<layer id="49" name="
|
662 |
<data special_zero="false" />
|
663 |
<input>
|
664 |
<port id="0" precision="FP16">
|
@@ -677,7 +677,7 @@
|
|
677 |
</port>
|
678 |
</output>
|
679 |
</layer>
|
680 |
-
<layer id="50" name="
|
681 |
<data destination_type="f32" />
|
682 |
<input>
|
683 |
<port id="0" precision="FP16">
|
@@ -692,7 +692,7 @@
|
|
692 |
</port>
|
693 |
</output>
|
694 |
</layer>
|
695 |
-
<layer id="51" name="
|
696 |
<data transpose_a="false" transpose_b="true" />
|
697 |
<input>
|
698 |
<port id="0" precision="FP32">
|
@@ -713,7 +713,7 @@
|
|
713 |
</port>
|
714 |
</output>
|
715 |
</layer>
|
716 |
-
<layer id="52" name="
|
717 |
<data element_type="f32" shape="1, 1, 1280" offset="67980362" size="5120" />
|
718 |
<output>
|
719 |
<port id="0" precision="FP32">
|
@@ -745,7 +745,7 @@
|
|
745 |
</port>
|
746 |
</output>
|
747 |
</layer>
|
748 |
-
<layer id="54" name="
|
749 |
<data element_type="i64" shape="4" offset="67985482" size="32" />
|
750 |
<output>
|
751 |
<port id="0" precision="I64">
|
@@ -813,7 +813,7 @@
|
|
813 |
</port>
|
814 |
</output>
|
815 |
</layer>
|
816 |
-
<layer id="59" name="
|
817 |
<data destination_type="f16" />
|
818 |
<input>
|
819 |
<port id="0" precision="U4">
|
@@ -840,7 +840,7 @@
|
|
840 |
</port>
|
841 |
</output>
|
842 |
</layer>
|
843 |
-
<layer id="61" name="
|
844 |
<data destination_type="f16" />
|
845 |
<input>
|
846 |
<port id="0" precision="U4">
|
@@ -911,7 +911,7 @@
|
|
911 |
</port>
|
912 |
</output>
|
913 |
</layer>
|
914 |
-
<layer id="65" name="
|
915 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
916 |
<output>
|
917 |
<port id="0" precision="I64">
|
@@ -919,7 +919,7 @@
|
|
919 |
</port>
|
920 |
</output>
|
921 |
</layer>
|
922 |
-
<layer id="66" name="
|
923 |
<data special_zero="false" />
|
924 |
<input>
|
925 |
<port id="0" precision="FP16">
|
@@ -974,7 +974,7 @@
|
|
974 |
</port>
|
975 |
</output>
|
976 |
</layer>
|
977 |
-
<layer id="69" name="
|
978 |
<data element_type="i64" shape="4" offset="67985482" size="32" />
|
979 |
<output>
|
980 |
<port id="0" precision="I64">
|
@@ -1063,13 +1063,13 @@
|
|
1063 |
<port id="0" precision="I32" />
|
1064 |
</output>
|
1065 |
</layer>
|
1066 |
-
<layer id="75" name="
|
1067 |
<data element_type="f32" shape="" offset="68836730" size="4" />
|
1068 |
<output>
|
1069 |
-
<port id="0" precision="FP32" />
|
1070 |
</output>
|
1071 |
</layer>
|
1072 |
-
<layer id="76" name="
|
1073 |
<data element_type="i64" shape="1" offset="67118890" size="8" />
|
1074 |
<output>
|
1075 |
<port id="0" precision="I64">
|
@@ -1077,7 +1077,7 @@
|
|
1077 |
</port>
|
1078 |
</output>
|
1079 |
</layer>
|
1080 |
-
<layer id="77" name="
|
1081 |
<data special_zero="false" />
|
1082 |
<input>
|
1083 |
<port id="0" precision="I64" />
|
@@ -1107,13 +1107,13 @@
|
|
1107 |
<port id="2" precision="I64" names="62,64" />
|
1108 |
</output>
|
1109 |
</layer>
|
1110 |
-
<layer id="80" name="
|
1111 |
<data element_type="i32" shape="" offset="66544094" size="4" />
|
1112 |
<output>
|
1113 |
<port id="0" precision="I32" />
|
1114 |
</output>
|
1115 |
</layer>
|
1116 |
-
<layer id="81" name="
|
1117 |
<input>
|
1118 |
<port id="0" precision="I64" />
|
1119 |
<port id="1" precision="I32" />
|
@@ -1155,7 +1155,7 @@
|
|
1155 |
</port>
|
1156 |
</output>
|
1157 |
</layer>
|
1158 |
-
<layer id="84" name="
|
1159 |
<data output_type="i32" />
|
1160 |
<input>
|
1161 |
<port id="0" precision="FP32">
|
@@ -1169,19 +1169,19 @@
|
|
1169 |
</port>
|
1170 |
</output>
|
1171 |
</layer>
|
1172 |
-
<layer id="85" name="
|
1173 |
<data element_type="i64" shape="" offset="67118890" size="8" />
|
1174 |
<output>
|
1175 |
<port id="0" precision="I64" />
|
1176 |
</output>
|
1177 |
</layer>
|
1178 |
-
<layer id="86" name="
|
1179 |
<data element_type="i64" shape="" offset="67118882" size="8" />
|
1180 |
<output>
|
1181 |
<port id="0" precision="I64" />
|
1182 |
</output>
|
1183 |
</layer>
|
1184 |
-
<layer id="87" name="
|
1185 |
<data batch_dims="0" />
|
1186 |
<input>
|
1187 |
<port id="0" precision="I32">
|
@@ -1233,7 +1233,7 @@
|
|
1233 |
<port id="0" precision="I32" />
|
1234 |
</output>
|
1235 |
</layer>
|
1236 |
-
<layer id="92" name="
|
1237 |
<data destination_type="i32" />
|
1238 |
<input>
|
1239 |
<port id="0" precision="I64" />
|
@@ -1375,7 +1375,7 @@
|
|
1375 |
</port>
|
1376 |
</output>
|
1377 |
</layer>
|
1378 |
-
<layer id="104" name="
|
1379 |
<data element_type="i64" shape="2" offset="68836734" size="16" />
|
1380 |
<output>
|
1381 |
<port id="0" precision="I64" names="70">
|
@@ -1492,7 +1492,7 @@
|
|
1492 |
</port>
|
1493 |
</output>
|
1494 |
</layer>
|
1495 |
-
<layer id="112" name="
|
1496 |
<data element_type="i64" shape="1" offset="67118882" size="8" />
|
1497 |
<output>
|
1498 |
<port id="0" precision="I64">
|
@@ -1500,13 +1500,13 @@
|
|
1500 |
</port>
|
1501 |
</output>
|
1502 |
</layer>
|
1503 |
-
<layer id="113" name="
|
1504 |
<data element_type="i64" shape="" offset="67118882" size="8" />
|
1505 |
<output>
|
1506 |
<port id="0" precision="I64" />
|
1507 |
</output>
|
1508 |
</layer>
|
1509 |
-
<layer id="114" name="
|
1510 |
<data batch_dims="0" />
|
1511 |
<input>
|
1512 |
<port id="0" precision="I64">
|
@@ -1523,7 +1523,7 @@
|
|
1523 |
</port>
|
1524 |
</output>
|
1525 |
</layer>
|
1526 |
-
<layer id="115" name="
|
1527 |
<data element_type="i64" shape="1" offset="67118890" size="8" />
|
1528 |
<output>
|
1529 |
<port id="0" precision="I64">
|
@@ -1531,7 +1531,7 @@
|
|
1531 |
</port>
|
1532 |
</output>
|
1533 |
</layer>
|
1534 |
-
<layer id="116" name="
|
1535 |
<data element_type="i64" shape="1" offset="67118890" size="8" />
|
1536 |
<output>
|
1537 |
<port id="0" precision="I64">
|
@@ -1539,7 +1539,7 @@
|
|
1539 |
</port>
|
1540 |
</output>
|
1541 |
</layer>
|
1542 |
-
<layer id="117" name="
|
1543 |
<data element_type="i64" shape="1" offset="67118890" size="8" />
|
1544 |
<output>
|
1545 |
<port id="0" precision="I64">
|
@@ -1591,7 +1591,7 @@
|
|
1591 |
</port>
|
1592 |
</output>
|
1593 |
</layer>
|
1594 |
-
<layer id="120" name="
|
1595 |
<data element_type="i64" shape="1" offset="67118882" size="8" />
|
1596 |
<output>
|
1597 |
<port id="0" precision="I64">
|
@@ -1599,7 +1599,7 @@
|
|
1599 |
</port>
|
1600 |
</output>
|
1601 |
</layer>
|
1602 |
-
<layer id="121" name="
|
1603 |
<data output_type="i64" />
|
1604 |
<input>
|
1605 |
<port id="0" precision="FP32">
|
@@ -1614,7 +1614,7 @@
|
|
1614 |
</port>
|
1615 |
</output>
|
1616 |
</layer>
|
1617 |
-
<layer id="122" name="
|
1618 |
<data element_type="i64" shape="1" offset="67118890" size="8" />
|
1619 |
<output>
|
1620 |
<port id="0" precision="I64">
|
@@ -1622,13 +1622,13 @@
|
|
1622 |
</port>
|
1623 |
</output>
|
1624 |
</layer>
|
1625 |
-
<layer id="123" name="
|
1626 |
<data element_type="i64" shape="" offset="67118882" size="8" />
|
1627 |
<output>
|
1628 |
<port id="0" precision="I64" />
|
1629 |
</output>
|
1630 |
</layer>
|
1631 |
-
<layer id="124" name="
|
1632 |
<data batch_dims="0" />
|
1633 |
<input>
|
1634 |
<port id="0" precision="I64">
|
@@ -1645,7 +1645,7 @@
|
|
1645 |
</port>
|
1646 |
</output>
|
1647 |
</layer>
|
1648 |
-
<layer id="125" name="
|
1649 |
<data element_type="i64" shape="1" offset="67118890" size="8" />
|
1650 |
<output>
|
1651 |
<port id="0" precision="I64">
|
@@ -1745,7 +1745,7 @@
|
|
1745 |
</port>
|
1746 |
</output>
|
1747 |
</layer>
|
1748 |
-
<layer id="131" name="
|
1749 |
<data destination_type="f16" />
|
1750 |
<input>
|
1751 |
<port id="0" precision="U4">
|
@@ -1772,7 +1772,7 @@
|
|
1772 |
</port>
|
1773 |
</output>
|
1774 |
</layer>
|
1775 |
-
<layer id="133" name="
|
1776 |
<data destination_type="f16" />
|
1777 |
<input>
|
1778 |
<port id="0" precision="U4">
|
@@ -1843,7 +1843,7 @@
|
|
1843 |
</port>
|
1844 |
</output>
|
1845 |
</layer>
|
1846 |
-
<layer id="137" name="
|
1847 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
1848 |
<output>
|
1849 |
<port id="0" precision="I64">
|
@@ -1851,7 +1851,7 @@
|
|
1851 |
</port>
|
1852 |
</output>
|
1853 |
</layer>
|
1854 |
-
<layer id="138" name="
|
1855 |
<data special_zero="false" />
|
1856 |
<input>
|
1857 |
<port id="0" precision="FP16">
|
@@ -1906,7 +1906,7 @@
|
|
1906 |
</port>
|
1907 |
</output>
|
1908 |
</layer>
|
1909 |
-
<layer id="141" name="
|
1910 |
<data element_type="f32" shape="1, 1, 1280" offset="69687958" size="5120" />
|
1911 |
<output>
|
1912 |
<port id="0" precision="FP32">
|
@@ -1938,7 +1938,7 @@
|
|
1938 |
</port>
|
1939 |
</output>
|
1940 |
</layer>
|
1941 |
-
<layer id="143" name="
|
1942 |
<data element_type="i64" shape="4" offset="67985482" size="32" />
|
1943 |
<output>
|
1944 |
<port id="0" precision="I64">
|
@@ -2050,7 +2050,7 @@
|
|
2050 |
</port>
|
2051 |
</output>
|
2052 |
</layer>
|
2053 |
-
<layer id="150" name="
|
2054 |
<data element_type="i64" shape="3" offset="69693078" size="24" />
|
2055 |
<output>
|
2056 |
<port id="0" precision="I64">
|
@@ -2089,7 +2089,7 @@
|
|
2089 |
</port>
|
2090 |
</output>
|
2091 |
</layer>
|
2092 |
-
<layer id="153" name="
|
2093 |
<data destination_type="f16" />
|
2094 |
<input>
|
2095 |
<port id="0" precision="U4">
|
@@ -2116,7 +2116,7 @@
|
|
2116 |
</port>
|
2117 |
</output>
|
2118 |
</layer>
|
2119 |
-
<layer id="155" name="
|
2120 |
<data destination_type="f16" />
|
2121 |
<input>
|
2122 |
<port id="0" precision="U4">
|
@@ -2187,7 +2187,7 @@
|
|
2187 |
</port>
|
2188 |
</output>
|
2189 |
</layer>
|
2190 |
-
<layer id="159" name="
|
2191 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
2192 |
<output>
|
2193 |
<port id="0" precision="I64">
|
@@ -2195,7 +2195,7 @@
|
|
2195 |
</port>
|
2196 |
</output>
|
2197 |
</layer>
|
2198 |
-
<layer id="160" name="
|
2199 |
<data special_zero="false" />
|
2200 |
<input>
|
2201 |
<port id="0" precision="FP16">
|
@@ -2250,7 +2250,7 @@
|
|
2250 |
</port>
|
2251 |
</output>
|
2252 |
</layer>
|
2253 |
-
<layer id="163" name="
|
2254 |
<data element_type="f32" shape="1, 1, 1280" offset="70544302" size="5120" />
|
2255 |
<output>
|
2256 |
<port id="0" precision="FP32">
|
@@ -2332,7 +2332,7 @@
|
|
2332 |
</port>
|
2333 |
</output>
|
2334 |
</layer>
|
2335 |
-
<layer id="168" name="
|
2336 |
<data element_type="f32" shape="1, 1, 1280" offset="70549422" size="5120" />
|
2337 |
<output>
|
2338 |
<port id="0" precision="FP32">
|
@@ -2364,7 +2364,7 @@
|
|
2364 |
</port>
|
2365 |
</output>
|
2366 |
</layer>
|
2367 |
-
<layer id="170" name="
|
2368 |
<data element_type="f32" shape="1, 1, 1280" offset="70554542" size="5120" />
|
2369 |
<output>
|
2370 |
<port id="0" precision="FP32">
|
@@ -2396,7 +2396,7 @@
|
|
2396 |
</port>
|
2397 |
</output>
|
2398 |
</layer>
|
2399 |
-
<layer id="172" name="
|
2400 |
<data element_type="u4" shape="1280, 10, 128" offset="70559662" size="819200" />
|
2401 |
<output>
|
2402 |
<port id="0" precision="U4">
|
@@ -2406,7 +2406,7 @@
|
|
2406 |
</port>
|
2407 |
</output>
|
2408 |
</layer>
|
2409 |
-
<layer id="173" name="
|
2410 |
<data destination_type="f16" />
|
2411 |
<input>
|
2412 |
<port id="0" precision="U4">
|
@@ -2423,7 +2423,7 @@
|
|
2423 |
</port>
|
2424 |
</output>
|
2425 |
</layer>
|
2426 |
-
<layer id="174" name="
|
2427 |
<data element_type="u4" shape="1280, 10, 1" offset="71378862" size="6400" />
|
2428 |
<output>
|
2429 |
<port id="0" precision="U4">
|
@@ -2433,7 +2433,7 @@
|
|
2433 |
</port>
|
2434 |
</output>
|
2435 |
</layer>
|
2436 |
-
<layer id="175" name="
|
2437 |
<data destination_type="f16" />
|
2438 |
<input>
|
2439 |
<port id="0" precision="U4">
|
@@ -2450,7 +2450,7 @@
|
|
2450 |
</port>
|
2451 |
</output>
|
2452 |
</layer>
|
2453 |
-
<layer id="176" name="
|
2454 |
<data auto_broadcast="numpy" />
|
2455 |
<input>
|
2456 |
<port id="0" precision="FP16">
|
@@ -2472,7 +2472,7 @@
|
|
2472 |
</port>
|
2473 |
</output>
|
2474 |
</layer>
|
2475 |
-
<layer id="177" name="
|
2476 |
<data element_type="f16" shape="1280, 10, 1" offset="71385262" size="25600" />
|
2477 |
<output>
|
2478 |
<port id="0" precision="FP16">
|
@@ -2482,7 +2482,7 @@
|
|
2482 |
</port>
|
2483 |
</output>
|
2484 |
</layer>
|
2485 |
-
<layer id="178" name="
|
2486 |
<data auto_broadcast="numpy" />
|
2487 |
<input>
|
2488 |
<port id="0" precision="FP16">
|
@@ -2504,7 +2504,7 @@
|
|
2504 |
</port>
|
2505 |
</output>
|
2506 |
</layer>
|
2507 |
-
<layer id="179" name="
|
2508 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
2509 |
<output>
|
2510 |
<port id="0" precision="I64">
|
@@ -2512,7 +2512,7 @@
|
|
2512 |
</port>
|
2513 |
</output>
|
2514 |
</layer>
|
2515 |
-
<layer id="180" name="
|
2516 |
<data special_zero="false" />
|
2517 |
<input>
|
2518 |
<port id="0" precision="FP16">
|
@@ -2531,7 +2531,7 @@
|
|
2531 |
</port>
|
2532 |
</output>
|
2533 |
</layer>
|
2534 |
-
<layer id="181" name="
|
2535 |
<data destination_type="f32" />
|
2536 |
<input>
|
2537 |
<port id="0" precision="FP16">
|
@@ -2546,7 +2546,7 @@
|
|
2546 |
</port>
|
2547 |
</output>
|
2548 |
</layer>
|
2549 |
-
<layer id="182" name="
|
2550 |
<data transpose_a="false" transpose_b="true" />
|
2551 |
<input>
|
2552 |
<port id="0" precision="FP32">
|
@@ -2567,7 +2567,7 @@
|
|
2567 |
</port>
|
2568 |
</output>
|
2569 |
</layer>
|
2570 |
-
<layer id="183" name="
|
2571 |
<data element_type="f32" shape="1, 1, 1280" offset="71410862" size="5120" />
|
2572 |
<output>
|
2573 |
<port id="0" precision="FP32">
|
@@ -2599,7 +2599,7 @@
|
|
2599 |
</port>
|
2600 |
</output>
|
2601 |
</layer>
|
2602 |
-
<layer id="185" name="
|
2603 |
<data element_type="i64" shape="4" offset="67985482" size="32" />
|
2604 |
<output>
|
2605 |
<port id="0" precision="I64">
|
@@ -2667,7 +2667,7 @@
|
|
2667 |
</port>
|
2668 |
</output>
|
2669 |
</layer>
|
2670 |
-
<layer id="190" name="
|
2671 |
<data destination_type="f16" />
|
2672 |
<input>
|
2673 |
<port id="0" precision="U4">
|
@@ -2694,7 +2694,7 @@
|
|
2694 |
</port>
|
2695 |
</output>
|
2696 |
</layer>
|
2697 |
-
<layer id="192" name="
|
2698 |
<data destination_type="f16" />
|
2699 |
<input>
|
2700 |
<port id="0" precision="U4">
|
@@ -2765,7 +2765,7 @@
|
|
2765 |
</port>
|
2766 |
</output>
|
2767 |
</layer>
|
2768 |
-
<layer id="196" name="
|
2769 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
2770 |
<output>
|
2771 |
<port id="0" precision="I64">
|
@@ -2773,7 +2773,7 @@
|
|
2773 |
</port>
|
2774 |
</output>
|
2775 |
</layer>
|
2776 |
-
<layer id="197" name="
|
2777 |
<data special_zero="false" />
|
2778 |
<input>
|
2779 |
<port id="0" precision="FP16">
|
@@ -2828,7 +2828,7 @@
|
|
2828 |
</port>
|
2829 |
</output>
|
2830 |
</layer>
|
2831 |
-
<layer id="200" name="
|
2832 |
<data element_type="i64" shape="1" offset="72267182" size="8" />
|
2833 |
<output>
|
2834 |
<port id="0" precision="I64">
|
@@ -2836,7 +2836,7 @@
|
|
2836 |
</port>
|
2837 |
</output>
|
2838 |
</layer>
|
2839 |
-
<layer id="201" name="
|
2840 |
<data element_type="i64" shape="1" offset="72267190" size="8" />
|
2841 |
<output>
|
2842 |
<port id="0" precision="I64">
|
@@ -2844,7 +2844,7 @@
|
|
2844 |
</port>
|
2845 |
</output>
|
2846 |
</layer>
|
2847 |
-
<layer id="202" name="
|
2848 |
<data element_type="i64" shape="1" offset="72267198" size="8" />
|
2849 |
<output>
|
2850 |
<port id="0" precision="I64">
|
@@ -2852,7 +2852,7 @@
|
|
2852 |
</port>
|
2853 |
</output>
|
2854 |
</layer>
|
2855 |
-
<layer id="203" name="__module.model.model.decoder.layers.0.
|
2856 |
<data axis="0" />
|
2857 |
<input>
|
2858 |
<port id="0" precision="I64">
|
@@ -2978,7 +2978,7 @@
|
|
2978 |
</port>
|
2979 |
</output>
|
2980 |
</layer>
|
2981 |
-
<layer id="210" name="
|
2982 |
<data destination_type="f16" />
|
2983 |
<input>
|
2984 |
<port id="0" precision="U4">
|
@@ -3005,7 +3005,7 @@
|
|
3005 |
</port>
|
3006 |
</output>
|
3007 |
</layer>
|
3008 |
-
<layer id="212" name="
|
3009 |
<data destination_type="f16" />
|
3010 |
<input>
|
3011 |
<port id="0" precision="U4">
|
@@ -3076,7 +3076,7 @@
|
|
3076 |
</port>
|
3077 |
</output>
|
3078 |
</layer>
|
3079 |
-
<layer id="216" name="
|
3080 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
3081 |
<output>
|
3082 |
<port id="0" precision="I64">
|
@@ -3084,7 +3084,7 @@
|
|
3084 |
</port>
|
3085 |
</output>
|
3086 |
</layer>
|
3087 |
-
<layer id="217" name="
|
3088 |
<data special_zero="false" />
|
3089 |
<input>
|
3090 |
<port id="0" precision="FP16">
|
@@ -3139,7 +3139,7 @@
|
|
3139 |
</port>
|
3140 |
</output>
|
3141 |
</layer>
|
3142 |
-
<layer id="220" name="
|
3143 |
<data element_type="f32" shape="1, 1, 1280" offset="73118406" size="5120" />
|
3144 |
<output>
|
3145 |
<port id="0" precision="FP32">
|
@@ -3275,7 +3275,7 @@
|
|
3275 |
</port>
|
3276 |
</output>
|
3277 |
</layer>
|
3278 |
-
<layer id="228" name="
|
3279 |
<data element_type="i64" shape="3" offset="73123526" size="24" />
|
3280 |
<output>
|
3281 |
<port id="0" precision="I64">
|
@@ -3314,7 +3314,7 @@
|
|
3314 |
</port>
|
3315 |
</output>
|
3316 |
</layer>
|
3317 |
-
<layer id="231" name="
|
3318 |
<data destination_type="f16" />
|
3319 |
<input>
|
3320 |
<port id="0" precision="U4">
|
@@ -3341,7 +3341,7 @@
|
|
3341 |
</port>
|
3342 |
</output>
|
3343 |
</layer>
|
3344 |
-
<layer id="233" name="
|
3345 |
<data destination_type="f16" />
|
3346 |
<input>
|
3347 |
<port id="0" precision="U4">
|
@@ -3412,7 +3412,7 @@
|
|
3412 |
</port>
|
3413 |
</output>
|
3414 |
</layer>
|
3415 |
-
<layer id="237" name="
|
3416 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
3417 |
<output>
|
3418 |
<port id="0" precision="I64">
|
@@ -3420,7 +3420,7 @@
|
|
3420 |
</port>
|
3421 |
</output>
|
3422 |
</layer>
|
3423 |
-
<layer id="238" name="
|
3424 |
<data special_zero="false" />
|
3425 |
<input>
|
3426 |
<port id="0" precision="FP16">
|
@@ -3475,7 +3475,7 @@
|
|
3475 |
</port>
|
3476 |
</output>
|
3477 |
</layer>
|
3478 |
-
<layer id="241" name="
|
3479 |
<data element_type="f32" shape="1, 1, 1280" offset="73974750" size="5120" />
|
3480 |
<output>
|
3481 |
<port id="0" precision="FP32">
|
@@ -3557,7 +3557,7 @@
|
|
3557 |
</port>
|
3558 |
</output>
|
3559 |
</layer>
|
3560 |
-
<layer id="246" name="
|
3561 |
<data element_type="f32" shape="1, 1, 1280" offset="73979870" size="5120" />
|
3562 |
<output>
|
3563 |
<port id="0" precision="FP32">
|
@@ -3589,7 +3589,7 @@
|
|
3589 |
</port>
|
3590 |
</output>
|
3591 |
</layer>
|
3592 |
-
<layer id="248" name="
|
3593 |
<data element_type="f32" shape="1, 1, 1280" offset="73984990" size="5120" />
|
3594 |
<output>
|
3595 |
<port id="0" precision="FP32">
|
@@ -3631,7 +3631,7 @@
|
|
3631 |
</port>
|
3632 |
</output>
|
3633 |
</layer>
|
3634 |
-
<layer id="251" name="
|
3635 |
<data destination_type="f16" />
|
3636 |
<input>
|
3637 |
<port id="0" precision="U4">
|
@@ -3658,7 +3658,7 @@
|
|
3658 |
</port>
|
3659 |
</output>
|
3660 |
</layer>
|
3661 |
-
<layer id="253" name="
|
3662 |
<data destination_type="f16" />
|
3663 |
<input>
|
3664 |
<port id="0" precision="U4">
|
@@ -3729,7 +3729,7 @@
|
|
3729 |
</port>
|
3730 |
</output>
|
3731 |
</layer>
|
3732 |
-
<layer id="257" name="
|
3733 |
<data element_type="i64" shape="2" offset="77394910" size="16" />
|
3734 |
<output>
|
3735 |
<port id="0" precision="I64">
|
@@ -3737,7 +3737,7 @@
|
|
3737 |
</port>
|
3738 |
</output>
|
3739 |
</layer>
|
3740 |
-
<layer id="258" name="
|
3741 |
<data special_zero="false" />
|
3742 |
<input>
|
3743 |
<port id="0" precision="FP16">
|
@@ -3792,7 +3792,7 @@
|
|
3792 |
</port>
|
3793 |
</output>
|
3794 |
</layer>
|
3795 |
-
<layer id="261" name="
|
3796 |
<data element_type="f32" shape="1, 1, 5120" offset="77394926" size="20480" />
|
3797 |
<output>
|
3798 |
<port id="0" precision="FP32">
|
@@ -3851,7 +3851,7 @@
|
|
3851 |
</port>
|
3852 |
</output>
|
3853 |
</layer>
|
3854 |
-
<layer id="265" name="
|
3855 |
<data destination_type="f16" />
|
3856 |
<input>
|
3857 |
<port id="0" precision="U4">
|
@@ -3878,7 +3878,7 @@
|
|
3878 |
</port>
|
3879 |
</output>
|
3880 |
</layer>
|
3881 |
-
<layer id="267" name="
|
3882 |
<data destination_type="f16" />
|
3883 |
<input>
|
3884 |
<port id="0" precision="U4">
|
@@ -3949,7 +3949,7 @@
|
|
3949 |
</port>
|
3950 |
</output>
|
3951 |
</layer>
|
3952 |
-
<layer id="271" name="
|
3953 |
<data element_type="i64" shape="2" offset="80820206" size="16" />
|
3954 |
<output>
|
3955 |
<port id="0" precision="I64">
|
@@ -3957,7 +3957,7 @@
|
|
3957 |
</port>
|
3958 |
</output>
|
3959 |
</layer>
|
3960 |
-
<layer id="272" name="
|
3961 |
<data special_zero="false" />
|
3962 |
<input>
|
3963 |
<port id="0" precision="FP16">
|
@@ -4012,7 +4012,7 @@
|
|
4012 |
</port>
|
4013 |
</output>
|
4014 |
</layer>
|
4015 |
-
<layer id="275" name="
|
4016 |
<data element_type="f32" shape="1, 1, 1280" offset="80820222" size="5120" />
|
4017 |
<output>
|
4018 |
<port id="0" precision="FP32">
|
@@ -4094,7 +4094,7 @@
|
|
4094 |
</port>
|
4095 |
</output>
|
4096 |
</layer>
|
4097 |
-
<layer id="280" name="
|
4098 |
<data element_type="f32" shape="1, 1, 1280" offset="80825342" size="5120" />
|
4099 |
<output>
|
4100 |
<port id="0" precision="FP32">
|
@@ -4126,7 +4126,7 @@
|
|
4126 |
</port>
|
4127 |
</output>
|
4128 |
</layer>
|
4129 |
-
<layer id="282" name="
|
4130 |
<data element_type="f32" shape="1, 1, 1280" offset="80830462" size="5120" />
|
4131 |
<output>
|
4132 |
<port id="0" precision="FP32">
|
@@ -4158,7 +4158,7 @@
|
|
4158 |
</port>
|
4159 |
</output>
|
4160 |
</layer>
|
4161 |
-
<layer id="284" name="
|
4162 |
<data element_type="u4" shape="1280, 10, 128" offset="80835582" size="819200" />
|
4163 |
<output>
|
4164 |
<port id="0" precision="U4">
|
@@ -4168,7 +4168,7 @@
|
|
4168 |
</port>
|
4169 |
</output>
|
4170 |
</layer>
|
4171 |
-
<layer id="285" name="
|
4172 |
<data destination_type="f16" />
|
4173 |
<input>
|
4174 |
<port id="0" precision="U4">
|
@@ -4185,7 +4185,7 @@
|
|
4185 |
</port>
|
4186 |
</output>
|
4187 |
</layer>
|
4188 |
-
<layer id="286" name="
|
4189 |
<data element_type="u4" shape="1280, 10, 1" offset="81654782" size="6400" />
|
4190 |
<output>
|
4191 |
<port id="0" precision="U4">
|
@@ -4195,7 +4195,7 @@
|
|
4195 |
</port>
|
4196 |
</output>
|
4197 |
</layer>
|
4198 |
-
<layer id="287" name="
|
4199 |
<data destination_type="f16" />
|
4200 |
<input>
|
4201 |
<port id="0" precision="U4">
|
@@ -4212,7 +4212,7 @@
|
|
4212 |
</port>
|
4213 |
</output>
|
4214 |
</layer>
|
4215 |
-
<layer id="288" name="
|
4216 |
<data auto_broadcast="numpy" />
|
4217 |
<input>
|
4218 |
<port id="0" precision="FP16">
|
@@ -4234,7 +4234,7 @@
|
|
4234 |
</port>
|
4235 |
</output>
|
4236 |
</layer>
|
4237 |
-
<layer id="289" name="
|
4238 |
<data element_type="f16" shape="1280, 10, 1" offset="81661182" size="25600" />
|
4239 |
<output>
|
4240 |
<port id="0" precision="FP16">
|
@@ -4244,7 +4244,7 @@
|
|
4244 |
</port>
|
4245 |
</output>
|
4246 |
</layer>
|
4247 |
-
<layer id="290" name="
|
4248 |
<data auto_broadcast="numpy" />
|
4249 |
<input>
|
4250 |
<port id="0" precision="FP16">
|
@@ -4266,7 +4266,7 @@
|
|
4266 |
</port>
|
4267 |
</output>
|
4268 |
</layer>
|
4269 |
-
<layer id="291" name="
|
4270 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
4271 |
<output>
|
4272 |
<port id="0" precision="I64">
|
@@ -4274,7 +4274,7 @@
|
|
4274 |
</port>
|
4275 |
</output>
|
4276 |
</layer>
|
4277 |
-
<layer id="292" name="
|
4278 |
<data special_zero="false" />
|
4279 |
<input>
|
4280 |
<port id="0" precision="FP16">
|
@@ -4293,7 +4293,7 @@
|
|
4293 |
</port>
|
4294 |
</output>
|
4295 |
</layer>
|
4296 |
-
<layer id="293" name="
|
4297 |
<data destination_type="f32" />
|
4298 |
<input>
|
4299 |
<port id="0" precision="FP16">
|
@@ -4308,7 +4308,7 @@
|
|
4308 |
</port>
|
4309 |
</output>
|
4310 |
</layer>
|
4311 |
-
<layer id="294" name="
|
4312 |
<data transpose_a="false" transpose_b="true" />
|
4313 |
<input>
|
4314 |
<port id="0" precision="FP32">
|
@@ -4329,7 +4329,7 @@
|
|
4329 |
</port>
|
4330 |
</output>
|
4331 |
</layer>
|
4332 |
-
<layer id="295" name="
|
4333 |
<data element_type="f32" shape="1, 1, 1280" offset="81686782" size="5120" />
|
4334 |
<output>
|
4335 |
<port id="0" precision="FP32">
|
@@ -4361,7 +4361,7 @@
|
|
4361 |
</port>
|
4362 |
</output>
|
4363 |
</layer>
|
4364 |
-
<layer id="297" name="
|
4365 |
<data element_type="i64" shape="4" offset="67985482" size="32" />
|
4366 |
<output>
|
4367 |
<port id="0" precision="I64">
|
@@ -4429,7 +4429,7 @@
|
|
4429 |
</port>
|
4430 |
</output>
|
4431 |
</layer>
|
4432 |
-
<layer id="302" name="
|
4433 |
<data destination_type="f16" />
|
4434 |
<input>
|
4435 |
<port id="0" precision="U4">
|
@@ -4456,7 +4456,7 @@
|
|
4456 |
</port>
|
4457 |
</output>
|
4458 |
</layer>
|
4459 |
-
<layer id="304" name="
|
4460 |
<data destination_type="f16" />
|
4461 |
<input>
|
4462 |
<port id="0" precision="U4">
|
@@ -4527,7 +4527,7 @@
|
|
4527 |
</port>
|
4528 |
</output>
|
4529 |
</layer>
|
4530 |
-
<layer id="308" name="
|
4531 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
4532 |
<output>
|
4533 |
<port id="0" precision="I64">
|
@@ -4535,7 +4535,7 @@
|
|
4535 |
</port>
|
4536 |
</output>
|
4537 |
</layer>
|
4538 |
-
<layer id="309" name="
|
4539 |
<data special_zero="false" />
|
4540 |
<input>
|
4541 |
<port id="0" precision="FP16">
|
@@ -4590,7 +4590,7 @@
|
|
4590 |
</port>
|
4591 |
</output>
|
4592 |
</layer>
|
4593 |
-
<layer id="312" name="
|
4594 |
<data element_type="i64" shape="4" offset="67985482" size="32" />
|
4595 |
<output>
|
4596 |
<port id="0" precision="I64">
|
@@ -4727,7 +4727,7 @@
|
|
4727 |
</port>
|
4728 |
</output>
|
4729 |
</layer>
|
4730 |
-
<layer id="320" name="
|
4731 |
<data destination_type="f16" />
|
4732 |
<input>
|
4733 |
<port id="0" precision="U4">
|
@@ -4754,7 +4754,7 @@
|
|
4754 |
</port>
|
4755 |
</output>
|
4756 |
</layer>
|
4757 |
-
<layer id="322" name="
|
4758 |
<data destination_type="f16" />
|
4759 |
<input>
|
4760 |
<port id="0" precision="U4">
|
@@ -4825,7 +4825,7 @@
|
|
4825 |
</port>
|
4826 |
</output>
|
4827 |
</layer>
|
4828 |
-
<layer id="326" name="
|
4829 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
4830 |
<output>
|
4831 |
<port id="0" precision="I64">
|
@@ -4833,7 +4833,7 @@
|
|
4833 |
</port>
|
4834 |
</output>
|
4835 |
</layer>
|
4836 |
-
<layer id="327" name="
|
4837 |
<data special_zero="false" />
|
4838 |
<input>
|
4839 |
<port id="0" precision="FP16">
|
@@ -4888,7 +4888,7 @@
|
|
4888 |
</port>
|
4889 |
</output>
|
4890 |
</layer>
|
4891 |
-
<layer id="330" name="
|
4892 |
<data element_type="f32" shape="1, 1, 1280" offset="83394302" size="5120" />
|
4893 |
<output>
|
4894 |
<port id="0" precision="FP32">
|
@@ -4920,7 +4920,7 @@
|
|
4920 |
</port>
|
4921 |
</output>
|
4922 |
</layer>
|
4923 |
-
<layer id="332" name="
|
4924 |
<data element_type="i64" shape="4" offset="67985482" size="32" />
|
4925 |
<output>
|
4926 |
<port id="0" precision="I64">
|
@@ -5032,7 +5032,7 @@
|
|
5032 |
</port>
|
5033 |
</output>
|
5034 |
</layer>
|
5035 |
-
<layer id="339" name="
|
5036 |
<data element_type="i64" shape="3" offset="69693078" size="24" />
|
5037 |
<output>
|
5038 |
<port id="0" precision="I64">
|
@@ -5071,7 +5071,7 @@
|
|
5071 |
</port>
|
5072 |
</output>
|
5073 |
</layer>
|
5074 |
-
<layer id="342" name="
|
5075 |
<data destination_type="f16" />
|
5076 |
<input>
|
5077 |
<port id="0" precision="U4">
|
@@ -5098,7 +5098,7 @@
|
|
5098 |
</port>
|
5099 |
</output>
|
5100 |
</layer>
|
5101 |
-
<layer id="344" name="
|
5102 |
<data destination_type="f16" />
|
5103 |
<input>
|
5104 |
<port id="0" precision="U4">
|
@@ -5169,7 +5169,7 @@
|
|
5169 |
</port>
|
5170 |
</output>
|
5171 |
</layer>
|
5172 |
-
<layer id="348" name="
|
5173 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
5174 |
<output>
|
5175 |
<port id="0" precision="I64">
|
@@ -5177,7 +5177,7 @@
|
|
5177 |
</port>
|
5178 |
</output>
|
5179 |
</layer>
|
5180 |
-
<layer id="349" name="
|
5181 |
<data special_zero="false" />
|
5182 |
<input>
|
5183 |
<port id="0" precision="FP16">
|
@@ -5232,7 +5232,7 @@
|
|
5232 |
</port>
|
5233 |
</output>
|
5234 |
</layer>
|
5235 |
-
<layer id="352" name="
|
5236 |
<data element_type="f32" shape="1, 1, 1280" offset="84250622" size="5120" />
|
5237 |
<output>
|
5238 |
<port id="0" precision="FP32">
|
@@ -5314,7 +5314,7 @@
|
|
5314 |
</port>
|
5315 |
</output>
|
5316 |
</layer>
|
5317 |
-
<layer id="357" name="
|
5318 |
<data element_type="f32" shape="1, 1, 1280" offset="84255742" size="5120" />
|
5319 |
<output>
|
5320 |
<port id="0" precision="FP32">
|
@@ -5346,7 +5346,7 @@
|
|
5346 |
</port>
|
5347 |
</output>
|
5348 |
</layer>
|
5349 |
-
<layer id="359" name="
|
5350 |
<data element_type="f32" shape="1, 1, 1280" offset="84260862" size="5120" />
|
5351 |
<output>
|
5352 |
<port id="0" precision="FP32">
|
@@ -5378,7 +5378,7 @@
|
|
5378 |
</port>
|
5379 |
</output>
|
5380 |
</layer>
|
5381 |
-
<layer id="361" name="
|
5382 |
<data element_type="u4" shape="1280, 10, 128" offset="84265982" size="819200" />
|
5383 |
<output>
|
5384 |
<port id="0" precision="U4">
|
@@ -5388,7 +5388,7 @@
|
|
5388 |
</port>
|
5389 |
</output>
|
5390 |
</layer>
|
5391 |
-
<layer id="362" name="
|
5392 |
<data destination_type="f16" />
|
5393 |
<input>
|
5394 |
<port id="0" precision="U4">
|
@@ -5405,7 +5405,7 @@
|
|
5405 |
</port>
|
5406 |
</output>
|
5407 |
</layer>
|
5408 |
-
<layer id="363" name="
|
5409 |
<data element_type="u4" shape="1280, 10, 1" offset="85085182" size="6400" />
|
5410 |
<output>
|
5411 |
<port id="0" precision="U4">
|
@@ -5415,7 +5415,7 @@
|
|
5415 |
</port>
|
5416 |
</output>
|
5417 |
</layer>
|
5418 |
-
<layer id="364" name="
|
5419 |
<data destination_type="f16" />
|
5420 |
<input>
|
5421 |
<port id="0" precision="U4">
|
@@ -5432,7 +5432,7 @@
|
|
5432 |
</port>
|
5433 |
</output>
|
5434 |
</layer>
|
5435 |
-
<layer id="365" name="
|
5436 |
<data auto_broadcast="numpy" />
|
5437 |
<input>
|
5438 |
<port id="0" precision="FP16">
|
@@ -5454,7 +5454,7 @@
|
|
5454 |
</port>
|
5455 |
</output>
|
5456 |
</layer>
|
5457 |
-
<layer id="366" name="
|
5458 |
<data element_type="f16" shape="1280, 10, 1" offset="85091582" size="25600" />
|
5459 |
<output>
|
5460 |
<port id="0" precision="FP16">
|
@@ -5464,7 +5464,7 @@
|
|
5464 |
</port>
|
5465 |
</output>
|
5466 |
</layer>
|
5467 |
-
<layer id="367" name="
|
5468 |
<data auto_broadcast="numpy" />
|
5469 |
<input>
|
5470 |
<port id="0" precision="FP16">
|
@@ -5486,7 +5486,7 @@
|
|
5486 |
</port>
|
5487 |
</output>
|
5488 |
</layer>
|
5489 |
-
<layer id="368" name="
|
5490 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
5491 |
<output>
|
5492 |
<port id="0" precision="I64">
|
@@ -5494,7 +5494,7 @@
|
|
5494 |
</port>
|
5495 |
</output>
|
5496 |
</layer>
|
5497 |
-
<layer id="369" name="
|
5498 |
<data special_zero="false" />
|
5499 |
<input>
|
5500 |
<port id="0" precision="FP16">
|
@@ -5513,7 +5513,7 @@
|
|
5513 |
</port>
|
5514 |
</output>
|
5515 |
</layer>
|
5516 |
-
<layer id="370" name="
|
5517 |
<data destination_type="f32" />
|
5518 |
<input>
|
5519 |
<port id="0" precision="FP16">
|
@@ -5528,7 +5528,7 @@
|
|
5528 |
</port>
|
5529 |
</output>
|
5530 |
</layer>
|
5531 |
-
<layer id="371" name="
|
5532 |
<data transpose_a="false" transpose_b="true" />
|
5533 |
<input>
|
5534 |
<port id="0" precision="FP32">
|
@@ -5549,7 +5549,7 @@
|
|
5549 |
</port>
|
5550 |
</output>
|
5551 |
</layer>
|
5552 |
-
<layer id="372" name="
|
5553 |
<data element_type="f32" shape="1, 1, 1280" offset="85117182" size="5120" />
|
5554 |
<output>
|
5555 |
<port id="0" precision="FP32">
|
@@ -5581,7 +5581,7 @@
|
|
5581 |
</port>
|
5582 |
</output>
|
5583 |
</layer>
|
5584 |
-
<layer id="374" name="
|
5585 |
<data element_type="i64" shape="4" offset="67985482" size="32" />
|
5586 |
<output>
|
5587 |
<port id="0" precision="I64">
|
@@ -5649,7 +5649,7 @@
|
|
5649 |
</port>
|
5650 |
</output>
|
5651 |
</layer>
|
5652 |
-
<layer id="379" name="
|
5653 |
<data destination_type="f16" />
|
5654 |
<input>
|
5655 |
<port id="0" precision="U4">
|
@@ -5676,7 +5676,7 @@
|
|
5676 |
</port>
|
5677 |
</output>
|
5678 |
</layer>
|
5679 |
-
<layer id="381" name="
|
5680 |
<data destination_type="f16" />
|
5681 |
<input>
|
5682 |
<port id="0" precision="U4">
|
@@ -5747,7 +5747,7 @@
|
|
5747 |
</port>
|
5748 |
</output>
|
5749 |
</layer>
|
5750 |
-
<layer id="385" name="
|
5751 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
5752 |
<output>
|
5753 |
<port id="0" precision="I64">
|
@@ -5755,7 +5755,7 @@
|
|
5755 |
</port>
|
5756 |
</output>
|
5757 |
</layer>
|
5758 |
-
<layer id="386" name="
|
5759 |
<data special_zero="false" />
|
5760 |
<input>
|
5761 |
<port id="0" precision="FP16">
|
@@ -5914,7 +5914,7 @@
|
|
5914 |
</port>
|
5915 |
</output>
|
5916 |
</layer>
|
5917 |
-
<layer id="395" name="
|
5918 |
<data destination_type="f16" />
|
5919 |
<input>
|
5920 |
<port id="0" precision="U4">
|
@@ -5941,7 +5941,7 @@
|
|
5941 |
</port>
|
5942 |
</output>
|
5943 |
</layer>
|
5944 |
-
<layer id="397" name="
|
5945 |
<data destination_type="f16" />
|
5946 |
<input>
|
5947 |
<port id="0" precision="U4">
|
@@ -6012,7 +6012,7 @@
|
|
6012 |
</port>
|
6013 |
</output>
|
6014 |
</layer>
|
6015 |
-
<layer id="401" name="
|
6016 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
6017 |
<output>
|
6018 |
<port id="0" precision="I64">
|
@@ -6020,7 +6020,7 @@
|
|
6020 |
</port>
|
6021 |
</output>
|
6022 |
</layer>
|
6023 |
-
<layer id="402" name="
|
6024 |
<data special_zero="false" />
|
6025 |
<input>
|
6026 |
<port id="0" precision="FP16">
|
@@ -6075,7 +6075,7 @@
|
|
6075 |
</port>
|
6076 |
</output>
|
6077 |
</layer>
|
6078 |
-
<layer id="405" name="
|
6079 |
<data element_type="f32" shape="1, 1, 1280" offset="86824702" size="5120" />
|
6080 |
<output>
|
6081 |
<port id="0" precision="FP32">
|
@@ -6211,7 +6211,7 @@
|
|
6211 |
</port>
|
6212 |
</output>
|
6213 |
</layer>
|
6214 |
-
<layer id="413" name="
|
6215 |
<data element_type="i64" shape="3" offset="73123526" size="24" />
|
6216 |
<output>
|
6217 |
<port id="0" precision="I64">
|
@@ -6250,7 +6250,7 @@
|
|
6250 |
</port>
|
6251 |
</output>
|
6252 |
</layer>
|
6253 |
-
<layer id="416" name="
|
6254 |
<data destination_type="f16" />
|
6255 |
<input>
|
6256 |
<port id="0" precision="U4">
|
@@ -6277,7 +6277,7 @@
|
|
6277 |
</port>
|
6278 |
</output>
|
6279 |
</layer>
|
6280 |
-
<layer id="418" name="
|
6281 |
<data destination_type="f16" />
|
6282 |
<input>
|
6283 |
<port id="0" precision="U4">
|
@@ -6348,7 +6348,7 @@
|
|
6348 |
</port>
|
6349 |
</output>
|
6350 |
</layer>
|
6351 |
-
<layer id="422" name="
|
6352 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
6353 |
<output>
|
6354 |
<port id="0" precision="I64">
|
@@ -6356,7 +6356,7 @@
|
|
6356 |
</port>
|
6357 |
</output>
|
6358 |
</layer>
|
6359 |
-
<layer id="423" name="
|
6360 |
<data special_zero="false" />
|
6361 |
<input>
|
6362 |
<port id="0" precision="FP16">
|
@@ -6411,7 +6411,7 @@
|
|
6411 |
</port>
|
6412 |
</output>
|
6413 |
</layer>
|
6414 |
-
<layer id="426" name="
|
6415 |
<data element_type="f32" shape="1, 1, 1280" offset="87681022" size="5120" />
|
6416 |
<output>
|
6417 |
<port id="0" precision="FP32">
|
@@ -6493,7 +6493,7 @@
|
|
6493 |
</port>
|
6494 |
</output>
|
6495 |
</layer>
|
6496 |
-
<layer id="431" name="
|
6497 |
<data element_type="f32" shape="1, 1, 1280" offset="87686142" size="5120" />
|
6498 |
<output>
|
6499 |
<port id="0" precision="FP32">
|
@@ -6525,7 +6525,7 @@
|
|
6525 |
</port>
|
6526 |
</output>
|
6527 |
</layer>
|
6528 |
-
<layer id="433" name="
|
6529 |
<data element_type="f32" shape="1, 1, 1280" offset="87691262" size="5120" />
|
6530 |
<output>
|
6531 |
<port id="0" precision="FP32">
|
@@ -6567,7 +6567,7 @@
|
|
6567 |
</port>
|
6568 |
</output>
|
6569 |
</layer>
|
6570 |
-
<layer id="436" name="
|
6571 |
<data destination_type="f16" />
|
6572 |
<input>
|
6573 |
<port id="0" precision="U4">
|
@@ -6594,7 +6594,7 @@
|
|
6594 |
</port>
|
6595 |
</output>
|
6596 |
</layer>
|
6597 |
-
<layer id="438" name="
|
6598 |
<data destination_type="f16" />
|
6599 |
<input>
|
6600 |
<port id="0" precision="U4">
|
@@ -6665,7 +6665,7 @@
|
|
6665 |
</port>
|
6666 |
</output>
|
6667 |
</layer>
|
6668 |
-
<layer id="442" name="
|
6669 |
<data element_type="i64" shape="2" offset="77394910" size="16" />
|
6670 |
<output>
|
6671 |
<port id="0" precision="I64">
|
@@ -6673,7 +6673,7 @@
|
|
6673 |
</port>
|
6674 |
</output>
|
6675 |
</layer>
|
6676 |
-
<layer id="443" name="
|
6677 |
<data special_zero="false" />
|
6678 |
<input>
|
6679 |
<port id="0" precision="FP16">
|
@@ -6728,7 +6728,7 @@
|
|
6728 |
</port>
|
6729 |
</output>
|
6730 |
</layer>
|
6731 |
-
<layer id="446" name="
|
6732 |
<data element_type="f32" shape="1, 1, 5120" offset="91101182" size="20480" />
|
6733 |
<output>
|
6734 |
<port id="0" precision="FP32">
|
@@ -6787,7 +6787,7 @@
|
|
6787 |
</port>
|
6788 |
</output>
|
6789 |
</layer>
|
6790 |
-
<layer id="450" name="
|
6791 |
<data destination_type="f16" />
|
6792 |
<input>
|
6793 |
<port id="0" precision="U4">
|
@@ -6814,7 +6814,7 @@
|
|
6814 |
</port>
|
6815 |
</output>
|
6816 |
</layer>
|
6817 |
-
<layer id="452" name="
|
6818 |
<data destination_type="f16" />
|
6819 |
<input>
|
6820 |
<port id="0" precision="U4">
|
@@ -6885,7 +6885,7 @@
|
|
6885 |
</port>
|
6886 |
</output>
|
6887 |
</layer>
|
6888 |
-
<layer id="456" name="
|
6889 |
<data element_type="i64" shape="2" offset="80820206" size="16" />
|
6890 |
<output>
|
6891 |
<port id="0" precision="I64">
|
@@ -6893,7 +6893,7 @@
|
|
6893 |
</port>
|
6894 |
</output>
|
6895 |
</layer>
|
6896 |
-
<layer id="457" name="
|
6897 |
<data special_zero="false" />
|
6898 |
<input>
|
6899 |
<port id="0" precision="FP16">
|
@@ -6948,7 +6948,7 @@
|
|
6948 |
</port>
|
6949 |
</output>
|
6950 |
</layer>
|
6951 |
-
<layer id="460" name="
|
6952 |
<data element_type="f32" shape="1, 1, 1280" offset="94526462" size="5120" />
|
6953 |
<output>
|
6954 |
<port id="0" precision="FP32">
|
@@ -7030,7 +7030,7 @@
|
|
7030 |
</port>
|
7031 |
</output>
|
7032 |
</layer>
|
7033 |
-
<layer id="465" name="
|
7034 |
<data element_type="f32" shape="1, 1, 1280" offset="94531582" size="5120" />
|
7035 |
<output>
|
7036 |
<port id="0" precision="FP32">
|
@@ -7062,7 +7062,7 @@
|
|
7062 |
</port>
|
7063 |
</output>
|
7064 |
</layer>
|
7065 |
-
<layer id="467" name="
|
7066 |
<data element_type="f32" shape="1, 1, 1280" offset="94536702" size="5120" />
|
7067 |
<output>
|
7068 |
<port id="0" precision="FP32">
|
@@ -7115,7 +7115,7 @@
|
|
7115 |
</port>
|
7116 |
</output>
|
7117 |
</layer>
|
7118 |
-
<layer id="470" name="
|
7119 |
<input>
|
7120 |
<port id="0" precision="FP32">
|
7121 |
<dim>-1</dim>
|
@@ -7632,7 +7632,7 @@
|
|
7632 |
<edge from-layer="469" from-port="2" to-layer="470" to-port="0" />
|
7633 |
</edges>
|
7634 |
<rt_info>
|
7635 |
-
<Runtime_version value="2024.5.0-
|
7636 |
<conversion_parameters>
|
7637 |
<framework value="pytorch" />
|
7638 |
<is_python_object value="True" />
|
@@ -7640,9 +7640,10 @@
|
|
7640 |
<nncf>
|
7641 |
<friendly_names_were_updated value="True" />
|
7642 |
<weight_compression>
|
7643 |
-
<advanced_parameters value="{'awq_params': {'subset_size': 32, 'percent_to_apply': 0.002, 'alpha_min': 0.0, 'alpha_max': 1.0, 'steps': 100}, 'scale_estimation_params': {'subset_size': 64, 'initial_steps': 5, 'scale_steps': 5, 'weight_penalty': -1.0}, 'gptq_params': {'damp_percent': 0.1, 'block_size': 128, 'subset_size': 128}, 'lora_correction_params': {'adapter_rank': 8, 'num_iterations': 3, 'apply_regularization': True, 'subset_size': 128, 'use_int8_adapters': True}}" />
|
7644 |
<all_layers value="False" />
|
7645 |
<awq value="False" />
|
|
|
7646 |
<gptq value="False" />
|
7647 |
<group_size value="128" />
|
7648 |
<ignored_scope value="[]" />
|
@@ -7654,10 +7655,10 @@
|
|
7654 |
</weight_compression>
|
7655 |
</nncf>
|
7656 |
<optimum>
|
7657 |
-
<optimum_intel_version value="1.
|
7658 |
-
<optimum_version value="1.23.
|
7659 |
-
<pytorch_version value="2.5.
|
7660 |
-
<transformers_version value="4.
|
7661 |
</optimum>
|
7662 |
</rt_info>
|
7663 |
</net>
|
|
|
10 |
</port>
|
11 |
</output>
|
12 |
</layer>
|
13 |
+
<layer id="0" name="Parameter_26207" type="Parameter" version="opset1">
|
14 |
<data shape="?,?,?" element_type="f32" />
|
15 |
<output>
|
16 |
<port id="0" precision="FP32" names="encoder_hidden_states">
|
|
|
29 |
</port>
|
30 |
</output>
|
31 |
</layer>
|
32 |
+
<layer id="3" name="Convert_42987" type="Convert" version="opset1">
|
33 |
<data destination_type="f16" />
|
34 |
<input>
|
35 |
<port id="0" precision="U8">
|
|
|
53 |
</port>
|
54 |
</output>
|
55 |
</layer>
|
56 |
+
<layer id="5" name="Convert_42990" type="Convert" version="opset1">
|
57 |
<data destination_type="f16" />
|
58 |
<input>
|
59 |
<port id="0" precision="U8">
|
|
|
130 |
</port>
|
131 |
</output>
|
132 |
</layer>
|
133 |
+
<layer id="10" name="Constant_31708" type="Const" version="opset1">
|
134 |
<data element_type="i64" shape="2" offset="66544078" size="16" />
|
135 |
<output>
|
136 |
<port id="0" precision="I64">
|
|
|
207 |
</port>
|
208 |
</output>
|
209 |
</layer>
|
210 |
+
<layer id="16" name="Convert_43218" type="Convert" version="opset1">
|
211 |
<data destination_type="f16" />
|
212 |
<input>
|
213 |
<port id="0" precision="U8">
|
|
|
231 |
</port>
|
232 |
</output>
|
233 |
</layer>
|
234 |
+
<layer id="18" name="Convert_43221" type="Convert" version="opset1">
|
235 |
<data destination_type="f16" />
|
236 |
<input>
|
237 |
<port id="0" precision="U8">
|
|
|
314 |
<port id="0" precision="I64" names="23" />
|
315 |
</output>
|
316 |
</layer>
|
317 |
+
<layer id="24" name="ShapeOf_31624" type="ShapeOf" version="opset3">
|
318 |
<data output_type="i64" />
|
319 |
<input>
|
320 |
<port id="0" precision="I64">
|
|
|
328 |
</port>
|
329 |
</output>
|
330 |
</layer>
|
331 |
+
<layer id="25" name="Constant_31625" type="Const" version="opset1">
|
332 |
<data element_type="i64" shape="" offset="67118890" size="8" />
|
333 |
<output>
|
334 |
<port id="0" precision="I64" />
|
335 |
</output>
|
336 |
</layer>
|
337 |
+
<layer id="26" name="Constant_31626" type="Const" version="opset1">
|
338 |
<data element_type="i64" shape="" offset="67118882" size="8" />
|
339 |
<output>
|
340 |
<port id="0" precision="I64" />
|
341 |
</output>
|
342 |
</layer>
|
343 |
+
<layer id="27" name="Gather_31627" type="Gather" version="opset8">
|
344 |
<data batch_dims="0" />
|
345 |
<input>
|
346 |
<port id="0" precision="I64">
|
|
|
401 |
</port>
|
402 |
</output>
|
403 |
</layer>
|
404 |
+
<layer id="32" name="__module.model.model.decoder.embed_positions/aten::index/Constant" type="Const" version="opset1">
|
405 |
<data element_type="i32" shape="" offset="66544094" size="4" />
|
406 |
<output>
|
407 |
<port id="0" precision="I32" />
|
|
|
478 |
</port>
|
479 |
</output>
|
480 |
</layer>
|
481 |
+
<layer id="37" name="Constant_31390" type="Const" version="opset1">
|
482 |
<data element_type="f32" shape="1, 1, 1280" offset="67118906" size="5120" />
|
483 |
<output>
|
484 |
<port id="0" precision="FP32">
|
|
|
510 |
</port>
|
511 |
</output>
|
512 |
</layer>
|
513 |
+
<layer id="39" name="Constant_31391" type="Const" version="opset1">
|
514 |
<data element_type="f32" shape="1, 1, 1280" offset="67124026" size="5120" />
|
515 |
<output>
|
516 |
<port id="0" precision="FP32">
|
|
|
542 |
</port>
|
543 |
</output>
|
544 |
</layer>
|
545 |
+
<layer id="41" name="Constant_31293" type="Const" version="opset1">
|
546 |
<data element_type="u4" shape="1280, 10, 128" offset="67129146" size="819200" />
|
547 |
<output>
|
548 |
<port id="0" precision="U4">
|
|
|
552 |
</port>
|
553 |
</output>
|
554 |
</layer>
|
555 |
+
<layer id="42" name="Convert_43107" type="Convert" version="opset1">
|
556 |
<data destination_type="f16" />
|
557 |
<input>
|
558 |
<port id="0" precision="U4">
|
|
|
569 |
</port>
|
570 |
</output>
|
571 |
</layer>
|
572 |
+
<layer id="43" name="Constant_31293/zero_point" type="Const" version="opset1">
|
573 |
<data element_type="u4" shape="1280, 10, 1" offset="67948346" size="6400" />
|
574 |
<output>
|
575 |
<port id="0" precision="U4">
|
|
|
579 |
</port>
|
580 |
</output>
|
581 |
</layer>
|
582 |
+
<layer id="44" name="Convert_43109" type="Convert" version="opset1">
|
583 |
<data destination_type="f16" />
|
584 |
<input>
|
585 |
<port id="0" precision="U4">
|
|
|
596 |
</port>
|
597 |
</output>
|
598 |
</layer>
|
599 |
+
<layer id="45" name="Constant_31293/zero_point/subtract" type="Subtract" version="opset1">
|
600 |
<data auto_broadcast="numpy" />
|
601 |
<input>
|
602 |
<port id="0" precision="FP16">
|
|
|
618 |
</port>
|
619 |
</output>
|
620 |
</layer>
|
621 |
+
<layer id="46" name="Constant_31293/scale" type="Const" version="opset1">
|
622 |
<data element_type="f16" shape="1280, 10, 1" offset="67954746" size="25600" />
|
623 |
<output>
|
624 |
<port id="0" precision="FP16">
|
|
|
628 |
</port>
|
629 |
</output>
|
630 |
</layer>
|
631 |
+
<layer id="47" name="Constant_31293/fq_weights_1" type="Multiply" version="opset1">
|
632 |
<data auto_broadcast="numpy" />
|
633 |
<input>
|
634 |
<port id="0" precision="FP16">
|
|
|
650 |
</port>
|
651 |
</output>
|
652 |
</layer>
|
653 |
+
<layer id="48" name="Constant_43114" type="Const" version="opset1">
|
654 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
655 |
<output>
|
656 |
<port id="0" precision="I64">
|
|
|
658 |
</port>
|
659 |
</output>
|
660 |
</layer>
|
661 |
+
<layer id="49" name="Reshape_43115" type="Reshape" version="opset1">
|
662 |
<data special_zero="false" />
|
663 |
<input>
|
664 |
<port id="0" precision="FP16">
|
|
|
677 |
</port>
|
678 |
</output>
|
679 |
</layer>
|
680 |
+
<layer id="50" name="Constant_31293/fq_weights_1/convert" type="Convert" version="opset1">
|
681 |
<data destination_type="f32" />
|
682 |
<input>
|
683 |
<port id="0" precision="FP16">
|
|
|
692 |
</port>
|
693 |
</output>
|
694 |
</layer>
|
695 |
+
<layer id="51" name="Multiply_31276" type="MatMul" version="opset1">
|
696 |
<data transpose_a="false" transpose_b="true" />
|
697 |
<input>
|
698 |
<port id="0" precision="FP32">
|
|
|
713 |
</port>
|
714 |
</output>
|
715 |
</layer>
|
716 |
+
<layer id="52" name="Constant_31392" type="Const" version="opset1">
|
717 |
<data element_type="f32" shape="1, 1, 1280" offset="67980362" size="5120" />
|
718 |
<output>
|
719 |
<port id="0" precision="FP32">
|
|
|
745 |
</port>
|
746 |
</output>
|
747 |
</layer>
|
748 |
+
<layer id="54" name="Constant_31709" type="Const" version="opset1">
|
749 |
<data element_type="i64" shape="4" offset="67985482" size="32" />
|
750 |
<output>
|
751 |
<port id="0" precision="I64">
|
|
|
813 |
</port>
|
814 |
</output>
|
815 |
</layer>
|
816 |
+
<layer id="59" name="Convert_43096" type="Convert" version="opset1">
|
817 |
<data destination_type="f16" />
|
818 |
<input>
|
819 |
<port id="0" precision="U4">
|
|
|
840 |
</port>
|
841 |
</output>
|
842 |
</layer>
|
843 |
+
<layer id="61" name="Convert_43098" type="Convert" version="opset1">
|
844 |
<data destination_type="f16" />
|
845 |
<input>
|
846 |
<port id="0" precision="U4">
|
|
|
911 |
</port>
|
912 |
</output>
|
913 |
</layer>
|
914 |
+
<layer id="65" name="Constant_43103" type="Const" version="opset1">
|
915 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
916 |
<output>
|
917 |
<port id="0" precision="I64">
|
|
|
919 |
</port>
|
920 |
</output>
|
921 |
</layer>
|
922 |
+
<layer id="66" name="Reshape_43104" type="Reshape" version="opset1">
|
923 |
<data special_zero="false" />
|
924 |
<input>
|
925 |
<port id="0" precision="FP16">
|
|
|
974 |
</port>
|
975 |
</output>
|
976 |
</layer>
|
977 |
+
<layer id="69" name="Constant_31710" type="Const" version="opset1">
|
978 |
<data element_type="i64" shape="4" offset="67985482" size="32" />
|
979 |
<output>
|
980 |
<port id="0" precision="I64">
|
|
|
1063 |
<port id="0" precision="I32" />
|
1064 |
</output>
|
1065 |
</layer>
|
1066 |
+
<layer id="75" name="17" type="Const" version="opset1">
|
1067 |
<data element_type="f32" shape="" offset="68836730" size="4" />
|
1068 |
<output>
|
1069 |
+
<port id="0" precision="FP32" names="17" />
|
1070 |
</output>
|
1071 |
</layer>
|
1072 |
+
<layer id="76" name="Constant_31648" type="Const" version="opset1">
|
1073 |
<data element_type="i64" shape="1" offset="67118890" size="8" />
|
1074 |
<output>
|
1075 |
<port id="0" precision="I64">
|
|
|
1077 |
</port>
|
1078 |
</output>
|
1079 |
</layer>
|
1080 |
+
<layer id="77" name="Reshape_31649" type="Reshape" version="opset1">
|
1081 |
<data special_zero="false" />
|
1082 |
<input>
|
1083 |
<port id="0" precision="I64" />
|
|
|
1107 |
<port id="2" precision="I64" names="62,64" />
|
1108 |
</output>
|
1109 |
</layer>
|
1110 |
+
<layer id="80" name="Constant_24084" type="Const" version="opset1">
|
1111 |
<data element_type="i32" shape="" offset="66544094" size="4" />
|
1112 |
<output>
|
1113 |
<port id="0" precision="I32" />
|
1114 |
</output>
|
1115 |
</layer>
|
1116 |
+
<layer id="81" name="Unsqueeze_24085" type="Unsqueeze" version="opset1">
|
1117 |
<input>
|
1118 |
<port id="0" precision="I64" />
|
1119 |
<port id="1" precision="I32" />
|
|
|
1155 |
</port>
|
1156 |
</output>
|
1157 |
</layer>
|
1158 |
+
<layer id="84" name="ShapeOf_31655" type="ShapeOf" version="opset3">
|
1159 |
<data output_type="i32" />
|
1160 |
<input>
|
1161 |
<port id="0" precision="FP32">
|
|
|
1169 |
</port>
|
1170 |
</output>
|
1171 |
</layer>
|
1172 |
+
<layer id="85" name="Constant_31656" type="Const" version="opset1">
|
1173 |
<data element_type="i64" shape="" offset="67118890" size="8" />
|
1174 |
<output>
|
1175 |
<port id="0" precision="I64" />
|
1176 |
</output>
|
1177 |
</layer>
|
1178 |
+
<layer id="86" name="Constant_31657" type="Const" version="opset1">
|
1179 |
<data element_type="i64" shape="" offset="67118882" size="8" />
|
1180 |
<output>
|
1181 |
<port id="0" precision="I64" />
|
1182 |
</output>
|
1183 |
</layer>
|
1184 |
+
<layer id="87" name="Gather_31658" type="Gather" version="opset8">
|
1185 |
<data batch_dims="0" />
|
1186 |
<input>
|
1187 |
<port id="0" precision="I32">
|
|
|
1233 |
<port id="0" precision="I32" />
|
1234 |
</output>
|
1235 |
</layer>
|
1236 |
+
<layer id="92" name="Convert_31661" type="Convert" version="opset1">
|
1237 |
<data destination_type="i32" />
|
1238 |
<input>
|
1239 |
<port id="0" precision="I64" />
|
|
|
1375 |
</port>
|
1376 |
</output>
|
1377 |
</layer>
|
1378 |
+
<layer id="104" name="Constant_24187" type="Const" version="opset1">
|
1379 |
<data element_type="i64" shape="2" offset="68836734" size="16" />
|
1380 |
<output>
|
1381 |
<port id="0" precision="I64" names="70">
|
|
|
1492 |
</port>
|
1493 |
</output>
|
1494 |
</layer>
|
1495 |
+
<layer id="112" name="Constant_31639" type="Const" version="opset1">
|
1496 |
<data element_type="i64" shape="1" offset="67118882" size="8" />
|
1497 |
<output>
|
1498 |
<port id="0" precision="I64">
|
|
|
1500 |
</port>
|
1501 |
</output>
|
1502 |
</layer>
|
1503 |
+
<layer id="113" name="Constant_31640" type="Const" version="opset1">
|
1504 |
<data element_type="i64" shape="" offset="67118882" size="8" />
|
1505 |
<output>
|
1506 |
<port id="0" precision="I64" />
|
1507 |
</output>
|
1508 |
</layer>
|
1509 |
+
<layer id="114" name="Gather_31641" type="Gather" version="opset8">
|
1510 |
<data batch_dims="0" />
|
1511 |
<input>
|
1512 |
<port id="0" precision="I64">
|
|
|
1523 |
</port>
|
1524 |
</output>
|
1525 |
</layer>
|
1526 |
+
<layer id="115" name="Constant_30625" type="Const" version="opset1">
|
1527 |
<data element_type="i64" shape="1" offset="67118890" size="8" />
|
1528 |
<output>
|
1529 |
<port id="0" precision="I64">
|
|
|
1531 |
</port>
|
1532 |
</output>
|
1533 |
</layer>
|
1534 |
+
<layer id="116" name="Constant_30627" type="Const" version="opset1">
|
1535 |
<data element_type="i64" shape="1" offset="67118890" size="8" />
|
1536 |
<output>
|
1537 |
<port id="0" precision="I64">
|
|
|
1539 |
</port>
|
1540 |
</output>
|
1541 |
</layer>
|
1542 |
+
<layer id="117" name="Constant_30629" type="Const" version="opset1">
|
1543 |
<data element_type="i64" shape="1" offset="67118890" size="8" />
|
1544 |
<output>
|
1545 |
<port id="0" precision="I64">
|
|
|
1591 |
</port>
|
1592 |
</output>
|
1593 |
</layer>
|
1594 |
+
<layer id="120" name="Constant_24621" type="Const" version="opset1">
|
1595 |
<data element_type="i64" shape="1" offset="67118882" size="8" />
|
1596 |
<output>
|
1597 |
<port id="0" precision="I64">
|
|
|
1599 |
</port>
|
1600 |
</output>
|
1601 |
</layer>
|
1602 |
+
<layer id="121" name="ShapeOf_31670" type="ShapeOf" version="opset3">
|
1603 |
<data output_type="i64" />
|
1604 |
<input>
|
1605 |
<port id="0" precision="FP32">
|
|
|
1614 |
</port>
|
1615 |
</output>
|
1616 |
</layer>
|
1617 |
+
<layer id="122" name="Constant_31671" type="Const" version="opset1">
|
1618 |
<data element_type="i64" shape="1" offset="67118890" size="8" />
|
1619 |
<output>
|
1620 |
<port id="0" precision="I64">
|
|
|
1622 |
</port>
|
1623 |
</output>
|
1624 |
</layer>
|
1625 |
+
<layer id="123" name="Constant_31672" type="Const" version="opset1">
|
1626 |
<data element_type="i64" shape="" offset="67118882" size="8" />
|
1627 |
<output>
|
1628 |
<port id="0" precision="I64" />
|
1629 |
</output>
|
1630 |
</layer>
|
1631 |
+
<layer id="124" name="Gather_31673" type="Gather" version="opset8">
|
1632 |
<data batch_dims="0" />
|
1633 |
<input>
|
1634 |
<port id="0" precision="I64">
|
|
|
1645 |
</port>
|
1646 |
</output>
|
1647 |
</layer>
|
1648 |
+
<layer id="125" name="Constant_24624" type="Const" version="opset1">
|
1649 |
<data element_type="i64" shape="1" offset="67118890" size="8" />
|
1650 |
<output>
|
1651 |
<port id="0" precision="I64">
|
|
|
1745 |
</port>
|
1746 |
</output>
|
1747 |
</layer>
|
1748 |
+
<layer id="131" name="Convert_43085" type="Convert" version="opset1">
|
1749 |
<data destination_type="f16" />
|
1750 |
<input>
|
1751 |
<port id="0" precision="U4">
|
|
|
1772 |
</port>
|
1773 |
</output>
|
1774 |
</layer>
|
1775 |
+
<layer id="133" name="Convert_43087" type="Convert" version="opset1">
|
1776 |
<data destination_type="f16" />
|
1777 |
<input>
|
1778 |
<port id="0" precision="U4">
|
|
|
1843 |
</port>
|
1844 |
</output>
|
1845 |
</layer>
|
1846 |
+
<layer id="137" name="Constant_43092" type="Const" version="opset1">
|
1847 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
1848 |
<output>
|
1849 |
<port id="0" precision="I64">
|
|
|
1851 |
</port>
|
1852 |
</output>
|
1853 |
</layer>
|
1854 |
+
<layer id="138" name="Reshape_43093" type="Reshape" version="opset1">
|
1855 |
<data special_zero="false" />
|
1856 |
<input>
|
1857 |
<port id="0" precision="FP16">
|
|
|
1906 |
</port>
|
1907 |
</output>
|
1908 |
</layer>
|
1909 |
+
<layer id="141" name="Constant_31393" type="Const" version="opset1">
|
1910 |
<data element_type="f32" shape="1, 1, 1280" offset="69687958" size="5120" />
|
1911 |
<output>
|
1912 |
<port id="0" precision="FP32">
|
|
|
1938 |
</port>
|
1939 |
</output>
|
1940 |
</layer>
|
1941 |
+
<layer id="143" name="Constant_31711" type="Const" version="opset1">
|
1942 |
<data element_type="i64" shape="4" offset="67985482" size="32" />
|
1943 |
<output>
|
1944 |
<port id="0" precision="I64">
|
|
|
2050 |
</port>
|
2051 |
</output>
|
2052 |
</layer>
|
2053 |
+
<layer id="150" name="Constant_31712" type="Const" version="opset1">
|
2054 |
<data element_type="i64" shape="3" offset="69693078" size="24" />
|
2055 |
<output>
|
2056 |
<port id="0" precision="I64">
|
|
|
2089 |
</port>
|
2090 |
</output>
|
2091 |
</layer>
|
2092 |
+
<layer id="153" name="Convert_43118" type="Convert" version="opset1">
|
2093 |
<data destination_type="f16" />
|
2094 |
<input>
|
2095 |
<port id="0" precision="U4">
|
|
|
2116 |
</port>
|
2117 |
</output>
|
2118 |
</layer>
|
2119 |
+
<layer id="155" name="Convert_43120" type="Convert" version="opset1">
|
2120 |
<data destination_type="f16" />
|
2121 |
<input>
|
2122 |
<port id="0" precision="U4">
|
|
|
2187 |
</port>
|
2188 |
</output>
|
2189 |
</layer>
|
2190 |
+
<layer id="159" name="Constant_43125" type="Const" version="opset1">
|
2191 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
2192 |
<output>
|
2193 |
<port id="0" precision="I64">
|
|
|
2195 |
</port>
|
2196 |
</output>
|
2197 |
</layer>
|
2198 |
+
<layer id="160" name="Reshape_43126" type="Reshape" version="opset1">
|
2199 |
<data special_zero="false" />
|
2200 |
<input>
|
2201 |
<port id="0" precision="FP16">
|
|
|
2250 |
</port>
|
2251 |
</output>
|
2252 |
</layer>
|
2253 |
+
<layer id="163" name="Constant_31394" type="Const" version="opset1">
|
2254 |
<data element_type="f32" shape="1, 1, 1280" offset="70544302" size="5120" />
|
2255 |
<output>
|
2256 |
<port id="0" precision="FP32">
|
|
|
2332 |
</port>
|
2333 |
</output>
|
2334 |
</layer>
|
2335 |
+
<layer id="168" name="Constant_31395" type="Const" version="opset1">
|
2336 |
<data element_type="f32" shape="1, 1, 1280" offset="70549422" size="5120" />
|
2337 |
<output>
|
2338 |
<port id="0" precision="FP32">
|
|
|
2364 |
</port>
|
2365 |
</output>
|
2366 |
</layer>
|
2367 |
+
<layer id="170" name="Constant_31396" type="Const" version="opset1">
|
2368 |
<data element_type="f32" shape="1, 1, 1280" offset="70554542" size="5120" />
|
2369 |
<output>
|
2370 |
<port id="0" precision="FP32">
|
|
|
2396 |
</port>
|
2397 |
</output>
|
2398 |
</layer>
|
2399 |
+
<layer id="172" name="Constant_31296" type="Const" version="opset1">
|
2400 |
<data element_type="u4" shape="1280, 10, 128" offset="70559662" size="819200" />
|
2401 |
<output>
|
2402 |
<port id="0" precision="U4">
|
|
|
2406 |
</port>
|
2407 |
</output>
|
2408 |
</layer>
|
2409 |
+
<layer id="173" name="Convert_43129" type="Convert" version="opset1">
|
2410 |
<data destination_type="f16" />
|
2411 |
<input>
|
2412 |
<port id="0" precision="U4">
|
|
|
2423 |
</port>
|
2424 |
</output>
|
2425 |
</layer>
|
2426 |
+
<layer id="174" name="Constant_31296/zero_point" type="Const" version="opset1">
|
2427 |
<data element_type="u4" shape="1280, 10, 1" offset="71378862" size="6400" />
|
2428 |
<output>
|
2429 |
<port id="0" precision="U4">
|
|
|
2433 |
</port>
|
2434 |
</output>
|
2435 |
</layer>
|
2436 |
+
<layer id="175" name="Convert_43131" type="Convert" version="opset1">
|
2437 |
<data destination_type="f16" />
|
2438 |
<input>
|
2439 |
<port id="0" precision="U4">
|
|
|
2450 |
</port>
|
2451 |
</output>
|
2452 |
</layer>
|
2453 |
+
<layer id="176" name="Constant_31296/zero_point/subtract" type="Subtract" version="opset1">
|
2454 |
<data auto_broadcast="numpy" />
|
2455 |
<input>
|
2456 |
<port id="0" precision="FP16">
|
|
|
2472 |
</port>
|
2473 |
</output>
|
2474 |
</layer>
|
2475 |
+
<layer id="177" name="Constant_31296/scale" type="Const" version="opset1">
|
2476 |
<data element_type="f16" shape="1280, 10, 1" offset="71385262" size="25600" />
|
2477 |
<output>
|
2478 |
<port id="0" precision="FP16">
|
|
|
2482 |
</port>
|
2483 |
</output>
|
2484 |
</layer>
|
2485 |
+
<layer id="178" name="Constant_31296/fq_weights_1" type="Multiply" version="opset1">
|
2486 |
<data auto_broadcast="numpy" />
|
2487 |
<input>
|
2488 |
<port id="0" precision="FP16">
|
|
|
2504 |
</port>
|
2505 |
</output>
|
2506 |
</layer>
|
2507 |
+
<layer id="179" name="Constant_43136" type="Const" version="opset1">
|
2508 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
2509 |
<output>
|
2510 |
<port id="0" precision="I64">
|
|
|
2512 |
</port>
|
2513 |
</output>
|
2514 |
</layer>
|
2515 |
+
<layer id="180" name="Reshape_43137" type="Reshape" version="opset1">
|
2516 |
<data special_zero="false" />
|
2517 |
<input>
|
2518 |
<port id="0" precision="FP16">
|
|
|
2531 |
</port>
|
2532 |
</output>
|
2533 |
</layer>
|
2534 |
+
<layer id="181" name="Constant_31296/fq_weights_1/convert" type="Convert" version="opset1">
|
2535 |
<data destination_type="f32" />
|
2536 |
<input>
|
2537 |
<port id="0" precision="FP16">
|
|
|
2546 |
</port>
|
2547 |
</output>
|
2548 |
</layer>
|
2549 |
+
<layer id="182" name="Multiply_31280" type="MatMul" version="opset1">
|
2550 |
<data transpose_a="false" transpose_b="true" />
|
2551 |
<input>
|
2552 |
<port id="0" precision="FP32">
|
|
|
2567 |
</port>
|
2568 |
</output>
|
2569 |
</layer>
|
2570 |
+
<layer id="183" name="Constant_31397" type="Const" version="opset1">
|
2571 |
<data element_type="f32" shape="1, 1, 1280" offset="71410862" size="5120" />
|
2572 |
<output>
|
2573 |
<port id="0" precision="FP32">
|
|
|
2599 |
</port>
|
2600 |
</output>
|
2601 |
</layer>
|
2602 |
+
<layer id="185" name="Constant_31713" type="Const" version="opset1">
|
2603 |
<data element_type="i64" shape="4" offset="67985482" size="32" />
|
2604 |
<output>
|
2605 |
<port id="0" precision="I64">
|
|
|
2667 |
</port>
|
2668 |
</output>
|
2669 |
</layer>
|
2670 |
+
<layer id="190" name="Convert_43074" type="Convert" version="opset1">
|
2671 |
<data destination_type="f16" />
|
2672 |
<input>
|
2673 |
<port id="0" precision="U4">
|
|
|
2694 |
</port>
|
2695 |
</output>
|
2696 |
</layer>
|
2697 |
+
<layer id="192" name="Convert_43076" type="Convert" version="opset1">
|
2698 |
<data destination_type="f16" />
|
2699 |
<input>
|
2700 |
<port id="0" precision="U4">
|
|
|
2765 |
</port>
|
2766 |
</output>
|
2767 |
</layer>
|
2768 |
+
<layer id="196" name="Constant_43081" type="Const" version="opset1">
|
2769 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
2770 |
<output>
|
2771 |
<port id="0" precision="I64">
|
|
|
2773 |
</port>
|
2774 |
</output>
|
2775 |
</layer>
|
2776 |
+
<layer id="197" name="Reshape_43082" type="Reshape" version="opset1">
|
2777 |
<data special_zero="false" />
|
2778 |
<input>
|
2779 |
<port id="0" precision="FP16">
|
|
|
2828 |
</port>
|
2829 |
</output>
|
2830 |
</layer>
|
2831 |
+
<layer id="200" name="Constant_24369" type="Const" version="opset1">
|
2832 |
<data element_type="i64" shape="1" offset="72267182" size="8" />
|
2833 |
<output>
|
2834 |
<port id="0" precision="I64">
|
|
|
2836 |
</port>
|
2837 |
</output>
|
2838 |
</layer>
|
2839 |
+
<layer id="201" name="Constant_24370" type="Const" version="opset1">
|
2840 |
<data element_type="i64" shape="1" offset="72267190" size="8" />
|
2841 |
<output>
|
2842 |
<port id="0" precision="I64">
|
|
|
2844 |
</port>
|
2845 |
</output>
|
2846 |
</layer>
|
2847 |
+
<layer id="202" name="Constant_24371" type="Const" version="opset1">
|
2848 |
<data element_type="i64" shape="1" offset="72267198" size="8" />
|
2849 |
<output>
|
2850 |
<port id="0" precision="I64">
|
|
|
2852 |
</port>
|
2853 |
</output>
|
2854 |
</layer>
|
2855 |
+
<layer id="203" name="__module.model.model.decoder.layers.0.self_attn/prim::ListConstruct_1" type="Concat" version="opset1">
|
2856 |
<data axis="0" />
|
2857 |
<input>
|
2858 |
<port id="0" precision="I64">
|
|
|
2978 |
</port>
|
2979 |
</output>
|
2980 |
</layer>
|
2981 |
+
<layer id="210" name="Convert_43063" type="Convert" version="opset1">
|
2982 |
<data destination_type="f16" />
|
2983 |
<input>
|
2984 |
<port id="0" precision="U4">
|
|
|
3005 |
</port>
|
3006 |
</output>
|
3007 |
</layer>
|
3008 |
+
<layer id="212" name="Convert_43065" type="Convert" version="opset1">
|
3009 |
<data destination_type="f16" />
|
3010 |
<input>
|
3011 |
<port id="0" precision="U4">
|
|
|
3076 |
</port>
|
3077 |
</output>
|
3078 |
</layer>
|
3079 |
+
<layer id="216" name="Constant_43070" type="Const" version="opset1">
|
3080 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
3081 |
<output>
|
3082 |
<port id="0" precision="I64">
|
|
|
3084 |
</port>
|
3085 |
</output>
|
3086 |
</layer>
|
3087 |
+
<layer id="217" name="Reshape_43071" type="Reshape" version="opset1">
|
3088 |
<data special_zero="false" />
|
3089 |
<input>
|
3090 |
<port id="0" precision="FP16">
|
|
|
3139 |
</port>
|
3140 |
</output>
|
3141 |
</layer>
|
3142 |
+
<layer id="220" name="Constant_31398" type="Const" version="opset1">
|
3143 |
<data element_type="f32" shape="1, 1, 1280" offset="73118406" size="5120" />
|
3144 |
<output>
|
3145 |
<port id="0" precision="FP32">
|
|
|
3275 |
</port>
|
3276 |
</output>
|
3277 |
</layer>
|
3278 |
+
<layer id="228" name="Constant_31714" type="Const" version="opset1">
|
3279 |
<data element_type="i64" shape="3" offset="73123526" size="24" />
|
3280 |
<output>
|
3281 |
<port id="0" precision="I64">
|
|
|
3314 |
</port>
|
3315 |
</output>
|
3316 |
</layer>
|
3317 |
+
<layer id="231" name="Convert_43140" type="Convert" version="opset1">
|
3318 |
<data destination_type="f16" />
|
3319 |
<input>
|
3320 |
<port id="0" precision="U4">
|
|
|
3341 |
</port>
|
3342 |
</output>
|
3343 |
</layer>
|
3344 |
+
<layer id="233" name="Convert_43142" type="Convert" version="opset1">
|
3345 |
<data destination_type="f16" />
|
3346 |
<input>
|
3347 |
<port id="0" precision="U4">
|
|
|
3412 |
</port>
|
3413 |
</output>
|
3414 |
</layer>
|
3415 |
+
<layer id="237" name="Constant_43147" type="Const" version="opset1">
|
3416 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
3417 |
<output>
|
3418 |
<port id="0" precision="I64">
|
|
|
3420 |
</port>
|
3421 |
</output>
|
3422 |
</layer>
|
3423 |
+
<layer id="238" name="Reshape_43148" type="Reshape" version="opset1">
|
3424 |
<data special_zero="false" />
|
3425 |
<input>
|
3426 |
<port id="0" precision="FP16">
|
|
|
3475 |
</port>
|
3476 |
</output>
|
3477 |
</layer>
|
3478 |
+
<layer id="241" name="Constant_31399" type="Const" version="opset1">
|
3479 |
<data element_type="f32" shape="1, 1, 1280" offset="73974750" size="5120" />
|
3480 |
<output>
|
3481 |
<port id="0" precision="FP32">
|
|
|
3557 |
</port>
|
3558 |
</output>
|
3559 |
</layer>
|
3560 |
+
<layer id="246" name="Constant_31400" type="Const" version="opset1">
|
3561 |
<data element_type="f32" shape="1, 1, 1280" offset="73979870" size="5120" />
|
3562 |
<output>
|
3563 |
<port id="0" precision="FP32">
|
|
|
3589 |
</port>
|
3590 |
</output>
|
3591 |
</layer>
|
3592 |
+
<layer id="248" name="Constant_31401" type="Const" version="opset1">
|
3593 |
<data element_type="f32" shape="1, 1, 1280" offset="73984990" size="5120" />
|
3594 |
<output>
|
3595 |
<port id="0" precision="FP32">
|
|
|
3631 |
</port>
|
3632 |
</output>
|
3633 |
</layer>
|
3634 |
+
<layer id="251" name="Convert_42997" type="Convert" version="opset1">
|
3635 |
<data destination_type="f16" />
|
3636 |
<input>
|
3637 |
<port id="0" precision="U4">
|
|
|
3658 |
</port>
|
3659 |
</output>
|
3660 |
</layer>
|
3661 |
+
<layer id="253" name="Convert_42999" type="Convert" version="opset1">
|
3662 |
<data destination_type="f16" />
|
3663 |
<input>
|
3664 |
<port id="0" precision="U4">
|
|
|
3729 |
</port>
|
3730 |
</output>
|
3731 |
</layer>
|
3732 |
+
<layer id="257" name="Constant_43004" type="Const" version="opset1">
|
3733 |
<data element_type="i64" shape="2" offset="77394910" size="16" />
|
3734 |
<output>
|
3735 |
<port id="0" precision="I64">
|
|
|
3737 |
</port>
|
3738 |
</output>
|
3739 |
</layer>
|
3740 |
+
<layer id="258" name="Reshape_43005" type="Reshape" version="opset1">
|
3741 |
<data special_zero="false" />
|
3742 |
<input>
|
3743 |
<port id="0" precision="FP16">
|
|
|
3792 |
</port>
|
3793 |
</output>
|
3794 |
</layer>
|
3795 |
+
<layer id="261" name="Constant_31402" type="Const" version="opset1">
|
3796 |
<data element_type="f32" shape="1, 1, 5120" offset="77394926" size="20480" />
|
3797 |
<output>
|
3798 |
<port id="0" precision="FP32">
|
|
|
3851 |
</port>
|
3852 |
</output>
|
3853 |
</layer>
|
3854 |
+
<layer id="265" name="Convert_43008" type="Convert" version="opset1">
|
3855 |
<data destination_type="f16" />
|
3856 |
<input>
|
3857 |
<port id="0" precision="U4">
|
|
|
3878 |
</port>
|
3879 |
</output>
|
3880 |
</layer>
|
3881 |
+
<layer id="267" name="Convert_43010" type="Convert" version="opset1">
|
3882 |
<data destination_type="f16" />
|
3883 |
<input>
|
3884 |
<port id="0" precision="U4">
|
|
|
3949 |
</port>
|
3950 |
</output>
|
3951 |
</layer>
|
3952 |
+
<layer id="271" name="Constant_43015" type="Const" version="opset1">
|
3953 |
<data element_type="i64" shape="2" offset="80820206" size="16" />
|
3954 |
<output>
|
3955 |
<port id="0" precision="I64">
|
|
|
3957 |
</port>
|
3958 |
</output>
|
3959 |
</layer>
|
3960 |
+
<layer id="272" name="Reshape_43016" type="Reshape" version="opset1">
|
3961 |
<data special_zero="false" />
|
3962 |
<input>
|
3963 |
<port id="0" precision="FP16">
|
|
|
4012 |
</port>
|
4013 |
</output>
|
4014 |
</layer>
|
4015 |
+
<layer id="275" name="Constant_31403" type="Const" version="opset1">
|
4016 |
<data element_type="f32" shape="1, 1, 1280" offset="80820222" size="5120" />
|
4017 |
<output>
|
4018 |
<port id="0" precision="FP32">
|
|
|
4094 |
</port>
|
4095 |
</output>
|
4096 |
</layer>
|
4097 |
+
<layer id="280" name="Constant_31404" type="Const" version="opset1">
|
4098 |
<data element_type="f32" shape="1, 1, 1280" offset="80825342" size="5120" />
|
4099 |
<output>
|
4100 |
<port id="0" precision="FP32">
|
|
|
4126 |
</port>
|
4127 |
</output>
|
4128 |
</layer>
|
4129 |
+
<layer id="282" name="Constant_31405" type="Const" version="opset1">
|
4130 |
<data element_type="f32" shape="1, 1, 1280" offset="80830462" size="5120" />
|
4131 |
<output>
|
4132 |
<port id="0" precision="FP32">
|
|
|
4158 |
</port>
|
4159 |
</output>
|
4160 |
</layer>
|
4161 |
+
<layer id="284" name="Constant_31299" type="Const" version="opset1">
|
4162 |
<data element_type="u4" shape="1280, 10, 128" offset="80835582" size="819200" />
|
4163 |
<output>
|
4164 |
<port id="0" precision="U4">
|
|
|
4168 |
</port>
|
4169 |
</output>
|
4170 |
</layer>
|
4171 |
+
<layer id="285" name="Convert_43173" type="Convert" version="opset1">
|
4172 |
<data destination_type="f16" />
|
4173 |
<input>
|
4174 |
<port id="0" precision="U4">
|
|
|
4185 |
</port>
|
4186 |
</output>
|
4187 |
</layer>
|
4188 |
+
<layer id="286" name="Constant_31299/zero_point" type="Const" version="opset1">
|
4189 |
<data element_type="u4" shape="1280, 10, 1" offset="81654782" size="6400" />
|
4190 |
<output>
|
4191 |
<port id="0" precision="U4">
|
|
|
4195 |
</port>
|
4196 |
</output>
|
4197 |
</layer>
|
4198 |
+
<layer id="287" name="Convert_43175" type="Convert" version="opset1">
|
4199 |
<data destination_type="f16" />
|
4200 |
<input>
|
4201 |
<port id="0" precision="U4">
|
|
|
4212 |
</port>
|
4213 |
</output>
|
4214 |
</layer>
|
4215 |
+
<layer id="288" name="Constant_31299/zero_point/subtract" type="Subtract" version="opset1">
|
4216 |
<data auto_broadcast="numpy" />
|
4217 |
<input>
|
4218 |
<port id="0" precision="FP16">
|
|
|
4234 |
</port>
|
4235 |
</output>
|
4236 |
</layer>
|
4237 |
+
<layer id="289" name="Constant_31299/scale" type="Const" version="opset1">
|
4238 |
<data element_type="f16" shape="1280, 10, 1" offset="81661182" size="25600" />
|
4239 |
<output>
|
4240 |
<port id="0" precision="FP16">
|
|
|
4244 |
</port>
|
4245 |
</output>
|
4246 |
</layer>
|
4247 |
+
<layer id="290" name="Constant_31299/fq_weights_1" type="Multiply" version="opset1">
|
4248 |
<data auto_broadcast="numpy" />
|
4249 |
<input>
|
4250 |
<port id="0" precision="FP16">
|
|
|
4266 |
</port>
|
4267 |
</output>
|
4268 |
</layer>
|
4269 |
+
<layer id="291" name="Constant_43180" type="Const" version="opset1">
|
4270 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
4271 |
<output>
|
4272 |
<port id="0" precision="I64">
|
|
|
4274 |
</port>
|
4275 |
</output>
|
4276 |
</layer>
|
4277 |
+
<layer id="292" name="Reshape_43181" type="Reshape" version="opset1">
|
4278 |
<data special_zero="false" />
|
4279 |
<input>
|
4280 |
<port id="0" precision="FP16">
|
|
|
4293 |
</port>
|
4294 |
</output>
|
4295 |
</layer>
|
4296 |
+
<layer id="293" name="Constant_31299/fq_weights_1/convert" type="Convert" version="opset1">
|
4297 |
<data destination_type="f32" />
|
4298 |
<input>
|
4299 |
<port id="0" precision="FP16">
|
|
|
4308 |
</port>
|
4309 |
</output>
|
4310 |
</layer>
|
4311 |
+
<layer id="294" name="Multiply_31284" type="MatMul" version="opset1">
|
4312 |
<data transpose_a="false" transpose_b="true" />
|
4313 |
<input>
|
4314 |
<port id="0" precision="FP32">
|
|
|
4329 |
</port>
|
4330 |
</output>
|
4331 |
</layer>
|
4332 |
+
<layer id="295" name="Constant_31406" type="Const" version="opset1">
|
4333 |
<data element_type="f32" shape="1, 1, 1280" offset="81686782" size="5120" />
|
4334 |
<output>
|
4335 |
<port id="0" precision="FP32">
|
|
|
4361 |
</port>
|
4362 |
</output>
|
4363 |
</layer>
|
4364 |
+
<layer id="297" name="Constant_31715" type="Const" version="opset1">
|
4365 |
<data element_type="i64" shape="4" offset="67985482" size="32" />
|
4366 |
<output>
|
4367 |
<port id="0" precision="I64">
|
|
|
4429 |
</port>
|
4430 |
</output>
|
4431 |
</layer>
|
4432 |
+
<layer id="302" name="Convert_43162" type="Convert" version="opset1">
|
4433 |
<data destination_type="f16" />
|
4434 |
<input>
|
4435 |
<port id="0" precision="U4">
|
|
|
4456 |
</port>
|
4457 |
</output>
|
4458 |
</layer>
|
4459 |
+
<layer id="304" name="Convert_43164" type="Convert" version="opset1">
|
4460 |
<data destination_type="f16" />
|
4461 |
<input>
|
4462 |
<port id="0" precision="U4">
|
|
|
4527 |
</port>
|
4528 |
</output>
|
4529 |
</layer>
|
4530 |
+
<layer id="308" name="Constant_43169" type="Const" version="opset1">
|
4531 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
4532 |
<output>
|
4533 |
<port id="0" precision="I64">
|
|
|
4535 |
</port>
|
4536 |
</output>
|
4537 |
</layer>
|
4538 |
+
<layer id="309" name="Reshape_43170" type="Reshape" version="opset1">
|
4539 |
<data special_zero="false" />
|
4540 |
<input>
|
4541 |
<port id="0" precision="FP16">
|
|
|
4590 |
</port>
|
4591 |
</output>
|
4592 |
</layer>
|
4593 |
+
<layer id="312" name="Constant_31716" type="Const" version="opset1">
|
4594 |
<data element_type="i64" shape="4" offset="67985482" size="32" />
|
4595 |
<output>
|
4596 |
<port id="0" precision="I64">
|
|
|
4727 |
</port>
|
4728 |
</output>
|
4729 |
</layer>
|
4730 |
+
<layer id="320" name="Convert_43151" type="Convert" version="opset1">
|
4731 |
<data destination_type="f16" />
|
4732 |
<input>
|
4733 |
<port id="0" precision="U4">
|
|
|
4754 |
</port>
|
4755 |
</output>
|
4756 |
</layer>
|
4757 |
+
<layer id="322" name="Convert_43153" type="Convert" version="opset1">
|
4758 |
<data destination_type="f16" />
|
4759 |
<input>
|
4760 |
<port id="0" precision="U4">
|
|
|
4825 |
</port>
|
4826 |
</output>
|
4827 |
</layer>
|
4828 |
+
<layer id="326" name="Constant_43158" type="Const" version="opset1">
|
4829 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
4830 |
<output>
|
4831 |
<port id="0" precision="I64">
|
|
|
4833 |
</port>
|
4834 |
</output>
|
4835 |
</layer>
|
4836 |
+
<layer id="327" name="Reshape_43159" type="Reshape" version="opset1">
|
4837 |
<data special_zero="false" />
|
4838 |
<input>
|
4839 |
<port id="0" precision="FP16">
|
|
|
4888 |
</port>
|
4889 |
</output>
|
4890 |
</layer>
|
4891 |
+
<layer id="330" name="Constant_31407" type="Const" version="opset1">
|
4892 |
<data element_type="f32" shape="1, 1, 1280" offset="83394302" size="5120" />
|
4893 |
<output>
|
4894 |
<port id="0" precision="FP32">
|
|
|
4920 |
</port>
|
4921 |
</output>
|
4922 |
</layer>
|
4923 |
+
<layer id="332" name="Constant_31717" type="Const" version="opset1">
|
4924 |
<data element_type="i64" shape="4" offset="67985482" size="32" />
|
4925 |
<output>
|
4926 |
<port id="0" precision="I64">
|
|
|
5032 |
</port>
|
5033 |
</output>
|
5034 |
</layer>
|
5035 |
+
<layer id="339" name="Constant_31718" type="Const" version="opset1">
|
5036 |
<data element_type="i64" shape="3" offset="69693078" size="24" />
|
5037 |
<output>
|
5038 |
<port id="0" precision="I64">
|
|
|
5071 |
</port>
|
5072 |
</output>
|
5073 |
</layer>
|
5074 |
+
<layer id="342" name="Convert_43184" type="Convert" version="opset1">
|
5075 |
<data destination_type="f16" />
|
5076 |
<input>
|
5077 |
<port id="0" precision="U4">
|
|
|
5098 |
</port>
|
5099 |
</output>
|
5100 |
</layer>
|
5101 |
+
<layer id="344" name="Convert_43186" type="Convert" version="opset1">
|
5102 |
<data destination_type="f16" />
|
5103 |
<input>
|
5104 |
<port id="0" precision="U4">
|
|
|
5169 |
</port>
|
5170 |
</output>
|
5171 |
</layer>
|
5172 |
+
<layer id="348" name="Constant_43191" type="Const" version="opset1">
|
5173 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
5174 |
<output>
|
5175 |
<port id="0" precision="I64">
|
|
|
5177 |
</port>
|
5178 |
</output>
|
5179 |
</layer>
|
5180 |
+
<layer id="349" name="Reshape_43192" type="Reshape" version="opset1">
|
5181 |
<data special_zero="false" />
|
5182 |
<input>
|
5183 |
<port id="0" precision="FP16">
|
|
|
5232 |
</port>
|
5233 |
</output>
|
5234 |
</layer>
|
5235 |
+
<layer id="352" name="Constant_31408" type="Const" version="opset1">
|
5236 |
<data element_type="f32" shape="1, 1, 1280" offset="84250622" size="5120" />
|
5237 |
<output>
|
5238 |
<port id="0" precision="FP32">
|
|
|
5314 |
</port>
|
5315 |
</output>
|
5316 |
</layer>
|
5317 |
+
<layer id="357" name="Constant_31409" type="Const" version="opset1">
|
5318 |
<data element_type="f32" shape="1, 1, 1280" offset="84255742" size="5120" />
|
5319 |
<output>
|
5320 |
<port id="0" precision="FP32">
|
|
|
5346 |
</port>
|
5347 |
</output>
|
5348 |
</layer>
|
5349 |
+
<layer id="359" name="Constant_31410" type="Const" version="opset1">
|
5350 |
<data element_type="f32" shape="1, 1, 1280" offset="84260862" size="5120" />
|
5351 |
<output>
|
5352 |
<port id="0" precision="FP32">
|
|
|
5378 |
</port>
|
5379 |
</output>
|
5380 |
</layer>
|
5381 |
+
<layer id="361" name="Constant_31302" type="Const" version="opset1">
|
5382 |
<data element_type="u4" shape="1280, 10, 128" offset="84265982" size="819200" />
|
5383 |
<output>
|
5384 |
<port id="0" precision="U4">
|
|
|
5388 |
</port>
|
5389 |
</output>
|
5390 |
</layer>
|
5391 |
+
<layer id="362" name="Convert_43195" type="Convert" version="opset1">
|
5392 |
<data destination_type="f16" />
|
5393 |
<input>
|
5394 |
<port id="0" precision="U4">
|
|
|
5405 |
</port>
|
5406 |
</output>
|
5407 |
</layer>
|
5408 |
+
<layer id="363" name="Constant_31302/zero_point" type="Const" version="opset1">
|
5409 |
<data element_type="u4" shape="1280, 10, 1" offset="85085182" size="6400" />
|
5410 |
<output>
|
5411 |
<port id="0" precision="U4">
|
|
|
5415 |
</port>
|
5416 |
</output>
|
5417 |
</layer>
|
5418 |
+
<layer id="364" name="Convert_43197" type="Convert" version="opset1">
|
5419 |
<data destination_type="f16" />
|
5420 |
<input>
|
5421 |
<port id="0" precision="U4">
|
|
|
5432 |
</port>
|
5433 |
</output>
|
5434 |
</layer>
|
5435 |
+
<layer id="365" name="Constant_31302/zero_point/subtract" type="Subtract" version="opset1">
|
5436 |
<data auto_broadcast="numpy" />
|
5437 |
<input>
|
5438 |
<port id="0" precision="FP16">
|
|
|
5454 |
</port>
|
5455 |
</output>
|
5456 |
</layer>
|
5457 |
+
<layer id="366" name="Constant_31302/scale" type="Const" version="opset1">
|
5458 |
<data element_type="f16" shape="1280, 10, 1" offset="85091582" size="25600" />
|
5459 |
<output>
|
5460 |
<port id="0" precision="FP16">
|
|
|
5464 |
</port>
|
5465 |
</output>
|
5466 |
</layer>
|
5467 |
+
<layer id="367" name="Constant_31302/fq_weights_1" type="Multiply" version="opset1">
|
5468 |
<data auto_broadcast="numpy" />
|
5469 |
<input>
|
5470 |
<port id="0" precision="FP16">
|
|
|
5486 |
</port>
|
5487 |
</output>
|
5488 |
</layer>
|
5489 |
+
<layer id="368" name="Constant_43202" type="Const" version="opset1">
|
5490 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
5491 |
<output>
|
5492 |
<port id="0" precision="I64">
|
|
|
5494 |
</port>
|
5495 |
</output>
|
5496 |
</layer>
|
5497 |
+
<layer id="369" name="Reshape_43203" type="Reshape" version="opset1">
|
5498 |
<data special_zero="false" />
|
5499 |
<input>
|
5500 |
<port id="0" precision="FP16">
|
|
|
5513 |
</port>
|
5514 |
</output>
|
5515 |
</layer>
|
5516 |
+
<layer id="370" name="Constant_31302/fq_weights_1/convert" type="Convert" version="opset1">
|
5517 |
<data destination_type="f32" />
|
5518 |
<input>
|
5519 |
<port id="0" precision="FP16">
|
|
|
5528 |
</port>
|
5529 |
</output>
|
5530 |
</layer>
|
5531 |
+
<layer id="371" name="Multiply_31288" type="MatMul" version="opset1">
|
5532 |
<data transpose_a="false" transpose_b="true" />
|
5533 |
<input>
|
5534 |
<port id="0" precision="FP32">
|
|
|
5549 |
</port>
|
5550 |
</output>
|
5551 |
</layer>
|
5552 |
+
<layer id="372" name="Constant_31411" type="Const" version="opset1">
|
5553 |
<data element_type="f32" shape="1, 1, 1280" offset="85117182" size="5120" />
|
5554 |
<output>
|
5555 |
<port id="0" precision="FP32">
|
|
|
5581 |
</port>
|
5582 |
</output>
|
5583 |
</layer>
|
5584 |
+
<layer id="374" name="Constant_31719" type="Const" version="opset1">
|
5585 |
<data element_type="i64" shape="4" offset="67985482" size="32" />
|
5586 |
<output>
|
5587 |
<port id="0" precision="I64">
|
|
|
5649 |
</port>
|
5650 |
</output>
|
5651 |
</layer>
|
5652 |
+
<layer id="379" name="Convert_43052" type="Convert" version="opset1">
|
5653 |
<data destination_type="f16" />
|
5654 |
<input>
|
5655 |
<port id="0" precision="U4">
|
|
|
5676 |
</port>
|
5677 |
</output>
|
5678 |
</layer>
|
5679 |
+
<layer id="381" name="Convert_43054" type="Convert" version="opset1">
|
5680 |
<data destination_type="f16" />
|
5681 |
<input>
|
5682 |
<port id="0" precision="U4">
|
|
|
5747 |
</port>
|
5748 |
</output>
|
5749 |
</layer>
|
5750 |
+
<layer id="385" name="Constant_43059" type="Const" version="opset1">
|
5751 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
5752 |
<output>
|
5753 |
<port id="0" precision="I64">
|
|
|
5755 |
</port>
|
5756 |
</output>
|
5757 |
</layer>
|
5758 |
+
<layer id="386" name="Reshape_43060" type="Reshape" version="opset1">
|
5759 |
<data special_zero="false" />
|
5760 |
<input>
|
5761 |
<port id="0" precision="FP16">
|
|
|
5914 |
</port>
|
5915 |
</output>
|
5916 |
</layer>
|
5917 |
+
<layer id="395" name="Convert_43041" type="Convert" version="opset1">
|
5918 |
<data destination_type="f16" />
|
5919 |
<input>
|
5920 |
<port id="0" precision="U4">
|
|
|
5941 |
</port>
|
5942 |
</output>
|
5943 |
</layer>
|
5944 |
+
<layer id="397" name="Convert_43043" type="Convert" version="opset1">
|
5945 |
<data destination_type="f16" />
|
5946 |
<input>
|
5947 |
<port id="0" precision="U4">
|
|
|
6012 |
</port>
|
6013 |
</output>
|
6014 |
</layer>
|
6015 |
+
<layer id="401" name="Constant_43048" type="Const" version="opset1">
|
6016 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
6017 |
<output>
|
6018 |
<port id="0" precision="I64">
|
|
|
6020 |
</port>
|
6021 |
</output>
|
6022 |
</layer>
|
6023 |
+
<layer id="402" name="Reshape_43049" type="Reshape" version="opset1">
|
6024 |
<data special_zero="false" />
|
6025 |
<input>
|
6026 |
<port id="0" precision="FP16">
|
|
|
6075 |
</port>
|
6076 |
</output>
|
6077 |
</layer>
|
6078 |
+
<layer id="405" name="Constant_31412" type="Const" version="opset1">
|
6079 |
<data element_type="f32" shape="1, 1, 1280" offset="86824702" size="5120" />
|
6080 |
<output>
|
6081 |
<port id="0" precision="FP32">
|
|
|
6211 |
</port>
|
6212 |
</output>
|
6213 |
</layer>
|
6214 |
+
<layer id="413" name="Constant_31720" type="Const" version="opset1">
|
6215 |
<data element_type="i64" shape="3" offset="73123526" size="24" />
|
6216 |
<output>
|
6217 |
<port id="0" precision="I64">
|
|
|
6250 |
</port>
|
6251 |
</output>
|
6252 |
</layer>
|
6253 |
+
<layer id="416" name="Convert_43206" type="Convert" version="opset1">
|
6254 |
<data destination_type="f16" />
|
6255 |
<input>
|
6256 |
<port id="0" precision="U4">
|
|
|
6277 |
</port>
|
6278 |
</output>
|
6279 |
</layer>
|
6280 |
+
<layer id="418" name="Convert_43208" type="Convert" version="opset1">
|
6281 |
<data destination_type="f16" />
|
6282 |
<input>
|
6283 |
<port id="0" precision="U4">
|
|
|
6348 |
</port>
|
6349 |
</output>
|
6350 |
</layer>
|
6351 |
+
<layer id="422" name="Constant_43213" type="Const" version="opset1">
|
6352 |
<data element_type="i64" shape="2" offset="67980346" size="16" />
|
6353 |
<output>
|
6354 |
<port id="0" precision="I64">
|
|
|
6356 |
</port>
|
6357 |
</output>
|
6358 |
</layer>
|
6359 |
+
<layer id="423" name="Reshape_43214" type="Reshape" version="opset1">
|
6360 |
<data special_zero="false" />
|
6361 |
<input>
|
6362 |
<port id="0" precision="FP16">
|
|
|
6411 |
</port>
|
6412 |
</output>
|
6413 |
</layer>
|
6414 |
+
<layer id="426" name="Constant_31413" type="Const" version="opset1">
|
6415 |
<data element_type="f32" shape="1, 1, 1280" offset="87681022" size="5120" />
|
6416 |
<output>
|
6417 |
<port id="0" precision="FP32">
|
|
|
6493 |
</port>
|
6494 |
</output>
|
6495 |
</layer>
|
6496 |
+
<layer id="431" name="Constant_31414" type="Const" version="opset1">
|
6497 |
<data element_type="f32" shape="1, 1, 1280" offset="87686142" size="5120" />
|
6498 |
<output>
|
6499 |
<port id="0" precision="FP32">
|
|
|
6525 |
</port>
|
6526 |
</output>
|
6527 |
</layer>
|
6528 |
+
<layer id="433" name="Constant_31415" type="Const" version="opset1">
|
6529 |
<data element_type="f32" shape="1, 1, 1280" offset="87691262" size="5120" />
|
6530 |
<output>
|
6531 |
<port id="0" precision="FP32">
|
|
|
6567 |
</port>
|
6568 |
</output>
|
6569 |
</layer>
|
6570 |
+
<layer id="436" name="Convert_43019" type="Convert" version="opset1">
|
6571 |
<data destination_type="f16" />
|
6572 |
<input>
|
6573 |
<port id="0" precision="U4">
|
|
|
6594 |
</port>
|
6595 |
</output>
|
6596 |
</layer>
|
6597 |
+
<layer id="438" name="Convert_43021" type="Convert" version="opset1">
|
6598 |
<data destination_type="f16" />
|
6599 |
<input>
|
6600 |
<port id="0" precision="U4">
|
|
|
6665 |
</port>
|
6666 |
</output>
|
6667 |
</layer>
|
6668 |
+
<layer id="442" name="Constant_43026" type="Const" version="opset1">
|
6669 |
<data element_type="i64" shape="2" offset="77394910" size="16" />
|
6670 |
<output>
|
6671 |
<port id="0" precision="I64">
|
|
|
6673 |
</port>
|
6674 |
</output>
|
6675 |
</layer>
|
6676 |
+
<layer id="443" name="Reshape_43027" type="Reshape" version="opset1">
|
6677 |
<data special_zero="false" />
|
6678 |
<input>
|
6679 |
<port id="0" precision="FP16">
|
|
|
6728 |
</port>
|
6729 |
</output>
|
6730 |
</layer>
|
6731 |
+
<layer id="446" name="Constant_31416" type="Const" version="opset1">
|
6732 |
<data element_type="f32" shape="1, 1, 5120" offset="91101182" size="20480" />
|
6733 |
<output>
|
6734 |
<port id="0" precision="FP32">
|
|
|
6787 |
</port>
|
6788 |
</output>
|
6789 |
</layer>
|
6790 |
+
<layer id="450" name="Convert_43030" type="Convert" version="opset1">
|
6791 |
<data destination_type="f16" />
|
6792 |
<input>
|
6793 |
<port id="0" precision="U4">
|
|
|
6814 |
</port>
|
6815 |
</output>
|
6816 |
</layer>
|
6817 |
+
<layer id="452" name="Convert_43032" type="Convert" version="opset1">
|
6818 |
<data destination_type="f16" />
|
6819 |
<input>
|
6820 |
<port id="0" precision="U4">
|
|
|
6885 |
</port>
|
6886 |
</output>
|
6887 |
</layer>
|
6888 |
+
<layer id="456" name="Constant_43037" type="Const" version="opset1">
|
6889 |
<data element_type="i64" shape="2" offset="80820206" size="16" />
|
6890 |
<output>
|
6891 |
<port id="0" precision="I64">
|
|
|
6893 |
</port>
|
6894 |
</output>
|
6895 |
</layer>
|
6896 |
+
<layer id="457" name="Reshape_43038" type="Reshape" version="opset1">
|
6897 |
<data special_zero="false" />
|
6898 |
<input>
|
6899 |
<port id="0" precision="FP16">
|
|
|
6948 |
</port>
|
6949 |
</output>
|
6950 |
</layer>
|
6951 |
+
<layer id="460" name="Constant_31417" type="Const" version="opset1">
|
6952 |
<data element_type="f32" shape="1, 1, 1280" offset="94526462" size="5120" />
|
6953 |
<output>
|
6954 |
<port id="0" precision="FP32">
|
|
|
7030 |
</port>
|
7031 |
</output>
|
7032 |
</layer>
|
7033 |
+
<layer id="465" name="Constant_31418" type="Const" version="opset1">
|
7034 |
<data element_type="f32" shape="1, 1, 1280" offset="94531582" size="5120" />
|
7035 |
<output>
|
7036 |
<port id="0" precision="FP32">
|
|
|
7062 |
</port>
|
7063 |
</output>
|
7064 |
</layer>
|
7065 |
+
<layer id="467" name="Constant_31419" type="Const" version="opset1">
|
7066 |
<data element_type="f32" shape="1, 1, 1280" offset="94536702" size="5120" />
|
7067 |
<output>
|
7068 |
<port id="0" precision="FP32">
|
|
|
7115 |
</port>
|
7116 |
</output>
|
7117 |
</layer>
|
7118 |
+
<layer id="470" name="Result_26206" type="Result" version="opset1">
|
7119 |
<input>
|
7120 |
<port id="0" precision="FP32">
|
7121 |
<dim>-1</dim>
|
|
|
7632 |
<edge from-layer="469" from-port="2" to-layer="470" to-port="0" />
|
7633 |
</edges>
|
7634 |
<rt_info>
|
7635 |
+
<Runtime_version value="2024.5.0-17285-ea5c1dcfdf9-releases/2024/5" />
|
7636 |
<conversion_parameters>
|
7637 |
<framework value="pytorch" />
|
7638 |
<is_python_object value="True" />
|
|
|
7640 |
<nncf>
|
7641 |
<friendly_names_were_updated value="True" />
|
7642 |
<weight_compression>
|
7643 |
+
<advanced_parameters value="{'statistics_path': None, 'awq_params': {'subset_size': 32, 'percent_to_apply': 0.002, 'alpha_min': 0.0, 'alpha_max': 1.0, 'steps': 100}, 'scale_estimation_params': {'subset_size': 64, 'initial_steps': 5, 'scale_steps': 5, 'weight_penalty': -1.0}, 'gptq_params': {'damp_percent': 0.1, 'block_size': 128, 'subset_size': 128}, 'lora_correction_params': {'adapter_rank': 8, 'num_iterations': 3, 'apply_regularization': True, 'subset_size': 128, 'use_int8_adapters': True}}" />
|
7644 |
<all_layers value="False" />
|
7645 |
<awq value="False" />
|
7646 |
+
<backup_mode value="int8_asym" />
|
7647 |
<gptq value="False" />
|
7648 |
<group_size value="128" />
|
7649 |
<ignored_scope value="[]" />
|
|
|
7655 |
</weight_compression>
|
7656 |
</nncf>
|
7657 |
<optimum>
|
7658 |
+
<optimum_intel_version value="1.21.0.dev0+d357376" />
|
7659 |
+
<optimum_version value="1.23.3" />
|
7660 |
+
<pytorch_version value="2.5.1" />
|
7661 |
+
<transformers_version value="4.46.3" />
|
7662 |
</optimum>
|
7663 |
</rt_info>
|
7664 |
</net>
|
openvino_detokenizer.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 528306
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c95aa7a4b53ecb3768d2a6608aa9e419059aef1c75b9b99e6b1c56328281c18
|
3 |
size 528306
|
openvino_detokenizer.xml
CHANGED
@@ -1,16 +1,16 @@
|
|
1 |
<?xml version="1.0"?>
|
2 |
<net name="detokenizer" version="11">
|
3 |
<layers>
|
4 |
-
<layer id="0" name="
|
5 |
<data shape="?,?" element_type="i64" />
|
6 |
<output>
|
7 |
-
<port id="0" precision="I64" names="
|
8 |
<dim>-1</dim>
|
9 |
<dim>-1</dim>
|
10 |
</port>
|
11 |
</output>
|
12 |
</layer>
|
13 |
-
<layer id="1" name="
|
14 |
<data destination_type="i32" />
|
15 |
<input>
|
16 |
<port id="0" precision="I64">
|
@@ -25,7 +25,7 @@
|
|
25 |
</port>
|
26 |
</output>
|
27 |
</layer>
|
28 |
-
<layer id="2" name="
|
29 |
<data element_type="u8" shape="528257" offset="0" size="528257" />
|
30 |
<output>
|
31 |
<port id="0" precision="U8">
|
@@ -33,7 +33,7 @@
|
|
33 |
</port>
|
34 |
</output>
|
35 |
</layer>
|
36 |
-
<layer id="3" name="
|
37 |
<data mode="begins_ends" />
|
38 |
<input>
|
39 |
<port id="0" precision="U8">
|
@@ -52,7 +52,7 @@
|
|
52 |
</port>
|
53 |
</output>
|
54 |
</layer>
|
55 |
-
<layer id="4" name="
|
56 |
<data skip_tokens="50257, 50258, 50259, 50260, 50261, 50262, 50263, 50264, 50265, 50266, 50267, 50268, 50269, 50270, 50271, 50272, 50273, 50274, 50275, 50276, 50277, 50278, 50279, 50280, 50281, 50282, 50283, 50284, 50285, 50286, 50287, 50288, 50289, 50290, 50291, 50292, 50293, 50294, 50295, 50296, 50297, 50298, 50299, 50300, 50301, 50302, 50303, 50304, 50305, 50306, 50307, 50308, 50309, 50310, 50311, 50312, 50313, 50314, 50315, 50316, 50317, 50318, 50319, 50320, 50321, 50322, 50323, 50324, 50325, 50326, 50327, 50328, 50329, 50330, 50331, 50332, 50333, 50334, 50335, 50336, 50337, 50338, 50339, 50340, 50341, 50342, 50343, 50344, 50345, 50346, 50347, 50348, 50349, 50350, 50351, 50352, 50353, 50354, 50355, 50356, 50357, 50358, 50359, 50360, 50361, 50362, 50363, 50364" />
|
57 |
<input>
|
58 |
<port id="0" precision="I32">
|
@@ -87,7 +87,7 @@
|
|
87 |
</port>
|
88 |
</output>
|
89 |
</layer>
|
90 |
-
<layer id="5" name="
|
91 |
<input>
|
92 |
<port id="0" precision="I32">
|
93 |
<dim>-1</dim>
|
@@ -111,7 +111,7 @@
|
|
111 |
</port>
|
112 |
</output>
|
113 |
</layer>
|
114 |
-
<layer id="6" name="
|
115 |
<data element_type="u8" shape="47" offset="528257" size="47" />
|
116 |
<output>
|
117 |
<port id="0" precision="U8">
|
@@ -119,7 +119,7 @@
|
|
119 |
</port>
|
120 |
</output>
|
121 |
</layer>
|
122 |
-
<layer id="7" name="
|
123 |
<data element_type="u8" shape="2" offset="528304" size="2" />
|
124 |
<output>
|
125 |
<port id="0" precision="U8">
|
@@ -127,7 +127,7 @@
|
|
127 |
</port>
|
128 |
</output>
|
129 |
</layer>
|
130 |
-
<layer id="8" name="
|
131 |
<data global_replace="true" />
|
132 |
<input>
|
133 |
<port id="0" precision="I32">
|
@@ -158,7 +158,7 @@
|
|
158 |
</port>
|
159 |
</output>
|
160 |
</layer>
|
161 |
-
<layer id="9" name="
|
162 |
<data mode="begins_ends" />
|
163 |
<input>
|
164 |
<port id="0" precision="I32">
|
@@ -177,7 +177,7 @@
|
|
177 |
</port>
|
178 |
</output>
|
179 |
</layer>
|
180 |
-
<layer id="10" name="
|
181 |
<input>
|
182 |
<port id="0" precision="STRING">
|
183 |
<dim>-1</dim>
|
@@ -207,9 +207,29 @@
|
|
207 |
<edge from-layer="9" from-port="3" to-layer="10" to-port="0" />
|
208 |
</edges>
|
209 |
<rt_info>
|
|
|
|
|
|
|
210 |
<bos_token_id value="50257" />
|
|
|
|
|
211 |
<eos_token_id value="50257" />
|
|
|
|
|
|
|
|
|
212 |
<original_tokenizer_class value="<class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
|
213 |
<pad_token_id value="50257" />
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
214 |
</rt_info>
|
215 |
</net>
|
|
|
1 |
<?xml version="1.0"?>
|
2 |
<net name="detokenizer" version="11">
|
3 |
<layers>
|
4 |
+
<layer id="0" name="Parameter_32760" type="Parameter" version="opset1">
|
5 |
<data shape="?,?" element_type="i64" />
|
6 |
<output>
|
7 |
+
<port id="0" precision="I64" names="Parameter_32760">
|
8 |
<dim>-1</dim>
|
9 |
<dim>-1</dim>
|
10 |
</port>
|
11 |
</output>
|
12 |
</layer>
|
13 |
+
<layer id="1" name="Convert_32776" type="Convert" version="opset1">
|
14 |
<data destination_type="i32" />
|
15 |
<input>
|
16 |
<port id="0" precision="I64">
|
|
|
25 |
</port>
|
26 |
</output>
|
27 |
</layer>
|
28 |
+
<layer id="2" name="Constant_32721" type="Const" version="opset1">
|
29 |
<data element_type="u8" shape="528257" offset="0" size="528257" />
|
30 |
<output>
|
31 |
<port id="0" precision="U8">
|
|
|
33 |
</port>
|
34 |
</output>
|
35 |
</layer>
|
36 |
+
<layer id="3" name="StringTensorUnpack_32722" type="StringTensorUnpack" version="extension">
|
37 |
<data mode="begins_ends" />
|
38 |
<input>
|
39 |
<port id="0" precision="U8">
|
|
|
52 |
</port>
|
53 |
</output>
|
54 |
</layer>
|
55 |
+
<layer id="4" name="VocabDecoder_32761" type="VocabDecoder" version="extension">
|
56 |
<data skip_tokens="50257, 50258, 50259, 50260, 50261, 50262, 50263, 50264, 50265, 50266, 50267, 50268, 50269, 50270, 50271, 50272, 50273, 50274, 50275, 50276, 50277, 50278, 50279, 50280, 50281, 50282, 50283, 50284, 50285, 50286, 50287, 50288, 50289, 50290, 50291, 50292, 50293, 50294, 50295, 50296, 50297, 50298, 50299, 50300, 50301, 50302, 50303, 50304, 50305, 50306, 50307, 50308, 50309, 50310, 50311, 50312, 50313, 50314, 50315, 50316, 50317, 50318, 50319, 50320, 50321, 50322, 50323, 50324, 50325, 50326, 50327, 50328, 50329, 50330, 50331, 50332, 50333, 50334, 50335, 50336, 50337, 50338, 50339, 50340, 50341, 50342, 50343, 50344, 50345, 50346, 50347, 50348, 50349, 50350, 50351, 50352, 50353, 50354, 50355, 50356, 50357, 50358, 50359, 50360, 50361, 50362, 50363, 50364" />
|
57 |
<input>
|
58 |
<port id="0" precision="I32">
|
|
|
87 |
</port>
|
88 |
</output>
|
89 |
</layer>
|
90 |
+
<layer id="5" name="FuzeRagged_32762" type="FuzeRagged" version="extension">
|
91 |
<input>
|
92 |
<port id="0" precision="I32">
|
93 |
<dim>-1</dim>
|
|
|
111 |
</port>
|
112 |
</output>
|
113 |
</layer>
|
114 |
+
<layer id="6" name="Constant_32764" type="Const" version="opset1">
|
115 |
<data element_type="u8" shape="47" offset="528257" size="47" />
|
116 |
<output>
|
117 |
<port id="0" precision="U8">
|
|
|
119 |
</port>
|
120 |
</output>
|
121 |
</layer>
|
122 |
+
<layer id="7" name="Constant_32766" type="Const" version="opset1">
|
123 |
<data element_type="u8" shape="2" offset="528304" size="2" />
|
124 |
<output>
|
125 |
<port id="0" precision="U8">
|
|
|
127 |
</port>
|
128 |
</output>
|
129 |
</layer>
|
130 |
+
<layer id="8" name="RegexNormalization_32767" type="RegexNormalization" version="extension">
|
131 |
<data global_replace="true" />
|
132 |
<input>
|
133 |
<port id="0" precision="I32">
|
|
|
158 |
</port>
|
159 |
</output>
|
160 |
</layer>
|
161 |
+
<layer id="9" name="StringTensorPack_32768" type="StringTensorPack" version="extension">
|
162 |
<data mode="begins_ends" />
|
163 |
<input>
|
164 |
<port id="0" precision="I32">
|
|
|
177 |
</port>
|
178 |
</output>
|
179 |
</layer>
|
180 |
+
<layer id="10" name="Result_32769" type="Result" version="opset1">
|
181 |
<input>
|
182 |
<port id="0" precision="STRING">
|
183 |
<dim>-1</dim>
|
|
|
207 |
<edge from-layer="9" from-port="3" to-layer="10" to-port="0" />
|
208 |
</edges>
|
209 |
<rt_info>
|
210 |
+
<add_attention_mask value="True" />
|
211 |
+
<add_prefix_space />
|
212 |
+
<add_special_tokens value="True" />
|
213 |
<bos_token_id value="50257" />
|
214 |
+
<clean_up_tokenization_spaces />
|
215 |
+
<detokenizer_input_type value="i64" />
|
216 |
<eos_token_id value="50257" />
|
217 |
+
<handle_special_tokens_with_re />
|
218 |
+
<number_of_inputs value="1" />
|
219 |
+
<openvino_tokenizers_version value="2024.5.0.0" />
|
220 |
+
<openvino_version value="2024.5.0" />
|
221 |
<original_tokenizer_class value="<class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
|
222 |
<pad_token_id value="50257" />
|
223 |
+
<sentencepiece_version value="0.2.0" />
|
224 |
+
<skip_special_tokens value="True" />
|
225 |
+
<streaming_detokenizer value="False" />
|
226 |
+
<tiktoken_version value="0.8.0" />
|
227 |
+
<tokenizer_output_type value="i64" />
|
228 |
+
<tokenizers_version value="0.20.3" />
|
229 |
+
<transformers_version value="4.46.3" />
|
230 |
+
<use_max_padding value="False" />
|
231 |
+
<use_sentencepiece_backend value="False" />
|
232 |
+
<utf8_replace_mode />
|
233 |
+
<with_detokenizer value="True" />
|
234 |
</rt_info>
|
235 |
</net>
|
openvino_encoder_model.xml
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
openvino_tokenizer.xml
CHANGED
@@ -1,27 +1,27 @@
|
|
1 |
<?xml version="1.0"?>
|
2 |
<net name="tokenizer" version="11">
|
3 |
<layers>
|
4 |
-
<layer id="0" name="
|
5 |
<data shape="?" element_type="string" />
|
6 |
<output>
|
7 |
-
<port id="0" precision="STRING" names="
|
8 |
<dim>-1</dim>
|
9 |
</port>
|
10 |
</output>
|
11 |
</layer>
|
12 |
-
<layer id="1" name="
|
13 |
<data element_type="i32" shape="" offset="0" size="4" />
|
14 |
<output>
|
15 |
<port id="0" precision="I32" />
|
16 |
</output>
|
17 |
</layer>
|
18 |
-
<layer id="2" name="
|
19 |
<data element_type="i32" shape="" offset="4" size="4" />
|
20 |
<output>
|
21 |
<port id="0" precision="I32" />
|
22 |
</output>
|
23 |
</layer>
|
24 |
-
<layer id="3" name="
|
25 |
<data element_type="i32" shape="1" offset="8" size="4" />
|
26 |
<output>
|
27 |
<port id="0" precision="I32">
|
@@ -29,19 +29,19 @@
|
|
29 |
</port>
|
30 |
</output>
|
31 |
</layer>
|
32 |
-
<layer id="4" name="
|
33 |
<data element_type="i32" shape="" offset="0" size="4" />
|
34 |
<output>
|
35 |
<port id="0" precision="I32" />
|
36 |
</output>
|
37 |
</layer>
|
38 |
-
<layer id="5" name="
|
39 |
<data element_type="i32" shape="" offset="4" size="4" />
|
40 |
<output>
|
41 |
<port id="0" precision="I32" />
|
42 |
</output>
|
43 |
</layer>
|
44 |
-
<layer id="6" name="
|
45 |
<data element_type="i32" shape="1" offset="12" size="4" />
|
46 |
<output>
|
47 |
<port id="0" precision="I32">
|
@@ -49,13 +49,13 @@
|
|
49 |
</port>
|
50 |
</output>
|
51 |
</layer>
|
52 |
-
<layer id="7" name="
|
53 |
<data element_type="i64" shape="" offset="16" size="8" />
|
54 |
<output>
|
55 |
<port id="0" precision="I64" />
|
56 |
</output>
|
57 |
</layer>
|
58 |
-
<layer id="8" name="
|
59 |
<data mode="begins_ends" />
|
60 |
<input>
|
61 |
<port id="0" precision="STRING">
|
@@ -74,7 +74,7 @@
|
|
74 |
</port>
|
75 |
</output>
|
76 |
</layer>
|
77 |
-
<layer id="9" name="
|
78 |
<data output_type="i64" />
|
79 |
<input>
|
80 |
<port id="0" precision="I32">
|
@@ -87,19 +87,19 @@
|
|
87 |
</port>
|
88 |
</output>
|
89 |
</layer>
|
90 |
-
<layer id="10" name="
|
91 |
<data element_type="i64" shape="" offset="16" size="8" />
|
92 |
<output>
|
93 |
<port id="0" precision="I64" />
|
94 |
</output>
|
95 |
</layer>
|
96 |
-
<layer id="11" name="
|
97 |
<data element_type="i64" shape="" offset="16" size="8" />
|
98 |
<output>
|
99 |
<port id="0" precision="I64" />
|
100 |
</output>
|
101 |
</layer>
|
102 |
-
<layer id="12" name="
|
103 |
<data batch_dims="0" />
|
104 |
<input>
|
105 |
<port id="0" precision="I64">
|
@@ -112,13 +112,13 @@
|
|
112 |
<port id="3" precision="I64" />
|
113 |
</output>
|
114 |
</layer>
|
115 |
-
<layer id="13" name="
|
116 |
<data element_type="i64" shape="" offset="24" size="8" />
|
117 |
<output>
|
118 |
<port id="0" precision="I64" />
|
119 |
</output>
|
120 |
</layer>
|
121 |
-
<layer id="14" name="
|
122 |
<data output_type="i32" />
|
123 |
<input>
|
124 |
<port id="0" precision="I64" />
|
@@ -131,19 +131,19 @@
|
|
131 |
</port>
|
132 |
</output>
|
133 |
</layer>
|
134 |
-
<layer id="15" name="
|
135 |
<data element_type="i64" shape="" offset="24" size="8" />
|
136 |
<output>
|
137 |
<port id="0" precision="I64" />
|
138 |
</output>
|
139 |
</layer>
|
140 |
-
<layer id="16" name="
|
141 |
<data element_type="i64" shape="" offset="24" size="8" />
|
142 |
<output>
|
143 |
<port id="0" precision="I64" />
|
144 |
</output>
|
145 |
</layer>
|
146 |
-
<layer id="17" name="
|
147 |
<data auto_broadcast="numpy" />
|
148 |
<input>
|
149 |
<port id="0" precision="I64" />
|
@@ -153,13 +153,13 @@
|
|
153 |
<port id="2" precision="I64" />
|
154 |
</output>
|
155 |
</layer>
|
156 |
-
<layer id="18" name="
|
157 |
<data element_type="i64" shape="" offset="24" size="8" />
|
158 |
<output>
|
159 |
<port id="0" precision="I64" />
|
160 |
</output>
|
161 |
</layer>
|
162 |
-
<layer id="19" name="
|
163 |
<data output_type="i32" />
|
164 |
<input>
|
165 |
<port id="0" precision="I64" />
|
@@ -172,7 +172,7 @@
|
|
172 |
</port>
|
173 |
</output>
|
174 |
</layer>
|
175 |
-
<layer id="20" name="
|
176 |
<data element_type="u8" shape="26491" offset="32" size="26491" />
|
177 |
<output>
|
178 |
<port id="0" precision="U8">
|
@@ -180,7 +180,7 @@
|
|
180 |
</port>
|
181 |
</output>
|
182 |
</layer>
|
183 |
-
<layer id="21" name="
|
184 |
<input>
|
185 |
<port id="0" precision="I32">
|
186 |
<dim>-1</dim>
|
@@ -222,7 +222,7 @@
|
|
222 |
</port>
|
223 |
</output>
|
224 |
</layer>
|
225 |
-
<layer id="22" name="
|
226 |
<data element_type="u8" shape="64" offset="26523" size="64" />
|
227 |
<output>
|
228 |
<port id="0" precision="U8">
|
@@ -230,7 +230,7 @@
|
|
230 |
</port>
|
231 |
</output>
|
232 |
</layer>
|
233 |
-
<layer id="23" name="
|
234 |
<data behaviour="isolate" invert="false" max_splits="-1" />
|
235 |
<input>
|
236 |
<port id="0" precision="I32">
|
@@ -276,7 +276,7 @@
|
|
276 |
</port>
|
277 |
</output>
|
278 |
</layer>
|
279 |
-
<layer id="24" name="
|
280 |
<data element_type="u8" shape="528257" offset="26587" size="528257" />
|
281 |
<output>
|
282 |
<port id="0" precision="U8">
|
@@ -284,7 +284,7 @@
|
|
284 |
</port>
|
285 |
</output>
|
286 |
</layer>
|
287 |
-
<layer id="25" name="
|
288 |
<data mode="begins_ends" />
|
289 |
<input>
|
290 |
<port id="0" precision="U8">
|
@@ -303,7 +303,7 @@
|
|
303 |
</port>
|
304 |
</output>
|
305 |
</layer>
|
306 |
-
<layer id="26" name="
|
307 |
<data element_type="u8" shape="369958" offset="554844" size="369958" />
|
308 |
<output>
|
309 |
<port id="0" precision="U8">
|
@@ -311,7 +311,7 @@
|
|
311 |
</port>
|
312 |
</output>
|
313 |
</layer>
|
314 |
-
<layer id="27" name="
|
315 |
<data mode="begins_ends" />
|
316 |
<input>
|
317 |
<port id="0" precision="U8">
|
@@ -330,7 +330,7 @@
|
|
330 |
</port>
|
331 |
</output>
|
332 |
</layer>
|
333 |
-
<layer id="28" name="
|
334 |
<data element_type="u8" shape="336859" offset="924802" size="336859" />
|
335 |
<output>
|
336 |
<port id="0" precision="U8">
|
@@ -338,7 +338,7 @@
|
|
338 |
</port>
|
339 |
</output>
|
340 |
</layer>
|
341 |
-
<layer id="29" name="
|
342 |
<data mode="begins_ends" />
|
343 |
<input>
|
344 |
<port id="0" precision="U8">
|
@@ -357,7 +357,7 @@
|
|
357 |
</port>
|
358 |
</output>
|
359 |
</layer>
|
360 |
-
<layer id="30" name="
|
361 |
<data element_type="u8" shape="20172" offset="1261661" size="20172" />
|
362 |
<output>
|
363 |
<port id="0" precision="U8">
|
@@ -365,7 +365,7 @@
|
|
365 |
</port>
|
366 |
</output>
|
367 |
</layer>
|
368 |
-
<layer id="31" name="
|
369 |
<data mode="begins_ends" />
|
370 |
<input>
|
371 |
<port id="0" precision="U8">
|
@@ -384,7 +384,7 @@
|
|
384 |
</port>
|
385 |
</output>
|
386 |
</layer>
|
387 |
-
<layer id="32" name="
|
388 |
<data element_type="i32" shape="1609" offset="1281833" size="6436" />
|
389 |
<output>
|
390 |
<port id="0" precision="I32">
|
@@ -392,7 +392,7 @@
|
|
392 |
</port>
|
393 |
</output>
|
394 |
</layer>
|
395 |
-
<layer id="33" name="
|
396 |
<data unk_token="" fuse_unk="false" suffix_indicator="" end_suffix="" byte_fallback="false" cache_capacity="20000" />
|
397 |
<input>
|
398 |
<port id="0" precision="I32">
|
@@ -462,7 +462,7 @@
|
|
462 |
</port>
|
463 |
</output>
|
464 |
</layer>
|
465 |
-
<layer id="34" name="
|
466 |
<data auto_broadcast="numpy" />
|
467 |
<input>
|
468 |
<port id="0" precision="I32">
|
@@ -478,13 +478,13 @@
|
|
478 |
</port>
|
479 |
</output>
|
480 |
</layer>
|
481 |
-
<layer id="35" name="
|
482 |
<data element_type="i32" shape="" offset="1288269" size="4" />
|
483 |
<output>
|
484 |
<port id="0" precision="I32" />
|
485 |
</output>
|
486 |
</layer>
|
487 |
-
<layer id="36" name="
|
488 |
<data auto_broadcast="numpy" />
|
489 |
<input>
|
490 |
<port id="0" precision="I32">
|
@@ -498,7 +498,7 @@
|
|
498 |
</port>
|
499 |
</output>
|
500 |
</layer>
|
501 |
-
<layer id="37" name="
|
502 |
<data auto_broadcast="numpy" />
|
503 |
<input>
|
504 |
<port id="0" precision="I32">
|
@@ -514,19 +514,19 @@
|
|
514 |
</port>
|
515 |
</output>
|
516 |
</layer>
|
517 |
-
<layer id="38" name="
|
518 |
<data element_type="i32" shape="" offset="0" size="4" />
|
519 |
<output>
|
520 |
<port id="0" precision="I32" />
|
521 |
</output>
|
522 |
</layer>
|
523 |
-
<layer id="39" name="
|
524 |
<data element_type="i32" shape="" offset="4" size="4" />
|
525 |
<output>
|
526 |
<port id="0" precision="I32" />
|
527 |
</output>
|
528 |
</layer>
|
529 |
-
<layer id="40" name="
|
530 |
<data element_type="i32" shape="1" offset="1288273" size="4" />
|
531 |
<output>
|
532 |
<port id="0" precision="I32">
|
@@ -534,7 +534,7 @@
|
|
534 |
</port>
|
535 |
</output>
|
536 |
</layer>
|
537 |
-
<layer id="41" name="
|
538 |
<data element_type="i32" shape="4" offset="1288277" size="16" />
|
539 |
<output>
|
540 |
<port id="0" precision="I32">
|
@@ -542,7 +542,7 @@
|
|
542 |
</port>
|
543 |
</output>
|
544 |
</layer>
|
545 |
-
<layer id="42" name="
|
546 |
<input>
|
547 |
<port id="0" precision="I32" />
|
548 |
<port id="1" precision="I32" />
|
@@ -593,7 +593,7 @@
|
|
593 |
</port>
|
594 |
</output>
|
595 |
</layer>
|
596 |
-
<layer id="43" name="
|
597 |
<data auto_broadcast="numpy" />
|
598 |
<input>
|
599 |
<port id="0" precision="I32">
|
@@ -609,13 +609,13 @@
|
|
609 |
</port>
|
610 |
</output>
|
611 |
</layer>
|
612 |
-
<layer id="44" name="
|
613 |
<data element_type="i32" shape="" offset="0" size="4" />
|
614 |
<output>
|
615 |
<port id="0" precision="I32" />
|
616 |
</output>
|
617 |
</layer>
|
618 |
-
<layer id="45" name="
|
619 |
<data keep_dims="false" />
|
620 |
<input>
|
621 |
<port id="0" precision="I32">
|
@@ -627,13 +627,13 @@
|
|
627 |
<port id="2" precision="I32" />
|
628 |
</output>
|
629 |
</layer>
|
630 |
-
<layer id="46" name="
|
631 |
<data element_type="i32" shape="" offset="1288273" size="4" />
|
632 |
<output>
|
633 |
<port id="0" precision="I32" />
|
634 |
</output>
|
635 |
</layer>
|
636 |
-
<layer id="47" name="
|
637 |
<data pad_right="true" />
|
638 |
<input>
|
639 |
<port id="0" precision="I32">
|
@@ -659,7 +659,7 @@
|
|
659 |
</port>
|
660 |
</output>
|
661 |
</layer>
|
662 |
-
<layer id="48" name="
|
663 |
<data destination_type="i32" />
|
664 |
<input>
|
665 |
<port id="0" precision="BOOL">
|
@@ -674,7 +674,7 @@
|
|
674 |
</port>
|
675 |
</output>
|
676 |
</layer>
|
677 |
-
<layer id="49" name="
|
678 |
<data destination_type="i64" />
|
679 |
<input>
|
680 |
<port id="0" precision="I32">
|
@@ -689,7 +689,7 @@
|
|
689 |
</port>
|
690 |
</output>
|
691 |
</layer>
|
692 |
-
<layer id="51" name="
|
693 |
<data destination_type="i64" />
|
694 |
<input>
|
695 |
<port id="0" precision="I32">
|
@@ -704,7 +704,7 @@
|
|
704 |
</port>
|
705 |
</output>
|
706 |
</layer>
|
707 |
-
<layer id="52" name="
|
708 |
<input>
|
709 |
<port id="0" precision="I64">
|
710 |
<dim>-1</dim>
|
@@ -712,7 +712,7 @@
|
|
712 |
</port>
|
713 |
</input>
|
714 |
</layer>
|
715 |
-
<layer id="50" name="
|
716 |
<input>
|
717 |
<port id="0" precision="I64">
|
718 |
<dim>-1</dim>
|
@@ -805,9 +805,29 @@
|
|
805 |
<edge from-layer="51" from-port="1" to-layer="52" to-port="0" />
|
806 |
</edges>
|
807 |
<rt_info>
|
|
|
|
|
|
|
808 |
<bos_token_id value="50257" />
|
|
|
|
|
809 |
<eos_token_id value="50257" />
|
|
|
|
|
|
|
|
|
810 |
<original_tokenizer_class value="<class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
|
811 |
<pad_token_id value="50257" />
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
812 |
</rt_info>
|
813 |
</net>
|
|
|
1 |
<?xml version="1.0"?>
|
2 |
<net name="tokenizer" version="11">
|
3 |
<layers>
|
4 |
+
<layer id="0" name="Parameter_32640" type="Parameter" version="opset1">
|
5 |
<data shape="?" element_type="string" />
|
6 |
<output>
|
7 |
+
<port id="0" precision="STRING" names="Parameter_32640">
|
8 |
<dim>-1</dim>
|
9 |
</port>
|
10 |
</output>
|
11 |
</layer>
|
12 |
+
<layer id="1" name="Constant_32738" type="Const" version="opset1">
|
13 |
<data element_type="i32" shape="" offset="0" size="4" />
|
14 |
<output>
|
15 |
<port id="0" precision="I32" />
|
16 |
</output>
|
17 |
</layer>
|
18 |
+
<layer id="2" name="Constant_32739" type="Const" version="opset1">
|
19 |
<data element_type="i32" shape="" offset="4" size="4" />
|
20 |
<output>
|
21 |
<port id="0" precision="I32" />
|
22 |
</output>
|
23 |
</layer>
|
24 |
+
<layer id="3" name="Constant_32740" type="Const" version="opset1">
|
25 |
<data element_type="i32" shape="1" offset="8" size="4" />
|
26 |
<output>
|
27 |
<port id="0" precision="I32">
|
|
|
29 |
</port>
|
30 |
</output>
|
31 |
</layer>
|
32 |
+
<layer id="4" name="Constant_32741" type="Const" version="opset1">
|
33 |
<data element_type="i32" shape="" offset="0" size="4" />
|
34 |
<output>
|
35 |
<port id="0" precision="I32" />
|
36 |
</output>
|
37 |
</layer>
|
38 |
+
<layer id="5" name="Constant_32742" type="Const" version="opset1">
|
39 |
<data element_type="i32" shape="" offset="4" size="4" />
|
40 |
<output>
|
41 |
<port id="0" precision="I32" />
|
42 |
</output>
|
43 |
</layer>
|
44 |
+
<layer id="6" name="Constant_32743" type="Const" version="opset1">
|
45 |
<data element_type="i32" shape="1" offset="12" size="4" />
|
46 |
<output>
|
47 |
<port id="0" precision="I32">
|
|
|
49 |
</port>
|
50 |
</output>
|
51 |
</layer>
|
52 |
+
<layer id="7" name="Constant_32646" type="Const" version="opset1">
|
53 |
<data element_type="i64" shape="" offset="16" size="8" />
|
54 |
<output>
|
55 |
<port id="0" precision="I64" />
|
56 |
</output>
|
57 |
</layer>
|
58 |
+
<layer id="8" name="StringTensorUnpack_32641" type="StringTensorUnpack" version="extension">
|
59 |
<data mode="begins_ends" />
|
60 |
<input>
|
61 |
<port id="0" precision="STRING">
|
|
|
74 |
</port>
|
75 |
</output>
|
76 |
</layer>
|
77 |
+
<layer id="9" name="ShapeOf_32642" type="ShapeOf" version="opset3">
|
78 |
<data output_type="i64" />
|
79 |
<input>
|
80 |
<port id="0" precision="I32">
|
|
|
87 |
</port>
|
88 |
</output>
|
89 |
</layer>
|
90 |
+
<layer id="10" name="Constant_32643" type="Const" version="opset1">
|
91 |
<data element_type="i64" shape="" offset="16" size="8" />
|
92 |
<output>
|
93 |
<port id="0" precision="I64" />
|
94 |
</output>
|
95 |
</layer>
|
96 |
+
<layer id="11" name="Constant_32644" type="Const" version="opset1">
|
97 |
<data element_type="i64" shape="" offset="16" size="8" />
|
98 |
<output>
|
99 |
<port id="0" precision="I64" />
|
100 |
</output>
|
101 |
</layer>
|
102 |
+
<layer id="12" name="Gather_32645" type="Gather" version="opset8">
|
103 |
<data batch_dims="0" />
|
104 |
<input>
|
105 |
<port id="0" precision="I64">
|
|
|
112 |
<port id="3" precision="I64" />
|
113 |
</output>
|
114 |
</layer>
|
115 |
+
<layer id="13" name="Constant_32647" type="Const" version="opset1">
|
116 |
<data element_type="i64" shape="" offset="24" size="8" />
|
117 |
<output>
|
118 |
<port id="0" precision="I64" />
|
119 |
</output>
|
120 |
</layer>
|
121 |
+
<layer id="14" name="Range_32648" type="Range" version="opset4">
|
122 |
<data output_type="i32" />
|
123 |
<input>
|
124 |
<port id="0" precision="I64" />
|
|
|
131 |
</port>
|
132 |
</output>
|
133 |
</layer>
|
134 |
+
<layer id="15" name="Constant_32649" type="Const" version="opset1">
|
135 |
<data element_type="i64" shape="" offset="24" size="8" />
|
136 |
<output>
|
137 |
<port id="0" precision="I64" />
|
138 |
</output>
|
139 |
</layer>
|
140 |
+
<layer id="16" name="Constant_32650" type="Const" version="opset1">
|
141 |
<data element_type="i64" shape="" offset="24" size="8" />
|
142 |
<output>
|
143 |
<port id="0" precision="I64" />
|
144 |
</output>
|
145 |
</layer>
|
146 |
+
<layer id="17" name="Add_32651" type="Add" version="opset1">
|
147 |
<data auto_broadcast="numpy" />
|
148 |
<input>
|
149 |
<port id="0" precision="I64" />
|
|
|
153 |
<port id="2" precision="I64" />
|
154 |
</output>
|
155 |
</layer>
|
156 |
+
<layer id="18" name="Constant_32652" type="Const" version="opset1">
|
157 |
<data element_type="i64" shape="" offset="24" size="8" />
|
158 |
<output>
|
159 |
<port id="0" precision="I64" />
|
160 |
</output>
|
161 |
</layer>
|
162 |
+
<layer id="19" name="Range_32653" type="Range" version="opset4">
|
163 |
<data output_type="i32" />
|
164 |
<input>
|
165 |
<port id="0" precision="I64" />
|
|
|
172 |
</port>
|
173 |
</output>
|
174 |
</layer>
|
175 |
+
<layer id="20" name="Constant_32715" type="Const" version="opset1">
|
176 |
<data element_type="u8" shape="26491" offset="32" size="26491" />
|
177 |
<output>
|
178 |
<port id="0" precision="U8">
|
|
|
180 |
</port>
|
181 |
</output>
|
182 |
</layer>
|
183 |
+
<layer id="21" name="SpecialTokensSplit_32716" type="SpecialTokensSplit" version="extension">
|
184 |
<input>
|
185 |
<port id="0" precision="I32">
|
186 |
<dim>-1</dim>
|
|
|
222 |
</port>
|
223 |
</output>
|
224 |
</layer>
|
225 |
+
<layer id="22" name="Constant_32718" type="Const" version="opset1">
|
226 |
<data element_type="u8" shape="64" offset="26523" size="64" />
|
227 |
<output>
|
228 |
<port id="0" precision="U8">
|
|
|
230 |
</port>
|
231 |
</output>
|
232 |
</layer>
|
233 |
+
<layer id="23" name="RegexSplit_32719" type="RegexSplit" version="extension">
|
234 |
<data behaviour="isolate" invert="false" max_splits="-1" />
|
235 |
<input>
|
236 |
<port id="0" precision="I32">
|
|
|
276 |
</port>
|
277 |
</output>
|
278 |
</layer>
|
279 |
+
<layer id="24" name="Constant_32721" type="Const" version="opset1">
|
280 |
<data element_type="u8" shape="528257" offset="26587" size="528257" />
|
281 |
<output>
|
282 |
<port id="0" precision="U8">
|
|
|
284 |
</port>
|
285 |
</output>
|
286 |
</layer>
|
287 |
+
<layer id="25" name="StringTensorUnpack_32722" type="StringTensorUnpack" version="extension">
|
288 |
<data mode="begins_ends" />
|
289 |
<input>
|
290 |
<port id="0" precision="U8">
|
|
|
303 |
</port>
|
304 |
</output>
|
305 |
</layer>
|
306 |
+
<layer id="26" name="Constant_32727" type="Const" version="opset1">
|
307 |
<data element_type="u8" shape="369958" offset="554844" size="369958" />
|
308 |
<output>
|
309 |
<port id="0" precision="U8">
|
|
|
311 |
</port>
|
312 |
</output>
|
313 |
</layer>
|
314 |
+
<layer id="27" name="StringTensorUnpack_32728" type="StringTensorUnpack" version="extension">
|
315 |
<data mode="begins_ends" />
|
316 |
<input>
|
317 |
<port id="0" precision="U8">
|
|
|
330 |
</port>
|
331 |
</output>
|
332 |
</layer>
|
333 |
+
<layer id="28" name="Constant_32730" type="Const" version="opset1">
|
334 |
<data element_type="u8" shape="336859" offset="924802" size="336859" />
|
335 |
<output>
|
336 |
<port id="0" precision="U8">
|
|
|
338 |
</port>
|
339 |
</output>
|
340 |
</layer>
|
341 |
+
<layer id="29" name="StringTensorUnpack_32731" type="StringTensorUnpack" version="extension">
|
342 |
<data mode="begins_ends" />
|
343 |
<input>
|
344 |
<port id="0" precision="U8">
|
|
|
357 |
</port>
|
358 |
</output>
|
359 |
</layer>
|
360 |
+
<layer id="30" name="Constant_32724" type="Const" version="opset1">
|
361 |
<data element_type="u8" shape="20172" offset="1261661" size="20172" />
|
362 |
<output>
|
363 |
<port id="0" precision="U8">
|
|
|
365 |
</port>
|
366 |
</output>
|
367 |
</layer>
|
368 |
+
<layer id="31" name="StringTensorUnpack_32725" type="StringTensorUnpack" version="extension">
|
369 |
<data mode="begins_ends" />
|
370 |
<input>
|
371 |
<port id="0" precision="U8">
|
|
|
384 |
</port>
|
385 |
</output>
|
386 |
</layer>
|
387 |
+
<layer id="32" name="Constant_32732" type="Const" version="opset1">
|
388 |
<data element_type="i32" shape="1609" offset="1281833" size="6436" />
|
389 |
<output>
|
390 |
<port id="0" precision="I32">
|
|
|
392 |
</port>
|
393 |
</output>
|
394 |
</layer>
|
395 |
+
<layer id="33" name="BPETokenizer_32733" type="BPETokenizer" version="extension">
|
396 |
<data unk_token="" fuse_unk="false" suffix_indicator="" end_suffix="" byte_fallback="false" cache_capacity="20000" />
|
397 |
<input>
|
398 |
<port id="0" precision="I32">
|
|
|
462 |
</port>
|
463 |
</output>
|
464 |
</layer>
|
465 |
+
<layer id="34" name="Subtract_32734" type="Subtract" version="opset1">
|
466 |
<data auto_broadcast="numpy" />
|
467 |
<input>
|
468 |
<port id="0" precision="I32">
|
|
|
478 |
</port>
|
479 |
</output>
|
480 |
</layer>
|
481 |
+
<layer id="35" name="Constant_32735" type="Const" version="opset1">
|
482 |
<data element_type="i32" shape="" offset="1288269" size="4" />
|
483 |
<output>
|
484 |
<port id="0" precision="I32" />
|
485 |
</output>
|
486 |
</layer>
|
487 |
+
<layer id="36" name="Minimum_32736" type="Minimum" version="opset1">
|
488 |
<data auto_broadcast="numpy" />
|
489 |
<input>
|
490 |
<port id="0" precision="I32">
|
|
|
498 |
</port>
|
499 |
</output>
|
500 |
</layer>
|
501 |
+
<layer id="37" name="Add_32737" type="Add" version="opset1">
|
502 |
<data auto_broadcast="numpy" />
|
503 |
<input>
|
504 |
<port id="0" precision="I32">
|
|
|
514 |
</port>
|
515 |
</output>
|
516 |
</layer>
|
517 |
+
<layer id="38" name="Constant_32744" type="Const" version="opset1">
|
518 |
<data element_type="i32" shape="" offset="0" size="4" />
|
519 |
<output>
|
520 |
<port id="0" precision="I32" />
|
521 |
</output>
|
522 |
</layer>
|
523 |
+
<layer id="39" name="Constant_32745" type="Const" version="opset1">
|
524 |
<data element_type="i32" shape="" offset="4" size="4" />
|
525 |
<output>
|
526 |
<port id="0" precision="I32" />
|
527 |
</output>
|
528 |
</layer>
|
529 |
+
<layer id="40" name="Constant_32746" type="Const" version="opset1">
|
530 |
<data element_type="i32" shape="1" offset="1288273" size="4" />
|
531 |
<output>
|
532 |
<port id="0" precision="I32">
|
|
|
534 |
</port>
|
535 |
</output>
|
536 |
</layer>
|
537 |
+
<layer id="41" name="Constant_32747" type="Const" version="opset1">
|
538 |
<data element_type="i32" shape="4" offset="1288277" size="16" />
|
539 |
<output>
|
540 |
<port id="0" precision="I32">
|
|
|
542 |
</port>
|
543 |
</output>
|
544 |
</layer>
|
545 |
+
<layer id="42" name="CombineSegments_32748" type="CombineSegments" version="extension">
|
546 |
<input>
|
547 |
<port id="0" precision="I32" />
|
548 |
<port id="1" precision="I32" />
|
|
|
593 |
</port>
|
594 |
</output>
|
595 |
</layer>
|
596 |
+
<layer id="43" name="Subtract_32749" type="Subtract" version="opset1">
|
597 |
<data auto_broadcast="numpy" />
|
598 |
<input>
|
599 |
<port id="0" precision="I32">
|
|
|
609 |
</port>
|
610 |
</output>
|
611 |
</layer>
|
612 |
+
<layer id="44" name="Constant_32750" type="Const" version="opset1">
|
613 |
<data element_type="i32" shape="" offset="0" size="4" />
|
614 |
<output>
|
615 |
<port id="0" precision="I32" />
|
616 |
</output>
|
617 |
</layer>
|
618 |
+
<layer id="45" name="ReduceMax_32751" type="ReduceMax" version="opset1">
|
619 |
<data keep_dims="false" />
|
620 |
<input>
|
621 |
<port id="0" precision="I32">
|
|
|
627 |
<port id="2" precision="I32" />
|
628 |
</output>
|
629 |
</layer>
|
630 |
+
<layer id="46" name="Constant_32752" type="Const" version="opset1">
|
631 |
<data element_type="i32" shape="" offset="1288273" size="4" />
|
632 |
<output>
|
633 |
<port id="0" precision="I32" />
|
634 |
</output>
|
635 |
</layer>
|
636 |
+
<layer id="47" name="RaggedToDense_32753" type="RaggedToDense" version="extension">
|
637 |
<data pad_right="true" />
|
638 |
<input>
|
639 |
<port id="0" precision="I32">
|
|
|
659 |
</port>
|
660 |
</output>
|
661 |
</layer>
|
662 |
+
<layer id="48" name="Convert_32754" type="Convert" version="opset1">
|
663 |
<data destination_type="i32" />
|
664 |
<input>
|
665 |
<port id="0" precision="BOOL">
|
|
|
674 |
</port>
|
675 |
</output>
|
676 |
</layer>
|
677 |
+
<layer id="49" name="Convert_32754" type="Convert" version="opset1">
|
678 |
<data destination_type="i64" />
|
679 |
<input>
|
680 |
<port id="0" precision="I32">
|
|
|
689 |
</port>
|
690 |
</output>
|
691 |
</layer>
|
692 |
+
<layer id="51" name="RaggedToDense_32753.0" type="Convert" version="opset1">
|
693 |
<data destination_type="i64" />
|
694 |
<input>
|
695 |
<port id="0" precision="I32">
|
|
|
704 |
</port>
|
705 |
</output>
|
706 |
</layer>
|
707 |
+
<layer id="52" name="Result_32757" type="Result" version="opset1">
|
708 |
<input>
|
709 |
<port id="0" precision="I64">
|
710 |
<dim>-1</dim>
|
|
|
712 |
</port>
|
713 |
</input>
|
714 |
</layer>
|
715 |
+
<layer id="50" name="Result_32759" type="Result" version="opset1">
|
716 |
<input>
|
717 |
<port id="0" precision="I64">
|
718 |
<dim>-1</dim>
|
|
|
805 |
<edge from-layer="51" from-port="1" to-layer="52" to-port="0" />
|
806 |
</edges>
|
807 |
<rt_info>
|
808 |
+
<add_attention_mask value="True" />
|
809 |
+
<add_prefix_space />
|
810 |
+
<add_special_tokens value="True" />
|
811 |
<bos_token_id value="50257" />
|
812 |
+
<clean_up_tokenization_spaces />
|
813 |
+
<detokenizer_input_type value="i64" />
|
814 |
<eos_token_id value="50257" />
|
815 |
+
<handle_special_tokens_with_re />
|
816 |
+
<number_of_inputs value="1" />
|
817 |
+
<openvino_tokenizers_version value="2024.5.0.0" />
|
818 |
+
<openvino_version value="2024.5.0" />
|
819 |
<original_tokenizer_class value="<class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
|
820 |
<pad_token_id value="50257" />
|
821 |
+
<sentencepiece_version value="0.2.0" />
|
822 |
+
<skip_special_tokens value="True" />
|
823 |
+
<streaming_detokenizer value="False" />
|
824 |
+
<tiktoken_version value="0.8.0" />
|
825 |
+
<tokenizer_output_type value="i64" />
|
826 |
+
<tokenizers_version value="0.20.3" />
|
827 |
+
<transformers_version value="4.46.3" />
|
828 |
+
<use_max_padding value="False" />
|
829 |
+
<use_sentencepiece_backend value="False" />
|
830 |
+
<utf8_replace_mode />
|
831 |
+
<with_detokenizer value="True" />
|
832 |
</rt_info>
|
833 |
</net>
|