openvino-ci
commited on
Commit
•
41e0b7f
1
Parent(s):
aa8b7de
Upload folder using huggingface_hub
Browse files- config.json +2 -1
- generation_config.json +1 -1
- openvino_decoder_model.xml +125 -125
- openvino_detokenizer.bin +1 -1
- openvino_detokenizer.xml +32 -12
- openvino_encoder_model.xml +0 -0
- openvino_tokenizer.xml +74 -54
config.json
CHANGED
@@ -1,4 +1,5 @@
|
|
1 |
{
|
|
|
2 |
"_name_or_path": "distil-whisper/distil-large-v3",
|
3 |
"activation_dropout": 0.0,
|
4 |
"activation_function": "gelu",
|
@@ -39,7 +40,7 @@
|
|
39 |
"num_mel_bins": 128,
|
40 |
"pad_token_id": 50256,
|
41 |
"scale_embedding": false,
|
42 |
-
"transformers_version": "4.
|
43 |
"use_cache": true,
|
44 |
"use_weighted_layer_sum": false,
|
45 |
"vocab_size": 51866
|
|
|
1 |
{
|
2 |
+
"_attn_implementation_autoset": true,
|
3 |
"_name_or_path": "distil-whisper/distil-large-v3",
|
4 |
"activation_dropout": 0.0,
|
5 |
"activation_function": "gelu",
|
|
|
40 |
"num_mel_bins": 128,
|
41 |
"pad_token_id": 50256,
|
42 |
"scale_embedding": false,
|
43 |
+
"transformers_version": "4.46.3",
|
44 |
"use_cache": true,
|
45 |
"use_weighted_layer_sum": false,
|
46 |
"vocab_size": 51866
|
generation_config.json
CHANGED
@@ -303,5 +303,5 @@
|
|
303 |
"transcribe": 50360,
|
304 |
"translate": 50359
|
305 |
},
|
306 |
-
"transformers_version": "4.
|
307 |
}
|
|
|
303 |
"transcribe": 50360,
|
304 |
"translate": 50359
|
305 |
},
|
306 |
+
"transformers_version": "4.46.3"
|
307 |
}
|
openvino_decoder_model.xml
CHANGED
@@ -10,7 +10,7 @@
|
|
10 |
</port>
|
11 |
</output>
|
12 |
</layer>
|
13 |
-
<layer id="0" name="
|
14 |
<data shape="?,?,?" element_type="f32" />
|
15 |
<output>
|
16 |
<port id="0" precision="FP32" names="encoder_hidden_states">
|
@@ -47,7 +47,7 @@
|
|
47 |
</port>
|
48 |
</output>
|
49 |
</layer>
|
50 |
-
<layer id="4" name="
|
51 |
<data element_type="i64" shape="2" offset="132776960" size="16" />
|
52 |
<rt_info>
|
53 |
<attribute name="precise" version="0" />
|
@@ -151,7 +151,7 @@
|
|
151 |
<port id="0" precision="I64" names="23" />
|
152 |
</output>
|
153 |
</layer>
|
154 |
-
<layer id="12" name="
|
155 |
<data output_type="i64" />
|
156 |
<input>
|
157 |
<port id="0" precision="I64">
|
@@ -165,7 +165,7 @@
|
|
165 |
</port>
|
166 |
</output>
|
167 |
</layer>
|
168 |
-
<layer id="13" name="
|
169 |
<data element_type="i64" shape="" offset="133923868" size="8" />
|
170 |
<rt_info>
|
171 |
<attribute name="precise" version="0" />
|
@@ -174,7 +174,7 @@
|
|
174 |
<port id="0" precision="I64" />
|
175 |
</output>
|
176 |
</layer>
|
177 |
-
<layer id="14" name="
|
178 |
<data element_type="i64" shape="" offset="133923860" size="8" />
|
179 |
<rt_info>
|
180 |
<attribute name="precise" version="0" />
|
@@ -183,7 +183,7 @@
|
|
183 |
<port id="0" precision="I64" />
|
184 |
</output>
|
185 |
</layer>
|
186 |
-
<layer id="15" name="
|
187 |
<data batch_dims="0" />
|
188 |
<input>
|
189 |
<port id="0" precision="I64">
|
@@ -244,7 +244,7 @@
|
|
244 |
</port>
|
245 |
</output>
|
246 |
</layer>
|
247 |
-
<layer id="20" name="
|
248 |
<data element_type="i32" shape="" offset="132776976" size="4" />
|
249 |
<output>
|
250 |
<port id="0" precision="I32" />
|
@@ -321,7 +321,7 @@
|
|
321 |
</port>
|
322 |
</output>
|
323 |
</layer>
|
324 |
-
<layer id="25" name="
|
325 |
<data element_type="f16" shape="1, 1, 1280" offset="133923884" size="2560" />
|
326 |
<output>
|
327 |
<port id="0" precision="FP16">
|
@@ -331,7 +331,7 @@
|
|
331 |
</port>
|
332 |
</output>
|
333 |
</layer>
|
334 |
-
<layer id="26" name="
|
335 |
<data destination_type="f32" />
|
336 |
<rt_info>
|
337 |
<attribute name="decompression" version="0" />
|
@@ -373,7 +373,7 @@
|
|
373 |
</port>
|
374 |
</output>
|
375 |
</layer>
|
376 |
-
<layer id="28" name="
|
377 |
<data element_type="f16" shape="1, 1, 1280" offset="133926444" size="2560" />
|
378 |
<output>
|
379 |
<port id="0" precision="FP16">
|
@@ -383,7 +383,7 @@
|
|
383 |
</port>
|
384 |
</output>
|
385 |
</layer>
|
386 |
-
<layer id="29" name="
|
387 |
<data destination_type="f32" />
|
388 |
<rt_info>
|
389 |
<attribute name="decompression" version="0" />
|
@@ -425,7 +425,7 @@
|
|
425 |
</port>
|
426 |
</output>
|
427 |
</layer>
|
428 |
-
<layer id="31" name="
|
429 |
<data element_type="f16" shape="1280, 1280" offset="133929004" size="3276800" />
|
430 |
<output>
|
431 |
<port id="0" precision="FP16">
|
@@ -434,7 +434,7 @@
|
|
434 |
</port>
|
435 |
</output>
|
436 |
</layer>
|
437 |
-
<layer id="32" name="
|
438 |
<data destination_type="f32" />
|
439 |
<rt_info>
|
440 |
<attribute name="decompression" version="0" />
|
@@ -452,7 +452,7 @@
|
|
452 |
</port>
|
453 |
</output>
|
454 |
</layer>
|
455 |
-
<layer id="33" name="
|
456 |
<data transpose_a="false" transpose_b="true" />
|
457 |
<input>
|
458 |
<port id="0" precision="FP32">
|
@@ -473,7 +473,7 @@
|
|
473 |
</port>
|
474 |
</output>
|
475 |
</layer>
|
476 |
-
<layer id="34" name="
|
477 |
<data element_type="f16" shape="1, 1, 1280" offset="137205804" size="2560" />
|
478 |
<output>
|
479 |
<port id="0" precision="FP16">
|
@@ -483,7 +483,7 @@
|
|
483 |
</port>
|
484 |
</output>
|
485 |
</layer>
|
486 |
-
<layer id="35" name="
|
487 |
<data destination_type="f32" />
|
488 |
<rt_info>
|
489 |
<attribute name="decompression" version="0" />
|
@@ -525,7 +525,7 @@
|
|
525 |
</port>
|
526 |
</output>
|
527 |
</layer>
|
528 |
-
<layer id="37" name="
|
529 |
<data element_type="i64" shape="4" offset="137208364" size="32" />
|
530 |
<rt_info>
|
531 |
<attribute name="precise" version="0" />
|
@@ -634,7 +634,7 @@
|
|
634 |
</port>
|
635 |
</output>
|
636 |
</layer>
|
637 |
-
<layer id="44" name="
|
638 |
<data element_type="i64" shape="4" offset="137208364" size="32" />
|
639 |
<rt_info>
|
640 |
<attribute name="precise" version="0" />
|
@@ -726,13 +726,13 @@
|
|
726 |
<port id="0" precision="I32" />
|
727 |
</output>
|
728 |
</layer>
|
729 |
-
<layer id="50" name="
|
730 |
<data element_type="f32" shape="" offset="140485212" size="4" />
|
731 |
<output>
|
732 |
-
<port id="0" precision="FP32" />
|
733 |
</output>
|
734 |
</layer>
|
735 |
-
<layer id="51" name="
|
736 |
<data element_type="i64" shape="1" offset="133923868" size="8" />
|
737 |
<rt_info>
|
738 |
<attribute name="precise" version="0" />
|
@@ -743,7 +743,7 @@
|
|
743 |
</port>
|
744 |
</output>
|
745 |
</layer>
|
746 |
-
<layer id="52" name="
|
747 |
<data special_zero="false" />
|
748 |
<input>
|
749 |
<port id="0" precision="I64" />
|
@@ -776,7 +776,7 @@
|
|
776 |
<port id="2" precision="I64" names="62,64" />
|
777 |
</output>
|
778 |
</layer>
|
779 |
-
<layer id="55" name="
|
780 |
<data element_type="i32" shape="" offset="132776976" size="4" />
|
781 |
<rt_info>
|
782 |
<attribute name="precise" version="0" />
|
@@ -785,7 +785,7 @@
|
|
785 |
<port id="0" precision="I32" />
|
786 |
</output>
|
787 |
</layer>
|
788 |
-
<layer id="56" name="
|
789 |
<input>
|
790 |
<port id="0" precision="I64" />
|
791 |
<port id="1" precision="I32" />
|
@@ -827,7 +827,7 @@
|
|
827 |
</port>
|
828 |
</output>
|
829 |
</layer>
|
830 |
-
<layer id="59" name="
|
831 |
<data output_type="i32" />
|
832 |
<input>
|
833 |
<port id="0" precision="FP32">
|
@@ -841,19 +841,19 @@
|
|
841 |
</port>
|
842 |
</output>
|
843 |
</layer>
|
844 |
-
<layer id="60" name="
|
845 |
<data element_type="i64" shape="" offset="133923868" size="8" />
|
846 |
<output>
|
847 |
<port id="0" precision="I64" />
|
848 |
</output>
|
849 |
</layer>
|
850 |
-
<layer id="61" name="
|
851 |
<data element_type="i64" shape="" offset="133923860" size="8" />
|
852 |
<output>
|
853 |
<port id="0" precision="I64" />
|
854 |
</output>
|
855 |
</layer>
|
856 |
-
<layer id="62" name="
|
857 |
<data batch_dims="0" />
|
858 |
<input>
|
859 |
<port id="0" precision="I32">
|
@@ -905,7 +905,7 @@
|
|
905 |
<port id="0" precision="I32" />
|
906 |
</output>
|
907 |
</layer>
|
908 |
-
<layer id="67" name="
|
909 |
<data destination_type="i32" />
|
910 |
<input>
|
911 |
<port id="0" precision="I64" />
|
@@ -1059,7 +1059,7 @@
|
|
1059 |
</port>
|
1060 |
</output>
|
1061 |
</layer>
|
1062 |
-
<layer id="80" name="
|
1063 |
<data element_type="i64" shape="2" offset="140485218" size="16" />
|
1064 |
<rt_info>
|
1065 |
<attribute name="precise" version="0" />
|
@@ -1179,7 +1179,7 @@
|
|
1179 |
</port>
|
1180 |
</output>
|
1181 |
</layer>
|
1182 |
-
<layer id="88" name="
|
1183 |
<data element_type="i64" shape="1" offset="133923860" size="8" />
|
1184 |
<rt_info>
|
1185 |
<attribute name="precise" version="0" />
|
@@ -1190,7 +1190,7 @@
|
|
1190 |
</port>
|
1191 |
</output>
|
1192 |
</layer>
|
1193 |
-
<layer id="89" name="
|
1194 |
<data element_type="i64" shape="" offset="133923860" size="8" />
|
1195 |
<rt_info>
|
1196 |
<attribute name="precise" version="0" />
|
@@ -1199,7 +1199,7 @@
|
|
1199 |
<port id="0" precision="I64" />
|
1200 |
</output>
|
1201 |
</layer>
|
1202 |
-
<layer id="90" name="
|
1203 |
<data batch_dims="0" />
|
1204 |
<input>
|
1205 |
<port id="0" precision="I64">
|
@@ -1216,7 +1216,7 @@
|
|
1216 |
</port>
|
1217 |
</output>
|
1218 |
</layer>
|
1219 |
-
<layer id="91" name="
|
1220 |
<data element_type="i64" shape="1" offset="133923868" size="8" />
|
1221 |
<rt_info>
|
1222 |
<attribute name="precise" version="0" />
|
@@ -1227,7 +1227,7 @@
|
|
1227 |
</port>
|
1228 |
</output>
|
1229 |
</layer>
|
1230 |
-
<layer id="92" name="
|
1231 |
<data element_type="i64" shape="1" offset="133923868" size="8" />
|
1232 |
<rt_info>
|
1233 |
<attribute name="precise" version="0" />
|
@@ -1238,7 +1238,7 @@
|
|
1238 |
</port>
|
1239 |
</output>
|
1240 |
</layer>
|
1241 |
-
<layer id="93" name="
|
1242 |
<data element_type="i64" shape="1" offset="133923868" size="8" />
|
1243 |
<rt_info>
|
1244 |
<attribute name="precise" version="0" />
|
@@ -1293,7 +1293,7 @@
|
|
1293 |
</port>
|
1294 |
</output>
|
1295 |
</layer>
|
1296 |
-
<layer id="96" name="
|
1297 |
<data element_type="i64" shape="1" offset="133923860" size="8" />
|
1298 |
<output>
|
1299 |
<port id="0" precision="I64">
|
@@ -1301,7 +1301,7 @@
|
|
1301 |
</port>
|
1302 |
</output>
|
1303 |
</layer>
|
1304 |
-
<layer id="97" name="
|
1305 |
<data output_type="i64" />
|
1306 |
<input>
|
1307 |
<port id="0" precision="FP32">
|
@@ -1316,7 +1316,7 @@
|
|
1316 |
</port>
|
1317 |
</output>
|
1318 |
</layer>
|
1319 |
-
<layer id="98" name="
|
1320 |
<data element_type="i64" shape="1" offset="133923868" size="8" />
|
1321 |
<output>
|
1322 |
<port id="0" precision="I64">
|
@@ -1324,13 +1324,13 @@
|
|
1324 |
</port>
|
1325 |
</output>
|
1326 |
</layer>
|
1327 |
-
<layer id="99" name="
|
1328 |
<data element_type="i64" shape="" offset="133923860" size="8" />
|
1329 |
<output>
|
1330 |
<port id="0" precision="I64" />
|
1331 |
</output>
|
1332 |
</layer>
|
1333 |
-
<layer id="100" name="
|
1334 |
<data batch_dims="0" />
|
1335 |
<input>
|
1336 |
<port id="0" precision="I64">
|
@@ -1347,7 +1347,7 @@
|
|
1347 |
</port>
|
1348 |
</output>
|
1349 |
</layer>
|
1350 |
-
<layer id="101" name="
|
1351 |
<data element_type="i64" shape="1" offset="133923868" size="8" />
|
1352 |
<output>
|
1353 |
<port id="0" precision="I64">
|
@@ -1485,7 +1485,7 @@
|
|
1485 |
</port>
|
1486 |
</output>
|
1487 |
</layer>
|
1488 |
-
<layer id="109" name="
|
1489 |
<data element_type="f16" shape="1, 1, 1280" offset="143762042" size="2560" />
|
1490 |
<output>
|
1491 |
<port id="0" precision="FP16">
|
@@ -1495,7 +1495,7 @@
|
|
1495 |
</port>
|
1496 |
</output>
|
1497 |
</layer>
|
1498 |
-
<layer id="110" name="
|
1499 |
<data destination_type="f32" />
|
1500 |
<rt_info>
|
1501 |
<attribute name="decompression" version="0" />
|
@@ -1537,7 +1537,7 @@
|
|
1537 |
</port>
|
1538 |
</output>
|
1539 |
</layer>
|
1540 |
-
<layer id="112" name="
|
1541 |
<data element_type="i64" shape="4" offset="137208364" size="32" />
|
1542 |
<rt_info>
|
1543 |
<attribute name="precise" version="0" />
|
@@ -1652,7 +1652,7 @@
|
|
1652 |
</port>
|
1653 |
</output>
|
1654 |
</layer>
|
1655 |
-
<layer id="119" name="
|
1656 |
<data element_type="i64" shape="3" offset="143764602" size="24" />
|
1657 |
<rt_info>
|
1658 |
<attribute name="precise" version="0" />
|
@@ -1732,7 +1732,7 @@
|
|
1732 |
</port>
|
1733 |
</output>
|
1734 |
</layer>
|
1735 |
-
<layer id="124" name="
|
1736 |
<data element_type="f16" shape="1, 1, 1280" offset="147041426" size="2560" />
|
1737 |
<output>
|
1738 |
<port id="0" precision="FP16">
|
@@ -1742,7 +1742,7 @@
|
|
1742 |
</port>
|
1743 |
</output>
|
1744 |
</layer>
|
1745 |
-
<layer id="125" name="
|
1746 |
<data destination_type="f32" />
|
1747 |
<rt_info>
|
1748 |
<attribute name="decompression" version="0" />
|
@@ -1834,7 +1834,7 @@
|
|
1834 |
</port>
|
1835 |
</output>
|
1836 |
</layer>
|
1837 |
-
<layer id="130" name="
|
1838 |
<data element_type="f16" shape="1, 1, 1280" offset="147043986" size="2560" />
|
1839 |
<output>
|
1840 |
<port id="0" precision="FP16">
|
@@ -1844,7 +1844,7 @@
|
|
1844 |
</port>
|
1845 |
</output>
|
1846 |
</layer>
|
1847 |
-
<layer id="131" name="
|
1848 |
<data destination_type="f32" />
|
1849 |
<rt_info>
|
1850 |
<attribute name="decompression" version="0" />
|
@@ -1886,7 +1886,7 @@
|
|
1886 |
</port>
|
1887 |
</output>
|
1888 |
</layer>
|
1889 |
-
<layer id="133" name="
|
1890 |
<data element_type="f16" shape="1, 1, 1280" offset="147046546" size="2560" />
|
1891 |
<output>
|
1892 |
<port id="0" precision="FP16">
|
@@ -1896,7 +1896,7 @@
|
|
1896 |
</port>
|
1897 |
</output>
|
1898 |
</layer>
|
1899 |
-
<layer id="134" name="
|
1900 |
<data destination_type="f32" />
|
1901 |
<rt_info>
|
1902 |
<attribute name="decompression" version="0" />
|
@@ -1938,7 +1938,7 @@
|
|
1938 |
</port>
|
1939 |
</output>
|
1940 |
</layer>
|
1941 |
-
<layer id="136" name="
|
1942 |
<data element_type="f16" shape="1280, 1280" offset="147049106" size="3276800" />
|
1943 |
<output>
|
1944 |
<port id="0" precision="FP16">
|
@@ -1947,7 +1947,7 @@
|
|
1947 |
</port>
|
1948 |
</output>
|
1949 |
</layer>
|
1950 |
-
<layer id="137" name="
|
1951 |
<data destination_type="f32" />
|
1952 |
<rt_info>
|
1953 |
<attribute name="decompression" version="0" />
|
@@ -1965,7 +1965,7 @@
|
|
1965 |
</port>
|
1966 |
</output>
|
1967 |
</layer>
|
1968 |
-
<layer id="138" name="
|
1969 |
<data transpose_a="false" transpose_b="true" />
|
1970 |
<input>
|
1971 |
<port id="0" precision="FP32">
|
@@ -1986,7 +1986,7 @@
|
|
1986 |
</port>
|
1987 |
</output>
|
1988 |
</layer>
|
1989 |
-
<layer id="139" name="
|
1990 |
<data element_type="f16" shape="1, 1, 1280" offset="150325906" size="2560" />
|
1991 |
<output>
|
1992 |
<port id="0" precision="FP16">
|
@@ -1996,7 +1996,7 @@
|
|
1996 |
</port>
|
1997 |
</output>
|
1998 |
</layer>
|
1999 |
-
<layer id="140" name="
|
2000 |
<data destination_type="f32" />
|
2001 |
<rt_info>
|
2002 |
<attribute name="decompression" version="0" />
|
@@ -2038,7 +2038,7 @@
|
|
2038 |
</port>
|
2039 |
</output>
|
2040 |
</layer>
|
2041 |
-
<layer id="142" name="
|
2042 |
<data element_type="i64" shape="4" offset="137208364" size="32" />
|
2043 |
<rt_info>
|
2044 |
<attribute name="precise" version="0" />
|
@@ -2147,7 +2147,7 @@
|
|
2147 |
</port>
|
2148 |
</output>
|
2149 |
</layer>
|
2150 |
-
<layer id="149" name="
|
2151 |
<data element_type="i64" shape="1" offset="153605266" size="8" />
|
2152 |
<rt_info>
|
2153 |
<attribute name="precise" version="0" />
|
@@ -2158,7 +2158,7 @@
|
|
2158 |
</port>
|
2159 |
</output>
|
2160 |
</layer>
|
2161 |
-
<layer id="150" name="
|
2162 |
<data element_type="i64" shape="1" offset="153605274" size="8" />
|
2163 |
<rt_info>
|
2164 |
<attribute name="precise" version="0" />
|
@@ -2169,7 +2169,7 @@
|
|
2169 |
</port>
|
2170 |
</output>
|
2171 |
</layer>
|
2172 |
-
<layer id="151" name="
|
2173 |
<data element_type="i64" shape="1" offset="153605282" size="8" />
|
2174 |
<rt_info>
|
2175 |
<attribute name="precise" version="0" />
|
@@ -2180,7 +2180,7 @@
|
|
2180 |
</port>
|
2181 |
</output>
|
2182 |
</layer>
|
2183 |
-
<layer id="152" name="__module.model.model.decoder.layers.0.
|
2184 |
<data axis="0" />
|
2185 |
<input>
|
2186 |
<port id="0" precision="I64">
|
@@ -2344,7 +2344,7 @@
|
|
2344 |
</port>
|
2345 |
</output>
|
2346 |
</layer>
|
2347 |
-
<layer id="161" name="
|
2348 |
<data element_type="f16" shape="1, 1, 1280" offset="156882090" size="2560" />
|
2349 |
<output>
|
2350 |
<port id="0" precision="FP16">
|
@@ -2354,7 +2354,7 @@
|
|
2354 |
</port>
|
2355 |
</output>
|
2356 |
</layer>
|
2357 |
-
<layer id="162" name="
|
2358 |
<data destination_type="f32" />
|
2359 |
<rt_info>
|
2360 |
<attribute name="decompression" version="0" />
|
@@ -2500,7 +2500,7 @@
|
|
2500 |
</port>
|
2501 |
</output>
|
2502 |
</layer>
|
2503 |
-
<layer id="170" name="
|
2504 |
<data element_type="i64" shape="3" offset="156884650" size="24" />
|
2505 |
<rt_info>
|
2506 |
<attribute name="precise" version="0" />
|
@@ -2580,7 +2580,7 @@
|
|
2580 |
</port>
|
2581 |
</output>
|
2582 |
</layer>
|
2583 |
-
<layer id="175" name="
|
2584 |
<data element_type="f16" shape="1, 1, 1280" offset="160161474" size="2560" />
|
2585 |
<output>
|
2586 |
<port id="0" precision="FP16">
|
@@ -2590,7 +2590,7 @@
|
|
2590 |
</port>
|
2591 |
</output>
|
2592 |
</layer>
|
2593 |
-
<layer id="176" name="
|
2594 |
<data destination_type="f32" />
|
2595 |
<rt_info>
|
2596 |
<attribute name="decompression" version="0" />
|
@@ -2682,7 +2682,7 @@
|
|
2682 |
</port>
|
2683 |
</output>
|
2684 |
</layer>
|
2685 |
-
<layer id="181" name="
|
2686 |
<data element_type="f16" shape="1, 1, 1280" offset="160164034" size="2560" />
|
2687 |
<output>
|
2688 |
<port id="0" precision="FP16">
|
@@ -2692,7 +2692,7 @@
|
|
2692 |
</port>
|
2693 |
</output>
|
2694 |
</layer>
|
2695 |
-
<layer id="182" name="
|
2696 |
<data destination_type="f32" />
|
2697 |
<rt_info>
|
2698 |
<attribute name="decompression" version="0" />
|
@@ -2734,7 +2734,7 @@
|
|
2734 |
</port>
|
2735 |
</output>
|
2736 |
</layer>
|
2737 |
-
<layer id="184" name="
|
2738 |
<data element_type="f16" shape="1, 1, 1280" offset="160166594" size="2560" />
|
2739 |
<output>
|
2740 |
<port id="0" precision="FP16">
|
@@ -2744,7 +2744,7 @@
|
|
2744 |
</port>
|
2745 |
</output>
|
2746 |
</layer>
|
2747 |
-
<layer id="185" name="
|
2748 |
<data destination_type="f32" />
|
2749 |
<rt_info>
|
2750 |
<attribute name="decompression" version="0" />
|
@@ -2834,7 +2834,7 @@
|
|
2834 |
</port>
|
2835 |
</output>
|
2836 |
</layer>
|
2837 |
-
<layer id="190" name="
|
2838 |
<data element_type="f16" shape="1, 1, 5120" offset="173276354" size="10240" />
|
2839 |
<output>
|
2840 |
<port id="0" precision="FP16">
|
@@ -2844,7 +2844,7 @@
|
|
2844 |
</port>
|
2845 |
</output>
|
2846 |
</layer>
|
2847 |
-
<layer id="191" name="
|
2848 |
<data destination_type="f32" />
|
2849 |
<rt_info>
|
2850 |
<attribute name="decompression" version="0" />
|
@@ -2951,7 +2951,7 @@
|
|
2951 |
</port>
|
2952 |
</output>
|
2953 |
</layer>
|
2954 |
-
<layer id="197" name="
|
2955 |
<data element_type="f16" shape="1, 1, 1280" offset="186393794" size="2560" />
|
2956 |
<output>
|
2957 |
<port id="0" precision="FP16">
|
@@ -2961,7 +2961,7 @@
|
|
2961 |
</port>
|
2962 |
</output>
|
2963 |
</layer>
|
2964 |
-
<layer id="198" name="
|
2965 |
<data destination_type="f32" />
|
2966 |
<rt_info>
|
2967 |
<attribute name="decompression" version="0" />
|
@@ -3053,7 +3053,7 @@
|
|
3053 |
</port>
|
3054 |
</output>
|
3055 |
</layer>
|
3056 |
-
<layer id="203" name="
|
3057 |
<data element_type="f16" shape="1, 1, 1280" offset="186396354" size="2560" />
|
3058 |
<output>
|
3059 |
<port id="0" precision="FP16">
|
@@ -3063,7 +3063,7 @@
|
|
3063 |
</port>
|
3064 |
</output>
|
3065 |
</layer>
|
3066 |
-
<layer id="204" name="
|
3067 |
<data destination_type="f32" />
|
3068 |
<rt_info>
|
3069 |
<attribute name="decompression" version="0" />
|
@@ -3105,7 +3105,7 @@
|
|
3105 |
</port>
|
3106 |
</output>
|
3107 |
</layer>
|
3108 |
-
<layer id="206" name="
|
3109 |
<data element_type="f16" shape="1, 1, 1280" offset="186398914" size="2560" />
|
3110 |
<output>
|
3111 |
<port id="0" precision="FP16">
|
@@ -3115,7 +3115,7 @@
|
|
3115 |
</port>
|
3116 |
</output>
|
3117 |
</layer>
|
3118 |
-
<layer id="207" name="
|
3119 |
<data destination_type="f32" />
|
3120 |
<rt_info>
|
3121 |
<attribute name="decompression" version="0" />
|
@@ -3157,7 +3157,7 @@
|
|
3157 |
</port>
|
3158 |
</output>
|
3159 |
</layer>
|
3160 |
-
<layer id="209" name="
|
3161 |
<data element_type="f16" shape="1280, 1280" offset="186401474" size="3276800" />
|
3162 |
<output>
|
3163 |
<port id="0" precision="FP16">
|
@@ -3166,7 +3166,7 @@
|
|
3166 |
</port>
|
3167 |
</output>
|
3168 |
</layer>
|
3169 |
-
<layer id="210" name="
|
3170 |
<data destination_type="f32" />
|
3171 |
<rt_info>
|
3172 |
<attribute name="decompression" version="0" />
|
@@ -3184,7 +3184,7 @@
|
|
3184 |
</port>
|
3185 |
</output>
|
3186 |
</layer>
|
3187 |
-
<layer id="211" name="
|
3188 |
<data transpose_a="false" transpose_b="true" />
|
3189 |
<input>
|
3190 |
<port id="0" precision="FP32">
|
@@ -3205,7 +3205,7 @@
|
|
3205 |
</port>
|
3206 |
</output>
|
3207 |
</layer>
|
3208 |
-
<layer id="212" name="
|
3209 |
<data element_type="f16" shape="1, 1, 1280" offset="189678274" size="2560" />
|
3210 |
<output>
|
3211 |
<port id="0" precision="FP16">
|
@@ -3215,7 +3215,7 @@
|
|
3215 |
</port>
|
3216 |
</output>
|
3217 |
</layer>
|
3218 |
-
<layer id="213" name="
|
3219 |
<data destination_type="f32" />
|
3220 |
<rt_info>
|
3221 |
<attribute name="decompression" version="0" />
|
@@ -3257,7 +3257,7 @@
|
|
3257 |
</port>
|
3258 |
</output>
|
3259 |
</layer>
|
3260 |
-
<layer id="215" name="
|
3261 |
<data element_type="i64" shape="4" offset="137208364" size="32" />
|
3262 |
<rt_info>
|
3263 |
<attribute name="precise" version="0" />
|
@@ -3366,7 +3366,7 @@
|
|
3366 |
</port>
|
3367 |
</output>
|
3368 |
</layer>
|
3369 |
-
<layer id="222" name="
|
3370 |
<data element_type="i64" shape="4" offset="137208364" size="32" />
|
3371 |
<rt_info>
|
3372 |
<attribute name="precise" version="0" />
|
@@ -3544,7 +3544,7 @@
|
|
3544 |
</port>
|
3545 |
</output>
|
3546 |
</layer>
|
3547 |
-
<layer id="232" name="
|
3548 |
<data element_type="f16" shape="1, 1, 1280" offset="196234434" size="2560" />
|
3549 |
<output>
|
3550 |
<port id="0" precision="FP16">
|
@@ -3554,7 +3554,7 @@
|
|
3554 |
</port>
|
3555 |
</output>
|
3556 |
</layer>
|
3557 |
-
<layer id="233" name="
|
3558 |
<data destination_type="f32" />
|
3559 |
<rt_info>
|
3560 |
<attribute name="decompression" version="0" />
|
@@ -3596,7 +3596,7 @@
|
|
3596 |
</port>
|
3597 |
</output>
|
3598 |
</layer>
|
3599 |
-
<layer id="235" name="
|
3600 |
<data element_type="i64" shape="4" offset="137208364" size="32" />
|
3601 |
<rt_info>
|
3602 |
<attribute name="precise" version="0" />
|
@@ -3711,7 +3711,7 @@
|
|
3711 |
</port>
|
3712 |
</output>
|
3713 |
</layer>
|
3714 |
-
<layer id="242" name="
|
3715 |
<data element_type="i64" shape="3" offset="143764602" size="24" />
|
3716 |
<rt_info>
|
3717 |
<attribute name="precise" version="0" />
|
@@ -3791,7 +3791,7 @@
|
|
3791 |
</port>
|
3792 |
</output>
|
3793 |
</layer>
|
3794 |
-
<layer id="247" name="
|
3795 |
<data element_type="f16" shape="1, 1, 1280" offset="199513794" size="2560" />
|
3796 |
<output>
|
3797 |
<port id="0" precision="FP16">
|
@@ -3801,7 +3801,7 @@
|
|
3801 |
</port>
|
3802 |
</output>
|
3803 |
</layer>
|
3804 |
-
<layer id="248" name="
|
3805 |
<data destination_type="f32" />
|
3806 |
<rt_info>
|
3807 |
<attribute name="decompression" version="0" />
|
@@ -3893,7 +3893,7 @@
|
|
3893 |
</port>
|
3894 |
</output>
|
3895 |
</layer>
|
3896 |
-
<layer id="253" name="
|
3897 |
<data element_type="f16" shape="1, 1, 1280" offset="199516354" size="2560" />
|
3898 |
<output>
|
3899 |
<port id="0" precision="FP16">
|
@@ -3903,7 +3903,7 @@
|
|
3903 |
</port>
|
3904 |
</output>
|
3905 |
</layer>
|
3906 |
-
<layer id="254" name="
|
3907 |
<data destination_type="f32" />
|
3908 |
<rt_info>
|
3909 |
<attribute name="decompression" version="0" />
|
@@ -3945,7 +3945,7 @@
|
|
3945 |
</port>
|
3946 |
</output>
|
3947 |
</layer>
|
3948 |
-
<layer id="256" name="
|
3949 |
<data element_type="f16" shape="1, 1, 1280" offset="199518914" size="2560" />
|
3950 |
<output>
|
3951 |
<port id="0" precision="FP16">
|
@@ -3955,7 +3955,7 @@
|
|
3955 |
</port>
|
3956 |
</output>
|
3957 |
</layer>
|
3958 |
-
<layer id="257" name="
|
3959 |
<data destination_type="f32" />
|
3960 |
<rt_info>
|
3961 |
<attribute name="decompression" version="0" />
|
@@ -3997,7 +3997,7 @@
|
|
3997 |
</port>
|
3998 |
</output>
|
3999 |
</layer>
|
4000 |
-
<layer id="259" name="
|
4001 |
<data element_type="f16" shape="1280, 1280" offset="199521474" size="3276800" />
|
4002 |
<output>
|
4003 |
<port id="0" precision="FP16">
|
@@ -4006,7 +4006,7 @@
|
|
4006 |
</port>
|
4007 |
</output>
|
4008 |
</layer>
|
4009 |
-
<layer id="260" name="
|
4010 |
<data destination_type="f32" />
|
4011 |
<rt_info>
|
4012 |
<attribute name="decompression" version="0" />
|
@@ -4024,7 +4024,7 @@
|
|
4024 |
</port>
|
4025 |
</output>
|
4026 |
</layer>
|
4027 |
-
<layer id="261" name="
|
4028 |
<data transpose_a="false" transpose_b="true" />
|
4029 |
<input>
|
4030 |
<port id="0" precision="FP32">
|
@@ -4045,7 +4045,7 @@
|
|
4045 |
</port>
|
4046 |
</output>
|
4047 |
</layer>
|
4048 |
-
<layer id="262" name="
|
4049 |
<data element_type="f16" shape="1, 1, 1280" offset="202798274" size="2560" />
|
4050 |
<output>
|
4051 |
<port id="0" precision="FP16">
|
@@ -4055,7 +4055,7 @@
|
|
4055 |
</port>
|
4056 |
</output>
|
4057 |
</layer>
|
4058 |
-
<layer id="263" name="
|
4059 |
<data destination_type="f32" />
|
4060 |
<rt_info>
|
4061 |
<attribute name="decompression" version="0" />
|
@@ -4097,7 +4097,7 @@
|
|
4097 |
</port>
|
4098 |
</output>
|
4099 |
</layer>
|
4100 |
-
<layer id="265" name="
|
4101 |
<data element_type="i64" shape="4" offset="137208364" size="32" />
|
4102 |
<rt_info>
|
4103 |
<attribute name="precise" version="0" />
|
@@ -4348,7 +4348,7 @@
|
|
4348 |
</port>
|
4349 |
</output>
|
4350 |
</layer>
|
4351 |
-
<layer id="280" name="
|
4352 |
<data element_type="f16" shape="1, 1, 1280" offset="209354434" size="2560" />
|
4353 |
<output>
|
4354 |
<port id="0" precision="FP16">
|
@@ -4358,7 +4358,7 @@
|
|
4358 |
</port>
|
4359 |
</output>
|
4360 |
</layer>
|
4361 |
-
<layer id="281" name="
|
4362 |
<data destination_type="f32" />
|
4363 |
<rt_info>
|
4364 |
<attribute name="decompression" version="0" />
|
@@ -4504,7 +4504,7 @@
|
|
4504 |
</port>
|
4505 |
</output>
|
4506 |
</layer>
|
4507 |
-
<layer id="289" name="
|
4508 |
<data element_type="i64" shape="3" offset="156884650" size="24" />
|
4509 |
<rt_info>
|
4510 |
<attribute name="precise" version="0" />
|
@@ -4584,7 +4584,7 @@
|
|
4584 |
</port>
|
4585 |
</output>
|
4586 |
</layer>
|
4587 |
-
<layer id="294" name="
|
4588 |
<data element_type="f16" shape="1, 1, 1280" offset="212633794" size="2560" />
|
4589 |
<output>
|
4590 |
<port id="0" precision="FP16">
|
@@ -4594,7 +4594,7 @@
|
|
4594 |
</port>
|
4595 |
</output>
|
4596 |
</layer>
|
4597 |
-
<layer id="295" name="
|
4598 |
<data destination_type="f32" />
|
4599 |
<rt_info>
|
4600 |
<attribute name="decompression" version="0" />
|
@@ -4686,7 +4686,7 @@
|
|
4686 |
</port>
|
4687 |
</output>
|
4688 |
</layer>
|
4689 |
-
<layer id="300" name="
|
4690 |
<data element_type="f16" shape="1, 1, 1280" offset="212636354" size="2560" />
|
4691 |
<output>
|
4692 |
<port id="0" precision="FP16">
|
@@ -4696,7 +4696,7 @@
|
|
4696 |
</port>
|
4697 |
</output>
|
4698 |
</layer>
|
4699 |
-
<layer id="301" name="
|
4700 |
<data destination_type="f32" />
|
4701 |
<rt_info>
|
4702 |
<attribute name="decompression" version="0" />
|
@@ -4738,7 +4738,7 @@
|
|
4738 |
</port>
|
4739 |
</output>
|
4740 |
</layer>
|
4741 |
-
<layer id="303" name="
|
4742 |
<data element_type="f16" shape="1, 1, 1280" offset="212638914" size="2560" />
|
4743 |
<output>
|
4744 |
<port id="0" precision="FP16">
|
@@ -4748,7 +4748,7 @@
|
|
4748 |
</port>
|
4749 |
</output>
|
4750 |
</layer>
|
4751 |
-
<layer id="304" name="
|
4752 |
<data destination_type="f32" />
|
4753 |
<rt_info>
|
4754 |
<attribute name="decompression" version="0" />
|
@@ -4838,7 +4838,7 @@
|
|
4838 |
</port>
|
4839 |
</output>
|
4840 |
</layer>
|
4841 |
-
<layer id="309" name="
|
4842 |
<data element_type="f16" shape="1, 1, 5120" offset="225748674" size="10240" />
|
4843 |
<output>
|
4844 |
<port id="0" precision="FP16">
|
@@ -4848,7 +4848,7 @@
|
|
4848 |
</port>
|
4849 |
</output>
|
4850 |
</layer>
|
4851 |
-
<layer id="310" name="
|
4852 |
<data destination_type="f32" />
|
4853 |
<rt_info>
|
4854 |
<attribute name="decompression" version="0" />
|
@@ -4955,7 +4955,7 @@
|
|
4955 |
</port>
|
4956 |
</output>
|
4957 |
</layer>
|
4958 |
-
<layer id="316" name="
|
4959 |
<data element_type="f16" shape="1, 1, 1280" offset="238866114" size="2560" />
|
4960 |
<output>
|
4961 |
<port id="0" precision="FP16">
|
@@ -4965,7 +4965,7 @@
|
|
4965 |
</port>
|
4966 |
</output>
|
4967 |
</layer>
|
4968 |
-
<layer id="317" name="
|
4969 |
<data destination_type="f32" />
|
4970 |
<rt_info>
|
4971 |
<attribute name="decompression" version="0" />
|
@@ -5057,7 +5057,7 @@
|
|
5057 |
</port>
|
5058 |
</output>
|
5059 |
</layer>
|
5060 |
-
<layer id="322" name="
|
5061 |
<data element_type="f16" shape="1, 1, 1280" offset="238868674" size="2560" />
|
5062 |
<output>
|
5063 |
<port id="0" precision="FP16">
|
@@ -5067,7 +5067,7 @@
|
|
5067 |
</port>
|
5068 |
</output>
|
5069 |
</layer>
|
5070 |
-
<layer id="323" name="
|
5071 |
<data destination_type="f32" />
|
5072 |
<rt_info>
|
5073 |
<attribute name="decompression" version="0" />
|
@@ -5109,7 +5109,7 @@
|
|
5109 |
</port>
|
5110 |
</output>
|
5111 |
</layer>
|
5112 |
-
<layer id="325" name="
|
5113 |
<data element_type="f16" shape="1, 1, 1280" offset="238871234" size="2560" />
|
5114 |
<output>
|
5115 |
<port id="0" precision="FP16">
|
@@ -5119,7 +5119,7 @@
|
|
5119 |
</port>
|
5120 |
</output>
|
5121 |
</layer>
|
5122 |
-
<layer id="326" name="
|
5123 |
<data destination_type="f32" />
|
5124 |
<rt_info>
|
5125 |
<attribute name="decompression" version="0" />
|
@@ -5182,7 +5182,7 @@
|
|
5182 |
</port>
|
5183 |
</output>
|
5184 |
</layer>
|
5185 |
-
<layer id="329" name="
|
5186 |
<input>
|
5187 |
<port id="0" precision="FP32">
|
5188 |
<dim>-1</dim>
|
@@ -5558,16 +5558,16 @@
|
|
5558 |
<edge from-layer="328" from-port="2" to-layer="329" to-port="0" />
|
5559 |
</edges>
|
5560 |
<rt_info>
|
5561 |
-
<Runtime_version value="2024.5.0-
|
5562 |
<conversion_parameters>
|
5563 |
<framework value="pytorch" />
|
5564 |
<is_python_object value="True" />
|
5565 |
</conversion_parameters>
|
5566 |
<optimum>
|
5567 |
-
<optimum_intel_version value="1.
|
5568 |
-
<optimum_version value="1.23.
|
5569 |
-
<pytorch_version value="2.5.
|
5570 |
-
<transformers_version value="4.
|
5571 |
</optimum>
|
5572 |
</rt_info>
|
5573 |
</net>
|
|
|
10 |
</port>
|
11 |
</output>
|
12 |
</layer>
|
13 |
+
<layer id="0" name="Parameter_26704" type="Parameter" version="opset1">
|
14 |
<data shape="?,?,?" element_type="f32" />
|
15 |
<output>
|
16 |
<port id="0" precision="FP32" names="encoder_hidden_states">
|
|
|
47 |
</port>
|
48 |
</output>
|
49 |
</layer>
|
50 |
+
<layer id="4" name="Constant_32205" type="Const" version="opset1">
|
51 |
<data element_type="i64" shape="2" offset="132776960" size="16" />
|
52 |
<rt_info>
|
53 |
<attribute name="precise" version="0" />
|
|
|
151 |
<port id="0" precision="I64" names="23" />
|
152 |
</output>
|
153 |
</layer>
|
154 |
+
<layer id="12" name="ShapeOf_32121" type="ShapeOf" version="opset3">
|
155 |
<data output_type="i64" />
|
156 |
<input>
|
157 |
<port id="0" precision="I64">
|
|
|
165 |
</port>
|
166 |
</output>
|
167 |
</layer>
|
168 |
+
<layer id="13" name="Constant_32122" type="Const" version="opset1">
|
169 |
<data element_type="i64" shape="" offset="133923868" size="8" />
|
170 |
<rt_info>
|
171 |
<attribute name="precise" version="0" />
|
|
|
174 |
<port id="0" precision="I64" />
|
175 |
</output>
|
176 |
</layer>
|
177 |
+
<layer id="14" name="Constant_32123" type="Const" version="opset1">
|
178 |
<data element_type="i64" shape="" offset="133923860" size="8" />
|
179 |
<rt_info>
|
180 |
<attribute name="precise" version="0" />
|
|
|
183 |
<port id="0" precision="I64" />
|
184 |
</output>
|
185 |
</layer>
|
186 |
+
<layer id="15" name="Gather_32124" type="Gather" version="opset8">
|
187 |
<data batch_dims="0" />
|
188 |
<input>
|
189 |
<port id="0" precision="I64">
|
|
|
244 |
</port>
|
245 |
</output>
|
246 |
</layer>
|
247 |
+
<layer id="20" name="__module.model.model.decoder.embed_positions/aten::index/Constant" type="Const" version="opset1">
|
248 |
<data element_type="i32" shape="" offset="132776976" size="4" />
|
249 |
<output>
|
250 |
<port id="0" precision="I32" />
|
|
|
321 |
</port>
|
322 |
</output>
|
323 |
</layer>
|
324 |
+
<layer id="25" name="Constant_31887_compressed" type="Const" version="opset1">
|
325 |
<data element_type="f16" shape="1, 1, 1280" offset="133923884" size="2560" />
|
326 |
<output>
|
327 |
<port id="0" precision="FP16">
|
|
|
331 |
</port>
|
332 |
</output>
|
333 |
</layer>
|
334 |
+
<layer id="26" name="Constant_31887" type="Convert" version="opset1">
|
335 |
<data destination_type="f32" />
|
336 |
<rt_info>
|
337 |
<attribute name="decompression" version="0" />
|
|
|
373 |
</port>
|
374 |
</output>
|
375 |
</layer>
|
376 |
+
<layer id="28" name="Constant_31888_compressed" type="Const" version="opset1">
|
377 |
<data element_type="f16" shape="1, 1, 1280" offset="133926444" size="2560" />
|
378 |
<output>
|
379 |
<port id="0" precision="FP16">
|
|
|
383 |
</port>
|
384 |
</output>
|
385 |
</layer>
|
386 |
+
<layer id="29" name="Constant_31888" type="Convert" version="opset1">
|
387 |
<data destination_type="f32" />
|
388 |
<rt_info>
|
389 |
<attribute name="decompression" version="0" />
|
|
|
425 |
</port>
|
426 |
</output>
|
427 |
</layer>
|
428 |
+
<layer id="31" name="Constant_31790_compressed" type="Const" version="opset1">
|
429 |
<data element_type="f16" shape="1280, 1280" offset="133929004" size="3276800" />
|
430 |
<output>
|
431 |
<port id="0" precision="FP16">
|
|
|
434 |
</port>
|
435 |
</output>
|
436 |
</layer>
|
437 |
+
<layer id="32" name="Constant_31790" type="Convert" version="opset1">
|
438 |
<data destination_type="f32" />
|
439 |
<rt_info>
|
440 |
<attribute name="decompression" version="0" />
|
|
|
452 |
</port>
|
453 |
</output>
|
454 |
</layer>
|
455 |
+
<layer id="33" name="Multiply_31773" type="MatMul" version="opset1">
|
456 |
<data transpose_a="false" transpose_b="true" />
|
457 |
<input>
|
458 |
<port id="0" precision="FP32">
|
|
|
473 |
</port>
|
474 |
</output>
|
475 |
</layer>
|
476 |
+
<layer id="34" name="Constant_31889_compressed" type="Const" version="opset1">
|
477 |
<data element_type="f16" shape="1, 1, 1280" offset="137205804" size="2560" />
|
478 |
<output>
|
479 |
<port id="0" precision="FP16">
|
|
|
483 |
</port>
|
484 |
</output>
|
485 |
</layer>
|
486 |
+
<layer id="35" name="Constant_31889" type="Convert" version="opset1">
|
487 |
<data destination_type="f32" />
|
488 |
<rt_info>
|
489 |
<attribute name="decompression" version="0" />
|
|
|
525 |
</port>
|
526 |
</output>
|
527 |
</layer>
|
528 |
+
<layer id="37" name="Constant_32206" type="Const" version="opset1">
|
529 |
<data element_type="i64" shape="4" offset="137208364" size="32" />
|
530 |
<rt_info>
|
531 |
<attribute name="precise" version="0" />
|
|
|
634 |
</port>
|
635 |
</output>
|
636 |
</layer>
|
637 |
+
<layer id="44" name="Constant_32207" type="Const" version="opset1">
|
638 |
<data element_type="i64" shape="4" offset="137208364" size="32" />
|
639 |
<rt_info>
|
640 |
<attribute name="precise" version="0" />
|
|
|
726 |
<port id="0" precision="I32" />
|
727 |
</output>
|
728 |
</layer>
|
729 |
+
<layer id="50" name="17" type="Const" version="opset1">
|
730 |
<data element_type="f32" shape="" offset="140485212" size="4" />
|
731 |
<output>
|
732 |
+
<port id="0" precision="FP32" names="17" />
|
733 |
</output>
|
734 |
</layer>
|
735 |
+
<layer id="51" name="Constant_32145" type="Const" version="opset1">
|
736 |
<data element_type="i64" shape="1" offset="133923868" size="8" />
|
737 |
<rt_info>
|
738 |
<attribute name="precise" version="0" />
|
|
|
743 |
</port>
|
744 |
</output>
|
745 |
</layer>
|
746 |
+
<layer id="52" name="Reshape_32146" type="Reshape" version="opset1">
|
747 |
<data special_zero="false" />
|
748 |
<input>
|
749 |
<port id="0" precision="I64" />
|
|
|
776 |
<port id="2" precision="I64" names="62,64" />
|
777 |
</output>
|
778 |
</layer>
|
779 |
+
<layer id="55" name="Constant_24581" type="Const" version="opset1">
|
780 |
<data element_type="i32" shape="" offset="132776976" size="4" />
|
781 |
<rt_info>
|
782 |
<attribute name="precise" version="0" />
|
|
|
785 |
<port id="0" precision="I32" />
|
786 |
</output>
|
787 |
</layer>
|
788 |
+
<layer id="56" name="Unsqueeze_24582" type="Unsqueeze" version="opset1">
|
789 |
<input>
|
790 |
<port id="0" precision="I64" />
|
791 |
<port id="1" precision="I32" />
|
|
|
827 |
</port>
|
828 |
</output>
|
829 |
</layer>
|
830 |
+
<layer id="59" name="ShapeOf_32152" type="ShapeOf" version="opset3">
|
831 |
<data output_type="i32" />
|
832 |
<input>
|
833 |
<port id="0" precision="FP32">
|
|
|
841 |
</port>
|
842 |
</output>
|
843 |
</layer>
|
844 |
+
<layer id="60" name="Constant_32153" type="Const" version="opset1">
|
845 |
<data element_type="i64" shape="" offset="133923868" size="8" />
|
846 |
<output>
|
847 |
<port id="0" precision="I64" />
|
848 |
</output>
|
849 |
</layer>
|
850 |
+
<layer id="61" name="Constant_32154" type="Const" version="opset1">
|
851 |
<data element_type="i64" shape="" offset="133923860" size="8" />
|
852 |
<output>
|
853 |
<port id="0" precision="I64" />
|
854 |
</output>
|
855 |
</layer>
|
856 |
+
<layer id="62" name="Gather_32155" type="Gather" version="opset8">
|
857 |
<data batch_dims="0" />
|
858 |
<input>
|
859 |
<port id="0" precision="I32">
|
|
|
905 |
<port id="0" precision="I32" />
|
906 |
</output>
|
907 |
</layer>
|
908 |
+
<layer id="67" name="Convert_32158" type="Convert" version="opset1">
|
909 |
<data destination_type="i32" />
|
910 |
<input>
|
911 |
<port id="0" precision="I64" />
|
|
|
1059 |
</port>
|
1060 |
</output>
|
1061 |
</layer>
|
1062 |
+
<layer id="80" name="Constant_24684" type="Const" version="opset1">
|
1063 |
<data element_type="i64" shape="2" offset="140485218" size="16" />
|
1064 |
<rt_info>
|
1065 |
<attribute name="precise" version="0" />
|
|
|
1179 |
</port>
|
1180 |
</output>
|
1181 |
</layer>
|
1182 |
+
<layer id="88" name="Constant_32136" type="Const" version="opset1">
|
1183 |
<data element_type="i64" shape="1" offset="133923860" size="8" />
|
1184 |
<rt_info>
|
1185 |
<attribute name="precise" version="0" />
|
|
|
1190 |
</port>
|
1191 |
</output>
|
1192 |
</layer>
|
1193 |
+
<layer id="89" name="Constant_32137" type="Const" version="opset1">
|
1194 |
<data element_type="i64" shape="" offset="133923860" size="8" />
|
1195 |
<rt_info>
|
1196 |
<attribute name="precise" version="0" />
|
|
|
1199 |
<port id="0" precision="I64" />
|
1200 |
</output>
|
1201 |
</layer>
|
1202 |
+
<layer id="90" name="Gather_32138" type="Gather" version="opset8">
|
1203 |
<data batch_dims="0" />
|
1204 |
<input>
|
1205 |
<port id="0" precision="I64">
|
|
|
1216 |
</port>
|
1217 |
</output>
|
1218 |
</layer>
|
1219 |
+
<layer id="91" name="Constant_31122" type="Const" version="opset1">
|
1220 |
<data element_type="i64" shape="1" offset="133923868" size="8" />
|
1221 |
<rt_info>
|
1222 |
<attribute name="precise" version="0" />
|
|
|
1227 |
</port>
|
1228 |
</output>
|
1229 |
</layer>
|
1230 |
+
<layer id="92" name="Constant_31124" type="Const" version="opset1">
|
1231 |
<data element_type="i64" shape="1" offset="133923868" size="8" />
|
1232 |
<rt_info>
|
1233 |
<attribute name="precise" version="0" />
|
|
|
1238 |
</port>
|
1239 |
</output>
|
1240 |
</layer>
|
1241 |
+
<layer id="93" name="Constant_31126" type="Const" version="opset1">
|
1242 |
<data element_type="i64" shape="1" offset="133923868" size="8" />
|
1243 |
<rt_info>
|
1244 |
<attribute name="precise" version="0" />
|
|
|
1293 |
</port>
|
1294 |
</output>
|
1295 |
</layer>
|
1296 |
+
<layer id="96" name="Constant_25118" type="Const" version="opset1">
|
1297 |
<data element_type="i64" shape="1" offset="133923860" size="8" />
|
1298 |
<output>
|
1299 |
<port id="0" precision="I64">
|
|
|
1301 |
</port>
|
1302 |
</output>
|
1303 |
</layer>
|
1304 |
+
<layer id="97" name="ShapeOf_32167" type="ShapeOf" version="opset3">
|
1305 |
<data output_type="i64" />
|
1306 |
<input>
|
1307 |
<port id="0" precision="FP32">
|
|
|
1316 |
</port>
|
1317 |
</output>
|
1318 |
</layer>
|
1319 |
+
<layer id="98" name="Constant_32168" type="Const" version="opset1">
|
1320 |
<data element_type="i64" shape="1" offset="133923868" size="8" />
|
1321 |
<output>
|
1322 |
<port id="0" precision="I64">
|
|
|
1324 |
</port>
|
1325 |
</output>
|
1326 |
</layer>
|
1327 |
+
<layer id="99" name="Constant_32169" type="Const" version="opset1">
|
1328 |
<data element_type="i64" shape="" offset="133923860" size="8" />
|
1329 |
<output>
|
1330 |
<port id="0" precision="I64" />
|
1331 |
</output>
|
1332 |
</layer>
|
1333 |
+
<layer id="100" name="Gather_32170" type="Gather" version="opset8">
|
1334 |
<data batch_dims="0" />
|
1335 |
<input>
|
1336 |
<port id="0" precision="I64">
|
|
|
1347 |
</port>
|
1348 |
</output>
|
1349 |
</layer>
|
1350 |
+
<layer id="101" name="Constant_25121" type="Const" version="opset1">
|
1351 |
<data element_type="i64" shape="1" offset="133923868" size="8" />
|
1352 |
<output>
|
1353 |
<port id="0" precision="I64">
|
|
|
1485 |
</port>
|
1486 |
</output>
|
1487 |
</layer>
|
1488 |
+
<layer id="109" name="Constant_31890_compressed" type="Const" version="opset1">
|
1489 |
<data element_type="f16" shape="1, 1, 1280" offset="143762042" size="2560" />
|
1490 |
<output>
|
1491 |
<port id="0" precision="FP16">
|
|
|
1495 |
</port>
|
1496 |
</output>
|
1497 |
</layer>
|
1498 |
+
<layer id="110" name="Constant_31890" type="Convert" version="opset1">
|
1499 |
<data destination_type="f32" />
|
1500 |
<rt_info>
|
1501 |
<attribute name="decompression" version="0" />
|
|
|
1537 |
</port>
|
1538 |
</output>
|
1539 |
</layer>
|
1540 |
+
<layer id="112" name="Constant_32208" type="Const" version="opset1">
|
1541 |
<data element_type="i64" shape="4" offset="137208364" size="32" />
|
1542 |
<rt_info>
|
1543 |
<attribute name="precise" version="0" />
|
|
|
1652 |
</port>
|
1653 |
</output>
|
1654 |
</layer>
|
1655 |
+
<layer id="119" name="Constant_32209" type="Const" version="opset1">
|
1656 |
<data element_type="i64" shape="3" offset="143764602" size="24" />
|
1657 |
<rt_info>
|
1658 |
<attribute name="precise" version="0" />
|
|
|
1732 |
</port>
|
1733 |
</output>
|
1734 |
</layer>
|
1735 |
+
<layer id="124" name="Constant_31891_compressed" type="Const" version="opset1">
|
1736 |
<data element_type="f16" shape="1, 1, 1280" offset="147041426" size="2560" />
|
1737 |
<output>
|
1738 |
<port id="0" precision="FP16">
|
|
|
1742 |
</port>
|
1743 |
</output>
|
1744 |
</layer>
|
1745 |
+
<layer id="125" name="Constant_31891" type="Convert" version="opset1">
|
1746 |
<data destination_type="f32" />
|
1747 |
<rt_info>
|
1748 |
<attribute name="decompression" version="0" />
|
|
|
1834 |
</port>
|
1835 |
</output>
|
1836 |
</layer>
|
1837 |
+
<layer id="130" name="Constant_31892_compressed" type="Const" version="opset1">
|
1838 |
<data element_type="f16" shape="1, 1, 1280" offset="147043986" size="2560" />
|
1839 |
<output>
|
1840 |
<port id="0" precision="FP16">
|
|
|
1844 |
</port>
|
1845 |
</output>
|
1846 |
</layer>
|
1847 |
+
<layer id="131" name="Constant_31892" type="Convert" version="opset1">
|
1848 |
<data destination_type="f32" />
|
1849 |
<rt_info>
|
1850 |
<attribute name="decompression" version="0" />
|
|
|
1886 |
</port>
|
1887 |
</output>
|
1888 |
</layer>
|
1889 |
+
<layer id="133" name="Constant_31893_compressed" type="Const" version="opset1">
|
1890 |
<data element_type="f16" shape="1, 1, 1280" offset="147046546" size="2560" />
|
1891 |
<output>
|
1892 |
<port id="0" precision="FP16">
|
|
|
1896 |
</port>
|
1897 |
</output>
|
1898 |
</layer>
|
1899 |
+
<layer id="134" name="Constant_31893" type="Convert" version="opset1">
|
1900 |
<data destination_type="f32" />
|
1901 |
<rt_info>
|
1902 |
<attribute name="decompression" version="0" />
|
|
|
1938 |
</port>
|
1939 |
</output>
|
1940 |
</layer>
|
1941 |
+
<layer id="136" name="Constant_31793_compressed" type="Const" version="opset1">
|
1942 |
<data element_type="f16" shape="1280, 1280" offset="147049106" size="3276800" />
|
1943 |
<output>
|
1944 |
<port id="0" precision="FP16">
|
|
|
1947 |
</port>
|
1948 |
</output>
|
1949 |
</layer>
|
1950 |
+
<layer id="137" name="Constant_31793" type="Convert" version="opset1">
|
1951 |
<data destination_type="f32" />
|
1952 |
<rt_info>
|
1953 |
<attribute name="decompression" version="0" />
|
|
|
1965 |
</port>
|
1966 |
</output>
|
1967 |
</layer>
|
1968 |
+
<layer id="138" name="Multiply_31777" type="MatMul" version="opset1">
|
1969 |
<data transpose_a="false" transpose_b="true" />
|
1970 |
<input>
|
1971 |
<port id="0" precision="FP32">
|
|
|
1986 |
</port>
|
1987 |
</output>
|
1988 |
</layer>
|
1989 |
+
<layer id="139" name="Constant_31894_compressed" type="Const" version="opset1">
|
1990 |
<data element_type="f16" shape="1, 1, 1280" offset="150325906" size="2560" />
|
1991 |
<output>
|
1992 |
<port id="0" precision="FP16">
|
|
|
1996 |
</port>
|
1997 |
</output>
|
1998 |
</layer>
|
1999 |
+
<layer id="140" name="Constant_31894" type="Convert" version="opset1">
|
2000 |
<data destination_type="f32" />
|
2001 |
<rt_info>
|
2002 |
<attribute name="decompression" version="0" />
|
|
|
2038 |
</port>
|
2039 |
</output>
|
2040 |
</layer>
|
2041 |
+
<layer id="142" name="Constant_32210" type="Const" version="opset1">
|
2042 |
<data element_type="i64" shape="4" offset="137208364" size="32" />
|
2043 |
<rt_info>
|
2044 |
<attribute name="precise" version="0" />
|
|
|
2147 |
</port>
|
2148 |
</output>
|
2149 |
</layer>
|
2150 |
+
<layer id="149" name="Constant_24866" type="Const" version="opset1">
|
2151 |
<data element_type="i64" shape="1" offset="153605266" size="8" />
|
2152 |
<rt_info>
|
2153 |
<attribute name="precise" version="0" />
|
|
|
2158 |
</port>
|
2159 |
</output>
|
2160 |
</layer>
|
2161 |
+
<layer id="150" name="Constant_24867" type="Const" version="opset1">
|
2162 |
<data element_type="i64" shape="1" offset="153605274" size="8" />
|
2163 |
<rt_info>
|
2164 |
<attribute name="precise" version="0" />
|
|
|
2169 |
</port>
|
2170 |
</output>
|
2171 |
</layer>
|
2172 |
+
<layer id="151" name="Constant_24868" type="Const" version="opset1">
|
2173 |
<data element_type="i64" shape="1" offset="153605282" size="8" />
|
2174 |
<rt_info>
|
2175 |
<attribute name="precise" version="0" />
|
|
|
2180 |
</port>
|
2181 |
</output>
|
2182 |
</layer>
|
2183 |
+
<layer id="152" name="__module.model.model.decoder.layers.0.self_attn/prim::ListConstruct_1" type="Concat" version="opset1">
|
2184 |
<data axis="0" />
|
2185 |
<input>
|
2186 |
<port id="0" precision="I64">
|
|
|
2344 |
</port>
|
2345 |
</output>
|
2346 |
</layer>
|
2347 |
+
<layer id="161" name="Constant_31895_compressed" type="Const" version="opset1">
|
2348 |
<data element_type="f16" shape="1, 1, 1280" offset="156882090" size="2560" />
|
2349 |
<output>
|
2350 |
<port id="0" precision="FP16">
|
|
|
2354 |
</port>
|
2355 |
</output>
|
2356 |
</layer>
|
2357 |
+
<layer id="162" name="Constant_31895" type="Convert" version="opset1">
|
2358 |
<data destination_type="f32" />
|
2359 |
<rt_info>
|
2360 |
<attribute name="decompression" version="0" />
|
|
|
2500 |
</port>
|
2501 |
</output>
|
2502 |
</layer>
|
2503 |
+
<layer id="170" name="Constant_32211" type="Const" version="opset1">
|
2504 |
<data element_type="i64" shape="3" offset="156884650" size="24" />
|
2505 |
<rt_info>
|
2506 |
<attribute name="precise" version="0" />
|
|
|
2580 |
</port>
|
2581 |
</output>
|
2582 |
</layer>
|
2583 |
+
<layer id="175" name="Constant_31896_compressed" type="Const" version="opset1">
|
2584 |
<data element_type="f16" shape="1, 1, 1280" offset="160161474" size="2560" />
|
2585 |
<output>
|
2586 |
<port id="0" precision="FP16">
|
|
|
2590 |
</port>
|
2591 |
</output>
|
2592 |
</layer>
|
2593 |
+
<layer id="176" name="Constant_31896" type="Convert" version="opset1">
|
2594 |
<data destination_type="f32" />
|
2595 |
<rt_info>
|
2596 |
<attribute name="decompression" version="0" />
|
|
|
2682 |
</port>
|
2683 |
</output>
|
2684 |
</layer>
|
2685 |
+
<layer id="181" name="Constant_31897_compressed" type="Const" version="opset1">
|
2686 |
<data element_type="f16" shape="1, 1, 1280" offset="160164034" size="2560" />
|
2687 |
<output>
|
2688 |
<port id="0" precision="FP16">
|
|
|
2692 |
</port>
|
2693 |
</output>
|
2694 |
</layer>
|
2695 |
+
<layer id="182" name="Constant_31897" type="Convert" version="opset1">
|
2696 |
<data destination_type="f32" />
|
2697 |
<rt_info>
|
2698 |
<attribute name="decompression" version="0" />
|
|
|
2734 |
</port>
|
2735 |
</output>
|
2736 |
</layer>
|
2737 |
+
<layer id="184" name="Constant_31898_compressed" type="Const" version="opset1">
|
2738 |
<data element_type="f16" shape="1, 1, 1280" offset="160166594" size="2560" />
|
2739 |
<output>
|
2740 |
<port id="0" precision="FP16">
|
|
|
2744 |
</port>
|
2745 |
</output>
|
2746 |
</layer>
|
2747 |
+
<layer id="185" name="Constant_31898" type="Convert" version="opset1">
|
2748 |
<data destination_type="f32" />
|
2749 |
<rt_info>
|
2750 |
<attribute name="decompression" version="0" />
|
|
|
2834 |
</port>
|
2835 |
</output>
|
2836 |
</layer>
|
2837 |
+
<layer id="190" name="Constant_31899_compressed" type="Const" version="opset1">
|
2838 |
<data element_type="f16" shape="1, 1, 5120" offset="173276354" size="10240" />
|
2839 |
<output>
|
2840 |
<port id="0" precision="FP16">
|
|
|
2844 |
</port>
|
2845 |
</output>
|
2846 |
</layer>
|
2847 |
+
<layer id="191" name="Constant_31899" type="Convert" version="opset1">
|
2848 |
<data destination_type="f32" />
|
2849 |
<rt_info>
|
2850 |
<attribute name="decompression" version="0" />
|
|
|
2951 |
</port>
|
2952 |
</output>
|
2953 |
</layer>
|
2954 |
+
<layer id="197" name="Constant_31900_compressed" type="Const" version="opset1">
|
2955 |
<data element_type="f16" shape="1, 1, 1280" offset="186393794" size="2560" />
|
2956 |
<output>
|
2957 |
<port id="0" precision="FP16">
|
|
|
2961 |
</port>
|
2962 |
</output>
|
2963 |
</layer>
|
2964 |
+
<layer id="198" name="Constant_31900" type="Convert" version="opset1">
|
2965 |
<data destination_type="f32" />
|
2966 |
<rt_info>
|
2967 |
<attribute name="decompression" version="0" />
|
|
|
3053 |
</port>
|
3054 |
</output>
|
3055 |
</layer>
|
3056 |
+
<layer id="203" name="Constant_31901_compressed" type="Const" version="opset1">
|
3057 |
<data element_type="f16" shape="1, 1, 1280" offset="186396354" size="2560" />
|
3058 |
<output>
|
3059 |
<port id="0" precision="FP16">
|
|
|
3063 |
</port>
|
3064 |
</output>
|
3065 |
</layer>
|
3066 |
+
<layer id="204" name="Constant_31901" type="Convert" version="opset1">
|
3067 |
<data destination_type="f32" />
|
3068 |
<rt_info>
|
3069 |
<attribute name="decompression" version="0" />
|
|
|
3105 |
</port>
|
3106 |
</output>
|
3107 |
</layer>
|
3108 |
+
<layer id="206" name="Constant_31902_compressed" type="Const" version="opset1">
|
3109 |
<data element_type="f16" shape="1, 1, 1280" offset="186398914" size="2560" />
|
3110 |
<output>
|
3111 |
<port id="0" precision="FP16">
|
|
|
3115 |
</port>
|
3116 |
</output>
|
3117 |
</layer>
|
3118 |
+
<layer id="207" name="Constant_31902" type="Convert" version="opset1">
|
3119 |
<data destination_type="f32" />
|
3120 |
<rt_info>
|
3121 |
<attribute name="decompression" version="0" />
|
|
|
3157 |
</port>
|
3158 |
</output>
|
3159 |
</layer>
|
3160 |
+
<layer id="209" name="Constant_31796_compressed" type="Const" version="opset1">
|
3161 |
<data element_type="f16" shape="1280, 1280" offset="186401474" size="3276800" />
|
3162 |
<output>
|
3163 |
<port id="0" precision="FP16">
|
|
|
3166 |
</port>
|
3167 |
</output>
|
3168 |
</layer>
|
3169 |
+
<layer id="210" name="Constant_31796" type="Convert" version="opset1">
|
3170 |
<data destination_type="f32" />
|
3171 |
<rt_info>
|
3172 |
<attribute name="decompression" version="0" />
|
|
|
3184 |
</port>
|
3185 |
</output>
|
3186 |
</layer>
|
3187 |
+
<layer id="211" name="Multiply_31781" type="MatMul" version="opset1">
|
3188 |
<data transpose_a="false" transpose_b="true" />
|
3189 |
<input>
|
3190 |
<port id="0" precision="FP32">
|
|
|
3205 |
</port>
|
3206 |
</output>
|
3207 |
</layer>
|
3208 |
+
<layer id="212" name="Constant_31903_compressed" type="Const" version="opset1">
|
3209 |
<data element_type="f16" shape="1, 1, 1280" offset="189678274" size="2560" />
|
3210 |
<output>
|
3211 |
<port id="0" precision="FP16">
|
|
|
3215 |
</port>
|
3216 |
</output>
|
3217 |
</layer>
|
3218 |
+
<layer id="213" name="Constant_31903" type="Convert" version="opset1">
|
3219 |
<data destination_type="f32" />
|
3220 |
<rt_info>
|
3221 |
<attribute name="decompression" version="0" />
|
|
|
3257 |
</port>
|
3258 |
</output>
|
3259 |
</layer>
|
3260 |
+
<layer id="215" name="Constant_32212" type="Const" version="opset1">
|
3261 |
<data element_type="i64" shape="4" offset="137208364" size="32" />
|
3262 |
<rt_info>
|
3263 |
<attribute name="precise" version="0" />
|
|
|
3366 |
</port>
|
3367 |
</output>
|
3368 |
</layer>
|
3369 |
+
<layer id="222" name="Constant_32213" type="Const" version="opset1">
|
3370 |
<data element_type="i64" shape="4" offset="137208364" size="32" />
|
3371 |
<rt_info>
|
3372 |
<attribute name="precise" version="0" />
|
|
|
3544 |
</port>
|
3545 |
</output>
|
3546 |
</layer>
|
3547 |
+
<layer id="232" name="Constant_31904_compressed" type="Const" version="opset1">
|
3548 |
<data element_type="f16" shape="1, 1, 1280" offset="196234434" size="2560" />
|
3549 |
<output>
|
3550 |
<port id="0" precision="FP16">
|
|
|
3554 |
</port>
|
3555 |
</output>
|
3556 |
</layer>
|
3557 |
+
<layer id="233" name="Constant_31904" type="Convert" version="opset1">
|
3558 |
<data destination_type="f32" />
|
3559 |
<rt_info>
|
3560 |
<attribute name="decompression" version="0" />
|
|
|
3596 |
</port>
|
3597 |
</output>
|
3598 |
</layer>
|
3599 |
+
<layer id="235" name="Constant_32214" type="Const" version="opset1">
|
3600 |
<data element_type="i64" shape="4" offset="137208364" size="32" />
|
3601 |
<rt_info>
|
3602 |
<attribute name="precise" version="0" />
|
|
|
3711 |
</port>
|
3712 |
</output>
|
3713 |
</layer>
|
3714 |
+
<layer id="242" name="Constant_32215" type="Const" version="opset1">
|
3715 |
<data element_type="i64" shape="3" offset="143764602" size="24" />
|
3716 |
<rt_info>
|
3717 |
<attribute name="precise" version="0" />
|
|
|
3791 |
</port>
|
3792 |
</output>
|
3793 |
</layer>
|
3794 |
+
<layer id="247" name="Constant_31905_compressed" type="Const" version="opset1">
|
3795 |
<data element_type="f16" shape="1, 1, 1280" offset="199513794" size="2560" />
|
3796 |
<output>
|
3797 |
<port id="0" precision="FP16">
|
|
|
3801 |
</port>
|
3802 |
</output>
|
3803 |
</layer>
|
3804 |
+
<layer id="248" name="Constant_31905" type="Convert" version="opset1">
|
3805 |
<data destination_type="f32" />
|
3806 |
<rt_info>
|
3807 |
<attribute name="decompression" version="0" />
|
|
|
3893 |
</port>
|
3894 |
</output>
|
3895 |
</layer>
|
3896 |
+
<layer id="253" name="Constant_31906_compressed" type="Const" version="opset1">
|
3897 |
<data element_type="f16" shape="1, 1, 1280" offset="199516354" size="2560" />
|
3898 |
<output>
|
3899 |
<port id="0" precision="FP16">
|
|
|
3903 |
</port>
|
3904 |
</output>
|
3905 |
</layer>
|
3906 |
+
<layer id="254" name="Constant_31906" type="Convert" version="opset1">
|
3907 |
<data destination_type="f32" />
|
3908 |
<rt_info>
|
3909 |
<attribute name="decompression" version="0" />
|
|
|
3945 |
</port>
|
3946 |
</output>
|
3947 |
</layer>
|
3948 |
+
<layer id="256" name="Constant_31907_compressed" type="Const" version="opset1">
|
3949 |
<data element_type="f16" shape="1, 1, 1280" offset="199518914" size="2560" />
|
3950 |
<output>
|
3951 |
<port id="0" precision="FP16">
|
|
|
3955 |
</port>
|
3956 |
</output>
|
3957 |
</layer>
|
3958 |
+
<layer id="257" name="Constant_31907" type="Convert" version="opset1">
|
3959 |
<data destination_type="f32" />
|
3960 |
<rt_info>
|
3961 |
<attribute name="decompression" version="0" />
|
|
|
3997 |
</port>
|
3998 |
</output>
|
3999 |
</layer>
|
4000 |
+
<layer id="259" name="Constant_31799_compressed" type="Const" version="opset1">
|
4001 |
<data element_type="f16" shape="1280, 1280" offset="199521474" size="3276800" />
|
4002 |
<output>
|
4003 |
<port id="0" precision="FP16">
|
|
|
4006 |
</port>
|
4007 |
</output>
|
4008 |
</layer>
|
4009 |
+
<layer id="260" name="Constant_31799" type="Convert" version="opset1">
|
4010 |
<data destination_type="f32" />
|
4011 |
<rt_info>
|
4012 |
<attribute name="decompression" version="0" />
|
|
|
4024 |
</port>
|
4025 |
</output>
|
4026 |
</layer>
|
4027 |
+
<layer id="261" name="Multiply_31785" type="MatMul" version="opset1">
|
4028 |
<data transpose_a="false" transpose_b="true" />
|
4029 |
<input>
|
4030 |
<port id="0" precision="FP32">
|
|
|
4045 |
</port>
|
4046 |
</output>
|
4047 |
</layer>
|
4048 |
+
<layer id="262" name="Constant_31908_compressed" type="Const" version="opset1">
|
4049 |
<data element_type="f16" shape="1, 1, 1280" offset="202798274" size="2560" />
|
4050 |
<output>
|
4051 |
<port id="0" precision="FP16">
|
|
|
4055 |
</port>
|
4056 |
</output>
|
4057 |
</layer>
|
4058 |
+
<layer id="263" name="Constant_31908" type="Convert" version="opset1">
|
4059 |
<data destination_type="f32" />
|
4060 |
<rt_info>
|
4061 |
<attribute name="decompression" version="0" />
|
|
|
4097 |
</port>
|
4098 |
</output>
|
4099 |
</layer>
|
4100 |
+
<layer id="265" name="Constant_32216" type="Const" version="opset1">
|
4101 |
<data element_type="i64" shape="4" offset="137208364" size="32" />
|
4102 |
<rt_info>
|
4103 |
<attribute name="precise" version="0" />
|
|
|
4348 |
</port>
|
4349 |
</output>
|
4350 |
</layer>
|
4351 |
+
<layer id="280" name="Constant_31909_compressed" type="Const" version="opset1">
|
4352 |
<data element_type="f16" shape="1, 1, 1280" offset="209354434" size="2560" />
|
4353 |
<output>
|
4354 |
<port id="0" precision="FP16">
|
|
|
4358 |
</port>
|
4359 |
</output>
|
4360 |
</layer>
|
4361 |
+
<layer id="281" name="Constant_31909" type="Convert" version="opset1">
|
4362 |
<data destination_type="f32" />
|
4363 |
<rt_info>
|
4364 |
<attribute name="decompression" version="0" />
|
|
|
4504 |
</port>
|
4505 |
</output>
|
4506 |
</layer>
|
4507 |
+
<layer id="289" name="Constant_32217" type="Const" version="opset1">
|
4508 |
<data element_type="i64" shape="3" offset="156884650" size="24" />
|
4509 |
<rt_info>
|
4510 |
<attribute name="precise" version="0" />
|
|
|
4584 |
</port>
|
4585 |
</output>
|
4586 |
</layer>
|
4587 |
+
<layer id="294" name="Constant_31910_compressed" type="Const" version="opset1">
|
4588 |
<data element_type="f16" shape="1, 1, 1280" offset="212633794" size="2560" />
|
4589 |
<output>
|
4590 |
<port id="0" precision="FP16">
|
|
|
4594 |
</port>
|
4595 |
</output>
|
4596 |
</layer>
|
4597 |
+
<layer id="295" name="Constant_31910" type="Convert" version="opset1">
|
4598 |
<data destination_type="f32" />
|
4599 |
<rt_info>
|
4600 |
<attribute name="decompression" version="0" />
|
|
|
4686 |
</port>
|
4687 |
</output>
|
4688 |
</layer>
|
4689 |
+
<layer id="300" name="Constant_31911_compressed" type="Const" version="opset1">
|
4690 |
<data element_type="f16" shape="1, 1, 1280" offset="212636354" size="2560" />
|
4691 |
<output>
|
4692 |
<port id="0" precision="FP16">
|
|
|
4696 |
</port>
|
4697 |
</output>
|
4698 |
</layer>
|
4699 |
+
<layer id="301" name="Constant_31911" type="Convert" version="opset1">
|
4700 |
<data destination_type="f32" />
|
4701 |
<rt_info>
|
4702 |
<attribute name="decompression" version="0" />
|
|
|
4738 |
</port>
|
4739 |
</output>
|
4740 |
</layer>
|
4741 |
+
<layer id="303" name="Constant_31912_compressed" type="Const" version="opset1">
|
4742 |
<data element_type="f16" shape="1, 1, 1280" offset="212638914" size="2560" />
|
4743 |
<output>
|
4744 |
<port id="0" precision="FP16">
|
|
|
4748 |
</port>
|
4749 |
</output>
|
4750 |
</layer>
|
4751 |
+
<layer id="304" name="Constant_31912" type="Convert" version="opset1">
|
4752 |
<data destination_type="f32" />
|
4753 |
<rt_info>
|
4754 |
<attribute name="decompression" version="0" />
|
|
|
4838 |
</port>
|
4839 |
</output>
|
4840 |
</layer>
|
4841 |
+
<layer id="309" name="Constant_31913_compressed" type="Const" version="opset1">
|
4842 |
<data element_type="f16" shape="1, 1, 5120" offset="225748674" size="10240" />
|
4843 |
<output>
|
4844 |
<port id="0" precision="FP16">
|
|
|
4848 |
</port>
|
4849 |
</output>
|
4850 |
</layer>
|
4851 |
+
<layer id="310" name="Constant_31913" type="Convert" version="opset1">
|
4852 |
<data destination_type="f32" />
|
4853 |
<rt_info>
|
4854 |
<attribute name="decompression" version="0" />
|
|
|
4955 |
</port>
|
4956 |
</output>
|
4957 |
</layer>
|
4958 |
+
<layer id="316" name="Constant_31914_compressed" type="Const" version="opset1">
|
4959 |
<data element_type="f16" shape="1, 1, 1280" offset="238866114" size="2560" />
|
4960 |
<output>
|
4961 |
<port id="0" precision="FP16">
|
|
|
4965 |
</port>
|
4966 |
</output>
|
4967 |
</layer>
|
4968 |
+
<layer id="317" name="Constant_31914" type="Convert" version="opset1">
|
4969 |
<data destination_type="f32" />
|
4970 |
<rt_info>
|
4971 |
<attribute name="decompression" version="0" />
|
|
|
5057 |
</port>
|
5058 |
</output>
|
5059 |
</layer>
|
5060 |
+
<layer id="322" name="Constant_31915_compressed" type="Const" version="opset1">
|
5061 |
<data element_type="f16" shape="1, 1, 1280" offset="238868674" size="2560" />
|
5062 |
<output>
|
5063 |
<port id="0" precision="FP16">
|
|
|
5067 |
</port>
|
5068 |
</output>
|
5069 |
</layer>
|
5070 |
+
<layer id="323" name="Constant_31915" type="Convert" version="opset1">
|
5071 |
<data destination_type="f32" />
|
5072 |
<rt_info>
|
5073 |
<attribute name="decompression" version="0" />
|
|
|
5109 |
</port>
|
5110 |
</output>
|
5111 |
</layer>
|
5112 |
+
<layer id="325" name="Constant_31916_compressed" type="Const" version="opset1">
|
5113 |
<data element_type="f16" shape="1, 1, 1280" offset="238871234" size="2560" />
|
5114 |
<output>
|
5115 |
<port id="0" precision="FP16">
|
|
|
5119 |
</port>
|
5120 |
</output>
|
5121 |
</layer>
|
5122 |
+
<layer id="326" name="Constant_31916" type="Convert" version="opset1">
|
5123 |
<data destination_type="f32" />
|
5124 |
<rt_info>
|
5125 |
<attribute name="decompression" version="0" />
|
|
|
5182 |
</port>
|
5183 |
</output>
|
5184 |
</layer>
|
5185 |
+
<layer id="329" name="Result_26703" type="Result" version="opset1">
|
5186 |
<input>
|
5187 |
<port id="0" precision="FP32">
|
5188 |
<dim>-1</dim>
|
|
|
5558 |
<edge from-layer="328" from-port="2" to-layer="329" to-port="0" />
|
5559 |
</edges>
|
5560 |
<rt_info>
|
5561 |
+
<Runtime_version value="2024.5.0-17285-ea5c1dcfdf9-releases/2024/5" />
|
5562 |
<conversion_parameters>
|
5563 |
<framework value="pytorch" />
|
5564 |
<is_python_object value="True" />
|
5565 |
</conversion_parameters>
|
5566 |
<optimum>
|
5567 |
+
<optimum_intel_version value="1.21.0.dev0+d357376" />
|
5568 |
+
<optimum_version value="1.23.3" />
|
5569 |
+
<pytorch_version value="2.5.1" />
|
5570 |
+
<transformers_version value="4.46.3" />
|
5571 |
</optimum>
|
5572 |
</rt_info>
|
5573 |
</net>
|
openvino_detokenizer.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 528306
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c95aa7a4b53ecb3768d2a6608aa9e419059aef1c75b9b99e6b1c56328281c18
|
3 |
size 528306
|
openvino_detokenizer.xml
CHANGED
@@ -1,16 +1,16 @@
|
|
1 |
<?xml version="1.0"?>
|
2 |
<net name="detokenizer" version="11">
|
3 |
<layers>
|
4 |
-
<layer id="0" name="
|
5 |
<data shape="?,?" element_type="i64" />
|
6 |
<output>
|
7 |
-
<port id="0" precision="I64" names="
|
8 |
<dim>-1</dim>
|
9 |
<dim>-1</dim>
|
10 |
</port>
|
11 |
</output>
|
12 |
</layer>
|
13 |
-
<layer id="1" name="
|
14 |
<data destination_type="i32" />
|
15 |
<input>
|
16 |
<port id="0" precision="I64">
|
@@ -25,7 +25,7 @@
|
|
25 |
</port>
|
26 |
</output>
|
27 |
</layer>
|
28 |
-
<layer id="2" name="
|
29 |
<data element_type="u8" shape="528257" offset="0" size="528257" />
|
30 |
<output>
|
31 |
<port id="0" precision="U8">
|
@@ -33,7 +33,7 @@
|
|
33 |
</port>
|
34 |
</output>
|
35 |
</layer>
|
36 |
-
<layer id="3" name="
|
37 |
<data mode="begins_ends" />
|
38 |
<input>
|
39 |
<port id="0" precision="U8">
|
@@ -52,7 +52,7 @@
|
|
52 |
</port>
|
53 |
</output>
|
54 |
</layer>
|
55 |
-
<layer id="4" name="
|
56 |
<data skip_tokens="50257, 50258, 50259, 50260, 50261, 50262, 50263, 50264, 50265, 50266, 50267, 50268, 50269, 50270, 50271, 50272, 50273, 50274, 50275, 50276, 50277, 50278, 50279, 50280, 50281, 50282, 50283, 50284, 50285, 50286, 50287, 50288, 50289, 50290, 50291, 50292, 50293, 50294, 50295, 50296, 50297, 50298, 50299, 50300, 50301, 50302, 50303, 50304, 50305, 50306, 50307, 50308, 50309, 50310, 50311, 50312, 50313, 50314, 50315, 50316, 50317, 50318, 50319, 50320, 50321, 50322, 50323, 50324, 50325, 50326, 50327, 50328, 50329, 50330, 50331, 50332, 50333, 50334, 50335, 50336, 50337, 50338, 50339, 50340, 50341, 50342, 50343, 50344, 50345, 50346, 50347, 50348, 50349, 50350, 50351, 50352, 50353, 50354, 50355, 50356, 50357, 50358, 50359, 50360, 50361, 50362, 50363, 50364" />
|
57 |
<input>
|
58 |
<port id="0" precision="I32">
|
@@ -87,7 +87,7 @@
|
|
87 |
</port>
|
88 |
</output>
|
89 |
</layer>
|
90 |
-
<layer id="5" name="
|
91 |
<input>
|
92 |
<port id="0" precision="I32">
|
93 |
<dim>-1</dim>
|
@@ -111,7 +111,7 @@
|
|
111 |
</port>
|
112 |
</output>
|
113 |
</layer>
|
114 |
-
<layer id="6" name="
|
115 |
<data element_type="u8" shape="47" offset="528257" size="47" />
|
116 |
<output>
|
117 |
<port id="0" precision="U8">
|
@@ -119,7 +119,7 @@
|
|
119 |
</port>
|
120 |
</output>
|
121 |
</layer>
|
122 |
-
<layer id="7" name="
|
123 |
<data element_type="u8" shape="2" offset="528304" size="2" />
|
124 |
<output>
|
125 |
<port id="0" precision="U8">
|
@@ -127,7 +127,7 @@
|
|
127 |
</port>
|
128 |
</output>
|
129 |
</layer>
|
130 |
-
<layer id="8" name="
|
131 |
<data global_replace="true" />
|
132 |
<input>
|
133 |
<port id="0" precision="I32">
|
@@ -158,7 +158,7 @@
|
|
158 |
</port>
|
159 |
</output>
|
160 |
</layer>
|
161 |
-
<layer id="9" name="
|
162 |
<data mode="begins_ends" />
|
163 |
<input>
|
164 |
<port id="0" precision="I32">
|
@@ -177,7 +177,7 @@
|
|
177 |
</port>
|
178 |
</output>
|
179 |
</layer>
|
180 |
-
<layer id="10" name="
|
181 |
<input>
|
182 |
<port id="0" precision="STRING">
|
183 |
<dim>-1</dim>
|
@@ -207,9 +207,29 @@
|
|
207 |
<edge from-layer="9" from-port="3" to-layer="10" to-port="0" />
|
208 |
</edges>
|
209 |
<rt_info>
|
|
|
|
|
|
|
210 |
<bos_token_id value="50257" />
|
|
|
|
|
211 |
<eos_token_id value="50257" />
|
|
|
|
|
|
|
|
|
212 |
<original_tokenizer_class value="<class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
|
213 |
<pad_token_id value="50257" />
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
214 |
</rt_info>
|
215 |
</net>
|
|
|
1 |
<?xml version="1.0"?>
|
2 |
<net name="detokenizer" version="11">
|
3 |
<layers>
|
4 |
+
<layer id="0" name="Parameter_33580" type="Parameter" version="opset1">
|
5 |
<data shape="?,?" element_type="i64" />
|
6 |
<output>
|
7 |
+
<port id="0" precision="I64" names="Parameter_33580">
|
8 |
<dim>-1</dim>
|
9 |
<dim>-1</dim>
|
10 |
</port>
|
11 |
</output>
|
12 |
</layer>
|
13 |
+
<layer id="1" name="Convert_33596" type="Convert" version="opset1">
|
14 |
<data destination_type="i32" />
|
15 |
<input>
|
16 |
<port id="0" precision="I64">
|
|
|
25 |
</port>
|
26 |
</output>
|
27 |
</layer>
|
28 |
+
<layer id="2" name="Constant_33541" type="Const" version="opset1">
|
29 |
<data element_type="u8" shape="528257" offset="0" size="528257" />
|
30 |
<output>
|
31 |
<port id="0" precision="U8">
|
|
|
33 |
</port>
|
34 |
</output>
|
35 |
</layer>
|
36 |
+
<layer id="3" name="StringTensorUnpack_33542" type="StringTensorUnpack" version="extension">
|
37 |
<data mode="begins_ends" />
|
38 |
<input>
|
39 |
<port id="0" precision="U8">
|
|
|
52 |
</port>
|
53 |
</output>
|
54 |
</layer>
|
55 |
+
<layer id="4" name="VocabDecoder_33581" type="VocabDecoder" version="extension">
|
56 |
<data skip_tokens="50257, 50258, 50259, 50260, 50261, 50262, 50263, 50264, 50265, 50266, 50267, 50268, 50269, 50270, 50271, 50272, 50273, 50274, 50275, 50276, 50277, 50278, 50279, 50280, 50281, 50282, 50283, 50284, 50285, 50286, 50287, 50288, 50289, 50290, 50291, 50292, 50293, 50294, 50295, 50296, 50297, 50298, 50299, 50300, 50301, 50302, 50303, 50304, 50305, 50306, 50307, 50308, 50309, 50310, 50311, 50312, 50313, 50314, 50315, 50316, 50317, 50318, 50319, 50320, 50321, 50322, 50323, 50324, 50325, 50326, 50327, 50328, 50329, 50330, 50331, 50332, 50333, 50334, 50335, 50336, 50337, 50338, 50339, 50340, 50341, 50342, 50343, 50344, 50345, 50346, 50347, 50348, 50349, 50350, 50351, 50352, 50353, 50354, 50355, 50356, 50357, 50358, 50359, 50360, 50361, 50362, 50363, 50364" />
|
57 |
<input>
|
58 |
<port id="0" precision="I32">
|
|
|
87 |
</port>
|
88 |
</output>
|
89 |
</layer>
|
90 |
+
<layer id="5" name="FuzeRagged_33582" type="FuzeRagged" version="extension">
|
91 |
<input>
|
92 |
<port id="0" precision="I32">
|
93 |
<dim>-1</dim>
|
|
|
111 |
</port>
|
112 |
</output>
|
113 |
</layer>
|
114 |
+
<layer id="6" name="Constant_33584" type="Const" version="opset1">
|
115 |
<data element_type="u8" shape="47" offset="528257" size="47" />
|
116 |
<output>
|
117 |
<port id="0" precision="U8">
|
|
|
119 |
</port>
|
120 |
</output>
|
121 |
</layer>
|
122 |
+
<layer id="7" name="Constant_33586" type="Const" version="opset1">
|
123 |
<data element_type="u8" shape="2" offset="528304" size="2" />
|
124 |
<output>
|
125 |
<port id="0" precision="U8">
|
|
|
127 |
</port>
|
128 |
</output>
|
129 |
</layer>
|
130 |
+
<layer id="8" name="RegexNormalization_33587" type="RegexNormalization" version="extension">
|
131 |
<data global_replace="true" />
|
132 |
<input>
|
133 |
<port id="0" precision="I32">
|
|
|
158 |
</port>
|
159 |
</output>
|
160 |
</layer>
|
161 |
+
<layer id="9" name="StringTensorPack_33588" type="StringTensorPack" version="extension">
|
162 |
<data mode="begins_ends" />
|
163 |
<input>
|
164 |
<port id="0" precision="I32">
|
|
|
177 |
</port>
|
178 |
</output>
|
179 |
</layer>
|
180 |
+
<layer id="10" name="Result_33589" type="Result" version="opset1">
|
181 |
<input>
|
182 |
<port id="0" precision="STRING">
|
183 |
<dim>-1</dim>
|
|
|
207 |
<edge from-layer="9" from-port="3" to-layer="10" to-port="0" />
|
208 |
</edges>
|
209 |
<rt_info>
|
210 |
+
<add_attention_mask value="True" />
|
211 |
+
<add_prefix_space />
|
212 |
+
<add_special_tokens value="True" />
|
213 |
<bos_token_id value="50257" />
|
214 |
+
<clean_up_tokenization_spaces />
|
215 |
+
<detokenizer_input_type value="i64" />
|
216 |
<eos_token_id value="50257" />
|
217 |
+
<handle_special_tokens_with_re />
|
218 |
+
<number_of_inputs value="1" />
|
219 |
+
<openvino_tokenizers_version value="2024.5.0.0" />
|
220 |
+
<openvino_version value="2024.5.0" />
|
221 |
<original_tokenizer_class value="<class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
|
222 |
<pad_token_id value="50257" />
|
223 |
+
<sentencepiece_version value="0.2.0" />
|
224 |
+
<skip_special_tokens value="True" />
|
225 |
+
<streaming_detokenizer value="False" />
|
226 |
+
<tiktoken_version value="0.8.0" />
|
227 |
+
<tokenizer_output_type value="i64" />
|
228 |
+
<tokenizers_version value="0.20.3" />
|
229 |
+
<transformers_version value="4.46.3" />
|
230 |
+
<use_max_padding value="False" />
|
231 |
+
<use_sentencepiece_backend value="False" />
|
232 |
+
<utf8_replace_mode />
|
233 |
+
<with_detokenizer value="True" />
|
234 |
</rt_info>
|
235 |
</net>
|
openvino_encoder_model.xml
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
openvino_tokenizer.xml
CHANGED
@@ -1,27 +1,27 @@
|
|
1 |
<?xml version="1.0"?>
|
2 |
<net name="tokenizer" version="11">
|
3 |
<layers>
|
4 |
-
<layer id="0" name="
|
5 |
<data shape="?" element_type="string" />
|
6 |
<output>
|
7 |
-
<port id="0" precision="STRING" names="
|
8 |
<dim>-1</dim>
|
9 |
</port>
|
10 |
</output>
|
11 |
</layer>
|
12 |
-
<layer id="1" name="
|
13 |
<data element_type="i32" shape="" offset="0" size="4" />
|
14 |
<output>
|
15 |
<port id="0" precision="I32" />
|
16 |
</output>
|
17 |
</layer>
|
18 |
-
<layer id="2" name="
|
19 |
<data element_type="i32" shape="" offset="4" size="4" />
|
20 |
<output>
|
21 |
<port id="0" precision="I32" />
|
22 |
</output>
|
23 |
</layer>
|
24 |
-
<layer id="3" name="
|
25 |
<data element_type="i32" shape="1" offset="8" size="4" />
|
26 |
<output>
|
27 |
<port id="0" precision="I32">
|
@@ -29,19 +29,19 @@
|
|
29 |
</port>
|
30 |
</output>
|
31 |
</layer>
|
32 |
-
<layer id="4" name="
|
33 |
<data element_type="i32" shape="" offset="0" size="4" />
|
34 |
<output>
|
35 |
<port id="0" precision="I32" />
|
36 |
</output>
|
37 |
</layer>
|
38 |
-
<layer id="5" name="
|
39 |
<data element_type="i32" shape="" offset="4" size="4" />
|
40 |
<output>
|
41 |
<port id="0" precision="I32" />
|
42 |
</output>
|
43 |
</layer>
|
44 |
-
<layer id="6" name="
|
45 |
<data element_type="i32" shape="1" offset="12" size="4" />
|
46 |
<output>
|
47 |
<port id="0" precision="I32">
|
@@ -49,13 +49,13 @@
|
|
49 |
</port>
|
50 |
</output>
|
51 |
</layer>
|
52 |
-
<layer id="7" name="
|
53 |
<data element_type="i64" shape="" offset="16" size="8" />
|
54 |
<output>
|
55 |
<port id="0" precision="I64" />
|
56 |
</output>
|
57 |
</layer>
|
58 |
-
<layer id="8" name="
|
59 |
<data mode="begins_ends" />
|
60 |
<input>
|
61 |
<port id="0" precision="STRING">
|
@@ -74,7 +74,7 @@
|
|
74 |
</port>
|
75 |
</output>
|
76 |
</layer>
|
77 |
-
<layer id="9" name="
|
78 |
<data output_type="i64" />
|
79 |
<input>
|
80 |
<port id="0" precision="I32">
|
@@ -87,19 +87,19 @@
|
|
87 |
</port>
|
88 |
</output>
|
89 |
</layer>
|
90 |
-
<layer id="10" name="
|
91 |
<data element_type="i64" shape="" offset="16" size="8" />
|
92 |
<output>
|
93 |
<port id="0" precision="I64" />
|
94 |
</output>
|
95 |
</layer>
|
96 |
-
<layer id="11" name="
|
97 |
<data element_type="i64" shape="" offset="16" size="8" />
|
98 |
<output>
|
99 |
<port id="0" precision="I64" />
|
100 |
</output>
|
101 |
</layer>
|
102 |
-
<layer id="12" name="
|
103 |
<data batch_dims="0" />
|
104 |
<input>
|
105 |
<port id="0" precision="I64">
|
@@ -112,13 +112,13 @@
|
|
112 |
<port id="3" precision="I64" />
|
113 |
</output>
|
114 |
</layer>
|
115 |
-
<layer id="13" name="
|
116 |
<data element_type="i64" shape="" offset="24" size="8" />
|
117 |
<output>
|
118 |
<port id="0" precision="I64" />
|
119 |
</output>
|
120 |
</layer>
|
121 |
-
<layer id="14" name="
|
122 |
<data output_type="i32" />
|
123 |
<input>
|
124 |
<port id="0" precision="I64" />
|
@@ -131,19 +131,19 @@
|
|
131 |
</port>
|
132 |
</output>
|
133 |
</layer>
|
134 |
-
<layer id="15" name="
|
135 |
<data element_type="i64" shape="" offset="24" size="8" />
|
136 |
<output>
|
137 |
<port id="0" precision="I64" />
|
138 |
</output>
|
139 |
</layer>
|
140 |
-
<layer id="16" name="
|
141 |
<data element_type="i64" shape="" offset="24" size="8" />
|
142 |
<output>
|
143 |
<port id="0" precision="I64" />
|
144 |
</output>
|
145 |
</layer>
|
146 |
-
<layer id="17" name="
|
147 |
<data auto_broadcast="numpy" />
|
148 |
<input>
|
149 |
<port id="0" precision="I64" />
|
@@ -153,13 +153,13 @@
|
|
153 |
<port id="2" precision="I64" />
|
154 |
</output>
|
155 |
</layer>
|
156 |
-
<layer id="18" name="
|
157 |
<data element_type="i64" shape="" offset="24" size="8" />
|
158 |
<output>
|
159 |
<port id="0" precision="I64" />
|
160 |
</output>
|
161 |
</layer>
|
162 |
-
<layer id="19" name="
|
163 |
<data output_type="i32" />
|
164 |
<input>
|
165 |
<port id="0" precision="I64" />
|
@@ -172,7 +172,7 @@
|
|
172 |
</port>
|
173 |
</output>
|
174 |
</layer>
|
175 |
-
<layer id="20" name="
|
176 |
<data element_type="u8" shape="26491" offset="32" size="26491" />
|
177 |
<output>
|
178 |
<port id="0" precision="U8">
|
@@ -180,7 +180,7 @@
|
|
180 |
</port>
|
181 |
</output>
|
182 |
</layer>
|
183 |
-
<layer id="21" name="
|
184 |
<input>
|
185 |
<port id="0" precision="I32">
|
186 |
<dim>-1</dim>
|
@@ -222,7 +222,7 @@
|
|
222 |
</port>
|
223 |
</output>
|
224 |
</layer>
|
225 |
-
<layer id="22" name="
|
226 |
<data element_type="u8" shape="64" offset="26523" size="64" />
|
227 |
<output>
|
228 |
<port id="0" precision="U8">
|
@@ -230,7 +230,7 @@
|
|
230 |
</port>
|
231 |
</output>
|
232 |
</layer>
|
233 |
-
<layer id="23" name="
|
234 |
<data behaviour="isolate" invert="false" max_splits="-1" />
|
235 |
<input>
|
236 |
<port id="0" precision="I32">
|
@@ -276,7 +276,7 @@
|
|
276 |
</port>
|
277 |
</output>
|
278 |
</layer>
|
279 |
-
<layer id="24" name="
|
280 |
<data element_type="u8" shape="528257" offset="26587" size="528257" />
|
281 |
<output>
|
282 |
<port id="0" precision="U8">
|
@@ -284,7 +284,7 @@
|
|
284 |
</port>
|
285 |
</output>
|
286 |
</layer>
|
287 |
-
<layer id="25" name="
|
288 |
<data mode="begins_ends" />
|
289 |
<input>
|
290 |
<port id="0" precision="U8">
|
@@ -303,7 +303,7 @@
|
|
303 |
</port>
|
304 |
</output>
|
305 |
</layer>
|
306 |
-
<layer id="26" name="
|
307 |
<data element_type="u8" shape="369958" offset="554844" size="369958" />
|
308 |
<output>
|
309 |
<port id="0" precision="U8">
|
@@ -311,7 +311,7 @@
|
|
311 |
</port>
|
312 |
</output>
|
313 |
</layer>
|
314 |
-
<layer id="27" name="
|
315 |
<data mode="begins_ends" />
|
316 |
<input>
|
317 |
<port id="0" precision="U8">
|
@@ -330,7 +330,7 @@
|
|
330 |
</port>
|
331 |
</output>
|
332 |
</layer>
|
333 |
-
<layer id="28" name="
|
334 |
<data element_type="u8" shape="336859" offset="924802" size="336859" />
|
335 |
<output>
|
336 |
<port id="0" precision="U8">
|
@@ -338,7 +338,7 @@
|
|
338 |
</port>
|
339 |
</output>
|
340 |
</layer>
|
341 |
-
<layer id="29" name="
|
342 |
<data mode="begins_ends" />
|
343 |
<input>
|
344 |
<port id="0" precision="U8">
|
@@ -357,7 +357,7 @@
|
|
357 |
</port>
|
358 |
</output>
|
359 |
</layer>
|
360 |
-
<layer id="30" name="
|
361 |
<data element_type="u8" shape="20172" offset="1261661" size="20172" />
|
362 |
<output>
|
363 |
<port id="0" precision="U8">
|
@@ -365,7 +365,7 @@
|
|
365 |
</port>
|
366 |
</output>
|
367 |
</layer>
|
368 |
-
<layer id="31" name="
|
369 |
<data mode="begins_ends" />
|
370 |
<input>
|
371 |
<port id="0" precision="U8">
|
@@ -384,7 +384,7 @@
|
|
384 |
</port>
|
385 |
</output>
|
386 |
</layer>
|
387 |
-
<layer id="32" name="
|
388 |
<data element_type="i32" shape="1609" offset="1281833" size="6436" />
|
389 |
<output>
|
390 |
<port id="0" precision="I32">
|
@@ -392,7 +392,7 @@
|
|
392 |
</port>
|
393 |
</output>
|
394 |
</layer>
|
395 |
-
<layer id="33" name="
|
396 |
<data unk_token="" fuse_unk="false" suffix_indicator="" end_suffix="" byte_fallback="false" cache_capacity="20000" />
|
397 |
<input>
|
398 |
<port id="0" precision="I32">
|
@@ -462,7 +462,7 @@
|
|
462 |
</port>
|
463 |
</output>
|
464 |
</layer>
|
465 |
-
<layer id="34" name="
|
466 |
<data auto_broadcast="numpy" />
|
467 |
<input>
|
468 |
<port id="0" precision="I32">
|
@@ -478,13 +478,13 @@
|
|
478 |
</port>
|
479 |
</output>
|
480 |
</layer>
|
481 |
-
<layer id="35" name="
|
482 |
<data element_type="i32" shape="" offset="1288269" size="4" />
|
483 |
<output>
|
484 |
<port id="0" precision="I32" />
|
485 |
</output>
|
486 |
</layer>
|
487 |
-
<layer id="36" name="
|
488 |
<data auto_broadcast="numpy" />
|
489 |
<input>
|
490 |
<port id="0" precision="I32">
|
@@ -498,7 +498,7 @@
|
|
498 |
</port>
|
499 |
</output>
|
500 |
</layer>
|
501 |
-
<layer id="37" name="
|
502 |
<data auto_broadcast="numpy" />
|
503 |
<input>
|
504 |
<port id="0" precision="I32">
|
@@ -514,19 +514,19 @@
|
|
514 |
</port>
|
515 |
</output>
|
516 |
</layer>
|
517 |
-
<layer id="38" name="
|
518 |
<data element_type="i32" shape="" offset="0" size="4" />
|
519 |
<output>
|
520 |
<port id="0" precision="I32" />
|
521 |
</output>
|
522 |
</layer>
|
523 |
-
<layer id="39" name="
|
524 |
<data element_type="i32" shape="" offset="4" size="4" />
|
525 |
<output>
|
526 |
<port id="0" precision="I32" />
|
527 |
</output>
|
528 |
</layer>
|
529 |
-
<layer id="40" name="
|
530 |
<data element_type="i32" shape="1" offset="1288273" size="4" />
|
531 |
<output>
|
532 |
<port id="0" precision="I32">
|
@@ -534,7 +534,7 @@
|
|
534 |
</port>
|
535 |
</output>
|
536 |
</layer>
|
537 |
-
<layer id="41" name="
|
538 |
<data element_type="i32" shape="4" offset="1288277" size="16" />
|
539 |
<output>
|
540 |
<port id="0" precision="I32">
|
@@ -542,7 +542,7 @@
|
|
542 |
</port>
|
543 |
</output>
|
544 |
</layer>
|
545 |
-
<layer id="42" name="
|
546 |
<input>
|
547 |
<port id="0" precision="I32" />
|
548 |
<port id="1" precision="I32" />
|
@@ -593,7 +593,7 @@
|
|
593 |
</port>
|
594 |
</output>
|
595 |
</layer>
|
596 |
-
<layer id="43" name="
|
597 |
<data auto_broadcast="numpy" />
|
598 |
<input>
|
599 |
<port id="0" precision="I32">
|
@@ -609,13 +609,13 @@
|
|
609 |
</port>
|
610 |
</output>
|
611 |
</layer>
|
612 |
-
<layer id="44" name="
|
613 |
<data element_type="i32" shape="" offset="0" size="4" />
|
614 |
<output>
|
615 |
<port id="0" precision="I32" />
|
616 |
</output>
|
617 |
</layer>
|
618 |
-
<layer id="45" name="
|
619 |
<data keep_dims="false" />
|
620 |
<input>
|
621 |
<port id="0" precision="I32">
|
@@ -627,13 +627,13 @@
|
|
627 |
<port id="2" precision="I32" />
|
628 |
</output>
|
629 |
</layer>
|
630 |
-
<layer id="46" name="
|
631 |
<data element_type="i32" shape="" offset="1288273" size="4" />
|
632 |
<output>
|
633 |
<port id="0" precision="I32" />
|
634 |
</output>
|
635 |
</layer>
|
636 |
-
<layer id="47" name="
|
637 |
<data pad_right="true" />
|
638 |
<input>
|
639 |
<port id="0" precision="I32">
|
@@ -659,7 +659,7 @@
|
|
659 |
</port>
|
660 |
</output>
|
661 |
</layer>
|
662 |
-
<layer id="48" name="
|
663 |
<data destination_type="i32" />
|
664 |
<input>
|
665 |
<port id="0" precision="BOOL">
|
@@ -674,7 +674,7 @@
|
|
674 |
</port>
|
675 |
</output>
|
676 |
</layer>
|
677 |
-
<layer id="49" name="
|
678 |
<data destination_type="i64" />
|
679 |
<input>
|
680 |
<port id="0" precision="I32">
|
@@ -689,7 +689,7 @@
|
|
689 |
</port>
|
690 |
</output>
|
691 |
</layer>
|
692 |
-
<layer id="51" name="
|
693 |
<data destination_type="i64" />
|
694 |
<input>
|
695 |
<port id="0" precision="I32">
|
@@ -704,7 +704,7 @@
|
|
704 |
</port>
|
705 |
</output>
|
706 |
</layer>
|
707 |
-
<layer id="52" name="
|
708 |
<input>
|
709 |
<port id="0" precision="I64">
|
710 |
<dim>-1</dim>
|
@@ -712,7 +712,7 @@
|
|
712 |
</port>
|
713 |
</input>
|
714 |
</layer>
|
715 |
-
<layer id="50" name="
|
716 |
<input>
|
717 |
<port id="0" precision="I64">
|
718 |
<dim>-1</dim>
|
@@ -805,9 +805,29 @@
|
|
805 |
<edge from-layer="51" from-port="1" to-layer="52" to-port="0" />
|
806 |
</edges>
|
807 |
<rt_info>
|
|
|
|
|
|
|
808 |
<bos_token_id value="50257" />
|
|
|
|
|
809 |
<eos_token_id value="50257" />
|
|
|
|
|
|
|
|
|
810 |
<original_tokenizer_class value="<class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
|
811 |
<pad_token_id value="50257" />
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
812 |
</rt_info>
|
813 |
</net>
|
|
|
1 |
<?xml version="1.0"?>
|
2 |
<net name="tokenizer" version="11">
|
3 |
<layers>
|
4 |
+
<layer id="0" name="Parameter_33460" type="Parameter" version="opset1">
|
5 |
<data shape="?" element_type="string" />
|
6 |
<output>
|
7 |
+
<port id="0" precision="STRING" names="Parameter_33460">
|
8 |
<dim>-1</dim>
|
9 |
</port>
|
10 |
</output>
|
11 |
</layer>
|
12 |
+
<layer id="1" name="Constant_33558" type="Const" version="opset1">
|
13 |
<data element_type="i32" shape="" offset="0" size="4" />
|
14 |
<output>
|
15 |
<port id="0" precision="I32" />
|
16 |
</output>
|
17 |
</layer>
|
18 |
+
<layer id="2" name="Constant_33559" type="Const" version="opset1">
|
19 |
<data element_type="i32" shape="" offset="4" size="4" />
|
20 |
<output>
|
21 |
<port id="0" precision="I32" />
|
22 |
</output>
|
23 |
</layer>
|
24 |
+
<layer id="3" name="Constant_33560" type="Const" version="opset1">
|
25 |
<data element_type="i32" shape="1" offset="8" size="4" />
|
26 |
<output>
|
27 |
<port id="0" precision="I32">
|
|
|
29 |
</port>
|
30 |
</output>
|
31 |
</layer>
|
32 |
+
<layer id="4" name="Constant_33561" type="Const" version="opset1">
|
33 |
<data element_type="i32" shape="" offset="0" size="4" />
|
34 |
<output>
|
35 |
<port id="0" precision="I32" />
|
36 |
</output>
|
37 |
</layer>
|
38 |
+
<layer id="5" name="Constant_33562" type="Const" version="opset1">
|
39 |
<data element_type="i32" shape="" offset="4" size="4" />
|
40 |
<output>
|
41 |
<port id="0" precision="I32" />
|
42 |
</output>
|
43 |
</layer>
|
44 |
+
<layer id="6" name="Constant_33563" type="Const" version="opset1">
|
45 |
<data element_type="i32" shape="1" offset="12" size="4" />
|
46 |
<output>
|
47 |
<port id="0" precision="I32">
|
|
|
49 |
</port>
|
50 |
</output>
|
51 |
</layer>
|
52 |
+
<layer id="7" name="Constant_33466" type="Const" version="opset1">
|
53 |
<data element_type="i64" shape="" offset="16" size="8" />
|
54 |
<output>
|
55 |
<port id="0" precision="I64" />
|
56 |
</output>
|
57 |
</layer>
|
58 |
+
<layer id="8" name="StringTensorUnpack_33461" type="StringTensorUnpack" version="extension">
|
59 |
<data mode="begins_ends" />
|
60 |
<input>
|
61 |
<port id="0" precision="STRING">
|
|
|
74 |
</port>
|
75 |
</output>
|
76 |
</layer>
|
77 |
+
<layer id="9" name="ShapeOf_33462" type="ShapeOf" version="opset3">
|
78 |
<data output_type="i64" />
|
79 |
<input>
|
80 |
<port id="0" precision="I32">
|
|
|
87 |
</port>
|
88 |
</output>
|
89 |
</layer>
|
90 |
+
<layer id="10" name="Constant_33463" type="Const" version="opset1">
|
91 |
<data element_type="i64" shape="" offset="16" size="8" />
|
92 |
<output>
|
93 |
<port id="0" precision="I64" />
|
94 |
</output>
|
95 |
</layer>
|
96 |
+
<layer id="11" name="Constant_33464" type="Const" version="opset1">
|
97 |
<data element_type="i64" shape="" offset="16" size="8" />
|
98 |
<output>
|
99 |
<port id="0" precision="I64" />
|
100 |
</output>
|
101 |
</layer>
|
102 |
+
<layer id="12" name="Gather_33465" type="Gather" version="opset8">
|
103 |
<data batch_dims="0" />
|
104 |
<input>
|
105 |
<port id="0" precision="I64">
|
|
|
112 |
<port id="3" precision="I64" />
|
113 |
</output>
|
114 |
</layer>
|
115 |
+
<layer id="13" name="Constant_33467" type="Const" version="opset1">
|
116 |
<data element_type="i64" shape="" offset="24" size="8" />
|
117 |
<output>
|
118 |
<port id="0" precision="I64" />
|
119 |
</output>
|
120 |
</layer>
|
121 |
+
<layer id="14" name="Range_33468" type="Range" version="opset4">
|
122 |
<data output_type="i32" />
|
123 |
<input>
|
124 |
<port id="0" precision="I64" />
|
|
|
131 |
</port>
|
132 |
</output>
|
133 |
</layer>
|
134 |
+
<layer id="15" name="Constant_33469" type="Const" version="opset1">
|
135 |
<data element_type="i64" shape="" offset="24" size="8" />
|
136 |
<output>
|
137 |
<port id="0" precision="I64" />
|
138 |
</output>
|
139 |
</layer>
|
140 |
+
<layer id="16" name="Constant_33470" type="Const" version="opset1">
|
141 |
<data element_type="i64" shape="" offset="24" size="8" />
|
142 |
<output>
|
143 |
<port id="0" precision="I64" />
|
144 |
</output>
|
145 |
</layer>
|
146 |
+
<layer id="17" name="Add_33471" type="Add" version="opset1">
|
147 |
<data auto_broadcast="numpy" />
|
148 |
<input>
|
149 |
<port id="0" precision="I64" />
|
|
|
153 |
<port id="2" precision="I64" />
|
154 |
</output>
|
155 |
</layer>
|
156 |
+
<layer id="18" name="Constant_33472" type="Const" version="opset1">
|
157 |
<data element_type="i64" shape="" offset="24" size="8" />
|
158 |
<output>
|
159 |
<port id="0" precision="I64" />
|
160 |
</output>
|
161 |
</layer>
|
162 |
+
<layer id="19" name="Range_33473" type="Range" version="opset4">
|
163 |
<data output_type="i32" />
|
164 |
<input>
|
165 |
<port id="0" precision="I64" />
|
|
|
172 |
</port>
|
173 |
</output>
|
174 |
</layer>
|
175 |
+
<layer id="20" name="Constant_33535" type="Const" version="opset1">
|
176 |
<data element_type="u8" shape="26491" offset="32" size="26491" />
|
177 |
<output>
|
178 |
<port id="0" precision="U8">
|
|
|
180 |
</port>
|
181 |
</output>
|
182 |
</layer>
|
183 |
+
<layer id="21" name="SpecialTokensSplit_33536" type="SpecialTokensSplit" version="extension">
|
184 |
<input>
|
185 |
<port id="0" precision="I32">
|
186 |
<dim>-1</dim>
|
|
|
222 |
</port>
|
223 |
</output>
|
224 |
</layer>
|
225 |
+
<layer id="22" name="Constant_33538" type="Const" version="opset1">
|
226 |
<data element_type="u8" shape="64" offset="26523" size="64" />
|
227 |
<output>
|
228 |
<port id="0" precision="U8">
|
|
|
230 |
</port>
|
231 |
</output>
|
232 |
</layer>
|
233 |
+
<layer id="23" name="RegexSplit_33539" type="RegexSplit" version="extension">
|
234 |
<data behaviour="isolate" invert="false" max_splits="-1" />
|
235 |
<input>
|
236 |
<port id="0" precision="I32">
|
|
|
276 |
</port>
|
277 |
</output>
|
278 |
</layer>
|
279 |
+
<layer id="24" name="Constant_33541" type="Const" version="opset1">
|
280 |
<data element_type="u8" shape="528257" offset="26587" size="528257" />
|
281 |
<output>
|
282 |
<port id="0" precision="U8">
|
|
|
284 |
</port>
|
285 |
</output>
|
286 |
</layer>
|
287 |
+
<layer id="25" name="StringTensorUnpack_33542" type="StringTensorUnpack" version="extension">
|
288 |
<data mode="begins_ends" />
|
289 |
<input>
|
290 |
<port id="0" precision="U8">
|
|
|
303 |
</port>
|
304 |
</output>
|
305 |
</layer>
|
306 |
+
<layer id="26" name="Constant_33547" type="Const" version="opset1">
|
307 |
<data element_type="u8" shape="369958" offset="554844" size="369958" />
|
308 |
<output>
|
309 |
<port id="0" precision="U8">
|
|
|
311 |
</port>
|
312 |
</output>
|
313 |
</layer>
|
314 |
+
<layer id="27" name="StringTensorUnpack_33548" type="StringTensorUnpack" version="extension">
|
315 |
<data mode="begins_ends" />
|
316 |
<input>
|
317 |
<port id="0" precision="U8">
|
|
|
330 |
</port>
|
331 |
</output>
|
332 |
</layer>
|
333 |
+
<layer id="28" name="Constant_33550" type="Const" version="opset1">
|
334 |
<data element_type="u8" shape="336859" offset="924802" size="336859" />
|
335 |
<output>
|
336 |
<port id="0" precision="U8">
|
|
|
338 |
</port>
|
339 |
</output>
|
340 |
</layer>
|
341 |
+
<layer id="29" name="StringTensorUnpack_33551" type="StringTensorUnpack" version="extension">
|
342 |
<data mode="begins_ends" />
|
343 |
<input>
|
344 |
<port id="0" precision="U8">
|
|
|
357 |
</port>
|
358 |
</output>
|
359 |
</layer>
|
360 |
+
<layer id="30" name="Constant_33544" type="Const" version="opset1">
|
361 |
<data element_type="u8" shape="20172" offset="1261661" size="20172" />
|
362 |
<output>
|
363 |
<port id="0" precision="U8">
|
|
|
365 |
</port>
|
366 |
</output>
|
367 |
</layer>
|
368 |
+
<layer id="31" name="StringTensorUnpack_33545" type="StringTensorUnpack" version="extension">
|
369 |
<data mode="begins_ends" />
|
370 |
<input>
|
371 |
<port id="0" precision="U8">
|
|
|
384 |
</port>
|
385 |
</output>
|
386 |
</layer>
|
387 |
+
<layer id="32" name="Constant_33552" type="Const" version="opset1">
|
388 |
<data element_type="i32" shape="1609" offset="1281833" size="6436" />
|
389 |
<output>
|
390 |
<port id="0" precision="I32">
|
|
|
392 |
</port>
|
393 |
</output>
|
394 |
</layer>
|
395 |
+
<layer id="33" name="BPETokenizer_33553" type="BPETokenizer" version="extension">
|
396 |
<data unk_token="" fuse_unk="false" suffix_indicator="" end_suffix="" byte_fallback="false" cache_capacity="20000" />
|
397 |
<input>
|
398 |
<port id="0" precision="I32">
|
|
|
462 |
</port>
|
463 |
</output>
|
464 |
</layer>
|
465 |
+
<layer id="34" name="Subtract_33554" type="Subtract" version="opset1">
|
466 |
<data auto_broadcast="numpy" />
|
467 |
<input>
|
468 |
<port id="0" precision="I32">
|
|
|
478 |
</port>
|
479 |
</output>
|
480 |
</layer>
|
481 |
+
<layer id="35" name="Constant_33555" type="Const" version="opset1">
|
482 |
<data element_type="i32" shape="" offset="1288269" size="4" />
|
483 |
<output>
|
484 |
<port id="0" precision="I32" />
|
485 |
</output>
|
486 |
</layer>
|
487 |
+
<layer id="36" name="Minimum_33556" type="Minimum" version="opset1">
|
488 |
<data auto_broadcast="numpy" />
|
489 |
<input>
|
490 |
<port id="0" precision="I32">
|
|
|
498 |
</port>
|
499 |
</output>
|
500 |
</layer>
|
501 |
+
<layer id="37" name="Add_33557" type="Add" version="opset1">
|
502 |
<data auto_broadcast="numpy" />
|
503 |
<input>
|
504 |
<port id="0" precision="I32">
|
|
|
514 |
</port>
|
515 |
</output>
|
516 |
</layer>
|
517 |
+
<layer id="38" name="Constant_33564" type="Const" version="opset1">
|
518 |
<data element_type="i32" shape="" offset="0" size="4" />
|
519 |
<output>
|
520 |
<port id="0" precision="I32" />
|
521 |
</output>
|
522 |
</layer>
|
523 |
+
<layer id="39" name="Constant_33565" type="Const" version="opset1">
|
524 |
<data element_type="i32" shape="" offset="4" size="4" />
|
525 |
<output>
|
526 |
<port id="0" precision="I32" />
|
527 |
</output>
|
528 |
</layer>
|
529 |
+
<layer id="40" name="Constant_33566" type="Const" version="opset1">
|
530 |
<data element_type="i32" shape="1" offset="1288273" size="4" />
|
531 |
<output>
|
532 |
<port id="0" precision="I32">
|
|
|
534 |
</port>
|
535 |
</output>
|
536 |
</layer>
|
537 |
+
<layer id="41" name="Constant_33567" type="Const" version="opset1">
|
538 |
<data element_type="i32" shape="4" offset="1288277" size="16" />
|
539 |
<output>
|
540 |
<port id="0" precision="I32">
|
|
|
542 |
</port>
|
543 |
</output>
|
544 |
</layer>
|
545 |
+
<layer id="42" name="CombineSegments_33568" type="CombineSegments" version="extension">
|
546 |
<input>
|
547 |
<port id="0" precision="I32" />
|
548 |
<port id="1" precision="I32" />
|
|
|
593 |
</port>
|
594 |
</output>
|
595 |
</layer>
|
596 |
+
<layer id="43" name="Subtract_33569" type="Subtract" version="opset1">
|
597 |
<data auto_broadcast="numpy" />
|
598 |
<input>
|
599 |
<port id="0" precision="I32">
|
|
|
609 |
</port>
|
610 |
</output>
|
611 |
</layer>
|
612 |
+
<layer id="44" name="Constant_33570" type="Const" version="opset1">
|
613 |
<data element_type="i32" shape="" offset="0" size="4" />
|
614 |
<output>
|
615 |
<port id="0" precision="I32" />
|
616 |
</output>
|
617 |
</layer>
|
618 |
+
<layer id="45" name="ReduceMax_33571" type="ReduceMax" version="opset1">
|
619 |
<data keep_dims="false" />
|
620 |
<input>
|
621 |
<port id="0" precision="I32">
|
|
|
627 |
<port id="2" precision="I32" />
|
628 |
</output>
|
629 |
</layer>
|
630 |
+
<layer id="46" name="Constant_33572" type="Const" version="opset1">
|
631 |
<data element_type="i32" shape="" offset="1288273" size="4" />
|
632 |
<output>
|
633 |
<port id="0" precision="I32" />
|
634 |
</output>
|
635 |
</layer>
|
636 |
+
<layer id="47" name="RaggedToDense_33573" type="RaggedToDense" version="extension">
|
637 |
<data pad_right="true" />
|
638 |
<input>
|
639 |
<port id="0" precision="I32">
|
|
|
659 |
</port>
|
660 |
</output>
|
661 |
</layer>
|
662 |
+
<layer id="48" name="Convert_33574" type="Convert" version="opset1">
|
663 |
<data destination_type="i32" />
|
664 |
<input>
|
665 |
<port id="0" precision="BOOL">
|
|
|
674 |
</port>
|
675 |
</output>
|
676 |
</layer>
|
677 |
+
<layer id="49" name="Convert_33574" type="Convert" version="opset1">
|
678 |
<data destination_type="i64" />
|
679 |
<input>
|
680 |
<port id="0" precision="I32">
|
|
|
689 |
</port>
|
690 |
</output>
|
691 |
</layer>
|
692 |
+
<layer id="51" name="RaggedToDense_33573.0" type="Convert" version="opset1">
|
693 |
<data destination_type="i64" />
|
694 |
<input>
|
695 |
<port id="0" precision="I32">
|
|
|
704 |
</port>
|
705 |
</output>
|
706 |
</layer>
|
707 |
+
<layer id="52" name="Result_33577" type="Result" version="opset1">
|
708 |
<input>
|
709 |
<port id="0" precision="I64">
|
710 |
<dim>-1</dim>
|
|
|
712 |
</port>
|
713 |
</input>
|
714 |
</layer>
|
715 |
+
<layer id="50" name="Result_33579" type="Result" version="opset1">
|
716 |
<input>
|
717 |
<port id="0" precision="I64">
|
718 |
<dim>-1</dim>
|
|
|
805 |
<edge from-layer="51" from-port="1" to-layer="52" to-port="0" />
|
806 |
</edges>
|
807 |
<rt_info>
|
808 |
+
<add_attention_mask value="True" />
|
809 |
+
<add_prefix_space />
|
810 |
+
<add_special_tokens value="True" />
|
811 |
<bos_token_id value="50257" />
|
812 |
+
<clean_up_tokenization_spaces />
|
813 |
+
<detokenizer_input_type value="i64" />
|
814 |
<eos_token_id value="50257" />
|
815 |
+
<handle_special_tokens_with_re />
|
816 |
+
<number_of_inputs value="1" />
|
817 |
+
<openvino_tokenizers_version value="2024.5.0.0" />
|
818 |
+
<openvino_version value="2024.5.0" />
|
819 |
<original_tokenizer_class value="<class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
|
820 |
<pad_token_id value="50257" />
|
821 |
+
<sentencepiece_version value="0.2.0" />
|
822 |
+
<skip_special_tokens value="True" />
|
823 |
+
<streaming_detokenizer value="False" />
|
824 |
+
<tiktoken_version value="0.8.0" />
|
825 |
+
<tokenizer_output_type value="i64" />
|
826 |
+
<tokenizers_version value="0.20.3" />
|
827 |
+
<transformers_version value="4.46.3" />
|
828 |
+
<use_max_padding value="False" />
|
829 |
+
<use_sentencepiece_backend value="False" />
|
830 |
+
<utf8_replace_mode />
|
831 |
+
<with_detokenizer value="True" />
|
832 |
</rt_info>
|
833 |
</net>
|