openvino-ci commited on
Commit
41e0b7f
1 Parent(s): aa8b7de

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "_name_or_path": "distil-whisper/distil-large-v3",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
@@ -39,7 +40,7 @@
39
  "num_mel_bins": 128,
40
  "pad_token_id": 50256,
41
  "scale_embedding": false,
42
- "transformers_version": "4.45.2",
43
  "use_cache": true,
44
  "use_weighted_layer_sum": false,
45
  "vocab_size": 51866
 
1
  {
2
+ "_attn_implementation_autoset": true,
3
  "_name_or_path": "distil-whisper/distil-large-v3",
4
  "activation_dropout": 0.0,
5
  "activation_function": "gelu",
 
40
  "num_mel_bins": 128,
41
  "pad_token_id": 50256,
42
  "scale_embedding": false,
43
+ "transformers_version": "4.46.3",
44
  "use_cache": true,
45
  "use_weighted_layer_sum": false,
46
  "vocab_size": 51866
generation_config.json CHANGED
@@ -303,5 +303,5 @@
303
  "transcribe": 50360,
304
  "translate": 50359
305
  },
306
- "transformers_version": "4.45.2"
307
  }
 
303
  "transcribe": 50360,
304
  "translate": 50359
305
  },
306
+ "transformers_version": "4.46.3"
307
  }
openvino_decoder_model.xml CHANGED
@@ -10,7 +10,7 @@
10
  </port>
11
  </output>
12
  </layer>
13
- <layer id="0" name="Parameter_26431" type="Parameter" version="opset1">
14
  <data shape="?,?,?" element_type="f32" />
15
  <output>
16
  <port id="0" precision="FP32" names="encoder_hidden_states">
@@ -47,7 +47,7 @@
47
  </port>
48
  </output>
49
  </layer>
50
- <layer id="4" name="Constant_31865" type="Const" version="opset1">
51
  <data element_type="i64" shape="2" offset="132776960" size="16" />
52
  <rt_info>
53
  <attribute name="precise" version="0" />
@@ -151,7 +151,7 @@
151
  <port id="0" precision="I64" names="23" />
152
  </output>
153
  </layer>
154
- <layer id="12" name="ShapeOf_31838" type="ShapeOf" version="opset3">
155
  <data output_type="i64" />
156
  <input>
157
  <port id="0" precision="I64">
@@ -165,7 +165,7 @@
165
  </port>
166
  </output>
167
  </layer>
168
- <layer id="13" name="Constant_31839" type="Const" version="opset1">
169
  <data element_type="i64" shape="" offset="133923868" size="8" />
170
  <rt_info>
171
  <attribute name="precise" version="0" />
@@ -174,7 +174,7 @@
174
  <port id="0" precision="I64" />
175
  </output>
176
  </layer>
177
- <layer id="14" name="Constant_31840" type="Const" version="opset1">
178
  <data element_type="i64" shape="" offset="133923860" size="8" />
179
  <rt_info>
180
  <attribute name="precise" version="0" />
@@ -183,7 +183,7 @@
183
  <port id="0" precision="I64" />
184
  </output>
185
  </layer>
186
- <layer id="15" name="Gather_31841" type="Gather" version="opset8">
187
  <data batch_dims="0" />
188
  <input>
189
  <port id="0" precision="I64">
@@ -244,7 +244,7 @@
244
  </port>
245
  </output>
246
  </layer>
247
- <layer id="20" name="Constant_26428" type="Const" version="opset1">
248
  <data element_type="i32" shape="" offset="132776976" size="4" />
249
  <output>
250
  <port id="0" precision="I32" />
@@ -321,7 +321,7 @@
321
  </port>
322
  </output>
323
  </layer>
324
- <layer id="25" name="Constant_31606_compressed" type="Const" version="opset1">
325
  <data element_type="f16" shape="1, 1, 1280" offset="133923884" size="2560" />
326
  <output>
327
  <port id="0" precision="FP16">
@@ -331,7 +331,7 @@
331
  </port>
332
  </output>
333
  </layer>
334
- <layer id="26" name="Constant_31606" type="Convert" version="opset1">
335
  <data destination_type="f32" />
336
  <rt_info>
337
  <attribute name="decompression" version="0" />
@@ -373,7 +373,7 @@
373
  </port>
374
  </output>
375
  </layer>
376
- <layer id="28" name="Constant_31607_compressed" type="Const" version="opset1">
377
  <data element_type="f16" shape="1, 1, 1280" offset="133926444" size="2560" />
378
  <output>
379
  <port id="0" precision="FP16">
@@ -383,7 +383,7 @@
383
  </port>
384
  </output>
385
  </layer>
386
- <layer id="29" name="Constant_31607" type="Convert" version="opset1">
387
  <data destination_type="f32" />
388
  <rt_info>
389
  <attribute name="decompression" version="0" />
@@ -425,7 +425,7 @@
425
  </port>
426
  </output>
427
  </layer>
428
- <layer id="31" name="Constant_31509_compressed" type="Const" version="opset1">
429
  <data element_type="f16" shape="1280, 1280" offset="133929004" size="3276800" />
430
  <output>
431
  <port id="0" precision="FP16">
@@ -434,7 +434,7 @@
434
  </port>
435
  </output>
436
  </layer>
437
- <layer id="32" name="Constant_31509" type="Convert" version="opset1">
438
  <data destination_type="f32" />
439
  <rt_info>
440
  <attribute name="decompression" version="0" />
@@ -452,7 +452,7 @@
452
  </port>
453
  </output>
454
  </layer>
455
- <layer id="33" name="Multiply_31492" type="MatMul" version="opset1">
456
  <data transpose_a="false" transpose_b="true" />
457
  <input>
458
  <port id="0" precision="FP32">
@@ -473,7 +473,7 @@
473
  </port>
474
  </output>
475
  </layer>
476
- <layer id="34" name="Constant_31608_compressed" type="Const" version="opset1">
477
  <data element_type="f16" shape="1, 1, 1280" offset="137205804" size="2560" />
478
  <output>
479
  <port id="0" precision="FP16">
@@ -483,7 +483,7 @@
483
  </port>
484
  </output>
485
  </layer>
486
- <layer id="35" name="Constant_31608" type="Convert" version="opset1">
487
  <data destination_type="f32" />
488
  <rt_info>
489
  <attribute name="decompression" version="0" />
@@ -525,7 +525,7 @@
525
  </port>
526
  </output>
527
  </layer>
528
- <layer id="37" name="Constant_31866" type="Const" version="opset1">
529
  <data element_type="i64" shape="4" offset="137208364" size="32" />
530
  <rt_info>
531
  <attribute name="precise" version="0" />
@@ -634,7 +634,7 @@
634
  </port>
635
  </output>
636
  </layer>
637
- <layer id="44" name="Constant_31867" type="Const" version="opset1">
638
  <data element_type="i64" shape="4" offset="137208364" size="32" />
639
  <rt_info>
640
  <attribute name="precise" version="0" />
@@ -726,13 +726,13 @@
726
  <port id="0" precision="I32" />
727
  </output>
728
  </layer>
729
- <layer id="50" name="__module.model.model.decoder/aten::full/Convert" type="Const" version="opset1">
730
  <data element_type="f32" shape="" offset="140485212" size="4" />
731
  <output>
732
- <port id="0" precision="FP32" />
733
  </output>
734
  </layer>
735
- <layer id="51" name="Constant_31848" type="Const" version="opset1">
736
  <data element_type="i64" shape="1" offset="133923868" size="8" />
737
  <rt_info>
738
  <attribute name="precise" version="0" />
@@ -743,7 +743,7 @@
743
  </port>
744
  </output>
745
  </layer>
746
- <layer id="52" name="Reshape_31849" type="Reshape" version="opset1">
747
  <data special_zero="false" />
748
  <input>
749
  <port id="0" precision="I64" />
@@ -776,7 +776,7 @@
776
  <port id="2" precision="I64" names="62,64" />
777
  </output>
778
  </layer>
779
- <layer id="55" name="Constant_24308" type="Const" version="opset1">
780
  <data element_type="i32" shape="" offset="132776976" size="4" />
781
  <rt_info>
782
  <attribute name="precise" version="0" />
@@ -785,7 +785,7 @@
785
  <port id="0" precision="I32" />
786
  </output>
787
  </layer>
788
- <layer id="56" name="Unsqueeze_24309" type="Unsqueeze" version="opset1">
789
  <input>
790
  <port id="0" precision="I64" />
791
  <port id="1" precision="I32" />
@@ -827,7 +827,7 @@
827
  </port>
828
  </output>
829
  </layer>
830
- <layer id="59" name="ShapeOf_31850" type="ShapeOf" version="opset3">
831
  <data output_type="i32" />
832
  <input>
833
  <port id="0" precision="FP32">
@@ -841,19 +841,19 @@
841
  </port>
842
  </output>
843
  </layer>
844
- <layer id="60" name="Constant_31851" type="Const" version="opset1">
845
  <data element_type="i64" shape="" offset="133923868" size="8" />
846
  <output>
847
  <port id="0" precision="I64" />
848
  </output>
849
  </layer>
850
- <layer id="61" name="Constant_31852" type="Const" version="opset1">
851
  <data element_type="i64" shape="" offset="133923860" size="8" />
852
  <output>
853
  <port id="0" precision="I64" />
854
  </output>
855
  </layer>
856
- <layer id="62" name="Gather_31853" type="Gather" version="opset8">
857
  <data batch_dims="0" />
858
  <input>
859
  <port id="0" precision="I32">
@@ -905,7 +905,7 @@
905
  <port id="0" precision="I32" />
906
  </output>
907
  </layer>
908
- <layer id="67" name="Convert_31856" type="Convert" version="opset1">
909
  <data destination_type="i32" />
910
  <input>
911
  <port id="0" precision="I64" />
@@ -1059,7 +1059,7 @@
1059
  </port>
1060
  </output>
1061
  </layer>
1062
- <layer id="80" name="Constant_24411" type="Const" version="opset1">
1063
  <data element_type="i64" shape="2" offset="140485218" size="16" />
1064
  <rt_info>
1065
  <attribute name="precise" version="0" />
@@ -1179,7 +1179,7 @@
1179
  </port>
1180
  </output>
1181
  </layer>
1182
- <layer id="88" name="Constant_31845" type="Const" version="opset1">
1183
  <data element_type="i64" shape="1" offset="133923860" size="8" />
1184
  <rt_info>
1185
  <attribute name="precise" version="0" />
@@ -1190,7 +1190,7 @@
1190
  </port>
1191
  </output>
1192
  </layer>
1193
- <layer id="89" name="Constant_31846" type="Const" version="opset1">
1194
  <data element_type="i64" shape="" offset="133923860" size="8" />
1195
  <rt_info>
1196
  <attribute name="precise" version="0" />
@@ -1199,7 +1199,7 @@
1199
  <port id="0" precision="I64" />
1200
  </output>
1201
  </layer>
1202
- <layer id="90" name="Gather_31847" type="Gather" version="opset8">
1203
  <data batch_dims="0" />
1204
  <input>
1205
  <port id="0" precision="I64">
@@ -1216,7 +1216,7 @@
1216
  </port>
1217
  </output>
1218
  </layer>
1219
- <layer id="91" name="Constant_30837" type="Const" version="opset1">
1220
  <data element_type="i64" shape="1" offset="133923868" size="8" />
1221
  <rt_info>
1222
  <attribute name="precise" version="0" />
@@ -1227,7 +1227,7 @@
1227
  </port>
1228
  </output>
1229
  </layer>
1230
- <layer id="92" name="Constant_30839" type="Const" version="opset1">
1231
  <data element_type="i64" shape="1" offset="133923868" size="8" />
1232
  <rt_info>
1233
  <attribute name="precise" version="0" />
@@ -1238,7 +1238,7 @@
1238
  </port>
1239
  </output>
1240
  </layer>
1241
- <layer id="93" name="Constant_30841" type="Const" version="opset1">
1242
  <data element_type="i64" shape="1" offset="133923868" size="8" />
1243
  <rt_info>
1244
  <attribute name="precise" version="0" />
@@ -1293,7 +1293,7 @@
1293
  </port>
1294
  </output>
1295
  </layer>
1296
- <layer id="96" name="Constant_24845" type="Const" version="opset1">
1297
  <data element_type="i64" shape="1" offset="133923860" size="8" />
1298
  <output>
1299
  <port id="0" precision="I64">
@@ -1301,7 +1301,7 @@
1301
  </port>
1302
  </output>
1303
  </layer>
1304
- <layer id="97" name="ShapeOf_31861" type="ShapeOf" version="opset3">
1305
  <data output_type="i64" />
1306
  <input>
1307
  <port id="0" precision="FP32">
@@ -1316,7 +1316,7 @@
1316
  </port>
1317
  </output>
1318
  </layer>
1319
- <layer id="98" name="Constant_31862" type="Const" version="opset1">
1320
  <data element_type="i64" shape="1" offset="133923868" size="8" />
1321
  <output>
1322
  <port id="0" precision="I64">
@@ -1324,13 +1324,13 @@
1324
  </port>
1325
  </output>
1326
  </layer>
1327
- <layer id="99" name="Constant_31863" type="Const" version="opset1">
1328
  <data element_type="i64" shape="" offset="133923860" size="8" />
1329
  <output>
1330
  <port id="0" precision="I64" />
1331
  </output>
1332
  </layer>
1333
- <layer id="100" name="Gather_31864" type="Gather" version="opset8">
1334
  <data batch_dims="0" />
1335
  <input>
1336
  <port id="0" precision="I64">
@@ -1347,7 +1347,7 @@
1347
  </port>
1348
  </output>
1349
  </layer>
1350
- <layer id="101" name="Constant_24848" type="Const" version="opset1">
1351
  <data element_type="i64" shape="1" offset="133923868" size="8" />
1352
  <output>
1353
  <port id="0" precision="I64">
@@ -1485,7 +1485,7 @@
1485
  </port>
1486
  </output>
1487
  </layer>
1488
- <layer id="109" name="Constant_31609_compressed" type="Const" version="opset1">
1489
  <data element_type="f16" shape="1, 1, 1280" offset="143762042" size="2560" />
1490
  <output>
1491
  <port id="0" precision="FP16">
@@ -1495,7 +1495,7 @@
1495
  </port>
1496
  </output>
1497
  </layer>
1498
- <layer id="110" name="Constant_31609" type="Convert" version="opset1">
1499
  <data destination_type="f32" />
1500
  <rt_info>
1501
  <attribute name="decompression" version="0" />
@@ -1537,7 +1537,7 @@
1537
  </port>
1538
  </output>
1539
  </layer>
1540
- <layer id="112" name="Constant_31868" type="Const" version="opset1">
1541
  <data element_type="i64" shape="4" offset="137208364" size="32" />
1542
  <rt_info>
1543
  <attribute name="precise" version="0" />
@@ -1652,7 +1652,7 @@
1652
  </port>
1653
  </output>
1654
  </layer>
1655
- <layer id="119" name="Constant_31869" type="Const" version="opset1">
1656
  <data element_type="i64" shape="3" offset="143764602" size="24" />
1657
  <rt_info>
1658
  <attribute name="precise" version="0" />
@@ -1732,7 +1732,7 @@
1732
  </port>
1733
  </output>
1734
  </layer>
1735
- <layer id="124" name="Constant_31610_compressed" type="Const" version="opset1">
1736
  <data element_type="f16" shape="1, 1, 1280" offset="147041426" size="2560" />
1737
  <output>
1738
  <port id="0" precision="FP16">
@@ -1742,7 +1742,7 @@
1742
  </port>
1743
  </output>
1744
  </layer>
1745
- <layer id="125" name="Constant_31610" type="Convert" version="opset1">
1746
  <data destination_type="f32" />
1747
  <rt_info>
1748
  <attribute name="decompression" version="0" />
@@ -1834,7 +1834,7 @@
1834
  </port>
1835
  </output>
1836
  </layer>
1837
- <layer id="130" name="Constant_31611_compressed" type="Const" version="opset1">
1838
  <data element_type="f16" shape="1, 1, 1280" offset="147043986" size="2560" />
1839
  <output>
1840
  <port id="0" precision="FP16">
@@ -1844,7 +1844,7 @@
1844
  </port>
1845
  </output>
1846
  </layer>
1847
- <layer id="131" name="Constant_31611" type="Convert" version="opset1">
1848
  <data destination_type="f32" />
1849
  <rt_info>
1850
  <attribute name="decompression" version="0" />
@@ -1886,7 +1886,7 @@
1886
  </port>
1887
  </output>
1888
  </layer>
1889
- <layer id="133" name="Constant_31612_compressed" type="Const" version="opset1">
1890
  <data element_type="f16" shape="1, 1, 1280" offset="147046546" size="2560" />
1891
  <output>
1892
  <port id="0" precision="FP16">
@@ -1896,7 +1896,7 @@
1896
  </port>
1897
  </output>
1898
  </layer>
1899
- <layer id="134" name="Constant_31612" type="Convert" version="opset1">
1900
  <data destination_type="f32" />
1901
  <rt_info>
1902
  <attribute name="decompression" version="0" />
@@ -1938,7 +1938,7 @@
1938
  </port>
1939
  </output>
1940
  </layer>
1941
- <layer id="136" name="Constant_31512_compressed" type="Const" version="opset1">
1942
  <data element_type="f16" shape="1280, 1280" offset="147049106" size="3276800" />
1943
  <output>
1944
  <port id="0" precision="FP16">
@@ -1947,7 +1947,7 @@
1947
  </port>
1948
  </output>
1949
  </layer>
1950
- <layer id="137" name="Constant_31512" type="Convert" version="opset1">
1951
  <data destination_type="f32" />
1952
  <rt_info>
1953
  <attribute name="decompression" version="0" />
@@ -1965,7 +1965,7 @@
1965
  </port>
1966
  </output>
1967
  </layer>
1968
- <layer id="138" name="Multiply_31496" type="MatMul" version="opset1">
1969
  <data transpose_a="false" transpose_b="true" />
1970
  <input>
1971
  <port id="0" precision="FP32">
@@ -1986,7 +1986,7 @@
1986
  </port>
1987
  </output>
1988
  </layer>
1989
- <layer id="139" name="Constant_31613_compressed" type="Const" version="opset1">
1990
  <data element_type="f16" shape="1, 1, 1280" offset="150325906" size="2560" />
1991
  <output>
1992
  <port id="0" precision="FP16">
@@ -1996,7 +1996,7 @@
1996
  </port>
1997
  </output>
1998
  </layer>
1999
- <layer id="140" name="Constant_31613" type="Convert" version="opset1">
2000
  <data destination_type="f32" />
2001
  <rt_info>
2002
  <attribute name="decompression" version="0" />
@@ -2038,7 +2038,7 @@
2038
  </port>
2039
  </output>
2040
  </layer>
2041
- <layer id="142" name="Constant_31870" type="Const" version="opset1">
2042
  <data element_type="i64" shape="4" offset="137208364" size="32" />
2043
  <rt_info>
2044
  <attribute name="precise" version="0" />
@@ -2147,7 +2147,7 @@
2147
  </port>
2148
  </output>
2149
  </layer>
2150
- <layer id="149" name="Constant_25069" type="Const" version="opset1">
2151
  <data element_type="i64" shape="1" offset="153605266" size="8" />
2152
  <rt_info>
2153
  <attribute name="precise" version="0" />
@@ -2158,7 +2158,7 @@
2158
  </port>
2159
  </output>
2160
  </layer>
2161
- <layer id="150" name="Constant_25070" type="Const" version="opset1">
2162
  <data element_type="i64" shape="1" offset="153605274" size="8" />
2163
  <rt_info>
2164
  <attribute name="precise" version="0" />
@@ -2169,7 +2169,7 @@
2169
  </port>
2170
  </output>
2171
  </layer>
2172
- <layer id="151" name="Constant_25071" type="Const" version="opset1">
2173
  <data element_type="i64" shape="1" offset="153605282" size="8" />
2174
  <rt_info>
2175
  <attribute name="precise" version="0" />
@@ -2180,7 +2180,7 @@
2180
  </port>
2181
  </output>
2182
  </layer>
2183
- <layer id="152" name="__module.model.model.decoder.layers.0.encoder_attn/prim::ListConstruct_1" type="Concat" version="opset1">
2184
  <data axis="0" />
2185
  <input>
2186
  <port id="0" precision="I64">
@@ -2344,7 +2344,7 @@
2344
  </port>
2345
  </output>
2346
  </layer>
2347
- <layer id="161" name="Constant_31614_compressed" type="Const" version="opset1">
2348
  <data element_type="f16" shape="1, 1, 1280" offset="156882090" size="2560" />
2349
  <output>
2350
  <port id="0" precision="FP16">
@@ -2354,7 +2354,7 @@
2354
  </port>
2355
  </output>
2356
  </layer>
2357
- <layer id="162" name="Constant_31614" type="Convert" version="opset1">
2358
  <data destination_type="f32" />
2359
  <rt_info>
2360
  <attribute name="decompression" version="0" />
@@ -2500,7 +2500,7 @@
2500
  </port>
2501
  </output>
2502
  </layer>
2503
- <layer id="170" name="Constant_31871" type="Const" version="opset1">
2504
  <data element_type="i64" shape="3" offset="156884650" size="24" />
2505
  <rt_info>
2506
  <attribute name="precise" version="0" />
@@ -2580,7 +2580,7 @@
2580
  </port>
2581
  </output>
2582
  </layer>
2583
- <layer id="175" name="Constant_31615_compressed" type="Const" version="opset1">
2584
  <data element_type="f16" shape="1, 1, 1280" offset="160161474" size="2560" />
2585
  <output>
2586
  <port id="0" precision="FP16">
@@ -2590,7 +2590,7 @@
2590
  </port>
2591
  </output>
2592
  </layer>
2593
- <layer id="176" name="Constant_31615" type="Convert" version="opset1">
2594
  <data destination_type="f32" />
2595
  <rt_info>
2596
  <attribute name="decompression" version="0" />
@@ -2682,7 +2682,7 @@
2682
  </port>
2683
  </output>
2684
  </layer>
2685
- <layer id="181" name="Constant_31616_compressed" type="Const" version="opset1">
2686
  <data element_type="f16" shape="1, 1, 1280" offset="160164034" size="2560" />
2687
  <output>
2688
  <port id="0" precision="FP16">
@@ -2692,7 +2692,7 @@
2692
  </port>
2693
  </output>
2694
  </layer>
2695
- <layer id="182" name="Constant_31616" type="Convert" version="opset1">
2696
  <data destination_type="f32" />
2697
  <rt_info>
2698
  <attribute name="decompression" version="0" />
@@ -2734,7 +2734,7 @@
2734
  </port>
2735
  </output>
2736
  </layer>
2737
- <layer id="184" name="Constant_31617_compressed" type="Const" version="opset1">
2738
  <data element_type="f16" shape="1, 1, 1280" offset="160166594" size="2560" />
2739
  <output>
2740
  <port id="0" precision="FP16">
@@ -2744,7 +2744,7 @@
2744
  </port>
2745
  </output>
2746
  </layer>
2747
- <layer id="185" name="Constant_31617" type="Convert" version="opset1">
2748
  <data destination_type="f32" />
2749
  <rt_info>
2750
  <attribute name="decompression" version="0" />
@@ -2834,7 +2834,7 @@
2834
  </port>
2835
  </output>
2836
  </layer>
2837
- <layer id="190" name="Constant_31618_compressed" type="Const" version="opset1">
2838
  <data element_type="f16" shape="1, 1, 5120" offset="173276354" size="10240" />
2839
  <output>
2840
  <port id="0" precision="FP16">
@@ -2844,7 +2844,7 @@
2844
  </port>
2845
  </output>
2846
  </layer>
2847
- <layer id="191" name="Constant_31618" type="Convert" version="opset1">
2848
  <data destination_type="f32" />
2849
  <rt_info>
2850
  <attribute name="decompression" version="0" />
@@ -2951,7 +2951,7 @@
2951
  </port>
2952
  </output>
2953
  </layer>
2954
- <layer id="197" name="Constant_31619_compressed" type="Const" version="opset1">
2955
  <data element_type="f16" shape="1, 1, 1280" offset="186393794" size="2560" />
2956
  <output>
2957
  <port id="0" precision="FP16">
@@ -2961,7 +2961,7 @@
2961
  </port>
2962
  </output>
2963
  </layer>
2964
- <layer id="198" name="Constant_31619" type="Convert" version="opset1">
2965
  <data destination_type="f32" />
2966
  <rt_info>
2967
  <attribute name="decompression" version="0" />
@@ -3053,7 +3053,7 @@
3053
  </port>
3054
  </output>
3055
  </layer>
3056
- <layer id="203" name="Constant_31620_compressed" type="Const" version="opset1">
3057
  <data element_type="f16" shape="1, 1, 1280" offset="186396354" size="2560" />
3058
  <output>
3059
  <port id="0" precision="FP16">
@@ -3063,7 +3063,7 @@
3063
  </port>
3064
  </output>
3065
  </layer>
3066
- <layer id="204" name="Constant_31620" type="Convert" version="opset1">
3067
  <data destination_type="f32" />
3068
  <rt_info>
3069
  <attribute name="decompression" version="0" />
@@ -3105,7 +3105,7 @@
3105
  </port>
3106
  </output>
3107
  </layer>
3108
- <layer id="206" name="Constant_31621_compressed" type="Const" version="opset1">
3109
  <data element_type="f16" shape="1, 1, 1280" offset="186398914" size="2560" />
3110
  <output>
3111
  <port id="0" precision="FP16">
@@ -3115,7 +3115,7 @@
3115
  </port>
3116
  </output>
3117
  </layer>
3118
- <layer id="207" name="Constant_31621" type="Convert" version="opset1">
3119
  <data destination_type="f32" />
3120
  <rt_info>
3121
  <attribute name="decompression" version="0" />
@@ -3157,7 +3157,7 @@
3157
  </port>
3158
  </output>
3159
  </layer>
3160
- <layer id="209" name="Constant_31515_compressed" type="Const" version="opset1">
3161
  <data element_type="f16" shape="1280, 1280" offset="186401474" size="3276800" />
3162
  <output>
3163
  <port id="0" precision="FP16">
@@ -3166,7 +3166,7 @@
3166
  </port>
3167
  </output>
3168
  </layer>
3169
- <layer id="210" name="Constant_31515" type="Convert" version="opset1">
3170
  <data destination_type="f32" />
3171
  <rt_info>
3172
  <attribute name="decompression" version="0" />
@@ -3184,7 +3184,7 @@
3184
  </port>
3185
  </output>
3186
  </layer>
3187
- <layer id="211" name="Multiply_31500" type="MatMul" version="opset1">
3188
  <data transpose_a="false" transpose_b="true" />
3189
  <input>
3190
  <port id="0" precision="FP32">
@@ -3205,7 +3205,7 @@
3205
  </port>
3206
  </output>
3207
  </layer>
3208
- <layer id="212" name="Constant_31622_compressed" type="Const" version="opset1">
3209
  <data element_type="f16" shape="1, 1, 1280" offset="189678274" size="2560" />
3210
  <output>
3211
  <port id="0" precision="FP16">
@@ -3215,7 +3215,7 @@
3215
  </port>
3216
  </output>
3217
  </layer>
3218
- <layer id="213" name="Constant_31622" type="Convert" version="opset1">
3219
  <data destination_type="f32" />
3220
  <rt_info>
3221
  <attribute name="decompression" version="0" />
@@ -3257,7 +3257,7 @@
3257
  </port>
3258
  </output>
3259
  </layer>
3260
- <layer id="215" name="Constant_31872" type="Const" version="opset1">
3261
  <data element_type="i64" shape="4" offset="137208364" size="32" />
3262
  <rt_info>
3263
  <attribute name="precise" version="0" />
@@ -3366,7 +3366,7 @@
3366
  </port>
3367
  </output>
3368
  </layer>
3369
- <layer id="222" name="Constant_31873" type="Const" version="opset1">
3370
  <data element_type="i64" shape="4" offset="137208364" size="32" />
3371
  <rt_info>
3372
  <attribute name="precise" version="0" />
@@ -3544,7 +3544,7 @@
3544
  </port>
3545
  </output>
3546
  </layer>
3547
- <layer id="232" name="Constant_31623_compressed" type="Const" version="opset1">
3548
  <data element_type="f16" shape="1, 1, 1280" offset="196234434" size="2560" />
3549
  <output>
3550
  <port id="0" precision="FP16">
@@ -3554,7 +3554,7 @@
3554
  </port>
3555
  </output>
3556
  </layer>
3557
- <layer id="233" name="Constant_31623" type="Convert" version="opset1">
3558
  <data destination_type="f32" />
3559
  <rt_info>
3560
  <attribute name="decompression" version="0" />
@@ -3596,7 +3596,7 @@
3596
  </port>
3597
  </output>
3598
  </layer>
3599
- <layer id="235" name="Constant_31874" type="Const" version="opset1">
3600
  <data element_type="i64" shape="4" offset="137208364" size="32" />
3601
  <rt_info>
3602
  <attribute name="precise" version="0" />
@@ -3711,7 +3711,7 @@
3711
  </port>
3712
  </output>
3713
  </layer>
3714
- <layer id="242" name="Constant_31875" type="Const" version="opset1">
3715
  <data element_type="i64" shape="3" offset="143764602" size="24" />
3716
  <rt_info>
3717
  <attribute name="precise" version="0" />
@@ -3791,7 +3791,7 @@
3791
  </port>
3792
  </output>
3793
  </layer>
3794
- <layer id="247" name="Constant_31624_compressed" type="Const" version="opset1">
3795
  <data element_type="f16" shape="1, 1, 1280" offset="199513794" size="2560" />
3796
  <output>
3797
  <port id="0" precision="FP16">
@@ -3801,7 +3801,7 @@
3801
  </port>
3802
  </output>
3803
  </layer>
3804
- <layer id="248" name="Constant_31624" type="Convert" version="opset1">
3805
  <data destination_type="f32" />
3806
  <rt_info>
3807
  <attribute name="decompression" version="0" />
@@ -3893,7 +3893,7 @@
3893
  </port>
3894
  </output>
3895
  </layer>
3896
- <layer id="253" name="Constant_31625_compressed" type="Const" version="opset1">
3897
  <data element_type="f16" shape="1, 1, 1280" offset="199516354" size="2560" />
3898
  <output>
3899
  <port id="0" precision="FP16">
@@ -3903,7 +3903,7 @@
3903
  </port>
3904
  </output>
3905
  </layer>
3906
- <layer id="254" name="Constant_31625" type="Convert" version="opset1">
3907
  <data destination_type="f32" />
3908
  <rt_info>
3909
  <attribute name="decompression" version="0" />
@@ -3945,7 +3945,7 @@
3945
  </port>
3946
  </output>
3947
  </layer>
3948
- <layer id="256" name="Constant_31626_compressed" type="Const" version="opset1">
3949
  <data element_type="f16" shape="1, 1, 1280" offset="199518914" size="2560" />
3950
  <output>
3951
  <port id="0" precision="FP16">
@@ -3955,7 +3955,7 @@
3955
  </port>
3956
  </output>
3957
  </layer>
3958
- <layer id="257" name="Constant_31626" type="Convert" version="opset1">
3959
  <data destination_type="f32" />
3960
  <rt_info>
3961
  <attribute name="decompression" version="0" />
@@ -3997,7 +3997,7 @@
3997
  </port>
3998
  </output>
3999
  </layer>
4000
- <layer id="259" name="Constant_31518_compressed" type="Const" version="opset1">
4001
  <data element_type="f16" shape="1280, 1280" offset="199521474" size="3276800" />
4002
  <output>
4003
  <port id="0" precision="FP16">
@@ -4006,7 +4006,7 @@
4006
  </port>
4007
  </output>
4008
  </layer>
4009
- <layer id="260" name="Constant_31518" type="Convert" version="opset1">
4010
  <data destination_type="f32" />
4011
  <rt_info>
4012
  <attribute name="decompression" version="0" />
@@ -4024,7 +4024,7 @@
4024
  </port>
4025
  </output>
4026
  </layer>
4027
- <layer id="261" name="Multiply_31504" type="MatMul" version="opset1">
4028
  <data transpose_a="false" transpose_b="true" />
4029
  <input>
4030
  <port id="0" precision="FP32">
@@ -4045,7 +4045,7 @@
4045
  </port>
4046
  </output>
4047
  </layer>
4048
- <layer id="262" name="Constant_31627_compressed" type="Const" version="opset1">
4049
  <data element_type="f16" shape="1, 1, 1280" offset="202798274" size="2560" />
4050
  <output>
4051
  <port id="0" precision="FP16">
@@ -4055,7 +4055,7 @@
4055
  </port>
4056
  </output>
4057
  </layer>
4058
- <layer id="263" name="Constant_31627" type="Convert" version="opset1">
4059
  <data destination_type="f32" />
4060
  <rt_info>
4061
  <attribute name="decompression" version="0" />
@@ -4097,7 +4097,7 @@
4097
  </port>
4098
  </output>
4099
  </layer>
4100
- <layer id="265" name="Constant_31876" type="Const" version="opset1">
4101
  <data element_type="i64" shape="4" offset="137208364" size="32" />
4102
  <rt_info>
4103
  <attribute name="precise" version="0" />
@@ -4348,7 +4348,7 @@
4348
  </port>
4349
  </output>
4350
  </layer>
4351
- <layer id="280" name="Constant_31628_compressed" type="Const" version="opset1">
4352
  <data element_type="f16" shape="1, 1, 1280" offset="209354434" size="2560" />
4353
  <output>
4354
  <port id="0" precision="FP16">
@@ -4358,7 +4358,7 @@
4358
  </port>
4359
  </output>
4360
  </layer>
4361
- <layer id="281" name="Constant_31628" type="Convert" version="opset1">
4362
  <data destination_type="f32" />
4363
  <rt_info>
4364
  <attribute name="decompression" version="0" />
@@ -4504,7 +4504,7 @@
4504
  </port>
4505
  </output>
4506
  </layer>
4507
- <layer id="289" name="Constant_31877" type="Const" version="opset1">
4508
  <data element_type="i64" shape="3" offset="156884650" size="24" />
4509
  <rt_info>
4510
  <attribute name="precise" version="0" />
@@ -4584,7 +4584,7 @@
4584
  </port>
4585
  </output>
4586
  </layer>
4587
- <layer id="294" name="Constant_31629_compressed" type="Const" version="opset1">
4588
  <data element_type="f16" shape="1, 1, 1280" offset="212633794" size="2560" />
4589
  <output>
4590
  <port id="0" precision="FP16">
@@ -4594,7 +4594,7 @@
4594
  </port>
4595
  </output>
4596
  </layer>
4597
- <layer id="295" name="Constant_31629" type="Convert" version="opset1">
4598
  <data destination_type="f32" />
4599
  <rt_info>
4600
  <attribute name="decompression" version="0" />
@@ -4686,7 +4686,7 @@
4686
  </port>
4687
  </output>
4688
  </layer>
4689
- <layer id="300" name="Constant_31630_compressed" type="Const" version="opset1">
4690
  <data element_type="f16" shape="1, 1, 1280" offset="212636354" size="2560" />
4691
  <output>
4692
  <port id="0" precision="FP16">
@@ -4696,7 +4696,7 @@
4696
  </port>
4697
  </output>
4698
  </layer>
4699
- <layer id="301" name="Constant_31630" type="Convert" version="opset1">
4700
  <data destination_type="f32" />
4701
  <rt_info>
4702
  <attribute name="decompression" version="0" />
@@ -4738,7 +4738,7 @@
4738
  </port>
4739
  </output>
4740
  </layer>
4741
- <layer id="303" name="Constant_31631_compressed" type="Const" version="opset1">
4742
  <data element_type="f16" shape="1, 1, 1280" offset="212638914" size="2560" />
4743
  <output>
4744
  <port id="0" precision="FP16">
@@ -4748,7 +4748,7 @@
4748
  </port>
4749
  </output>
4750
  </layer>
4751
- <layer id="304" name="Constant_31631" type="Convert" version="opset1">
4752
  <data destination_type="f32" />
4753
  <rt_info>
4754
  <attribute name="decompression" version="0" />
@@ -4838,7 +4838,7 @@
4838
  </port>
4839
  </output>
4840
  </layer>
4841
- <layer id="309" name="Constant_31632_compressed" type="Const" version="opset1">
4842
  <data element_type="f16" shape="1, 1, 5120" offset="225748674" size="10240" />
4843
  <output>
4844
  <port id="0" precision="FP16">
@@ -4848,7 +4848,7 @@
4848
  </port>
4849
  </output>
4850
  </layer>
4851
- <layer id="310" name="Constant_31632" type="Convert" version="opset1">
4852
  <data destination_type="f32" />
4853
  <rt_info>
4854
  <attribute name="decompression" version="0" />
@@ -4955,7 +4955,7 @@
4955
  </port>
4956
  </output>
4957
  </layer>
4958
- <layer id="316" name="Constant_31633_compressed" type="Const" version="opset1">
4959
  <data element_type="f16" shape="1, 1, 1280" offset="238866114" size="2560" />
4960
  <output>
4961
  <port id="0" precision="FP16">
@@ -4965,7 +4965,7 @@
4965
  </port>
4966
  </output>
4967
  </layer>
4968
- <layer id="317" name="Constant_31633" type="Convert" version="opset1">
4969
  <data destination_type="f32" />
4970
  <rt_info>
4971
  <attribute name="decompression" version="0" />
@@ -5057,7 +5057,7 @@
5057
  </port>
5058
  </output>
5059
  </layer>
5060
- <layer id="322" name="Constant_31634_compressed" type="Const" version="opset1">
5061
  <data element_type="f16" shape="1, 1, 1280" offset="238868674" size="2560" />
5062
  <output>
5063
  <port id="0" precision="FP16">
@@ -5067,7 +5067,7 @@
5067
  </port>
5068
  </output>
5069
  </layer>
5070
- <layer id="323" name="Constant_31634" type="Convert" version="opset1">
5071
  <data destination_type="f32" />
5072
  <rt_info>
5073
  <attribute name="decompression" version="0" />
@@ -5109,7 +5109,7 @@
5109
  </port>
5110
  </output>
5111
  </layer>
5112
- <layer id="325" name="Constant_31635_compressed" type="Const" version="opset1">
5113
  <data element_type="f16" shape="1, 1, 1280" offset="238871234" size="2560" />
5114
  <output>
5115
  <port id="0" precision="FP16">
@@ -5119,7 +5119,7 @@
5119
  </port>
5120
  </output>
5121
  </layer>
5122
- <layer id="326" name="Constant_31635" type="Convert" version="opset1">
5123
  <data destination_type="f32" />
5124
  <rt_info>
5125
  <attribute name="decompression" version="0" />
@@ -5182,7 +5182,7 @@
5182
  </port>
5183
  </output>
5184
  </layer>
5185
- <layer id="329" name="Result_26430" type="Result" version="opset1">
5186
  <input>
5187
  <port id="0" precision="FP32">
5188
  <dim>-1</dim>
@@ -5558,16 +5558,16 @@
5558
  <edge from-layer="328" from-port="2" to-layer="329" to-port="0" />
5559
  </edges>
5560
  <rt_info>
5561
- <Runtime_version value="2024.5.0-16901-32aaa2fbd96" />
5562
  <conversion_parameters>
5563
  <framework value="pytorch" />
5564
  <is_python_object value="True" />
5565
  </conversion_parameters>
5566
  <optimum>
5567
- <optimum_intel_version value="1.20.0.dev0+2559620" />
5568
- <optimum_version value="1.23.1" />
5569
- <pytorch_version value="2.5.0" />
5570
- <transformers_version value="4.45.2" />
5571
  </optimum>
5572
  </rt_info>
5573
  </net>
 
10
  </port>
11
  </output>
12
  </layer>
13
+ <layer id="0" name="Parameter_26704" type="Parameter" version="opset1">
14
  <data shape="?,?,?" element_type="f32" />
15
  <output>
16
  <port id="0" precision="FP32" names="encoder_hidden_states">
 
47
  </port>
48
  </output>
49
  </layer>
50
+ <layer id="4" name="Constant_32205" type="Const" version="opset1">
51
  <data element_type="i64" shape="2" offset="132776960" size="16" />
52
  <rt_info>
53
  <attribute name="precise" version="0" />
 
151
  <port id="0" precision="I64" names="23" />
152
  </output>
153
  </layer>
154
+ <layer id="12" name="ShapeOf_32121" type="ShapeOf" version="opset3">
155
  <data output_type="i64" />
156
  <input>
157
  <port id="0" precision="I64">
 
165
  </port>
166
  </output>
167
  </layer>
168
+ <layer id="13" name="Constant_32122" type="Const" version="opset1">
169
  <data element_type="i64" shape="" offset="133923868" size="8" />
170
  <rt_info>
171
  <attribute name="precise" version="0" />
 
174
  <port id="0" precision="I64" />
175
  </output>
176
  </layer>
177
+ <layer id="14" name="Constant_32123" type="Const" version="opset1">
178
  <data element_type="i64" shape="" offset="133923860" size="8" />
179
  <rt_info>
180
  <attribute name="precise" version="0" />
 
183
  <port id="0" precision="I64" />
184
  </output>
185
  </layer>
186
+ <layer id="15" name="Gather_32124" type="Gather" version="opset8">
187
  <data batch_dims="0" />
188
  <input>
189
  <port id="0" precision="I64">
 
244
  </port>
245
  </output>
246
  </layer>
247
+ <layer id="20" name="__module.model.model.decoder.embed_positions/aten::index/Constant" type="Const" version="opset1">
248
  <data element_type="i32" shape="" offset="132776976" size="4" />
249
  <output>
250
  <port id="0" precision="I32" />
 
321
  </port>
322
  </output>
323
  </layer>
324
+ <layer id="25" name="Constant_31887_compressed" type="Const" version="opset1">
325
  <data element_type="f16" shape="1, 1, 1280" offset="133923884" size="2560" />
326
  <output>
327
  <port id="0" precision="FP16">
 
331
  </port>
332
  </output>
333
  </layer>
334
+ <layer id="26" name="Constant_31887" type="Convert" version="opset1">
335
  <data destination_type="f32" />
336
  <rt_info>
337
  <attribute name="decompression" version="0" />
 
373
  </port>
374
  </output>
375
  </layer>
376
+ <layer id="28" name="Constant_31888_compressed" type="Const" version="opset1">
377
  <data element_type="f16" shape="1, 1, 1280" offset="133926444" size="2560" />
378
  <output>
379
  <port id="0" precision="FP16">
 
383
  </port>
384
  </output>
385
  </layer>
386
+ <layer id="29" name="Constant_31888" type="Convert" version="opset1">
387
  <data destination_type="f32" />
388
  <rt_info>
389
  <attribute name="decompression" version="0" />
 
425
  </port>
426
  </output>
427
  </layer>
428
+ <layer id="31" name="Constant_31790_compressed" type="Const" version="opset1">
429
  <data element_type="f16" shape="1280, 1280" offset="133929004" size="3276800" />
430
  <output>
431
  <port id="0" precision="FP16">
 
434
  </port>
435
  </output>
436
  </layer>
437
+ <layer id="32" name="Constant_31790" type="Convert" version="opset1">
438
  <data destination_type="f32" />
439
  <rt_info>
440
  <attribute name="decompression" version="0" />
 
452
  </port>
453
  </output>
454
  </layer>
455
+ <layer id="33" name="Multiply_31773" type="MatMul" version="opset1">
456
  <data transpose_a="false" transpose_b="true" />
457
  <input>
458
  <port id="0" precision="FP32">
 
473
  </port>
474
  </output>
475
  </layer>
476
+ <layer id="34" name="Constant_31889_compressed" type="Const" version="opset1">
477
  <data element_type="f16" shape="1, 1, 1280" offset="137205804" size="2560" />
478
  <output>
479
  <port id="0" precision="FP16">
 
483
  </port>
484
  </output>
485
  </layer>
486
+ <layer id="35" name="Constant_31889" type="Convert" version="opset1">
487
  <data destination_type="f32" />
488
  <rt_info>
489
  <attribute name="decompression" version="0" />
 
525
  </port>
526
  </output>
527
  </layer>
528
+ <layer id="37" name="Constant_32206" type="Const" version="opset1">
529
  <data element_type="i64" shape="4" offset="137208364" size="32" />
530
  <rt_info>
531
  <attribute name="precise" version="0" />
 
634
  </port>
635
  </output>
636
  </layer>
637
+ <layer id="44" name="Constant_32207" type="Const" version="opset1">
638
  <data element_type="i64" shape="4" offset="137208364" size="32" />
639
  <rt_info>
640
  <attribute name="precise" version="0" />
 
726
  <port id="0" precision="I32" />
727
  </output>
728
  </layer>
729
+ <layer id="50" name="17" type="Const" version="opset1">
730
  <data element_type="f32" shape="" offset="140485212" size="4" />
731
  <output>
732
+ <port id="0" precision="FP32" names="17" />
733
  </output>
734
  </layer>
735
+ <layer id="51" name="Constant_32145" type="Const" version="opset1">
736
  <data element_type="i64" shape="1" offset="133923868" size="8" />
737
  <rt_info>
738
  <attribute name="precise" version="0" />
 
743
  </port>
744
  </output>
745
  </layer>
746
+ <layer id="52" name="Reshape_32146" type="Reshape" version="opset1">
747
  <data special_zero="false" />
748
  <input>
749
  <port id="0" precision="I64" />
 
776
  <port id="2" precision="I64" names="62,64" />
777
  </output>
778
  </layer>
779
+ <layer id="55" name="Constant_24581" type="Const" version="opset1">
780
  <data element_type="i32" shape="" offset="132776976" size="4" />
781
  <rt_info>
782
  <attribute name="precise" version="0" />
 
785
  <port id="0" precision="I32" />
786
  </output>
787
  </layer>
788
+ <layer id="56" name="Unsqueeze_24582" type="Unsqueeze" version="opset1">
789
  <input>
790
  <port id="0" precision="I64" />
791
  <port id="1" precision="I32" />
 
827
  </port>
828
  </output>
829
  </layer>
830
+ <layer id="59" name="ShapeOf_32152" type="ShapeOf" version="opset3">
831
  <data output_type="i32" />
832
  <input>
833
  <port id="0" precision="FP32">
 
841
  </port>
842
  </output>
843
  </layer>
844
+ <layer id="60" name="Constant_32153" type="Const" version="opset1">
845
  <data element_type="i64" shape="" offset="133923868" size="8" />
846
  <output>
847
  <port id="0" precision="I64" />
848
  </output>
849
  </layer>
850
+ <layer id="61" name="Constant_32154" type="Const" version="opset1">
851
  <data element_type="i64" shape="" offset="133923860" size="8" />
852
  <output>
853
  <port id="0" precision="I64" />
854
  </output>
855
  </layer>
856
+ <layer id="62" name="Gather_32155" type="Gather" version="opset8">
857
  <data batch_dims="0" />
858
  <input>
859
  <port id="0" precision="I32">
 
905
  <port id="0" precision="I32" />
906
  </output>
907
  </layer>
908
+ <layer id="67" name="Convert_32158" type="Convert" version="opset1">
909
  <data destination_type="i32" />
910
  <input>
911
  <port id="0" precision="I64" />
 
1059
  </port>
1060
  </output>
1061
  </layer>
1062
+ <layer id="80" name="Constant_24684" type="Const" version="opset1">
1063
  <data element_type="i64" shape="2" offset="140485218" size="16" />
1064
  <rt_info>
1065
  <attribute name="precise" version="0" />
 
1179
  </port>
1180
  </output>
1181
  </layer>
1182
+ <layer id="88" name="Constant_32136" type="Const" version="opset1">
1183
  <data element_type="i64" shape="1" offset="133923860" size="8" />
1184
  <rt_info>
1185
  <attribute name="precise" version="0" />
 
1190
  </port>
1191
  </output>
1192
  </layer>
1193
+ <layer id="89" name="Constant_32137" type="Const" version="opset1">
1194
  <data element_type="i64" shape="" offset="133923860" size="8" />
1195
  <rt_info>
1196
  <attribute name="precise" version="0" />
 
1199
  <port id="0" precision="I64" />
1200
  </output>
1201
  </layer>
1202
+ <layer id="90" name="Gather_32138" type="Gather" version="opset8">
1203
  <data batch_dims="0" />
1204
  <input>
1205
  <port id="0" precision="I64">
 
1216
  </port>
1217
  </output>
1218
  </layer>
1219
+ <layer id="91" name="Constant_31122" type="Const" version="opset1">
1220
  <data element_type="i64" shape="1" offset="133923868" size="8" />
1221
  <rt_info>
1222
  <attribute name="precise" version="0" />
 
1227
  </port>
1228
  </output>
1229
  </layer>
1230
+ <layer id="92" name="Constant_31124" type="Const" version="opset1">
1231
  <data element_type="i64" shape="1" offset="133923868" size="8" />
1232
  <rt_info>
1233
  <attribute name="precise" version="0" />
 
1238
  </port>
1239
  </output>
1240
  </layer>
1241
+ <layer id="93" name="Constant_31126" type="Const" version="opset1">
1242
  <data element_type="i64" shape="1" offset="133923868" size="8" />
1243
  <rt_info>
1244
  <attribute name="precise" version="0" />
 
1293
  </port>
1294
  </output>
1295
  </layer>
1296
+ <layer id="96" name="Constant_25118" type="Const" version="opset1">
1297
  <data element_type="i64" shape="1" offset="133923860" size="8" />
1298
  <output>
1299
  <port id="0" precision="I64">
 
1301
  </port>
1302
  </output>
1303
  </layer>
1304
+ <layer id="97" name="ShapeOf_32167" type="ShapeOf" version="opset3">
1305
  <data output_type="i64" />
1306
  <input>
1307
  <port id="0" precision="FP32">
 
1316
  </port>
1317
  </output>
1318
  </layer>
1319
+ <layer id="98" name="Constant_32168" type="Const" version="opset1">
1320
  <data element_type="i64" shape="1" offset="133923868" size="8" />
1321
  <output>
1322
  <port id="0" precision="I64">
 
1324
  </port>
1325
  </output>
1326
  </layer>
1327
+ <layer id="99" name="Constant_32169" type="Const" version="opset1">
1328
  <data element_type="i64" shape="" offset="133923860" size="8" />
1329
  <output>
1330
  <port id="0" precision="I64" />
1331
  </output>
1332
  </layer>
1333
+ <layer id="100" name="Gather_32170" type="Gather" version="opset8">
1334
  <data batch_dims="0" />
1335
  <input>
1336
  <port id="0" precision="I64">
 
1347
  </port>
1348
  </output>
1349
  </layer>
1350
+ <layer id="101" name="Constant_25121" type="Const" version="opset1">
1351
  <data element_type="i64" shape="1" offset="133923868" size="8" />
1352
  <output>
1353
  <port id="0" precision="I64">
 
1485
  </port>
1486
  </output>
1487
  </layer>
1488
+ <layer id="109" name="Constant_31890_compressed" type="Const" version="opset1">
1489
  <data element_type="f16" shape="1, 1, 1280" offset="143762042" size="2560" />
1490
  <output>
1491
  <port id="0" precision="FP16">
 
1495
  </port>
1496
  </output>
1497
  </layer>
1498
+ <layer id="110" name="Constant_31890" type="Convert" version="opset1">
1499
  <data destination_type="f32" />
1500
  <rt_info>
1501
  <attribute name="decompression" version="0" />
 
1537
  </port>
1538
  </output>
1539
  </layer>
1540
+ <layer id="112" name="Constant_32208" type="Const" version="opset1">
1541
  <data element_type="i64" shape="4" offset="137208364" size="32" />
1542
  <rt_info>
1543
  <attribute name="precise" version="0" />
 
1652
  </port>
1653
  </output>
1654
  </layer>
1655
+ <layer id="119" name="Constant_32209" type="Const" version="opset1">
1656
  <data element_type="i64" shape="3" offset="143764602" size="24" />
1657
  <rt_info>
1658
  <attribute name="precise" version="0" />
 
1732
  </port>
1733
  </output>
1734
  </layer>
1735
+ <layer id="124" name="Constant_31891_compressed" type="Const" version="opset1">
1736
  <data element_type="f16" shape="1, 1, 1280" offset="147041426" size="2560" />
1737
  <output>
1738
  <port id="0" precision="FP16">
 
1742
  </port>
1743
  </output>
1744
  </layer>
1745
+ <layer id="125" name="Constant_31891" type="Convert" version="opset1">
1746
  <data destination_type="f32" />
1747
  <rt_info>
1748
  <attribute name="decompression" version="0" />
 
1834
  </port>
1835
  </output>
1836
  </layer>
1837
+ <layer id="130" name="Constant_31892_compressed" type="Const" version="opset1">
1838
  <data element_type="f16" shape="1, 1, 1280" offset="147043986" size="2560" />
1839
  <output>
1840
  <port id="0" precision="FP16">
 
1844
  </port>
1845
  </output>
1846
  </layer>
1847
+ <layer id="131" name="Constant_31892" type="Convert" version="opset1">
1848
  <data destination_type="f32" />
1849
  <rt_info>
1850
  <attribute name="decompression" version="0" />
 
1886
  </port>
1887
  </output>
1888
  </layer>
1889
+ <layer id="133" name="Constant_31893_compressed" type="Const" version="opset1">
1890
  <data element_type="f16" shape="1, 1, 1280" offset="147046546" size="2560" />
1891
  <output>
1892
  <port id="0" precision="FP16">
 
1896
  </port>
1897
  </output>
1898
  </layer>
1899
+ <layer id="134" name="Constant_31893" type="Convert" version="opset1">
1900
  <data destination_type="f32" />
1901
  <rt_info>
1902
  <attribute name="decompression" version="0" />
 
1938
  </port>
1939
  </output>
1940
  </layer>
1941
+ <layer id="136" name="Constant_31793_compressed" type="Const" version="opset1">
1942
  <data element_type="f16" shape="1280, 1280" offset="147049106" size="3276800" />
1943
  <output>
1944
  <port id="0" precision="FP16">
 
1947
  </port>
1948
  </output>
1949
  </layer>
1950
+ <layer id="137" name="Constant_31793" type="Convert" version="opset1">
1951
  <data destination_type="f32" />
1952
  <rt_info>
1953
  <attribute name="decompression" version="0" />
 
1965
  </port>
1966
  </output>
1967
  </layer>
1968
+ <layer id="138" name="Multiply_31777" type="MatMul" version="opset1">
1969
  <data transpose_a="false" transpose_b="true" />
1970
  <input>
1971
  <port id="0" precision="FP32">
 
1986
  </port>
1987
  </output>
1988
  </layer>
1989
+ <layer id="139" name="Constant_31894_compressed" type="Const" version="opset1">
1990
  <data element_type="f16" shape="1, 1, 1280" offset="150325906" size="2560" />
1991
  <output>
1992
  <port id="0" precision="FP16">
 
1996
  </port>
1997
  </output>
1998
  </layer>
1999
+ <layer id="140" name="Constant_31894" type="Convert" version="opset1">
2000
  <data destination_type="f32" />
2001
  <rt_info>
2002
  <attribute name="decompression" version="0" />
 
2038
  </port>
2039
  </output>
2040
  </layer>
2041
+ <layer id="142" name="Constant_32210" type="Const" version="opset1">
2042
  <data element_type="i64" shape="4" offset="137208364" size="32" />
2043
  <rt_info>
2044
  <attribute name="precise" version="0" />
 
2147
  </port>
2148
  </output>
2149
  </layer>
2150
+ <layer id="149" name="Constant_24866" type="Const" version="opset1">
2151
  <data element_type="i64" shape="1" offset="153605266" size="8" />
2152
  <rt_info>
2153
  <attribute name="precise" version="0" />
 
2158
  </port>
2159
  </output>
2160
  </layer>
2161
+ <layer id="150" name="Constant_24867" type="Const" version="opset1">
2162
  <data element_type="i64" shape="1" offset="153605274" size="8" />
2163
  <rt_info>
2164
  <attribute name="precise" version="0" />
 
2169
  </port>
2170
  </output>
2171
  </layer>
2172
+ <layer id="151" name="Constant_24868" type="Const" version="opset1">
2173
  <data element_type="i64" shape="1" offset="153605282" size="8" />
2174
  <rt_info>
2175
  <attribute name="precise" version="0" />
 
2180
  </port>
2181
  </output>
2182
  </layer>
2183
+ <layer id="152" name="__module.model.model.decoder.layers.0.self_attn/prim::ListConstruct_1" type="Concat" version="opset1">
2184
  <data axis="0" />
2185
  <input>
2186
  <port id="0" precision="I64">
 
2344
  </port>
2345
  </output>
2346
  </layer>
2347
+ <layer id="161" name="Constant_31895_compressed" type="Const" version="opset1">
2348
  <data element_type="f16" shape="1, 1, 1280" offset="156882090" size="2560" />
2349
  <output>
2350
  <port id="0" precision="FP16">
 
2354
  </port>
2355
  </output>
2356
  </layer>
2357
+ <layer id="162" name="Constant_31895" type="Convert" version="opset1">
2358
  <data destination_type="f32" />
2359
  <rt_info>
2360
  <attribute name="decompression" version="0" />
 
2500
  </port>
2501
  </output>
2502
  </layer>
2503
+ <layer id="170" name="Constant_32211" type="Const" version="opset1">
2504
  <data element_type="i64" shape="3" offset="156884650" size="24" />
2505
  <rt_info>
2506
  <attribute name="precise" version="0" />
 
2580
  </port>
2581
  </output>
2582
  </layer>
2583
+ <layer id="175" name="Constant_31896_compressed" type="Const" version="opset1">
2584
  <data element_type="f16" shape="1, 1, 1280" offset="160161474" size="2560" />
2585
  <output>
2586
  <port id="0" precision="FP16">
 
2590
  </port>
2591
  </output>
2592
  </layer>
2593
+ <layer id="176" name="Constant_31896" type="Convert" version="opset1">
2594
  <data destination_type="f32" />
2595
  <rt_info>
2596
  <attribute name="decompression" version="0" />
 
2682
  </port>
2683
  </output>
2684
  </layer>
2685
+ <layer id="181" name="Constant_31897_compressed" type="Const" version="opset1">
2686
  <data element_type="f16" shape="1, 1, 1280" offset="160164034" size="2560" />
2687
  <output>
2688
  <port id="0" precision="FP16">
 
2692
  </port>
2693
  </output>
2694
  </layer>
2695
+ <layer id="182" name="Constant_31897" type="Convert" version="opset1">
2696
  <data destination_type="f32" />
2697
  <rt_info>
2698
  <attribute name="decompression" version="0" />
 
2734
  </port>
2735
  </output>
2736
  </layer>
2737
+ <layer id="184" name="Constant_31898_compressed" type="Const" version="opset1">
2738
  <data element_type="f16" shape="1, 1, 1280" offset="160166594" size="2560" />
2739
  <output>
2740
  <port id="0" precision="FP16">
 
2744
  </port>
2745
  </output>
2746
  </layer>
2747
+ <layer id="185" name="Constant_31898" type="Convert" version="opset1">
2748
  <data destination_type="f32" />
2749
  <rt_info>
2750
  <attribute name="decompression" version="0" />
 
2834
  </port>
2835
  </output>
2836
  </layer>
2837
+ <layer id="190" name="Constant_31899_compressed" type="Const" version="opset1">
2838
  <data element_type="f16" shape="1, 1, 5120" offset="173276354" size="10240" />
2839
  <output>
2840
  <port id="0" precision="FP16">
 
2844
  </port>
2845
  </output>
2846
  </layer>
2847
+ <layer id="191" name="Constant_31899" type="Convert" version="opset1">
2848
  <data destination_type="f32" />
2849
  <rt_info>
2850
  <attribute name="decompression" version="0" />
 
2951
  </port>
2952
  </output>
2953
  </layer>
2954
+ <layer id="197" name="Constant_31900_compressed" type="Const" version="opset1">
2955
  <data element_type="f16" shape="1, 1, 1280" offset="186393794" size="2560" />
2956
  <output>
2957
  <port id="0" precision="FP16">
 
2961
  </port>
2962
  </output>
2963
  </layer>
2964
+ <layer id="198" name="Constant_31900" type="Convert" version="opset1">
2965
  <data destination_type="f32" />
2966
  <rt_info>
2967
  <attribute name="decompression" version="0" />
 
3053
  </port>
3054
  </output>
3055
  </layer>
3056
+ <layer id="203" name="Constant_31901_compressed" type="Const" version="opset1">
3057
  <data element_type="f16" shape="1, 1, 1280" offset="186396354" size="2560" />
3058
  <output>
3059
  <port id="0" precision="FP16">
 
3063
  </port>
3064
  </output>
3065
  </layer>
3066
+ <layer id="204" name="Constant_31901" type="Convert" version="opset1">
3067
  <data destination_type="f32" />
3068
  <rt_info>
3069
  <attribute name="decompression" version="0" />
 
3105
  </port>
3106
  </output>
3107
  </layer>
3108
+ <layer id="206" name="Constant_31902_compressed" type="Const" version="opset1">
3109
  <data element_type="f16" shape="1, 1, 1280" offset="186398914" size="2560" />
3110
  <output>
3111
  <port id="0" precision="FP16">
 
3115
  </port>
3116
  </output>
3117
  </layer>
3118
+ <layer id="207" name="Constant_31902" type="Convert" version="opset1">
3119
  <data destination_type="f32" />
3120
  <rt_info>
3121
  <attribute name="decompression" version="0" />
 
3157
  </port>
3158
  </output>
3159
  </layer>
3160
+ <layer id="209" name="Constant_31796_compressed" type="Const" version="opset1">
3161
  <data element_type="f16" shape="1280, 1280" offset="186401474" size="3276800" />
3162
  <output>
3163
  <port id="0" precision="FP16">
 
3166
  </port>
3167
  </output>
3168
  </layer>
3169
+ <layer id="210" name="Constant_31796" type="Convert" version="opset1">
3170
  <data destination_type="f32" />
3171
  <rt_info>
3172
  <attribute name="decompression" version="0" />
 
3184
  </port>
3185
  </output>
3186
  </layer>
3187
+ <layer id="211" name="Multiply_31781" type="MatMul" version="opset1">
3188
  <data transpose_a="false" transpose_b="true" />
3189
  <input>
3190
  <port id="0" precision="FP32">
 
3205
  </port>
3206
  </output>
3207
  </layer>
3208
+ <layer id="212" name="Constant_31903_compressed" type="Const" version="opset1">
3209
  <data element_type="f16" shape="1, 1, 1280" offset="189678274" size="2560" />
3210
  <output>
3211
  <port id="0" precision="FP16">
 
3215
  </port>
3216
  </output>
3217
  </layer>
3218
+ <layer id="213" name="Constant_31903" type="Convert" version="opset1">
3219
  <data destination_type="f32" />
3220
  <rt_info>
3221
  <attribute name="decompression" version="0" />
 
3257
  </port>
3258
  </output>
3259
  </layer>
3260
+ <layer id="215" name="Constant_32212" type="Const" version="opset1">
3261
  <data element_type="i64" shape="4" offset="137208364" size="32" />
3262
  <rt_info>
3263
  <attribute name="precise" version="0" />
 
3366
  </port>
3367
  </output>
3368
  </layer>
3369
+ <layer id="222" name="Constant_32213" type="Const" version="opset1">
3370
  <data element_type="i64" shape="4" offset="137208364" size="32" />
3371
  <rt_info>
3372
  <attribute name="precise" version="0" />
 
3544
  </port>
3545
  </output>
3546
  </layer>
3547
+ <layer id="232" name="Constant_31904_compressed" type="Const" version="opset1">
3548
  <data element_type="f16" shape="1, 1, 1280" offset="196234434" size="2560" />
3549
  <output>
3550
  <port id="0" precision="FP16">
 
3554
  </port>
3555
  </output>
3556
  </layer>
3557
+ <layer id="233" name="Constant_31904" type="Convert" version="opset1">
3558
  <data destination_type="f32" />
3559
  <rt_info>
3560
  <attribute name="decompression" version="0" />
 
3596
  </port>
3597
  </output>
3598
  </layer>
3599
+ <layer id="235" name="Constant_32214" type="Const" version="opset1">
3600
  <data element_type="i64" shape="4" offset="137208364" size="32" />
3601
  <rt_info>
3602
  <attribute name="precise" version="0" />
 
3711
  </port>
3712
  </output>
3713
  </layer>
3714
+ <layer id="242" name="Constant_32215" type="Const" version="opset1">
3715
  <data element_type="i64" shape="3" offset="143764602" size="24" />
3716
  <rt_info>
3717
  <attribute name="precise" version="0" />
 
3791
  </port>
3792
  </output>
3793
  </layer>
3794
+ <layer id="247" name="Constant_31905_compressed" type="Const" version="opset1">
3795
  <data element_type="f16" shape="1, 1, 1280" offset="199513794" size="2560" />
3796
  <output>
3797
  <port id="0" precision="FP16">
 
3801
  </port>
3802
  </output>
3803
  </layer>
3804
+ <layer id="248" name="Constant_31905" type="Convert" version="opset1">
3805
  <data destination_type="f32" />
3806
  <rt_info>
3807
  <attribute name="decompression" version="0" />
 
3893
  </port>
3894
  </output>
3895
  </layer>
3896
+ <layer id="253" name="Constant_31906_compressed" type="Const" version="opset1">
3897
  <data element_type="f16" shape="1, 1, 1280" offset="199516354" size="2560" />
3898
  <output>
3899
  <port id="0" precision="FP16">
 
3903
  </port>
3904
  </output>
3905
  </layer>
3906
+ <layer id="254" name="Constant_31906" type="Convert" version="opset1">
3907
  <data destination_type="f32" />
3908
  <rt_info>
3909
  <attribute name="decompression" version="0" />
 
3945
  </port>
3946
  </output>
3947
  </layer>
3948
+ <layer id="256" name="Constant_31907_compressed" type="Const" version="opset1">
3949
  <data element_type="f16" shape="1, 1, 1280" offset="199518914" size="2560" />
3950
  <output>
3951
  <port id="0" precision="FP16">
 
3955
  </port>
3956
  </output>
3957
  </layer>
3958
+ <layer id="257" name="Constant_31907" type="Convert" version="opset1">
3959
  <data destination_type="f32" />
3960
  <rt_info>
3961
  <attribute name="decompression" version="0" />
 
3997
  </port>
3998
  </output>
3999
  </layer>
4000
+ <layer id="259" name="Constant_31799_compressed" type="Const" version="opset1">
4001
  <data element_type="f16" shape="1280, 1280" offset="199521474" size="3276800" />
4002
  <output>
4003
  <port id="0" precision="FP16">
 
4006
  </port>
4007
  </output>
4008
  </layer>
4009
+ <layer id="260" name="Constant_31799" type="Convert" version="opset1">
4010
  <data destination_type="f32" />
4011
  <rt_info>
4012
  <attribute name="decompression" version="0" />
 
4024
  </port>
4025
  </output>
4026
  </layer>
4027
+ <layer id="261" name="Multiply_31785" type="MatMul" version="opset1">
4028
  <data transpose_a="false" transpose_b="true" />
4029
  <input>
4030
  <port id="0" precision="FP32">
 
4045
  </port>
4046
  </output>
4047
  </layer>
4048
+ <layer id="262" name="Constant_31908_compressed" type="Const" version="opset1">
4049
  <data element_type="f16" shape="1, 1, 1280" offset="202798274" size="2560" />
4050
  <output>
4051
  <port id="0" precision="FP16">
 
4055
  </port>
4056
  </output>
4057
  </layer>
4058
+ <layer id="263" name="Constant_31908" type="Convert" version="opset1">
4059
  <data destination_type="f32" />
4060
  <rt_info>
4061
  <attribute name="decompression" version="0" />
 
4097
  </port>
4098
  </output>
4099
  </layer>
4100
+ <layer id="265" name="Constant_32216" type="Const" version="opset1">
4101
  <data element_type="i64" shape="4" offset="137208364" size="32" />
4102
  <rt_info>
4103
  <attribute name="precise" version="0" />
 
4348
  </port>
4349
  </output>
4350
  </layer>
4351
+ <layer id="280" name="Constant_31909_compressed" type="Const" version="opset1">
4352
  <data element_type="f16" shape="1, 1, 1280" offset="209354434" size="2560" />
4353
  <output>
4354
  <port id="0" precision="FP16">
 
4358
  </port>
4359
  </output>
4360
  </layer>
4361
+ <layer id="281" name="Constant_31909" type="Convert" version="opset1">
4362
  <data destination_type="f32" />
4363
  <rt_info>
4364
  <attribute name="decompression" version="0" />
 
4504
  </port>
4505
  </output>
4506
  </layer>
4507
+ <layer id="289" name="Constant_32217" type="Const" version="opset1">
4508
  <data element_type="i64" shape="3" offset="156884650" size="24" />
4509
  <rt_info>
4510
  <attribute name="precise" version="0" />
 
4584
  </port>
4585
  </output>
4586
  </layer>
4587
+ <layer id="294" name="Constant_31910_compressed" type="Const" version="opset1">
4588
  <data element_type="f16" shape="1, 1, 1280" offset="212633794" size="2560" />
4589
  <output>
4590
  <port id="0" precision="FP16">
 
4594
  </port>
4595
  </output>
4596
  </layer>
4597
+ <layer id="295" name="Constant_31910" type="Convert" version="opset1">
4598
  <data destination_type="f32" />
4599
  <rt_info>
4600
  <attribute name="decompression" version="0" />
 
4686
  </port>
4687
  </output>
4688
  </layer>
4689
+ <layer id="300" name="Constant_31911_compressed" type="Const" version="opset1">
4690
  <data element_type="f16" shape="1, 1, 1280" offset="212636354" size="2560" />
4691
  <output>
4692
  <port id="0" precision="FP16">
 
4696
  </port>
4697
  </output>
4698
  </layer>
4699
+ <layer id="301" name="Constant_31911" type="Convert" version="opset1">
4700
  <data destination_type="f32" />
4701
  <rt_info>
4702
  <attribute name="decompression" version="0" />
 
4738
  </port>
4739
  </output>
4740
  </layer>
4741
+ <layer id="303" name="Constant_31912_compressed" type="Const" version="opset1">
4742
  <data element_type="f16" shape="1, 1, 1280" offset="212638914" size="2560" />
4743
  <output>
4744
  <port id="0" precision="FP16">
 
4748
  </port>
4749
  </output>
4750
  </layer>
4751
+ <layer id="304" name="Constant_31912" type="Convert" version="opset1">
4752
  <data destination_type="f32" />
4753
  <rt_info>
4754
  <attribute name="decompression" version="0" />
 
4838
  </port>
4839
  </output>
4840
  </layer>
4841
+ <layer id="309" name="Constant_31913_compressed" type="Const" version="opset1">
4842
  <data element_type="f16" shape="1, 1, 5120" offset="225748674" size="10240" />
4843
  <output>
4844
  <port id="0" precision="FP16">
 
4848
  </port>
4849
  </output>
4850
  </layer>
4851
+ <layer id="310" name="Constant_31913" type="Convert" version="opset1">
4852
  <data destination_type="f32" />
4853
  <rt_info>
4854
  <attribute name="decompression" version="0" />
 
4955
  </port>
4956
  </output>
4957
  </layer>
4958
+ <layer id="316" name="Constant_31914_compressed" type="Const" version="opset1">
4959
  <data element_type="f16" shape="1, 1, 1280" offset="238866114" size="2560" />
4960
  <output>
4961
  <port id="0" precision="FP16">
 
4965
  </port>
4966
  </output>
4967
  </layer>
4968
+ <layer id="317" name="Constant_31914" type="Convert" version="opset1">
4969
  <data destination_type="f32" />
4970
  <rt_info>
4971
  <attribute name="decompression" version="0" />
 
5057
  </port>
5058
  </output>
5059
  </layer>
5060
+ <layer id="322" name="Constant_31915_compressed" type="Const" version="opset1">
5061
  <data element_type="f16" shape="1, 1, 1280" offset="238868674" size="2560" />
5062
  <output>
5063
  <port id="0" precision="FP16">
 
5067
  </port>
5068
  </output>
5069
  </layer>
5070
+ <layer id="323" name="Constant_31915" type="Convert" version="opset1">
5071
  <data destination_type="f32" />
5072
  <rt_info>
5073
  <attribute name="decompression" version="0" />
 
5109
  </port>
5110
  </output>
5111
  </layer>
5112
+ <layer id="325" name="Constant_31916_compressed" type="Const" version="opset1">
5113
  <data element_type="f16" shape="1, 1, 1280" offset="238871234" size="2560" />
5114
  <output>
5115
  <port id="0" precision="FP16">
 
5119
  </port>
5120
  </output>
5121
  </layer>
5122
+ <layer id="326" name="Constant_31916" type="Convert" version="opset1">
5123
  <data destination_type="f32" />
5124
  <rt_info>
5125
  <attribute name="decompression" version="0" />
 
5182
  </port>
5183
  </output>
5184
  </layer>
5185
+ <layer id="329" name="Result_26703" type="Result" version="opset1">
5186
  <input>
5187
  <port id="0" precision="FP32">
5188
  <dim>-1</dim>
 
5558
  <edge from-layer="328" from-port="2" to-layer="329" to-port="0" />
5559
  </edges>
5560
  <rt_info>
5561
+ <Runtime_version value="2024.5.0-17285-ea5c1dcfdf9-releases/2024/5" />
5562
  <conversion_parameters>
5563
  <framework value="pytorch" />
5564
  <is_python_object value="True" />
5565
  </conversion_parameters>
5566
  <optimum>
5567
+ <optimum_intel_version value="1.21.0.dev0+d357376" />
5568
+ <optimum_version value="1.23.3" />
5569
+ <pytorch_version value="2.5.1" />
5570
+ <transformers_version value="4.46.3" />
5571
  </optimum>
5572
  </rt_info>
5573
  </net>
openvino_detokenizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b55ac04e90f19fede391281a9e5a90169fc646e1e302fe1208c782282b51ceaa
3
  size 528306
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c95aa7a4b53ecb3768d2a6608aa9e419059aef1c75b9b99e6b1c56328281c18
3
  size 528306
openvino_detokenizer.xml CHANGED
@@ -1,16 +1,16 @@
1
  <?xml version="1.0"?>
2
  <net name="detokenizer" version="11">
3
  <layers>
4
- <layer id="0" name="Parameter_33240" type="Parameter" version="opset1">
5
  <data shape="?,?" element_type="i64" />
6
  <output>
7
- <port id="0" precision="I64" names="Parameter_33240">
8
  <dim>-1</dim>
9
  <dim>-1</dim>
10
  </port>
11
  </output>
12
  </layer>
13
- <layer id="1" name="Convert_33256" type="Convert" version="opset1">
14
  <data destination_type="i32" />
15
  <input>
16
  <port id="0" precision="I64">
@@ -25,7 +25,7 @@
25
  </port>
26
  </output>
27
  </layer>
28
- <layer id="2" name="Constant_33201" type="Const" version="opset1">
29
  <data element_type="u8" shape="528257" offset="0" size="528257" />
30
  <output>
31
  <port id="0" precision="U8">
@@ -33,7 +33,7 @@
33
  </port>
34
  </output>
35
  </layer>
36
- <layer id="3" name="StringTensorUnpack_33202" type="StringTensorUnpack" version="extension">
37
  <data mode="begins_ends" />
38
  <input>
39
  <port id="0" precision="U8">
@@ -52,7 +52,7 @@
52
  </port>
53
  </output>
54
  </layer>
55
- <layer id="4" name="VocabDecoder_33241" type="VocabDecoder" version="extension">
56
  <data skip_tokens="50257, 50258, 50259, 50260, 50261, 50262, 50263, 50264, 50265, 50266, 50267, 50268, 50269, 50270, 50271, 50272, 50273, 50274, 50275, 50276, 50277, 50278, 50279, 50280, 50281, 50282, 50283, 50284, 50285, 50286, 50287, 50288, 50289, 50290, 50291, 50292, 50293, 50294, 50295, 50296, 50297, 50298, 50299, 50300, 50301, 50302, 50303, 50304, 50305, 50306, 50307, 50308, 50309, 50310, 50311, 50312, 50313, 50314, 50315, 50316, 50317, 50318, 50319, 50320, 50321, 50322, 50323, 50324, 50325, 50326, 50327, 50328, 50329, 50330, 50331, 50332, 50333, 50334, 50335, 50336, 50337, 50338, 50339, 50340, 50341, 50342, 50343, 50344, 50345, 50346, 50347, 50348, 50349, 50350, 50351, 50352, 50353, 50354, 50355, 50356, 50357, 50358, 50359, 50360, 50361, 50362, 50363, 50364" />
57
  <input>
58
  <port id="0" precision="I32">
@@ -87,7 +87,7 @@
87
  </port>
88
  </output>
89
  </layer>
90
- <layer id="5" name="FuzeRagged_33242" type="FuzeRagged" version="extension">
91
  <input>
92
  <port id="0" precision="I32">
93
  <dim>-1</dim>
@@ -111,7 +111,7 @@
111
  </port>
112
  </output>
113
  </layer>
114
- <layer id="6" name="Constant_33244" type="Const" version="opset1">
115
  <data element_type="u8" shape="47" offset="528257" size="47" />
116
  <output>
117
  <port id="0" precision="U8">
@@ -119,7 +119,7 @@
119
  </port>
120
  </output>
121
  </layer>
122
- <layer id="7" name="Constant_33246" type="Const" version="opset1">
123
  <data element_type="u8" shape="2" offset="528304" size="2" />
124
  <output>
125
  <port id="0" precision="U8">
@@ -127,7 +127,7 @@
127
  </port>
128
  </output>
129
  </layer>
130
- <layer id="8" name="RegexNormalization_33247" type="RegexNormalization" version="extension">
131
  <data global_replace="true" />
132
  <input>
133
  <port id="0" precision="I32">
@@ -158,7 +158,7 @@
158
  </port>
159
  </output>
160
  </layer>
161
- <layer id="9" name="StringTensorPack_33248" type="StringTensorPack" version="extension">
162
  <data mode="begins_ends" />
163
  <input>
164
  <port id="0" precision="I32">
@@ -177,7 +177,7 @@
177
  </port>
178
  </output>
179
  </layer>
180
- <layer id="10" name="Result_33249" type="Result" version="opset1">
181
  <input>
182
  <port id="0" precision="STRING">
183
  <dim>-1</dim>
@@ -207,9 +207,29 @@
207
  <edge from-layer="9" from-port="3" to-layer="10" to-port="0" />
208
  </edges>
209
  <rt_info>
 
 
 
210
  <bos_token_id value="50257" />
 
 
211
  <eos_token_id value="50257" />
 
 
 
 
212
  <original_tokenizer_class value="&lt;class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
213
  <pad_token_id value="50257" />
 
 
 
 
 
 
 
 
 
 
 
214
  </rt_info>
215
  </net>
 
1
  <?xml version="1.0"?>
2
  <net name="detokenizer" version="11">
3
  <layers>
4
+ <layer id="0" name="Parameter_33580" type="Parameter" version="opset1">
5
  <data shape="?,?" element_type="i64" />
6
  <output>
7
+ <port id="0" precision="I64" names="Parameter_33580">
8
  <dim>-1</dim>
9
  <dim>-1</dim>
10
  </port>
11
  </output>
12
  </layer>
13
+ <layer id="1" name="Convert_33596" type="Convert" version="opset1">
14
  <data destination_type="i32" />
15
  <input>
16
  <port id="0" precision="I64">
 
25
  </port>
26
  </output>
27
  </layer>
28
+ <layer id="2" name="Constant_33541" type="Const" version="opset1">
29
  <data element_type="u8" shape="528257" offset="0" size="528257" />
30
  <output>
31
  <port id="0" precision="U8">
 
33
  </port>
34
  </output>
35
  </layer>
36
+ <layer id="3" name="StringTensorUnpack_33542" type="StringTensorUnpack" version="extension">
37
  <data mode="begins_ends" />
38
  <input>
39
  <port id="0" precision="U8">
 
52
  </port>
53
  </output>
54
  </layer>
55
+ <layer id="4" name="VocabDecoder_33581" type="VocabDecoder" version="extension">
56
  <data skip_tokens="50257, 50258, 50259, 50260, 50261, 50262, 50263, 50264, 50265, 50266, 50267, 50268, 50269, 50270, 50271, 50272, 50273, 50274, 50275, 50276, 50277, 50278, 50279, 50280, 50281, 50282, 50283, 50284, 50285, 50286, 50287, 50288, 50289, 50290, 50291, 50292, 50293, 50294, 50295, 50296, 50297, 50298, 50299, 50300, 50301, 50302, 50303, 50304, 50305, 50306, 50307, 50308, 50309, 50310, 50311, 50312, 50313, 50314, 50315, 50316, 50317, 50318, 50319, 50320, 50321, 50322, 50323, 50324, 50325, 50326, 50327, 50328, 50329, 50330, 50331, 50332, 50333, 50334, 50335, 50336, 50337, 50338, 50339, 50340, 50341, 50342, 50343, 50344, 50345, 50346, 50347, 50348, 50349, 50350, 50351, 50352, 50353, 50354, 50355, 50356, 50357, 50358, 50359, 50360, 50361, 50362, 50363, 50364" />
57
  <input>
58
  <port id="0" precision="I32">
 
87
  </port>
88
  </output>
89
  </layer>
90
+ <layer id="5" name="FuzeRagged_33582" type="FuzeRagged" version="extension">
91
  <input>
92
  <port id="0" precision="I32">
93
  <dim>-1</dim>
 
111
  </port>
112
  </output>
113
  </layer>
114
+ <layer id="6" name="Constant_33584" type="Const" version="opset1">
115
  <data element_type="u8" shape="47" offset="528257" size="47" />
116
  <output>
117
  <port id="0" precision="U8">
 
119
  </port>
120
  </output>
121
  </layer>
122
+ <layer id="7" name="Constant_33586" type="Const" version="opset1">
123
  <data element_type="u8" shape="2" offset="528304" size="2" />
124
  <output>
125
  <port id="0" precision="U8">
 
127
  </port>
128
  </output>
129
  </layer>
130
+ <layer id="8" name="RegexNormalization_33587" type="RegexNormalization" version="extension">
131
  <data global_replace="true" />
132
  <input>
133
  <port id="0" precision="I32">
 
158
  </port>
159
  </output>
160
  </layer>
161
+ <layer id="9" name="StringTensorPack_33588" type="StringTensorPack" version="extension">
162
  <data mode="begins_ends" />
163
  <input>
164
  <port id="0" precision="I32">
 
177
  </port>
178
  </output>
179
  </layer>
180
+ <layer id="10" name="Result_33589" type="Result" version="opset1">
181
  <input>
182
  <port id="0" precision="STRING">
183
  <dim>-1</dim>
 
207
  <edge from-layer="9" from-port="3" to-layer="10" to-port="0" />
208
  </edges>
209
  <rt_info>
210
+ <add_attention_mask value="True" />
211
+ <add_prefix_space />
212
+ <add_special_tokens value="True" />
213
  <bos_token_id value="50257" />
214
+ <clean_up_tokenization_spaces />
215
+ <detokenizer_input_type value="i64" />
216
  <eos_token_id value="50257" />
217
+ <handle_special_tokens_with_re />
218
+ <number_of_inputs value="1" />
219
+ <openvino_tokenizers_version value="2024.5.0.0" />
220
+ <openvino_version value="2024.5.0" />
221
  <original_tokenizer_class value="&lt;class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
222
  <pad_token_id value="50257" />
223
+ <sentencepiece_version value="0.2.0" />
224
+ <skip_special_tokens value="True" />
225
+ <streaming_detokenizer value="False" />
226
+ <tiktoken_version value="0.8.0" />
227
+ <tokenizer_output_type value="i64" />
228
+ <tokenizers_version value="0.20.3" />
229
+ <transformers_version value="4.46.3" />
230
+ <use_max_padding value="False" />
231
+ <use_sentencepiece_backend value="False" />
232
+ <utf8_replace_mode />
233
+ <with_detokenizer value="True" />
234
  </rt_info>
235
  </net>
openvino_encoder_model.xml CHANGED
The diff for this file is too large to render. See raw diff
 
openvino_tokenizer.xml CHANGED
@@ -1,27 +1,27 @@
1
  <?xml version="1.0"?>
2
  <net name="tokenizer" version="11">
3
  <layers>
4
- <layer id="0" name="Parameter_33120" type="Parameter" version="opset1">
5
  <data shape="?" element_type="string" />
6
  <output>
7
- <port id="0" precision="STRING" names="Parameter_33120">
8
  <dim>-1</dim>
9
  </port>
10
  </output>
11
  </layer>
12
- <layer id="1" name="Constant_33218" type="Const" version="opset1">
13
  <data element_type="i32" shape="" offset="0" size="4" />
14
  <output>
15
  <port id="0" precision="I32" />
16
  </output>
17
  </layer>
18
- <layer id="2" name="Constant_33219" type="Const" version="opset1">
19
  <data element_type="i32" shape="" offset="4" size="4" />
20
  <output>
21
  <port id="0" precision="I32" />
22
  </output>
23
  </layer>
24
- <layer id="3" name="Constant_33220" type="Const" version="opset1">
25
  <data element_type="i32" shape="1" offset="8" size="4" />
26
  <output>
27
  <port id="0" precision="I32">
@@ -29,19 +29,19 @@
29
  </port>
30
  </output>
31
  </layer>
32
- <layer id="4" name="Constant_33221" type="Const" version="opset1">
33
  <data element_type="i32" shape="" offset="0" size="4" />
34
  <output>
35
  <port id="0" precision="I32" />
36
  </output>
37
  </layer>
38
- <layer id="5" name="Constant_33222" type="Const" version="opset1">
39
  <data element_type="i32" shape="" offset="4" size="4" />
40
  <output>
41
  <port id="0" precision="I32" />
42
  </output>
43
  </layer>
44
- <layer id="6" name="Constant_33223" type="Const" version="opset1">
45
  <data element_type="i32" shape="1" offset="12" size="4" />
46
  <output>
47
  <port id="0" precision="I32">
@@ -49,13 +49,13 @@
49
  </port>
50
  </output>
51
  </layer>
52
- <layer id="7" name="Constant_33126" type="Const" version="opset1">
53
  <data element_type="i64" shape="" offset="16" size="8" />
54
  <output>
55
  <port id="0" precision="I64" />
56
  </output>
57
  </layer>
58
- <layer id="8" name="StringTensorUnpack_33121" type="StringTensorUnpack" version="extension">
59
  <data mode="begins_ends" />
60
  <input>
61
  <port id="0" precision="STRING">
@@ -74,7 +74,7 @@
74
  </port>
75
  </output>
76
  </layer>
77
- <layer id="9" name="ShapeOf_33122" type="ShapeOf" version="opset3">
78
  <data output_type="i64" />
79
  <input>
80
  <port id="0" precision="I32">
@@ -87,19 +87,19 @@
87
  </port>
88
  </output>
89
  </layer>
90
- <layer id="10" name="Constant_33123" type="Const" version="opset1">
91
  <data element_type="i64" shape="" offset="16" size="8" />
92
  <output>
93
  <port id="0" precision="I64" />
94
  </output>
95
  </layer>
96
- <layer id="11" name="Constant_33124" type="Const" version="opset1">
97
  <data element_type="i64" shape="" offset="16" size="8" />
98
  <output>
99
  <port id="0" precision="I64" />
100
  </output>
101
  </layer>
102
- <layer id="12" name="Gather_33125" type="Gather" version="opset8">
103
  <data batch_dims="0" />
104
  <input>
105
  <port id="0" precision="I64">
@@ -112,13 +112,13 @@
112
  <port id="3" precision="I64" />
113
  </output>
114
  </layer>
115
- <layer id="13" name="Constant_33127" type="Const" version="opset1">
116
  <data element_type="i64" shape="" offset="24" size="8" />
117
  <output>
118
  <port id="0" precision="I64" />
119
  </output>
120
  </layer>
121
- <layer id="14" name="Range_33128" type="Range" version="opset4">
122
  <data output_type="i32" />
123
  <input>
124
  <port id="0" precision="I64" />
@@ -131,19 +131,19 @@
131
  </port>
132
  </output>
133
  </layer>
134
- <layer id="15" name="Constant_33129" type="Const" version="opset1">
135
  <data element_type="i64" shape="" offset="24" size="8" />
136
  <output>
137
  <port id="0" precision="I64" />
138
  </output>
139
  </layer>
140
- <layer id="16" name="Constant_33130" type="Const" version="opset1">
141
  <data element_type="i64" shape="" offset="24" size="8" />
142
  <output>
143
  <port id="0" precision="I64" />
144
  </output>
145
  </layer>
146
- <layer id="17" name="Add_33131" type="Add" version="opset1">
147
  <data auto_broadcast="numpy" />
148
  <input>
149
  <port id="0" precision="I64" />
@@ -153,13 +153,13 @@
153
  <port id="2" precision="I64" />
154
  </output>
155
  </layer>
156
- <layer id="18" name="Constant_33132" type="Const" version="opset1">
157
  <data element_type="i64" shape="" offset="24" size="8" />
158
  <output>
159
  <port id="0" precision="I64" />
160
  </output>
161
  </layer>
162
- <layer id="19" name="Range_33133" type="Range" version="opset4">
163
  <data output_type="i32" />
164
  <input>
165
  <port id="0" precision="I64" />
@@ -172,7 +172,7 @@
172
  </port>
173
  </output>
174
  </layer>
175
- <layer id="20" name="Constant_33195" type="Const" version="opset1">
176
  <data element_type="u8" shape="26491" offset="32" size="26491" />
177
  <output>
178
  <port id="0" precision="U8">
@@ -180,7 +180,7 @@
180
  </port>
181
  </output>
182
  </layer>
183
- <layer id="21" name="SpecialTokensSplit_33196" type="SpecialTokensSplit" version="extension">
184
  <input>
185
  <port id="0" precision="I32">
186
  <dim>-1</dim>
@@ -222,7 +222,7 @@
222
  </port>
223
  </output>
224
  </layer>
225
- <layer id="22" name="Constant_33198" type="Const" version="opset1">
226
  <data element_type="u8" shape="64" offset="26523" size="64" />
227
  <output>
228
  <port id="0" precision="U8">
@@ -230,7 +230,7 @@
230
  </port>
231
  </output>
232
  </layer>
233
- <layer id="23" name="RegexSplit_33199" type="RegexSplit" version="extension">
234
  <data behaviour="isolate" invert="false" max_splits="-1" />
235
  <input>
236
  <port id="0" precision="I32">
@@ -276,7 +276,7 @@
276
  </port>
277
  </output>
278
  </layer>
279
- <layer id="24" name="Constant_33201" type="Const" version="opset1">
280
  <data element_type="u8" shape="528257" offset="26587" size="528257" />
281
  <output>
282
  <port id="0" precision="U8">
@@ -284,7 +284,7 @@
284
  </port>
285
  </output>
286
  </layer>
287
- <layer id="25" name="StringTensorUnpack_33202" type="StringTensorUnpack" version="extension">
288
  <data mode="begins_ends" />
289
  <input>
290
  <port id="0" precision="U8">
@@ -303,7 +303,7 @@
303
  </port>
304
  </output>
305
  </layer>
306
- <layer id="26" name="Constant_33207" type="Const" version="opset1">
307
  <data element_type="u8" shape="369958" offset="554844" size="369958" />
308
  <output>
309
  <port id="0" precision="U8">
@@ -311,7 +311,7 @@
311
  </port>
312
  </output>
313
  </layer>
314
- <layer id="27" name="StringTensorUnpack_33208" type="StringTensorUnpack" version="extension">
315
  <data mode="begins_ends" />
316
  <input>
317
  <port id="0" precision="U8">
@@ -330,7 +330,7 @@
330
  </port>
331
  </output>
332
  </layer>
333
- <layer id="28" name="Constant_33210" type="Const" version="opset1">
334
  <data element_type="u8" shape="336859" offset="924802" size="336859" />
335
  <output>
336
  <port id="0" precision="U8">
@@ -338,7 +338,7 @@
338
  </port>
339
  </output>
340
  </layer>
341
- <layer id="29" name="StringTensorUnpack_33211" type="StringTensorUnpack" version="extension">
342
  <data mode="begins_ends" />
343
  <input>
344
  <port id="0" precision="U8">
@@ -357,7 +357,7 @@
357
  </port>
358
  </output>
359
  </layer>
360
- <layer id="30" name="Constant_33204" type="Const" version="opset1">
361
  <data element_type="u8" shape="20172" offset="1261661" size="20172" />
362
  <output>
363
  <port id="0" precision="U8">
@@ -365,7 +365,7 @@
365
  </port>
366
  </output>
367
  </layer>
368
- <layer id="31" name="StringTensorUnpack_33205" type="StringTensorUnpack" version="extension">
369
  <data mode="begins_ends" />
370
  <input>
371
  <port id="0" precision="U8">
@@ -384,7 +384,7 @@
384
  </port>
385
  </output>
386
  </layer>
387
- <layer id="32" name="Constant_33212" type="Const" version="opset1">
388
  <data element_type="i32" shape="1609" offset="1281833" size="6436" />
389
  <output>
390
  <port id="0" precision="I32">
@@ -392,7 +392,7 @@
392
  </port>
393
  </output>
394
  </layer>
395
- <layer id="33" name="BPETokenizer_33213" type="BPETokenizer" version="extension">
396
  <data unk_token="" fuse_unk="false" suffix_indicator="" end_suffix="" byte_fallback="false" cache_capacity="20000" />
397
  <input>
398
  <port id="0" precision="I32">
@@ -462,7 +462,7 @@
462
  </port>
463
  </output>
464
  </layer>
465
- <layer id="34" name="Subtract_33214" type="Subtract" version="opset1">
466
  <data auto_broadcast="numpy" />
467
  <input>
468
  <port id="0" precision="I32">
@@ -478,13 +478,13 @@
478
  </port>
479
  </output>
480
  </layer>
481
- <layer id="35" name="Constant_33215" type="Const" version="opset1">
482
  <data element_type="i32" shape="" offset="1288269" size="4" />
483
  <output>
484
  <port id="0" precision="I32" />
485
  </output>
486
  </layer>
487
- <layer id="36" name="Minimum_33216" type="Minimum" version="opset1">
488
  <data auto_broadcast="numpy" />
489
  <input>
490
  <port id="0" precision="I32">
@@ -498,7 +498,7 @@
498
  </port>
499
  </output>
500
  </layer>
501
- <layer id="37" name="Add_33217" type="Add" version="opset1">
502
  <data auto_broadcast="numpy" />
503
  <input>
504
  <port id="0" precision="I32">
@@ -514,19 +514,19 @@
514
  </port>
515
  </output>
516
  </layer>
517
- <layer id="38" name="Constant_33224" type="Const" version="opset1">
518
  <data element_type="i32" shape="" offset="0" size="4" />
519
  <output>
520
  <port id="0" precision="I32" />
521
  </output>
522
  </layer>
523
- <layer id="39" name="Constant_33225" type="Const" version="opset1">
524
  <data element_type="i32" shape="" offset="4" size="4" />
525
  <output>
526
  <port id="0" precision="I32" />
527
  </output>
528
  </layer>
529
- <layer id="40" name="Constant_33226" type="Const" version="opset1">
530
  <data element_type="i32" shape="1" offset="1288273" size="4" />
531
  <output>
532
  <port id="0" precision="I32">
@@ -534,7 +534,7 @@
534
  </port>
535
  </output>
536
  </layer>
537
- <layer id="41" name="Constant_33227" type="Const" version="opset1">
538
  <data element_type="i32" shape="4" offset="1288277" size="16" />
539
  <output>
540
  <port id="0" precision="I32">
@@ -542,7 +542,7 @@
542
  </port>
543
  </output>
544
  </layer>
545
- <layer id="42" name="CombineSegments_33228" type="CombineSegments" version="extension">
546
  <input>
547
  <port id="0" precision="I32" />
548
  <port id="1" precision="I32" />
@@ -593,7 +593,7 @@
593
  </port>
594
  </output>
595
  </layer>
596
- <layer id="43" name="Subtract_33229" type="Subtract" version="opset1">
597
  <data auto_broadcast="numpy" />
598
  <input>
599
  <port id="0" precision="I32">
@@ -609,13 +609,13 @@
609
  </port>
610
  </output>
611
  </layer>
612
- <layer id="44" name="Constant_33230" type="Const" version="opset1">
613
  <data element_type="i32" shape="" offset="0" size="4" />
614
  <output>
615
  <port id="0" precision="I32" />
616
  </output>
617
  </layer>
618
- <layer id="45" name="ReduceMax_33231" type="ReduceMax" version="opset1">
619
  <data keep_dims="false" />
620
  <input>
621
  <port id="0" precision="I32">
@@ -627,13 +627,13 @@
627
  <port id="2" precision="I32" />
628
  </output>
629
  </layer>
630
- <layer id="46" name="Constant_33232" type="Const" version="opset1">
631
  <data element_type="i32" shape="" offset="1288273" size="4" />
632
  <output>
633
  <port id="0" precision="I32" />
634
  </output>
635
  </layer>
636
- <layer id="47" name="RaggedToDense_33233" type="RaggedToDense" version="extension">
637
  <data pad_right="true" />
638
  <input>
639
  <port id="0" precision="I32">
@@ -659,7 +659,7 @@
659
  </port>
660
  </output>
661
  </layer>
662
- <layer id="48" name="Convert_33234" type="Convert" version="opset1">
663
  <data destination_type="i32" />
664
  <input>
665
  <port id="0" precision="BOOL">
@@ -674,7 +674,7 @@
674
  </port>
675
  </output>
676
  </layer>
677
- <layer id="49" name="Convert_33234" type="Convert" version="opset1">
678
  <data destination_type="i64" />
679
  <input>
680
  <port id="0" precision="I32">
@@ -689,7 +689,7 @@
689
  </port>
690
  </output>
691
  </layer>
692
- <layer id="51" name="RaggedToDense_33233.0" type="Convert" version="opset1">
693
  <data destination_type="i64" />
694
  <input>
695
  <port id="0" precision="I32">
@@ -704,7 +704,7 @@
704
  </port>
705
  </output>
706
  </layer>
707
- <layer id="52" name="Result_33237" type="Result" version="opset1">
708
  <input>
709
  <port id="0" precision="I64">
710
  <dim>-1</dim>
@@ -712,7 +712,7 @@
712
  </port>
713
  </input>
714
  </layer>
715
- <layer id="50" name="Result_33239" type="Result" version="opset1">
716
  <input>
717
  <port id="0" precision="I64">
718
  <dim>-1</dim>
@@ -805,9 +805,29 @@
805
  <edge from-layer="51" from-port="1" to-layer="52" to-port="0" />
806
  </edges>
807
  <rt_info>
 
 
 
808
  <bos_token_id value="50257" />
 
 
809
  <eos_token_id value="50257" />
 
 
 
 
810
  <original_tokenizer_class value="&lt;class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
811
  <pad_token_id value="50257" />
 
 
 
 
 
 
 
 
 
 
 
812
  </rt_info>
813
  </net>
 
1
  <?xml version="1.0"?>
2
  <net name="tokenizer" version="11">
3
  <layers>
4
+ <layer id="0" name="Parameter_33460" type="Parameter" version="opset1">
5
  <data shape="?" element_type="string" />
6
  <output>
7
+ <port id="0" precision="STRING" names="Parameter_33460">
8
  <dim>-1</dim>
9
  </port>
10
  </output>
11
  </layer>
12
+ <layer id="1" name="Constant_33558" type="Const" version="opset1">
13
  <data element_type="i32" shape="" offset="0" size="4" />
14
  <output>
15
  <port id="0" precision="I32" />
16
  </output>
17
  </layer>
18
+ <layer id="2" name="Constant_33559" type="Const" version="opset1">
19
  <data element_type="i32" shape="" offset="4" size="4" />
20
  <output>
21
  <port id="0" precision="I32" />
22
  </output>
23
  </layer>
24
+ <layer id="3" name="Constant_33560" type="Const" version="opset1">
25
  <data element_type="i32" shape="1" offset="8" size="4" />
26
  <output>
27
  <port id="0" precision="I32">
 
29
  </port>
30
  </output>
31
  </layer>
32
+ <layer id="4" name="Constant_33561" type="Const" version="opset1">
33
  <data element_type="i32" shape="" offset="0" size="4" />
34
  <output>
35
  <port id="0" precision="I32" />
36
  </output>
37
  </layer>
38
+ <layer id="5" name="Constant_33562" type="Const" version="opset1">
39
  <data element_type="i32" shape="" offset="4" size="4" />
40
  <output>
41
  <port id="0" precision="I32" />
42
  </output>
43
  </layer>
44
+ <layer id="6" name="Constant_33563" type="Const" version="opset1">
45
  <data element_type="i32" shape="1" offset="12" size="4" />
46
  <output>
47
  <port id="0" precision="I32">
 
49
  </port>
50
  </output>
51
  </layer>
52
+ <layer id="7" name="Constant_33466" type="Const" version="opset1">
53
  <data element_type="i64" shape="" offset="16" size="8" />
54
  <output>
55
  <port id="0" precision="I64" />
56
  </output>
57
  </layer>
58
+ <layer id="8" name="StringTensorUnpack_33461" type="StringTensorUnpack" version="extension">
59
  <data mode="begins_ends" />
60
  <input>
61
  <port id="0" precision="STRING">
 
74
  </port>
75
  </output>
76
  </layer>
77
+ <layer id="9" name="ShapeOf_33462" type="ShapeOf" version="opset3">
78
  <data output_type="i64" />
79
  <input>
80
  <port id="0" precision="I32">
 
87
  </port>
88
  </output>
89
  </layer>
90
+ <layer id="10" name="Constant_33463" type="Const" version="opset1">
91
  <data element_type="i64" shape="" offset="16" size="8" />
92
  <output>
93
  <port id="0" precision="I64" />
94
  </output>
95
  </layer>
96
+ <layer id="11" name="Constant_33464" type="Const" version="opset1">
97
  <data element_type="i64" shape="" offset="16" size="8" />
98
  <output>
99
  <port id="0" precision="I64" />
100
  </output>
101
  </layer>
102
+ <layer id="12" name="Gather_33465" type="Gather" version="opset8">
103
  <data batch_dims="0" />
104
  <input>
105
  <port id="0" precision="I64">
 
112
  <port id="3" precision="I64" />
113
  </output>
114
  </layer>
115
+ <layer id="13" name="Constant_33467" type="Const" version="opset1">
116
  <data element_type="i64" shape="" offset="24" size="8" />
117
  <output>
118
  <port id="0" precision="I64" />
119
  </output>
120
  </layer>
121
+ <layer id="14" name="Range_33468" type="Range" version="opset4">
122
  <data output_type="i32" />
123
  <input>
124
  <port id="0" precision="I64" />
 
131
  </port>
132
  </output>
133
  </layer>
134
+ <layer id="15" name="Constant_33469" type="Const" version="opset1">
135
  <data element_type="i64" shape="" offset="24" size="8" />
136
  <output>
137
  <port id="0" precision="I64" />
138
  </output>
139
  </layer>
140
+ <layer id="16" name="Constant_33470" type="Const" version="opset1">
141
  <data element_type="i64" shape="" offset="24" size="8" />
142
  <output>
143
  <port id="0" precision="I64" />
144
  </output>
145
  </layer>
146
+ <layer id="17" name="Add_33471" type="Add" version="opset1">
147
  <data auto_broadcast="numpy" />
148
  <input>
149
  <port id="0" precision="I64" />
 
153
  <port id="2" precision="I64" />
154
  </output>
155
  </layer>
156
+ <layer id="18" name="Constant_33472" type="Const" version="opset1">
157
  <data element_type="i64" shape="" offset="24" size="8" />
158
  <output>
159
  <port id="0" precision="I64" />
160
  </output>
161
  </layer>
162
+ <layer id="19" name="Range_33473" type="Range" version="opset4">
163
  <data output_type="i32" />
164
  <input>
165
  <port id="0" precision="I64" />
 
172
  </port>
173
  </output>
174
  </layer>
175
+ <layer id="20" name="Constant_33535" type="Const" version="opset1">
176
  <data element_type="u8" shape="26491" offset="32" size="26491" />
177
  <output>
178
  <port id="0" precision="U8">
 
180
  </port>
181
  </output>
182
  </layer>
183
+ <layer id="21" name="SpecialTokensSplit_33536" type="SpecialTokensSplit" version="extension">
184
  <input>
185
  <port id="0" precision="I32">
186
  <dim>-1</dim>
 
222
  </port>
223
  </output>
224
  </layer>
225
+ <layer id="22" name="Constant_33538" type="Const" version="opset1">
226
  <data element_type="u8" shape="64" offset="26523" size="64" />
227
  <output>
228
  <port id="0" precision="U8">
 
230
  </port>
231
  </output>
232
  </layer>
233
+ <layer id="23" name="RegexSplit_33539" type="RegexSplit" version="extension">
234
  <data behaviour="isolate" invert="false" max_splits="-1" />
235
  <input>
236
  <port id="0" precision="I32">
 
276
  </port>
277
  </output>
278
  </layer>
279
+ <layer id="24" name="Constant_33541" type="Const" version="opset1">
280
  <data element_type="u8" shape="528257" offset="26587" size="528257" />
281
  <output>
282
  <port id="0" precision="U8">
 
284
  </port>
285
  </output>
286
  </layer>
287
+ <layer id="25" name="StringTensorUnpack_33542" type="StringTensorUnpack" version="extension">
288
  <data mode="begins_ends" />
289
  <input>
290
  <port id="0" precision="U8">
 
303
  </port>
304
  </output>
305
  </layer>
306
+ <layer id="26" name="Constant_33547" type="Const" version="opset1">
307
  <data element_type="u8" shape="369958" offset="554844" size="369958" />
308
  <output>
309
  <port id="0" precision="U8">
 
311
  </port>
312
  </output>
313
  </layer>
314
+ <layer id="27" name="StringTensorUnpack_33548" type="StringTensorUnpack" version="extension">
315
  <data mode="begins_ends" />
316
  <input>
317
  <port id="0" precision="U8">
 
330
  </port>
331
  </output>
332
  </layer>
333
+ <layer id="28" name="Constant_33550" type="Const" version="opset1">
334
  <data element_type="u8" shape="336859" offset="924802" size="336859" />
335
  <output>
336
  <port id="0" precision="U8">
 
338
  </port>
339
  </output>
340
  </layer>
341
+ <layer id="29" name="StringTensorUnpack_33551" type="StringTensorUnpack" version="extension">
342
  <data mode="begins_ends" />
343
  <input>
344
  <port id="0" precision="U8">
 
357
  </port>
358
  </output>
359
  </layer>
360
+ <layer id="30" name="Constant_33544" type="Const" version="opset1">
361
  <data element_type="u8" shape="20172" offset="1261661" size="20172" />
362
  <output>
363
  <port id="0" precision="U8">
 
365
  </port>
366
  </output>
367
  </layer>
368
+ <layer id="31" name="StringTensorUnpack_33545" type="StringTensorUnpack" version="extension">
369
  <data mode="begins_ends" />
370
  <input>
371
  <port id="0" precision="U8">
 
384
  </port>
385
  </output>
386
  </layer>
387
+ <layer id="32" name="Constant_33552" type="Const" version="opset1">
388
  <data element_type="i32" shape="1609" offset="1281833" size="6436" />
389
  <output>
390
  <port id="0" precision="I32">
 
392
  </port>
393
  </output>
394
  </layer>
395
+ <layer id="33" name="BPETokenizer_33553" type="BPETokenizer" version="extension">
396
  <data unk_token="" fuse_unk="false" suffix_indicator="" end_suffix="" byte_fallback="false" cache_capacity="20000" />
397
  <input>
398
  <port id="0" precision="I32">
 
462
  </port>
463
  </output>
464
  </layer>
465
+ <layer id="34" name="Subtract_33554" type="Subtract" version="opset1">
466
  <data auto_broadcast="numpy" />
467
  <input>
468
  <port id="0" precision="I32">
 
478
  </port>
479
  </output>
480
  </layer>
481
+ <layer id="35" name="Constant_33555" type="Const" version="opset1">
482
  <data element_type="i32" shape="" offset="1288269" size="4" />
483
  <output>
484
  <port id="0" precision="I32" />
485
  </output>
486
  </layer>
487
+ <layer id="36" name="Minimum_33556" type="Minimum" version="opset1">
488
  <data auto_broadcast="numpy" />
489
  <input>
490
  <port id="0" precision="I32">
 
498
  </port>
499
  </output>
500
  </layer>
501
+ <layer id="37" name="Add_33557" type="Add" version="opset1">
502
  <data auto_broadcast="numpy" />
503
  <input>
504
  <port id="0" precision="I32">
 
514
  </port>
515
  </output>
516
  </layer>
517
+ <layer id="38" name="Constant_33564" type="Const" version="opset1">
518
  <data element_type="i32" shape="" offset="0" size="4" />
519
  <output>
520
  <port id="0" precision="I32" />
521
  </output>
522
  </layer>
523
+ <layer id="39" name="Constant_33565" type="Const" version="opset1">
524
  <data element_type="i32" shape="" offset="4" size="4" />
525
  <output>
526
  <port id="0" precision="I32" />
527
  </output>
528
  </layer>
529
+ <layer id="40" name="Constant_33566" type="Const" version="opset1">
530
  <data element_type="i32" shape="1" offset="1288273" size="4" />
531
  <output>
532
  <port id="0" precision="I32">
 
534
  </port>
535
  </output>
536
  </layer>
537
+ <layer id="41" name="Constant_33567" type="Const" version="opset1">
538
  <data element_type="i32" shape="4" offset="1288277" size="16" />
539
  <output>
540
  <port id="0" precision="I32">
 
542
  </port>
543
  </output>
544
  </layer>
545
+ <layer id="42" name="CombineSegments_33568" type="CombineSegments" version="extension">
546
  <input>
547
  <port id="0" precision="I32" />
548
  <port id="1" precision="I32" />
 
593
  </port>
594
  </output>
595
  </layer>
596
+ <layer id="43" name="Subtract_33569" type="Subtract" version="opset1">
597
  <data auto_broadcast="numpy" />
598
  <input>
599
  <port id="0" precision="I32">
 
609
  </port>
610
  </output>
611
  </layer>
612
+ <layer id="44" name="Constant_33570" type="Const" version="opset1">
613
  <data element_type="i32" shape="" offset="0" size="4" />
614
  <output>
615
  <port id="0" precision="I32" />
616
  </output>
617
  </layer>
618
+ <layer id="45" name="ReduceMax_33571" type="ReduceMax" version="opset1">
619
  <data keep_dims="false" />
620
  <input>
621
  <port id="0" precision="I32">
 
627
  <port id="2" precision="I32" />
628
  </output>
629
  </layer>
630
+ <layer id="46" name="Constant_33572" type="Const" version="opset1">
631
  <data element_type="i32" shape="" offset="1288273" size="4" />
632
  <output>
633
  <port id="0" precision="I32" />
634
  </output>
635
  </layer>
636
+ <layer id="47" name="RaggedToDense_33573" type="RaggedToDense" version="extension">
637
  <data pad_right="true" />
638
  <input>
639
  <port id="0" precision="I32">
 
659
  </port>
660
  </output>
661
  </layer>
662
+ <layer id="48" name="Convert_33574" type="Convert" version="opset1">
663
  <data destination_type="i32" />
664
  <input>
665
  <port id="0" precision="BOOL">
 
674
  </port>
675
  </output>
676
  </layer>
677
+ <layer id="49" name="Convert_33574" type="Convert" version="opset1">
678
  <data destination_type="i64" />
679
  <input>
680
  <port id="0" precision="I32">
 
689
  </port>
690
  </output>
691
  </layer>
692
+ <layer id="51" name="RaggedToDense_33573.0" type="Convert" version="opset1">
693
  <data destination_type="i64" />
694
  <input>
695
  <port id="0" precision="I32">
 
704
  </port>
705
  </output>
706
  </layer>
707
+ <layer id="52" name="Result_33577" type="Result" version="opset1">
708
  <input>
709
  <port id="0" precision="I64">
710
  <dim>-1</dim>
 
712
  </port>
713
  </input>
714
  </layer>
715
+ <layer id="50" name="Result_33579" type="Result" version="opset1">
716
  <input>
717
  <port id="0" precision="I64">
718
  <dim>-1</dim>
 
805
  <edge from-layer="51" from-port="1" to-layer="52" to-port="0" />
806
  </edges>
807
  <rt_info>
808
+ <add_attention_mask value="True" />
809
+ <add_prefix_space />
810
+ <add_special_tokens value="True" />
811
  <bos_token_id value="50257" />
812
+ <clean_up_tokenization_spaces />
813
+ <detokenizer_input_type value="i64" />
814
  <eos_token_id value="50257" />
815
+ <handle_special_tokens_with_re />
816
+ <number_of_inputs value="1" />
817
+ <openvino_tokenizers_version value="2024.5.0.0" />
818
+ <openvino_version value="2024.5.0" />
819
  <original_tokenizer_class value="&lt;class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
820
  <pad_token_id value="50257" />
821
+ <sentencepiece_version value="0.2.0" />
822
+ <skip_special_tokens value="True" />
823
+ <streaming_detokenizer value="False" />
824
+ <tiktoken_version value="0.8.0" />
825
+ <tokenizer_output_type value="i64" />
826
+ <tokenizers_version value="0.20.3" />
827
+ <transformers_version value="4.46.3" />
828
+ <use_max_padding value="False" />
829
+ <use_sentencepiece_backend value="False" />
830
+ <utf8_replace_mode />
831
+ <with_detokenizer value="True" />
832
  </rt_info>
833
  </net>