alexwengg commited on
Commit
cc7b0cd
·
verified ·
1 Parent(s): 21156b2

Upload 16 files

Browse files
G2PDecoder.mlpackage/Data/com.apple.CoreML/model.mlmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:153360a0a799c3e48b56456324f057557b69dedf183ae3d137b45c95df5b15b2
3
- size 17997
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b2bfc025be6563494c66b3f9c1b62674741e392d14d92d2ecaeb1730643e50c
3
+ size 85095
G2PDecoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cbaeb4e743359f607ab161af0c6d8a817462fdaec622ee788ef8ef952c5f8214
3
- size 828030
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:005b5ffbccabe4fd4074204d16af745b5d8f458a687b0c07e80060f7fe0a08e4
3
+ size 25977088
G2PDecoder.mlpackage/Manifest.json CHANGED
@@ -1,18 +1,18 @@
1
  {
2
  "fileFormatVersion": "1.0.0",
3
  "itemInfoEntries": {
4
- "4AA5D221-1355-4F3F-B188-7F8EF536155C": {
5
- "author": "com.apple.CoreML",
6
- "description": "CoreML Model Specification",
7
- "name": "model.mlmodel",
8
- "path": "com.apple.CoreML/model.mlmodel"
9
- },
10
- "5D000863-3BC2-4F18-AC66-6F1DE5E29001": {
11
  "author": "com.apple.CoreML",
12
  "description": "CoreML Model Weights",
13
  "name": "weights",
14
  "path": "com.apple.CoreML/weights"
 
 
 
 
 
 
15
  }
16
  },
17
- "rootModelIdentifier": "4AA5D221-1355-4F3F-B188-7F8EF536155C"
18
  }
 
1
  {
2
  "fileFormatVersion": "1.0.0",
3
  "itemInfoEntries": {
4
+ "837F74EA-4434-419F-AE52-FD61A69F6E0A": {
 
 
 
 
 
 
5
  "author": "com.apple.CoreML",
6
  "description": "CoreML Model Weights",
7
  "name": "weights",
8
  "path": "com.apple.CoreML/weights"
9
+ },
10
+ "FEF5E4E3-07B4-4F5A-BF3F-C4A2BB7E68E2": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Specification",
13
+ "name": "model.mlmodel",
14
+ "path": "com.apple.CoreML/model.mlmodel"
15
  }
16
  },
17
+ "rootModelIdentifier": "FEF5E4E3-07B4-4F5A-BF3F-C4A2BB7E68E2"
18
  }
G2PEncoder.mlpackage/Data/com.apple.CoreML/model.mlmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f51555b74730f0446406a50e3ee87dc4e2f0d759d2f095662880ac520a752fec
3
- size 20323
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:338ee3222fb062efddd1f85374d1aa15478b4975b74f90c59264ad961d9879a3
3
+ size 131789
G2PEncoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6926bcd2827d21fec82839487b987e06f85fd8a6a5bb896bc4f6062461d014ec
3
- size 694592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11b225e93b6b1fe6fb85c9d4317724e1a033d6123fdc01dc2ad85f3c1f168eb3
3
+ size 57056704
G2PEncoder.mlpackage/Manifest.json CHANGED
@@ -1,18 +1,18 @@
1
  {
2
  "fileFormatVersion": "1.0.0",
3
  "itemInfoEntries": {
4
- "C03F7353-6672-47CD-9842-1F68630789D7": {
5
- "author": "com.apple.CoreML",
6
- "description": "CoreML Model Weights",
7
- "name": "weights",
8
- "path": "com.apple.CoreML/weights"
9
- },
10
- "D40EF921-64C1-4EEC-BF85-D226D10F6B90": {
11
  "author": "com.apple.CoreML",
12
  "description": "CoreML Model Specification",
13
  "name": "model.mlmodel",
14
  "path": "com.apple.CoreML/model.mlmodel"
 
 
 
 
 
 
15
  }
16
  },
17
- "rootModelIdentifier": "D40EF921-64C1-4EEC-BF85-D226D10F6B90"
18
  }
 
1
  {
2
  "fileFormatVersion": "1.0.0",
3
  "itemInfoEntries": {
4
+ "48AE8C97-A0EB-4155-AE9E-D179548FBDD0": {
 
 
 
 
 
 
5
  "author": "com.apple.CoreML",
6
  "description": "CoreML Model Specification",
7
  "name": "model.mlmodel",
8
  "path": "com.apple.CoreML/model.mlmodel"
9
+ },
10
+ "7760FC9D-D7D7-4E6E-8C85-EBF0D242EFC9": {
11
+ "author": "com.apple.CoreML",
12
+ "description": "CoreML Model Weights",
13
+ "name": "weights",
14
+ "path": "com.apple.CoreML/weights"
15
  }
16
  },
17
+ "rootModelIdentifier": "48AE8C97-A0EB-4155-AE9E-D179548FBDD0"
18
  }
MultilingualG2PDecoder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f34464b8c4e85cde3ca62bc7e22d1ab3eb7494c8aa72c220391c99800910856
3
+ size 243
MultilingualG2PDecoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb5b5003066a66bde1b5bff980e3267453910b04f96ca7352c0adc996ae7df8f
3
+ size 507
MultilingualG2PDecoder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,113 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "metadataOutputVersion" : "3.0",
4
+ "storagePrecision" : "Float32",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32)",
11
+ "shortDescription" : "",
12
+ "shape" : "[]",
13
+ "name" : "logits",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "modelParameters" : [
18
+
19
+ ],
20
+ "specificationVersion" : 8,
21
+ "mlProgramOperationTypeHistogram" : {
22
+ "Range1d" : 2,
23
+ "Fill" : 2,
24
+ "Ios17.reshape" : 32,
25
+ "Ios16.reduceMean" : 13,
26
+ "Ios16.softmax" : 8,
27
+ "Ios17.matmul" : 16,
28
+ "Ios17.transpose" : 33,
29
+ "Select" : 3,
30
+ "Ios17.expandDims" : 11,
31
+ "Ios17.add" : 38,
32
+ "Tile" : 1,
33
+ "Ios17.lessEqual" : 1,
34
+ "Ios16.fillLike" : 1,
35
+ "Shape" : 4,
36
+ "Ios17.gather" : 6,
37
+ "Ios17.log" : 1,
38
+ "Ios17.cast" : 4,
39
+ "Ios17.sub" : 4,
40
+ "Ios17.pow" : 13,
41
+ "Ios17.less" : 1,
42
+ "Ios16.gelu" : 4,
43
+ "Ios17.linear" : 45,
44
+ "Ios17.concat" : 3,
45
+ "Ios17.greaterEqual" : 2,
46
+ "Ios17.minimum" : 2,
47
+ "Ios17.rsqrt" : 13,
48
+ "Ios17.mul" : 37
49
+ },
50
+ "computePrecision" : "Mixed (Float32, Int32)",
51
+ "isUpdatable" : "0",
52
+ "stateSchema" : [
53
+
54
+ ],
55
+ "availability" : {
56
+ "macOS" : "14.0",
57
+ "tvOS" : "17.0",
58
+ "visionOS" : "1.0",
59
+ "watchOS" : "10.0",
60
+ "iOS" : "17.0",
61
+ "macCatalyst" : "17.0"
62
+ },
63
+ "modelType" : {
64
+ "name" : "MLModelType_mlProgram"
65
+ },
66
+ "userDefinedMetadata" : {
67
+ "com.github.apple.coremltools.conversion_date" : "2026-03-13",
68
+ "com.github.apple.coremltools.source" : "torch==2.7.0",
69
+ "com.github.apple.coremltools.version" : "9.0",
70
+ "com.github.apple.coremltools.source_dialect" : "TorchScript"
71
+ },
72
+ "inputSchema" : [
73
+ {
74
+ "dataType" : "Int32",
75
+ "hasShapeFlexibility" : "1",
76
+ "isOptional" : "0",
77
+ "shapeFlexibility" : "1 × 1...128",
78
+ "shapeRange" : "[[1, 1], [1, 128]]",
79
+ "formattedType" : "MultiArray (Int32 1 × 8)",
80
+ "type" : "MultiArray",
81
+ "shape" : "[1, 8]",
82
+ "name" : "decoder_input_ids",
83
+ "shortDescription" : ""
84
+ },
85
+ {
86
+ "dataType" : "Float32",
87
+ "hasShapeFlexibility" : "1",
88
+ "isOptional" : "0",
89
+ "shapeFlexibility" : "1 × 1...64 × 256",
90
+ "shapeRange" : "[[1, 1], [1, 64], [256, 256]]",
91
+ "formattedType" : "MultiArray (Float32 1 × 16 × 256)",
92
+ "type" : "MultiArray",
93
+ "shape" : "[1, 16, 256]",
94
+ "name" : "encoder_hidden_states",
95
+ "shortDescription" : ""
96
+ },
97
+ {
98
+ "dataType" : "Int32",
99
+ "hasShapeFlexibility" : "1",
100
+ "isOptional" : "0",
101
+ "shapeFlexibility" : "1 × 1...64",
102
+ "shapeRange" : "[[1, 1], [1, 64]]",
103
+ "formattedType" : "MultiArray (Int32 1 × 16)",
104
+ "type" : "MultiArray",
105
+ "shape" : "[1, 16]",
106
+ "name" : "encoder_attention_mask",
107
+ "shortDescription" : ""
108
+ }
109
+ ],
110
+ "generatedClassName" : "G2PDecoder",
111
+ "method" : "predict"
112
+ }
113
+ ]
MultilingualG2PDecoder.mlmodelc/model.mil ADDED
@@ -0,0 +1,603 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ program(1.0)
2
+ [buildInfo = dict<tensor<string, []>, tensor<string, []>>({{"coremlc-component-MIL", "3510.2.1"}, {"coremlc-version", "3500.32.1"}, {"coremltools-component-torch", "2.7.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "9.0"}})]
3
+ {
4
+ func main<ios17>(tensor<int32, [1, ?]> decoder_input_ids, tensor<int32, [1, ?]> encoder_attention_mask, tensor<fp32, [1, ?, 256]> encoder_hidden_states) [FlexibleShapeInformation = tuple<tuple<tensor<string, []>, dict<tensor<string, []>, tensor<int32, [?]>>>, tuple<tensor<string, []>, dict<tensor<string, []>, list<tensor<int32, [2]>, ?>>>>((("DefaultShapes", {{"decoder_input_ids", [1, 8]}, {"encoder_attention_mask", [1, 16]}, {"encoder_hidden_states", [1, 16, 256]}}), ("RangeDims", {{"decoder_input_ids", [[1, 1], [1, 128]]}, {"encoder_attention_mask", [[1, 1], [1, 64]]}, {"encoder_hidden_states", [[1, 1], [1, 64], [256, 256]]}})))] {
5
+ tensor<fp32, [384, 256]> decoder_embed_tokens_weight = const()[name = tensor<string, []>("decoder_embed_tokens_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(64)))];
6
+ tensor<fp32, [256]> decoder_block_0_layer_0_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_0_layer_0_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(393344)))];
7
+ tensor<fp32, [384, 256]> decoder_block_0_layer_0_SelfAttention_q_weight = const()[name = tensor<string, []>("decoder_block_0_layer_0_SelfAttention_q_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(394432)))];
8
+ tensor<fp32, [384, 256]> decoder_block_0_layer_0_SelfAttention_k_weight = const()[name = tensor<string, []>("decoder_block_0_layer_0_SelfAttention_k_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(787712)))];
9
+ tensor<fp32, [384, 256]> decoder_block_0_layer_0_SelfAttention_v_weight = const()[name = tensor<string, []>("decoder_block_0_layer_0_SelfAttention_v_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1180992)))];
10
+ tensor<fp32, [32, 6]> decoder_block_0_layer_0_SelfAttention_relative_attention_bias_weight = const()[name = tensor<string, []>("decoder_block_0_layer_0_SelfAttention_relative_attention_bias_weight"), val = tensor<fp32, [32, 6]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1574272)))];
11
+ tensor<fp32, [256, 384]> decoder_block_0_layer_0_SelfAttention_o_weight = const()[name = tensor<string, []>("decoder_block_0_layer_0_SelfAttention_o_weight"), val = tensor<fp32, [256, 384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1575104)))];
12
+ tensor<fp32, [256]> decoder_block_0_layer_1_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_0_layer_1_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1968384)))];
13
+ tensor<fp32, [384, 256]> decoder_block_0_layer_1_EncDecAttention_q_weight = const()[name = tensor<string, []>("decoder_block_0_layer_1_EncDecAttention_q_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1969472)))];
14
+ tensor<fp32, [384, 256]> decoder_block_0_layer_1_EncDecAttention_k_weight = const()[name = tensor<string, []>("decoder_block_0_layer_1_EncDecAttention_k_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2362752)))];
15
+ tensor<fp32, [384, 256]> decoder_block_0_layer_1_EncDecAttention_v_weight = const()[name = tensor<string, []>("decoder_block_0_layer_1_EncDecAttention_v_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2756032)))];
16
+ tensor<fp32, [256, 384]> decoder_block_0_layer_1_EncDecAttention_o_weight = const()[name = tensor<string, []>("decoder_block_0_layer_1_EncDecAttention_o_weight"), val = tensor<fp32, [256, 384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3149312)))];
17
+ tensor<fp32, [256]> decoder_block_0_layer_2_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_0_layer_2_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3542592)))];
18
+ tensor<fp32, [1024, 256]> decoder_block_0_layer_2_DenseReluDense_wi_0_weight = const()[name = tensor<string, []>("decoder_block_0_layer_2_DenseReluDense_wi_0_weight"), val = tensor<fp32, [1024, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3543680)))];
19
+ tensor<fp32, [1024, 256]> decoder_block_0_layer_2_DenseReluDense_wi_1_weight = const()[name = tensor<string, []>("decoder_block_0_layer_2_DenseReluDense_wi_1_weight"), val = tensor<fp32, [1024, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4592320)))];
20
+ tensor<fp32, [256, 1024]> decoder_block_0_layer_2_DenseReluDense_wo_weight = const()[name = tensor<string, []>("decoder_block_0_layer_2_DenseReluDense_wo_weight"), val = tensor<fp32, [256, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5640960)))];
21
+ tensor<fp32, [256]> decoder_block_1_layer_0_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_1_layer_0_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6689600)))];
22
+ tensor<fp32, [384, 256]> decoder_block_1_layer_0_SelfAttention_q_weight = const()[name = tensor<string, []>("decoder_block_1_layer_0_SelfAttention_q_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6690688)))];
23
+ tensor<fp32, [384, 256]> decoder_block_1_layer_0_SelfAttention_k_weight = const()[name = tensor<string, []>("decoder_block_1_layer_0_SelfAttention_k_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7083968)))];
24
+ tensor<fp32, [384, 256]> decoder_block_1_layer_0_SelfAttention_v_weight = const()[name = tensor<string, []>("decoder_block_1_layer_0_SelfAttention_v_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7477248)))];
25
+ tensor<fp32, [256, 384]> decoder_block_1_layer_0_SelfAttention_o_weight = const()[name = tensor<string, []>("decoder_block_1_layer_0_SelfAttention_o_weight"), val = tensor<fp32, [256, 384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7870528)))];
26
+ tensor<fp32, [256]> decoder_block_1_layer_1_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_1_layer_1_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8263808)))];
27
+ tensor<fp32, [384, 256]> decoder_block_1_layer_1_EncDecAttention_q_weight = const()[name = tensor<string, []>("decoder_block_1_layer_1_EncDecAttention_q_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8264896)))];
28
+ tensor<fp32, [384, 256]> decoder_block_1_layer_1_EncDecAttention_k_weight = const()[name = tensor<string, []>("decoder_block_1_layer_1_EncDecAttention_k_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8658176)))];
29
+ tensor<fp32, [384, 256]> decoder_block_1_layer_1_EncDecAttention_v_weight = const()[name = tensor<string, []>("decoder_block_1_layer_1_EncDecAttention_v_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9051456)))];
30
+ tensor<fp32, [256, 384]> decoder_block_1_layer_1_EncDecAttention_o_weight = const()[name = tensor<string, []>("decoder_block_1_layer_1_EncDecAttention_o_weight"), val = tensor<fp32, [256, 384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9444736)))];
31
+ tensor<fp32, [256]> decoder_block_1_layer_2_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_1_layer_2_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9838016)))];
32
+ tensor<fp32, [1024, 256]> decoder_block_1_layer_2_DenseReluDense_wi_0_weight = const()[name = tensor<string, []>("decoder_block_1_layer_2_DenseReluDense_wi_0_weight"), val = tensor<fp32, [1024, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9839104)))];
33
+ tensor<fp32, [1024, 256]> decoder_block_1_layer_2_DenseReluDense_wi_1_weight = const()[name = tensor<string, []>("decoder_block_1_layer_2_DenseReluDense_wi_1_weight"), val = tensor<fp32, [1024, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(10887744)))];
34
+ tensor<fp32, [256, 1024]> decoder_block_1_layer_2_DenseReluDense_wo_weight = const()[name = tensor<string, []>("decoder_block_1_layer_2_DenseReluDense_wo_weight"), val = tensor<fp32, [256, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(11936384)))];
35
+ tensor<fp32, [256]> decoder_block_2_layer_0_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_2_layer_0_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12985024)))];
36
+ tensor<fp32, [384, 256]> decoder_block_2_layer_0_SelfAttention_q_weight = const()[name = tensor<string, []>("decoder_block_2_layer_0_SelfAttention_q_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12986112)))];
37
+ tensor<fp32, [384, 256]> decoder_block_2_layer_0_SelfAttention_k_weight = const()[name = tensor<string, []>("decoder_block_2_layer_0_SelfAttention_k_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(13379392)))];
38
+ tensor<fp32, [384, 256]> decoder_block_2_layer_0_SelfAttention_v_weight = const()[name = tensor<string, []>("decoder_block_2_layer_0_SelfAttention_v_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(13772672)))];
39
+ tensor<fp32, [256, 384]> decoder_block_2_layer_0_SelfAttention_o_weight = const()[name = tensor<string, []>("decoder_block_2_layer_0_SelfAttention_o_weight"), val = tensor<fp32, [256, 384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(14165952)))];
40
+ tensor<fp32, [256]> decoder_block_2_layer_1_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_2_layer_1_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(14559232)))];
41
+ tensor<fp32, [384, 256]> decoder_block_2_layer_1_EncDecAttention_q_weight = const()[name = tensor<string, []>("decoder_block_2_layer_1_EncDecAttention_q_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(14560320)))];
42
+ tensor<fp32, [384, 256]> decoder_block_2_layer_1_EncDecAttention_k_weight = const()[name = tensor<string, []>("decoder_block_2_layer_1_EncDecAttention_k_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(14953600)))];
43
+ tensor<fp32, [384, 256]> decoder_block_2_layer_1_EncDecAttention_v_weight = const()[name = tensor<string, []>("decoder_block_2_layer_1_EncDecAttention_v_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(15346880)))];
44
+ tensor<fp32, [256, 384]> decoder_block_2_layer_1_EncDecAttention_o_weight = const()[name = tensor<string, []>("decoder_block_2_layer_1_EncDecAttention_o_weight"), val = tensor<fp32, [256, 384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(15740160)))];
45
+ tensor<fp32, [256]> decoder_block_2_layer_2_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_2_layer_2_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16133440)))];
46
+ tensor<fp32, [1024, 256]> decoder_block_2_layer_2_DenseReluDense_wi_0_weight = const()[name = tensor<string, []>("decoder_block_2_layer_2_DenseReluDense_wi_0_weight"), val = tensor<fp32, [1024, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16134528)))];
47
+ tensor<fp32, [1024, 256]> decoder_block_2_layer_2_DenseReluDense_wi_1_weight = const()[name = tensor<string, []>("decoder_block_2_layer_2_DenseReluDense_wi_1_weight"), val = tensor<fp32, [1024, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17183168)))];
48
+ tensor<fp32, [256, 1024]> decoder_block_2_layer_2_DenseReluDense_wo_weight = const()[name = tensor<string, []>("decoder_block_2_layer_2_DenseReluDense_wo_weight"), val = tensor<fp32, [256, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(18231808)))];
49
+ tensor<fp32, [256]> decoder_block_3_layer_0_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_3_layer_0_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(19280448)))];
50
+ tensor<fp32, [384, 256]> decoder_block_3_layer_0_SelfAttention_q_weight = const()[name = tensor<string, []>("decoder_block_3_layer_0_SelfAttention_q_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(19281536)))];
51
+ tensor<fp32, [384, 256]> decoder_block_3_layer_0_SelfAttention_k_weight = const()[name = tensor<string, []>("decoder_block_3_layer_0_SelfAttention_k_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(19674816)))];
52
+ tensor<fp32, [384, 256]> decoder_block_3_layer_0_SelfAttention_v_weight = const()[name = tensor<string, []>("decoder_block_3_layer_0_SelfAttention_v_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(20068096)))];
53
+ tensor<fp32, [256, 384]> decoder_block_3_layer_0_SelfAttention_o_weight = const()[name = tensor<string, []>("decoder_block_3_layer_0_SelfAttention_o_weight"), val = tensor<fp32, [256, 384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(20461376)))];
54
+ tensor<fp32, [256]> decoder_block_3_layer_1_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_3_layer_1_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(20854656)))];
55
+ tensor<fp32, [384, 256]> decoder_block_3_layer_1_EncDecAttention_q_weight = const()[name = tensor<string, []>("decoder_block_3_layer_1_EncDecAttention_q_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(20855744)))];
56
+ tensor<fp32, [384, 256]> decoder_block_3_layer_1_EncDecAttention_k_weight = const()[name = tensor<string, []>("decoder_block_3_layer_1_EncDecAttention_k_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(21249024)))];
57
+ tensor<fp32, [384, 256]> decoder_block_3_layer_1_EncDecAttention_v_weight = const()[name = tensor<string, []>("decoder_block_3_layer_1_EncDecAttention_v_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(21642304)))];
58
+ tensor<fp32, [256, 384]> decoder_block_3_layer_1_EncDecAttention_o_weight = const()[name = tensor<string, []>("decoder_block_3_layer_1_EncDecAttention_o_weight"), val = tensor<fp32, [256, 384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22035584)))];
59
+ tensor<fp32, [256]> decoder_block_3_layer_2_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_3_layer_2_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22428864)))];
60
+ tensor<fp32, [1024, 256]> decoder_block_3_layer_2_DenseReluDense_wi_0_weight = const()[name = tensor<string, []>("decoder_block_3_layer_2_DenseReluDense_wi_0_weight"), val = tensor<fp32, [1024, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22429952)))];
61
+ tensor<fp32, [1024, 256]> decoder_block_3_layer_2_DenseReluDense_wi_1_weight = const()[name = tensor<string, []>("decoder_block_3_layer_2_DenseReluDense_wi_1_weight"), val = tensor<fp32, [1024, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(23478592)))];
62
+ tensor<fp32, [256, 1024]> decoder_block_3_layer_2_DenseReluDense_wo_weight = const()[name = tensor<string, []>("decoder_block_3_layer_2_DenseReluDense_wo_weight"), val = tensor<fp32, [256, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(24527232)))];
63
+ tensor<fp32, [256]> decoder_final_layer_norm_weight = const()[name = tensor<string, []>("decoder_final_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25575872)))];
64
+ tensor<fp32, [384, 256]> lm_head_weight = const()[name = tensor<string, []>("lm_head_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25576960)))];
65
+ tensor<int32, []> var_8 = const()[name = tensor<string, []>("op_8"), val = tensor<int32, []>(16)];
66
+ tensor<fp32, []> var_14 = const()[name = tensor<string, []>("op_14"), val = tensor<fp32, []>(0x1p+0)];
67
+ tensor<int32, []> var_16 = const()[name = tensor<string, []>("op_16"), val = tensor<int32, []>(6)];
68
+ tensor<int32, []> var_22 = const()[name = tensor<string, []>("op_22"), val = tensor<int32, []>(-1)];
69
+ tensor<int32, []> var_23 = const()[name = tensor<string, []>("op_23"), val = tensor<int32, []>(1)];
70
+ tensor<int32, [2]> var_35_shape = shape(x = decoder_input_ids)[name = tensor<string, []>("op_35_shape")];
71
+ tensor<int32, []> gather_0 = const()[name = tensor<string, []>("gather_0"), val = tensor<int32, []>(1)];
72
+ tensor<int32, []> gather_1_batch_dims_0 = const()[name = tensor<string, []>("gather_1_batch_dims_0"), val = tensor<int32, []>(0)];
73
+ tensor<bool, []> gather_1_validate_indices_0 = const()[name = tensor<string, []>("gather_1_validate_indices_0"), val = tensor<bool, []>(false)];
74
+ tensor<int32, []> select_0 = const()[name = tensor<string, []>("select_0"), val = tensor<int32, []>(1)];
75
+ tensor<int32, []> gather_1_axis_1 = const()[name = tensor<string, []>("gather_1_axis_1"), val = tensor<int32, []>(0)];
76
+ tensor<int32, []> gather_1 = gather(axis = gather_1_axis_1, batch_dims = gather_1_batch_dims_0, indices = select_0, validate_indices = gather_1_validate_indices_0, x = var_35_shape)[name = tensor<string, []>("gather_1")];
77
+ tensor<int32, []> input_3_batch_dims_0 = const()[name = tensor<string, []>("input_3_batch_dims_0"), val = tensor<int32, []>(0)];
78
+ tensor<bool, []> input_3_validate_indices_0 = const()[name = tensor<string, []>("input_3_validate_indices_0"), val = tensor<bool, []>(false)];
79
+ tensor<int32, []> greater_equal_1_y_0 = const()[name = tensor<string, []>("greater_equal_1_y_0"), val = tensor<int32, []>(0)];
80
+ tensor<bool, [1, ?]> greater_equal_1 = greater_equal(x = decoder_input_ids, y = greater_equal_1_y_0)[name = tensor<string, []>("greater_equal_1")];
81
+ tensor<int32, []> slice_by_index_1 = const()[name = tensor<string, []>("slice_by_index_1"), val = tensor<int32, []>(384)];
82
+ tensor<int32, [1, ?]> add_1 = add(x = decoder_input_ids, y = slice_by_index_1)[name = tensor<string, []>("add_1")];
83
+ tensor<int32, [1, ?]> select_1 = select(a = decoder_input_ids, b = add_1, cond = greater_equal_1)[name = tensor<string, []>("select_1")];
84
+ tensor<int32, []> input_3_axis_1 = const()[name = tensor<string, []>("input_3_axis_1"), val = tensor<int32, []>(0)];
85
+ tensor<fp32, [1, ?, 256]> input_3 = gather(axis = input_3_axis_1, batch_dims = input_3_batch_dims_0, indices = select_1, validate_indices = input_3_validate_indices_0, x = decoder_embed_tokens_weight)[name = tensor<string, []>("input_3")];
86
+ tensor<int32, []> concat_1_axis_0 = const()[name = tensor<string, []>("concat_1_axis_0"), val = tensor<int32, []>(0)];
87
+ tensor<bool, []> concat_1_interleave_0 = const()[name = tensor<string, []>("concat_1_interleave_0"), val = tensor<bool, []>(false)];
88
+ tensor<int32, [2]> concat_1 = concat(axis = concat_1_axis_0, interleave = concat_1_interleave_0, values = (gather_0, gather_1))[name = tensor<string, []>("concat_1")];
89
+ tensor<fp32, []> fill_0_value_0 = const()[name = tensor<string, []>("fill_0_value_0"), val = tensor<fp32, []>(0x1p+0)];
90
+ tensor<fp32, [1, ?]> fill_0 = fill(shape = concat_1, value = fill_0_value_0)[name = tensor<string, []>("fill_0")];
91
+ tensor<int32, []> const_0 = const()[name = tensor<string, []>("const_0"), val = tensor<int32, []>(0)];
92
+ tensor<int32, []> const_1 = const()[name = tensor<string, []>("const_1"), val = tensor<int32, []>(1)];
93
+ tensor<int32, [?]> seq_ids = range_1d(end = gather_1, start = const_0, step = const_1)[name = tensor<string, []>("seq_ids")];
94
+ tensor<int32, [1]> var_44_axes_0 = const()[name = tensor<string, []>("op_44_axes_0"), val = tensor<int32, [1]>([0])];
95
+ tensor<int32, [1, ?]> var_44 = expand_dims(axes = var_44_axes_0, x = seq_ids)[name = tensor<string, []>("op_44")];
96
+ tensor<int32, [1]> var_45_axes_0 = const()[name = tensor<string, []>("op_45_axes_0"), val = tensor<int32, [1]>([1])];
97
+ tensor<int32, [1, 1, ?]> var_45 = expand_dims(axes = var_45_axes_0, x = var_44)[name = tensor<string, []>("op_45")];
98
+ tensor<int32, []> concat_2_axis_0 = const()[name = tensor<string, []>("concat_2_axis_0"), val = tensor<int32, []>(0)];
99
+ tensor<bool, []> concat_2_interleave_0 = const()[name = tensor<string, []>("concat_2_interleave_0"), val = tensor<bool, []>(false)];
100
+ tensor<int32, [3]> concat_2 = concat(axis = concat_2_axis_0, interleave = concat_2_interleave_0, values = (gather_0, gather_1, var_23))[name = tensor<string, []>("concat_2")];
101
+ tensor<int32, [1, ?, ?]> var_48 = tile(reps = concat_2, x = var_45)[name = tensor<string, []>("op_48")];
102
+ tensor<int32, [1]> var_51_axes_0 = const()[name = tensor<string, []>("op_51_axes_0"), val = tensor<int32, [1]>([2])];
103
+ tensor<int32, [1, ?, 1]> var_51 = expand_dims(axes = var_51_axes_0, x = var_44)[name = tensor<string, []>("op_51")];
104
+ tensor<bool, [1, ?, ?]> causal_mask_1 = less_equal(x = var_48, y = var_51)[name = tensor<string, []>("causal_mask_1")];
105
+ tensor<string, []> causal_mask_dtype_0 = const()[name = tensor<string, []>("causal_mask_dtype_0"), val = tensor<string, []>("fp32")];
106
+ tensor<int32, [1]> var_55_axes_0 = const()[name = tensor<string, []>("op_55_axes_0"), val = tensor<int32, [1]>([1])];
107
+ tensor<fp32, [1, ?, ?]> causal_mask = cast(dtype = causal_mask_dtype_0, x = causal_mask_1)[name = tensor<string, []>("cast_42")];
108
+ tensor<fp32, [1, 1, ?, ?]> var_55 = expand_dims(axes = var_55_axes_0, x = causal_mask)[name = tensor<string, []>("op_55")];
109
+ tensor<int32, [1]> var_59_axes_0 = const()[name = tensor<string, []>("op_59_axes_0"), val = tensor<int32, [1]>([1])];
110
+ tensor<fp32, [1, 1, ?]> var_59 = expand_dims(axes = var_59_axes_0, x = fill_0)[name = tensor<string, []>("op_59")];
111
+ tensor<int32, [1]> var_60_axes_0 = const()[name = tensor<string, []>("op_60_axes_0"), val = tensor<int32, [1]>([2])];
112
+ tensor<fp32, [1, 1, 1, ?]> var_60 = expand_dims(axes = var_60_axes_0, x = var_59)[name = tensor<string, []>("op_60")];
113
+ tensor<fp32, [1, 1, ?, ?]> extended_attention_mask = mul(x = var_55, y = var_60)[name = tensor<string, []>("extended_attention_mask")];
114
+ tensor<fp32, [1, 1, ?, ?]> var_64 = sub(x = var_14, y = extended_attention_mask)[name = tensor<string, []>("op_64")];
115
+ tensor<fp32, []> var_65 = const()[name = tensor<string, []>("op_65"), val = tensor<fp32, []>(-0x1.fffffep+127)];
116
+ tensor<fp32, [1, 1, ?, ?]> mask_1 = mul(x = var_64, y = var_65)[name = tensor<string, []>("mask_1")];
117
+ tensor<int32, [1]> var_68_axes_0 = const()[name = tensor<string, []>("op_68_axes_0"), val = tensor<int32, [1]>([1])];
118
+ tensor<int32, [1, 1, ?]> var_68 = expand_dims(axes = var_68_axes_0, x = encoder_attention_mask)[name = tensor<string, []>("op_68")];
119
+ tensor<int32, [1]> var_69_axes_0 = const()[name = tensor<string, []>("op_69_axes_0"), val = tensor<int32, [1]>([2])];
120
+ tensor<int32, [1, 1, 1, ?]> var_69 = expand_dims(axes = var_69_axes_0, x = var_68)[name = tensor<string, []>("op_69")];
121
+ tensor<string, []> var_71_dtype_0 = const()[name = tensor<string, []>("op_71_dtype_0"), val = tensor<string, []>("fp32")];
122
+ tensor<fp32, [1, 1, 1, ?]> var_71 = cast(dtype = var_71_dtype_0, x = var_69)[name = tensor<string, []>("cast_41")];
123
+ tensor<fp32, [1, 1, 1, ?]> var_72 = sub(x = var_14, y = var_71)[name = tensor<string, []>("op_72")];
124
+ tensor<fp32, []> var_73 = const()[name = tensor<string, []>("op_73"), val = tensor<fp32, []>(-0x1.fffffep+127)];
125
+ tensor<fp32, [1, 1, 1, ?]> mask = mul(x = var_72, y = var_73)[name = tensor<string, []>("mask")];
126
+ tensor<fp32, []> var_18_promoted = const()[name = tensor<string, []>("op_18_promoted"), val = tensor<fp32, []>(0x1p+1)];
127
+ tensor<fp32, [1, ?, 256]> var_86 = pow(x = input_3, y = var_18_promoted)[name = tensor<string, []>("op_86")];
128
+ tensor<int32, [1]> variance_1_axes_0 = const()[name = tensor<string, []>("variance_1_axes_0"), val = tensor<int32, [1]>([-1])];
129
+ tensor<bool, []> variance_1_keep_dims_0 = const()[name = tensor<string, []>("variance_1_keep_dims_0"), val = tensor<bool, []>(true)];
130
+ tensor<fp32, [1, ?, 1]> variance_1 = reduce_mean(axes = variance_1_axes_0, keep_dims = variance_1_keep_dims_0, x = var_86)[name = tensor<string, []>("variance_1")];
131
+ tensor<fp32, []> var_89 = const()[name = tensor<string, []>("op_89"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
132
+ tensor<fp32, [1, ?, 1]> var_90 = add(x = variance_1, y = var_89)[name = tensor<string, []>("op_90")];
133
+ tensor<fp32, []> var_91_epsilon_0 = const()[name = tensor<string, []>("op_91_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
134
+ tensor<fp32, [1, ?, 1]> var_91 = rsqrt(epsilon = var_91_epsilon_0, x = var_90)[name = tensor<string, []>("op_91")];
135
+ tensor<fp32, [1, ?, 256]> hidden_states_5 = mul(x = input_3, y = var_91)[name = tensor<string, []>("hidden_states_5")];
136
+ tensor<fp32, [1, ?, 256]> hidden_states_7 = mul(x = decoder_block_0_layer_0_layer_norm_weight, y = hidden_states_5)[name = tensor<string, []>("hidden_states_7")];
137
+ tensor<int32, [3]> var_103_shape = shape(x = hidden_states_7)[name = tensor<string, []>("op_103_shape")];
138
+ tensor<int32, []> gather_3_batch_dims_0 = const()[name = tensor<string, []>("gather_3_batch_dims_0"), val = tensor<int32, []>(0)];
139
+ tensor<bool, []> gather_3_validate_indices_0 = const()[name = tensor<string, []>("gather_3_validate_indices_0"), val = tensor<bool, []>(false)];
140
+ tensor<int32, []> select_2 = const()[name = tensor<string, []>("select_2"), val = tensor<int32, []>(1)];
141
+ tensor<int32, []> gather_3_axis_1 = const()[name = tensor<string, []>("gather_3_axis_1"), val = tensor<int32, []>(0)];
142
+ tensor<int32, []> gather_3 = gather(axis = gather_3_axis_1, batch_dims = gather_3_batch_dims_0, indices = select_2, validate_indices = gather_3_validate_indices_0, x = var_103_shape)[name = tensor<string, []>("gather_3")];
143
+ tensor<fp32, [384]> linear_0_bias_0 = const()[name = tensor<string, []>("linear_0_bias_0"), val = tensor<fp32, [384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25970240)))];
144
+ tensor<fp32, [1, ?, 384]> states_1 = linear(bias = linear_0_bias_0, weight = decoder_block_0_layer_0_SelfAttention_q_weight, x = hidden_states_7)[name = tensor<string, []>("linear_0")];
145
+ tensor<int32, [4]> var_106 = const()[name = tensor<string, []>("op_106"), val = tensor<int32, [4]>([1, -1, 6, 64])];
146
+ tensor<fp32, [1, ?, 6, 64]> var_107 = reshape(shape = var_106, x = states_1)[name = tensor<string, []>("op_107")];
147
+ tensor<fp32, [1, ?, 384]> states_3 = linear(bias = linear_0_bias_0, weight = decoder_block_0_layer_0_SelfAttention_k_weight, x = hidden_states_7)[name = tensor<string, []>("linear_1")];
148
+ tensor<int32, [4]> var_111 = const()[name = tensor<string, []>("op_111"), val = tensor<int32, [4]>([1, -1, 6, 64])];
149
+ tensor<fp32, [1, ?, 6, 64]> var_112 = reshape(shape = var_111, x = states_3)[name = tensor<string, []>("op_112")];
150
+ tensor<fp32, [1, ?, 384]> states_5 = linear(bias = linear_0_bias_0, weight = decoder_block_0_layer_0_SelfAttention_v_weight, x = hidden_states_7)[name = tensor<string, []>("linear_2")];
151
+ tensor<int32, [4]> var_116 = const()[name = tensor<string, []>("op_116"), val = tensor<int32, [4]>([1, -1, 6, 64])];
152
+ tensor<fp32, [1, ?, 6, 64]> var_117 = reshape(shape = var_116, x = states_5)[name = tensor<string, []>("op_117")];
153
+ tensor<int32, [4]> value_states_1_perm_0 = const()[name = tensor<string, []>("value_states_1_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
154
+ tensor<bool, []> scores_1_transpose_x_0 = const()[name = tensor<string, []>("scores_1_transpose_x_0"), val = tensor<bool, []>(false)];
155
+ tensor<bool, []> scores_1_transpose_y_0 = const()[name = tensor<string, []>("scores_1_transpose_y_0"), val = tensor<bool, []>(false)];
156
+ tensor<int32, [4]> transpose_24_perm_0 = const()[name = tensor<string, []>("transpose_24_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])];
157
+ tensor<int32, [4]> transpose_25_perm_0 = const()[name = tensor<string, []>("transpose_25_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])];
158
+ tensor<fp32, [1, 6, 64, ?]> transpose_25 = transpose(perm = transpose_25_perm_0, x = var_112)[name = tensor<string, []>("transpose_70")];
159
+ tensor<fp32, [1, 6, ?, 64]> transpose_24 = transpose(perm = transpose_24_perm_0, x = var_107)[name = tensor<string, []>("transpose_71")];
160
+ tensor<fp32, [1, 6, ?, ?]> scores_1 = matmul(transpose_x = scores_1_transpose_x_0, transpose_y = scores_1_transpose_y_0, x = transpose_24, y = transpose_25)[name = tensor<string, []>("scores_1")];
161
+ tensor<int32, []> const_2 = const()[name = tensor<string, []>("const_2"), val = tensor<int32, []>(0)];
162
+ tensor<int32, []> const_3 = const()[name = tensor<string, []>("const_3"), val = tensor<int32, []>(1)];
163
+ tensor<int32, [?]> var_121 = range_1d(end = gather_3, start = const_2, step = const_3)[name = tensor<string, []>("op_121")];
164
+ tensor<int32, [1]> context_position_axes_0 = const()[name = tensor<string, []>("context_position_axes_0"), val = tensor<int32, [1]>([1])];
165
+ tensor<int32, [?, 1]> context_position = expand_dims(axes = context_position_axes_0, x = var_121)[name = tensor<string, []>("context_position")];
166
+ tensor<int32, [1]> var_125_axes_0 = const()[name = tensor<string, []>("op_125_axes_0"), val = tensor<int32, [1]>([0])];
167
+ tensor<int32, [1, ?]> var_125 = expand_dims(axes = var_125_axes_0, x = var_121)[name = tensor<string, []>("op_125")];
168
+ tensor<int32, [?, ?]> relative_position_1 = sub(x = var_125, y = context_position)[name = tensor<string, []>("relative_position_1")];
169
+ tensor<int32, [?, ?]> var_128 = sub(x = relative_position_1, y = relative_position_1)[name = tensor<string, []>("sub_0")];
170
+ tensor<int32, [?, ?]> var_129 = minimum(x = relative_position_1, y = var_128)[name = tensor<string, []>("op_129")];
171
+ tensor<int32, []> const_6 = const()[name = tensor<string, []>("const_6"), val = tensor<int32, []>(-1)];
172
+ tensor<int32, [?, ?]> relative_position = mul(x = var_129, y = const_6)[name = tensor<string, []>("relative_position")];
173
+ tensor<bool, [?, ?]> is_small = less(x = relative_position, y = var_8)[name = tensor<string, []>("is_small")];
174
+ tensor<string, []> var_132_dtype_0 = const()[name = tensor<string, []>("op_132_dtype_0"), val = tensor<string, []>("fp32")];
175
+ tensor<fp32, []> _inversed_134_y_0 = const()[name = tensor<string, []>("_inversed_134_y_0"), val = tensor<fp32, []>(0x1p-4)];
176
+ tensor<fp32, [?, ?]> var_132 = cast(dtype = var_132_dtype_0, x = relative_position)[name = tensor<string, []>("cast_40")];
177
+ tensor<fp32, [?, ?]> _inversed_134 = mul(x = var_132, y = _inversed_134_y_0)[name = tensor<string, []>("_inversed_134")];
178
+ tensor<fp32, []> var_135_epsilon_0 = const()[name = tensor<string, []>("op_135_epsilon_0"), val = tensor<fp32, []>(0x1p-149)];
179
+ tensor<fp32, [?, ?]> var_135 = log(epsilon = var_135_epsilon_0, x = _inversed_134)[name = tensor<string, []>("op_135")];
180
+ tensor<fp32, []> _inversed_137_y_0 = const()[name = tensor<string, []>("_inversed_137_y_0"), val = tensor<fp32, []>(0x1.ec709ep-2)];
181
+ tensor<fp32, [?, ?]> _inversed_137 = mul(x = var_135, y = _inversed_137_y_0)[name = tensor<string, []>("_inversed_137")];
182
+ tensor<fp32, []> var_138_promoted = const()[name = tensor<string, []>("op_138_promoted"), val = tensor<fp32, []>(0x1p+4)];
183
+ tensor<fp32, [?, ?]> var_139 = mul(x = _inversed_137, y = var_138_promoted)[name = tensor<string, []>("op_139")];
184
+ tensor<string, []> var_140_dtype_0 = const()[name = tensor<string, []>("op_140_dtype_0"), val = tensor<string, []>("int32")];
185
+ tensor<int32, []> var_141 = const()[name = tensor<string, []>("op_141"), val = tensor<int32, []>(16)];
186
+ tensor<int32, [?, ?]> var_140 = cast(dtype = var_140_dtype_0, x = var_139)[name = tensor<string, []>("cast_39")];
187
+ tensor<int32, [?, ?]> relative_position_if_large_1 = add(x = var_140, y = var_141)[name = tensor<string, []>("relative_position_if_large_1")];
188
+ tensor<int32, []> var_143_value_0 = const()[name = tensor<string, []>("op_143_value_0"), val = tensor<int32, []>(31)];
189
+ tensor<int32, [?, ?]> var_143 = fill_like(ref_tensor = relative_position_if_large_1, value = var_143_value_0)[name = tensor<string, []>("op_143")];
190
+ tensor<int32, [?, ?]> relative_position_if_large = minimum(x = relative_position_if_large_1, y = var_143)[name = tensor<string, []>("relative_position_if_large")];
191
+ tensor<int32, [?, ?]> var_145 = select(a = relative_position, b = relative_position_if_large, cond = is_small)[name = tensor<string, []>("op_145")];
192
+ tensor<int32, []> values_batch_dims_0 = const()[name = tensor<string, []>("values_batch_dims_0"), val = tensor<int32, []>(0)];
193
+ tensor<bool, []> values_validate_indices_0 = const()[name = tensor<string, []>("values_validate_indices_0"), val = tensor<bool, []>(false)];
194
+ tensor<int32, []> greater_equal_3_y_0 = const()[name = tensor<string, []>("greater_equal_3_y_0"), val = tensor<int32, []>(0)];
195
+ tensor<bool, [?, ?]> greater_equal_3 = greater_equal(x = var_145, y = greater_equal_3_y_0)[name = tensor<string, []>("greater_equal_3")];
196
+ tensor<int32, []> slice_by_index_3 = const()[name = tensor<string, []>("slice_by_index_3"), val = tensor<int32, []>(32)];
197
+ tensor<int32, [?, ?]> add_3 = add(x = var_145, y = slice_by_index_3)[name = tensor<string, []>("add_3")];
198
+ tensor<int32, [?, ?]> select_3 = select(a = var_145, b = add_3, cond = greater_equal_3)[name = tensor<string, []>("select_3")];
199
+ tensor<int32, []> values_axis_1 = const()[name = tensor<string, []>("values_axis_1"), val = tensor<int32, []>(0)];
200
+ tensor<fp32, [?, ?, 6]> values = gather(axis = values_axis_1, batch_dims = values_batch_dims_0, indices = select_3, validate_indices = values_validate_indices_0, x = decoder_block_0_layer_0_SelfAttention_relative_attention_bias_weight)[name = tensor<string, []>("values")];
201
+ tensor<int32, [3]> var_150 = const()[name = tensor<string, []>("op_150"), val = tensor<int32, [3]>([2, 0, 1])];
202
+ tensor<int32, [1]> position_bias_1_axes_0 = const()[name = tensor<string, []>("position_bias_1_axes_0"), val = tensor<int32, [1]>([0])];
203
+ tensor<fp32, [6, ?, ?]> var_151 = transpose(perm = var_150, x = values)[name = tensor<string, []>("transpose_69")];
204
+ tensor<fp32, [1, 6, ?, ?]> position_bias_1 = expand_dims(axes = position_bias_1_axes_0, x = var_151)[name = tensor<string, []>("position_bias_1")];
205
+ tensor<fp32, [1, 6, ?, ?]> position_bias_3 = add(x = position_bias_1, y = mask_1)[name = tensor<string, []>("position_bias_3")];
206
+ tensor<fp32, [1, 6, ?, ?]> scores_3 = add(x = scores_1, y = position_bias_3)[name = tensor<string, []>("scores_3")];
207
+ tensor<fp32, [1, 6, ?, ?]> var_156 = softmax(axis = var_22, x = scores_3)[name = tensor<string, []>("op_156")];
208
+ tensor<bool, []> states_7_transpose_x_0 = const()[name = tensor<string, []>("states_7_transpose_x_0"), val = tensor<bool, []>(false)];
209
+ tensor<bool, []> states_7_transpose_y_0 = const()[name = tensor<string, []>("states_7_transpose_y_0"), val = tensor<bool, []>(false)];
210
+ tensor<fp32, [1, 6, ?, 64]> value_states_1 = transpose(perm = value_states_1_perm_0, x = var_117)[name = tensor<string, []>("transpose_72")];
211
+ tensor<fp32, [1, 6, ?, 64]> states_7 = matmul(transpose_x = states_7_transpose_x_0, transpose_y = states_7_transpose_y_0, x = var_156, y = value_states_1)[name = tensor<string, []>("states_7")];
212
+ tensor<int32, [4]> var_160_perm_0 = const()[name = tensor<string, []>("op_160_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
213
+ tensor<int32, [3]> var_162 = const()[name = tensor<string, []>("op_162"), val = tensor<int32, [3]>([1, -1, 384])];
214
+ tensor<fp32, [1, ?, 6, 64]> var_160 = transpose(perm = var_160_perm_0, x = states_7)[name = tensor<string, []>("transpose_68")];
215
+ tensor<fp32, [1, ?, 384]> input_11 = reshape(shape = var_162, x = var_160)[name = tensor<string, []>("input_11")];
216
+ tensor<fp32, [256]> linear_3_bias_0 = const()[name = tensor<string, []>("linear_3_bias_0"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25971840)))];
217
+ tensor<fp32, [1, ?, 256]> input_13 = linear(bias = linear_3_bias_0, weight = decoder_block_0_layer_0_SelfAttention_o_weight, x = input_11)[name = tensor<string, []>("linear_3")];
218
+ tensor<fp32, [1, ?, 256]> hidden_states_9 = add(x = input_3, y = input_13)[name = tensor<string, []>("hidden_states_9")];
219
+ tensor<fp32, []> var_18_promoted_1 = const()[name = tensor<string, []>("op_18_promoted_1"), val = tensor<fp32, []>(0x1p+1)];
220
+ tensor<fp32, [1, ?, 256]> var_180 = pow(x = hidden_states_9, y = var_18_promoted_1)[name = tensor<string, []>("op_180")];
221
+ tensor<int32, [1]> variance_3_axes_0 = const()[name = tensor<string, []>("variance_3_axes_0"), val = tensor<int32, [1]>([-1])];
222
+ tensor<bool, []> variance_3_keep_dims_0 = const()[name = tensor<string, []>("variance_3_keep_dims_0"), val = tensor<bool, []>(true)];
223
+ tensor<fp32, [1, ?, 1]> variance_3 = reduce_mean(axes = variance_3_axes_0, keep_dims = variance_3_keep_dims_0, x = var_180)[name = tensor<string, []>("variance_3")];
224
+ tensor<fp32, []> var_183 = const()[name = tensor<string, []>("op_183"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
225
+ tensor<fp32, [1, ?, 1]> var_184 = add(x = variance_3, y = var_183)[name = tensor<string, []>("op_184")];
226
+ tensor<fp32, []> var_185_epsilon_0 = const()[name = tensor<string, []>("op_185_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
227
+ tensor<fp32, [1, ?, 1]> var_185 = rsqrt(epsilon = var_185_epsilon_0, x = var_184)[name = tensor<string, []>("op_185")];
228
+ tensor<fp32, [1, ?, 256]> hidden_states_13 = mul(x = hidden_states_9, y = var_185)[name = tensor<string, []>("hidden_states_13")];
229
+ tensor<fp32, [1, ?, 256]> hidden_states_15 = mul(x = decoder_block_0_layer_1_layer_norm_weight, y = hidden_states_13)[name = tensor<string, []>("hidden_states_15")];
230
+ tensor<int32, [3]> var_196_shape = shape(x = hidden_states_15)[name = tensor<string, []>("op_196_shape")];
231
+ tensor<int32, []> gather_5_batch_dims_0 = const()[name = tensor<string, []>("gather_5_batch_dims_0"), val = tensor<int32, []>(0)];
232
+ tensor<bool, []> gather_5_validate_indices_0 = const()[name = tensor<string, []>("gather_5_validate_indices_0"), val = tensor<bool, []>(false)];
233
+ tensor<int32, []> select_4 = const()[name = tensor<string, []>("select_4"), val = tensor<int32, []>(1)];
234
+ tensor<int32, []> gather_5_axis_1 = const()[name = tensor<string, []>("gather_5_axis_1"), val = tensor<int32, []>(0)];
235
+ tensor<int32, []> gather_5 = gather(axis = gather_5_axis_1, batch_dims = gather_5_batch_dims_0, indices = select_4, validate_indices = gather_5_validate_indices_0, x = var_196_shape)[name = tensor<string, []>("gather_5")];
236
+ tensor<int32, [3]> var_197_shape = shape(x = encoder_hidden_states)[name = tensor<string, []>("op_197_shape")];
237
+ tensor<int32, []> gather_6_batch_dims_0 = const()[name = tensor<string, []>("gather_6_batch_dims_0"), val = tensor<int32, []>(0)];
238
+ tensor<bool, []> gather_6_validate_indices_0 = const()[name = tensor<string, []>("gather_6_validate_indices_0"), val = tensor<bool, []>(false)];
239
+ tensor<int32, []> select_5 = const()[name = tensor<string, []>("select_5"), val = tensor<int32, []>(1)];
240
+ tensor<int32, []> gather_6_axis_1 = const()[name = tensor<string, []>("gather_6_axis_1"), val = tensor<int32, []>(0)];
241
+ tensor<int32, []> gather_6 = gather(axis = gather_6_axis_1, batch_dims = gather_6_batch_dims_0, indices = select_5, validate_indices = gather_6_validate_indices_0, x = var_197_shape)[name = tensor<string, []>("gather_6")];
242
+ tensor<fp32, [1, ?, 384]> states_9 = linear(bias = linear_0_bias_0, weight = decoder_block_0_layer_1_EncDecAttention_q_weight, x = hidden_states_15)[name = tensor<string, []>("linear_4")];
243
+ tensor<int32, [4]> var_200 = const()[name = tensor<string, []>("op_200"), val = tensor<int32, [4]>([1, -1, 6, 64])];
244
+ tensor<fp32, [1, ?, 6, 64]> var_201 = reshape(shape = var_200, x = states_9)[name = tensor<string, []>("op_201")];
245
+ tensor<fp32, [1, ?, 384]> states_11 = linear(bias = linear_0_bias_0, weight = decoder_block_0_layer_1_EncDecAttention_k_weight, x = encoder_hidden_states)[name = tensor<string, []>("linear_5")];
246
+ tensor<int32, [4]> var_205 = const()[name = tensor<string, []>("op_205"), val = tensor<int32, [4]>([1, -1, 6, 64])];
247
+ tensor<fp32, [1, ?, 6, 64]> var_206 = reshape(shape = var_205, x = states_11)[name = tensor<string, []>("op_206")];
248
+ tensor<fp32, [1, ?, 384]> states_13 = linear(bias = linear_0_bias_0, weight = decoder_block_0_layer_1_EncDecAttention_v_weight, x = encoder_hidden_states)[name = tensor<string, []>("linear_6")];
249
+ tensor<int32, [4]> var_210 = const()[name = tensor<string, []>("op_210"), val = tensor<int32, [4]>([1, -1, 6, 64])];
250
+ tensor<fp32, [1, ?, 6, 64]> var_211 = reshape(shape = var_210, x = states_13)[name = tensor<string, []>("op_211")];
251
+ tensor<int32, [4]> value_states_3_perm_0 = const()[name = tensor<string, []>("value_states_3_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
252
+ tensor<bool, []> scores_5_transpose_x_0 = const()[name = tensor<string, []>("scores_5_transpose_x_0"), val = tensor<bool, []>(false)];
253
+ tensor<bool, []> scores_5_transpose_y_0 = const()[name = tensor<string, []>("scores_5_transpose_y_0"), val = tensor<bool, []>(false)];
254
+ tensor<int32, [4]> transpose_26_perm_0 = const()[name = tensor<string, []>("transpose_26_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])];
255
+ tensor<int32, [4]> transpose_27_perm_0 = const()[name = tensor<string, []>("transpose_27_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])];
256
+ tensor<fp32, [1, 6, 64, ?]> transpose_27 = transpose(perm = transpose_27_perm_0, x = var_206)[name = tensor<string, []>("transpose_65")];
257
+ tensor<fp32, [1, 6, ?, 64]> transpose_26 = transpose(perm = transpose_26_perm_0, x = var_201)[name = tensor<string, []>("transpose_66")];
258
+ tensor<fp32, [1, 6, ?, ?]> scores_5 = matmul(transpose_x = scores_5_transpose_x_0, transpose_y = scores_5_transpose_y_0, x = transpose_26, y = transpose_27)[name = tensor<string, []>("scores_5")];
259
+ tensor<int32, []> concat_3_axis_0 = const()[name = tensor<string, []>("concat_3_axis_0"), val = tensor<int32, []>(0)];
260
+ tensor<bool, []> concat_3_interleave_0 = const()[name = tensor<string, []>("concat_3_interleave_0"), val = tensor<bool, []>(false)];
261
+ tensor<int32, [4]> concat_3 = concat(axis = concat_3_axis_0, interleave = concat_3_interleave_0, values = (var_23, var_16, gather_5, gather_6))[name = tensor<string, []>("concat_3")];
262
+ tensor<fp32, []> position_bias_5_value_0 = const()[name = tensor<string, []>("position_bias_5_value_0"), val = tensor<fp32, []>(0x0p+0)];
263
+ tensor<fp32, [1, 6, ?, ?]> position_bias_5 = fill(shape = concat_3, value = position_bias_5_value_0)[name = tensor<string, []>("position_bias_5")];
264
+ tensor<fp32, [1, 6, ?, ?]> position_bias = add(x = position_bias_5, y = mask)[name = tensor<string, []>("position_bias")];
265
+ tensor<fp32, [1, 6, ?, ?]> scores_7 = add(x = scores_5, y = position_bias)[name = tensor<string, []>("scores_7")];
266
+ tensor<fp32, [1, 6, ?, ?]> var_220 = softmax(axis = var_22, x = scores_7)[name = tensor<string, []>("op_220")];
267
+ tensor<bool, []> states_15_transpose_x_0 = const()[name = tensor<string, []>("states_15_transpose_x_0"), val = tensor<bool, []>(false)];
268
+ tensor<bool, []> states_15_transpose_y_0 = const()[name = tensor<string, []>("states_15_transpose_y_0"), val = tensor<bool, []>(false)];
269
+ tensor<fp32, [1, 6, ?, 64]> value_states_3 = transpose(perm = value_states_3_perm_0, x = var_211)[name = tensor<string, []>("transpose_67")];
270
+ tensor<fp32, [1, 6, ?, 64]> states_15 = matmul(transpose_x = states_15_transpose_x_0, transpose_y = states_15_transpose_y_0, x = var_220, y = value_states_3)[name = tensor<string, []>("states_15")];
271
+ tensor<int32, [4]> var_224_perm_0 = const()[name = tensor<string, []>("op_224_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
272
+ tensor<int32, [3]> var_226 = const()[name = tensor<string, []>("op_226"), val = tensor<int32, [3]>([1, -1, 384])];
273
+ tensor<fp32, [1, ?, 6, 64]> var_224 = transpose(perm = var_224_perm_0, x = states_15)[name = tensor<string, []>("transpose_64")];
274
+ tensor<fp32, [1, ?, 384]> input_19 = reshape(shape = var_226, x = var_224)[name = tensor<string, []>("input_19")];
275
+ tensor<fp32, [1, ?, 256]> input_21 = linear(bias = linear_3_bias_0, weight = decoder_block_0_layer_1_EncDecAttention_o_weight, x = input_19)[name = tensor<string, []>("linear_7")];
276
+ tensor<fp32, [1, ?, 256]> hidden_states_17 = add(x = hidden_states_9, y = input_21)[name = tensor<string, []>("hidden_states_17")];
277
+ tensor<fp32, []> var_18_promoted_2 = const()[name = tensor<string, []>("op_18_promoted_2"), val = tensor<fp32, []>(0x1p+1)];
278
+ tensor<fp32, [1, ?, 256]> var_242 = pow(x = hidden_states_17, y = var_18_promoted_2)[name = tensor<string, []>("op_242")];
279
+ tensor<int32, [1]> variance_5_axes_0 = const()[name = tensor<string, []>("variance_5_axes_0"), val = tensor<int32, [1]>([-1])];
280
+ tensor<bool, []> variance_5_keep_dims_0 = const()[name = tensor<string, []>("variance_5_keep_dims_0"), val = tensor<bool, []>(true)];
281
+ tensor<fp32, [1, ?, 1]> variance_5 = reduce_mean(axes = variance_5_axes_0, keep_dims = variance_5_keep_dims_0, x = var_242)[name = tensor<string, []>("variance_5")];
282
+ tensor<fp32, []> var_245 = const()[name = tensor<string, []>("op_245"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
283
+ tensor<fp32, [1, ?, 1]> var_246 = add(x = variance_5, y = var_245)[name = tensor<string, []>("op_246")];
284
+ tensor<fp32, []> var_247_epsilon_0 = const()[name = tensor<string, []>("op_247_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
285
+ tensor<fp32, [1, ?, 1]> var_247 = rsqrt(epsilon = var_247_epsilon_0, x = var_246)[name = tensor<string, []>("op_247")];
286
+ tensor<fp32, [1, ?, 256]> hidden_states_21 = mul(x = hidden_states_17, y = var_247)[name = tensor<string, []>("hidden_states_21")];
287
+ tensor<fp32, [1, ?, 256]> input_23 = mul(x = decoder_block_0_layer_2_layer_norm_weight, y = hidden_states_21)[name = tensor<string, []>("input_23")];
288
+ tensor<fp32, [1024]> linear_8_bias_0 = const()[name = tensor<string, []>("linear_8_bias_0"), val = tensor<fp32, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25972928)))];
289
+ tensor<fp32, [1, ?, 1024]> input_25 = linear(bias = linear_8_bias_0, weight = decoder_block_0_layer_2_DenseReluDense_wi_0_weight, x = input_23)[name = tensor<string, []>("linear_8")];
290
+ tensor<string, []> hidden_gelu_1_mode_0 = const()[name = tensor<string, []>("hidden_gelu_1_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
291
+ tensor<fp32, [1, ?, 1024]> hidden_gelu_1 = gelu(mode = hidden_gelu_1_mode_0, x = input_25)[name = tensor<string, []>("hidden_gelu_1")];
292
+ tensor<fp32, [1, ?, 1024]> hidden_linear_1 = linear(bias = linear_8_bias_0, weight = decoder_block_0_layer_2_DenseReluDense_wi_1_weight, x = input_23)[name = tensor<string, []>("linear_9")];
293
+ tensor<fp32, [1, ?, 1024]> input_27 = mul(x = hidden_gelu_1, y = hidden_linear_1)[name = tensor<string, []>("input_27")];
294
+ tensor<fp32, [1, ?, 256]> input_31 = linear(bias = linear_3_bias_0, weight = decoder_block_0_layer_2_DenseReluDense_wo_weight, x = input_27)[name = tensor<string, []>("linear_10")];
295
+ tensor<fp32, [1, ?, 256]> hidden_states_23 = add(x = hidden_states_17, y = input_31)[name = tensor<string, []>("hidden_states_23")];
296
+ tensor<fp32, []> var_18_promoted_3 = const()[name = tensor<string, []>("op_18_promoted_3"), val = tensor<fp32, []>(0x1p+1)];
297
+ tensor<fp32, [1, ?, 256]> var_292 = pow(x = hidden_states_23, y = var_18_promoted_3)[name = tensor<string, []>("op_292")];
298
+ tensor<int32, [1]> variance_7_axes_0 = const()[name = tensor<string, []>("variance_7_axes_0"), val = tensor<int32, [1]>([-1])];
299
+ tensor<bool, []> variance_7_keep_dims_0 = const()[name = tensor<string, []>("variance_7_keep_dims_0"), val = tensor<bool, []>(true)];
300
+ tensor<fp32, [1, ?, 1]> variance_7 = reduce_mean(axes = variance_7_axes_0, keep_dims = variance_7_keep_dims_0, x = var_292)[name = tensor<string, []>("variance_7")];
301
+ tensor<fp32, []> var_295 = const()[name = tensor<string, []>("op_295"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
302
+ tensor<fp32, [1, ?, 1]> var_296 = add(x = variance_7, y = var_295)[name = tensor<string, []>("op_296")];
303
+ tensor<fp32, []> var_297_epsilon_0 = const()[name = tensor<string, []>("op_297_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
304
+ tensor<fp32, [1, ?, 1]> var_297 = rsqrt(epsilon = var_297_epsilon_0, x = var_296)[name = tensor<string, []>("op_297")];
305
+ tensor<fp32, [1, ?, 256]> hidden_states_27 = mul(x = hidden_states_23, y = var_297)[name = tensor<string, []>("hidden_states_27")];
306
+ tensor<fp32, [1, ?, 256]> hidden_states_29 = mul(x = decoder_block_1_layer_0_layer_norm_weight, y = hidden_states_27)[name = tensor<string, []>("hidden_states_29")];
307
+ tensor<fp32, [1, ?, 384]> states_17 = linear(bias = linear_0_bias_0, weight = decoder_block_1_layer_0_SelfAttention_q_weight, x = hidden_states_29)[name = tensor<string, []>("linear_11")];
308
+ tensor<int32, [4]> var_310 = const()[name = tensor<string, []>("op_310"), val = tensor<int32, [4]>([1, -1, 6, 64])];
309
+ tensor<fp32, [1, ?, 6, 64]> var_311 = reshape(shape = var_310, x = states_17)[name = tensor<string, []>("op_311")];
310
+ tensor<fp32, [1, ?, 384]> states_19 = linear(bias = linear_0_bias_0, weight = decoder_block_1_layer_0_SelfAttention_k_weight, x = hidden_states_29)[name = tensor<string, []>("linear_12")];
311
+ tensor<int32, [4]> var_315 = const()[name = tensor<string, []>("op_315"), val = tensor<int32, [4]>([1, -1, 6, 64])];
312
+ tensor<fp32, [1, ?, 6, 64]> var_316 = reshape(shape = var_315, x = states_19)[name = tensor<string, []>("op_316")];
313
+ tensor<fp32, [1, ?, 384]> states_21 = linear(bias = linear_0_bias_0, weight = decoder_block_1_layer_0_SelfAttention_v_weight, x = hidden_states_29)[name = tensor<string, []>("linear_13")];
314
+ tensor<int32, [4]> var_320 = const()[name = tensor<string, []>("op_320"), val = tensor<int32, [4]>([1, -1, 6, 64])];
315
+ tensor<fp32, [1, ?, 6, 64]> var_321 = reshape(shape = var_320, x = states_21)[name = tensor<string, []>("op_321")];
316
+ tensor<int32, [4]> value_states_5_perm_0 = const()[name = tensor<string, []>("value_states_5_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
317
+ tensor<bool, []> scores_9_transpose_x_0 = const()[name = tensor<string, []>("scores_9_transpose_x_0"), val = tensor<bool, []>(false)];
318
+ tensor<bool, []> scores_9_transpose_y_0 = const()[name = tensor<string, []>("scores_9_transpose_y_0"), val = tensor<bool, []>(false)];
319
+ tensor<int32, [4]> transpose_28_perm_0 = const()[name = tensor<string, []>("transpose_28_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])];
320
+ tensor<int32, [4]> transpose_29_perm_0 = const()[name = tensor<string, []>("transpose_29_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])];
321
+ tensor<fp32, [1, 6, 64, ?]> transpose_29 = transpose(perm = transpose_29_perm_0, x = var_316)[name = tensor<string, []>("transpose_61")];
322
+ tensor<fp32, [1, 6, ?, 64]> transpose_28 = transpose(perm = transpose_28_perm_0, x = var_311)[name = tensor<string, []>("transpose_62")];
323
+ tensor<fp32, [1, 6, ?, ?]> scores_9 = matmul(transpose_x = scores_9_transpose_x_0, transpose_y = scores_9_transpose_y_0, x = transpose_28, y = transpose_29)[name = tensor<string, []>("scores_9")];
324
+ tensor<fp32, [1, 6, ?, ?]> scores_11 = add(x = scores_9, y = position_bias_3)[name = tensor<string, []>("scores_11")];
325
+ tensor<fp32, [1, 6, ?, ?]> var_327 = softmax(axis = var_22, x = scores_11)[name = tensor<string, []>("op_327")];
326
+ tensor<bool, []> states_23_transpose_x_0 = const()[name = tensor<string, []>("states_23_transpose_x_0"), val = tensor<bool, []>(false)];
327
+ tensor<bool, []> states_23_transpose_y_0 = const()[name = tensor<string, []>("states_23_transpose_y_0"), val = tensor<bool, []>(false)];
328
+ tensor<fp32, [1, 6, ?, 64]> value_states_5 = transpose(perm = value_states_5_perm_0, x = var_321)[name = tensor<string, []>("transpose_63")];
329
+ tensor<fp32, [1, 6, ?, 64]> states_23 = matmul(transpose_x = states_23_transpose_x_0, transpose_y = states_23_transpose_y_0, x = var_327, y = value_states_5)[name = tensor<string, []>("states_23")];
330
+ tensor<int32, [4]> var_331_perm_0 = const()[name = tensor<string, []>("op_331_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
331
+ tensor<int32, [3]> var_333 = const()[name = tensor<string, []>("op_333"), val = tensor<int32, [3]>([1, -1, 384])];
332
+ tensor<fp32, [1, ?, 6, 64]> var_331 = transpose(perm = var_331_perm_0, x = states_23)[name = tensor<string, []>("transpose_60")];
333
+ tensor<fp32, [1, ?, 384]> input_37 = reshape(shape = var_333, x = var_331)[name = tensor<string, []>("input_37")];
334
+ tensor<fp32, [1, ?, 256]> input_39 = linear(bias = linear_3_bias_0, weight = decoder_block_1_layer_0_SelfAttention_o_weight, x = input_37)[name = tensor<string, []>("linear_14")];
335
+ tensor<fp32, [1, ?, 256]> hidden_states_31 = add(x = hidden_states_23, y = input_39)[name = tensor<string, []>("hidden_states_31")];
336
+ tensor<fp32, []> var_18_promoted_4 = const()[name = tensor<string, []>("op_18_promoted_4"), val = tensor<fp32, []>(0x1p+1)];
337
+ tensor<fp32, [1, ?, 256]> var_349 = pow(x = hidden_states_31, y = var_18_promoted_4)[name = tensor<string, []>("op_349")];
338
+ tensor<int32, [1]> variance_9_axes_0 = const()[name = tensor<string, []>("variance_9_axes_0"), val = tensor<int32, [1]>([-1])];
339
+ tensor<bool, []> variance_9_keep_dims_0 = const()[name = tensor<string, []>("variance_9_keep_dims_0"), val = tensor<bool, []>(true)];
340
+ tensor<fp32, [1, ?, 1]> variance_9 = reduce_mean(axes = variance_9_axes_0, keep_dims = variance_9_keep_dims_0, x = var_349)[name = tensor<string, []>("variance_9")];
341
+ tensor<fp32, []> var_352 = const()[name = tensor<string, []>("op_352"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
342
+ tensor<fp32, [1, ?, 1]> var_353 = add(x = variance_9, y = var_352)[name = tensor<string, []>("op_353")];
343
+ tensor<fp32, []> var_354_epsilon_0 = const()[name = tensor<string, []>("op_354_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
344
+ tensor<fp32, [1, ?, 1]> var_354 = rsqrt(epsilon = var_354_epsilon_0, x = var_353)[name = tensor<string, []>("op_354")];
345
+ tensor<fp32, [1, ?, 256]> hidden_states_35 = mul(x = hidden_states_31, y = var_354)[name = tensor<string, []>("hidden_states_35")];
346
+ tensor<fp32, [1, ?, 256]> hidden_states_37 = mul(x = decoder_block_1_layer_1_layer_norm_weight, y = hidden_states_35)[name = tensor<string, []>("hidden_states_37")];
347
+ tensor<fp32, [1, ?, 384]> states_25 = linear(bias = linear_0_bias_0, weight = decoder_block_1_layer_1_EncDecAttention_q_weight, x = hidden_states_37)[name = tensor<string, []>("linear_15")];
348
+ tensor<int32, [4]> var_367 = const()[name = tensor<string, []>("op_367"), val = tensor<int32, [4]>([1, -1, 6, 64])];
349
+ tensor<fp32, [1, ?, 6, 64]> var_368 = reshape(shape = var_367, x = states_25)[name = tensor<string, []>("op_368")];
350
+ tensor<fp32, [1, ?, 384]> states_27 = linear(bias = linear_0_bias_0, weight = decoder_block_1_layer_1_EncDecAttention_k_weight, x = encoder_hidden_states)[name = tensor<string, []>("linear_16")];
351
+ tensor<int32, [4]> var_372 = const()[name = tensor<string, []>("op_372"), val = tensor<int32, [4]>([1, -1, 6, 64])];
352
+ tensor<fp32, [1, ?, 6, 64]> var_373 = reshape(shape = var_372, x = states_27)[name = tensor<string, []>("op_373")];
353
+ tensor<fp32, [1, ?, 384]> states_29 = linear(bias = linear_0_bias_0, weight = decoder_block_1_layer_1_EncDecAttention_v_weight, x = encoder_hidden_states)[name = tensor<string, []>("linear_17")];
354
+ tensor<int32, [4]> var_377 = const()[name = tensor<string, []>("op_377"), val = tensor<int32, [4]>([1, -1, 6, 64])];
355
+ tensor<fp32, [1, ?, 6, 64]> var_378 = reshape(shape = var_377, x = states_29)[name = tensor<string, []>("op_378")];
356
+ tensor<int32, [4]> value_states_7_perm_0 = const()[name = tensor<string, []>("value_states_7_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
357
+ tensor<bool, []> scores_13_transpose_x_0 = const()[name = tensor<string, []>("scores_13_transpose_x_0"), val = tensor<bool, []>(false)];
358
+ tensor<bool, []> scores_13_transpose_y_0 = const()[name = tensor<string, []>("scores_13_transpose_y_0"), val = tensor<bool, []>(false)];
359
+ tensor<int32, [4]> transpose_30_perm_0 = const()[name = tensor<string, []>("transpose_30_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])];
360
+ tensor<int32, [4]> transpose_31_perm_0 = const()[name = tensor<string, []>("transpose_31_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])];
361
+ tensor<fp32, [1, 6, 64, ?]> transpose_31 = transpose(perm = transpose_31_perm_0, x = var_373)[name = tensor<string, []>("transpose_57")];
362
+ tensor<fp32, [1, 6, ?, 64]> transpose_30 = transpose(perm = transpose_30_perm_0, x = var_368)[name = tensor<string, []>("transpose_58")];
363
+ tensor<fp32, [1, 6, ?, ?]> scores_13 = matmul(transpose_x = scores_13_transpose_x_0, transpose_y = scores_13_transpose_y_0, x = transpose_30, y = transpose_31)[name = tensor<string, []>("scores_13")];
364
+ tensor<fp32, [1, 6, ?, ?]> scores_15 = add(x = scores_13, y = position_bias)[name = tensor<string, []>("scores_15")];
365
+ tensor<fp32, [1, 6, ?, ?]> var_384 = softmax(axis = var_22, x = scores_15)[name = tensor<string, []>("op_384")];
366
+ tensor<bool, []> states_31_transpose_x_0 = const()[name = tensor<string, []>("states_31_transpose_x_0"), val = tensor<bool, []>(false)];
367
+ tensor<bool, []> states_31_transpose_y_0 = const()[name = tensor<string, []>("states_31_transpose_y_0"), val = tensor<bool, []>(false)];
368
+ tensor<fp32, [1, 6, ?, 64]> value_states_7 = transpose(perm = value_states_7_perm_0, x = var_378)[name = tensor<string, []>("transpose_59")];
369
+ tensor<fp32, [1, 6, ?, 64]> states_31 = matmul(transpose_x = states_31_transpose_x_0, transpose_y = states_31_transpose_y_0, x = var_384, y = value_states_7)[name = tensor<string, []>("states_31")];
370
+ tensor<int32, [4]> var_388_perm_0 = const()[name = tensor<string, []>("op_388_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
371
+ tensor<int32, [3]> var_390 = const()[name = tensor<string, []>("op_390"), val = tensor<int32, [3]>([1, -1, 384])];
372
+ tensor<fp32, [1, ?, 6, 64]> var_388 = transpose(perm = var_388_perm_0, x = states_31)[name = tensor<string, []>("transpose_56")];
373
+ tensor<fp32, [1, ?, 384]> input_45 = reshape(shape = var_390, x = var_388)[name = tensor<string, []>("input_45")];
374
+ tensor<fp32, [1, ?, 256]> input_47 = linear(bias = linear_3_bias_0, weight = decoder_block_1_layer_1_EncDecAttention_o_weight, x = input_45)[name = tensor<string, []>("linear_18")];
375
+ tensor<fp32, [1, ?, 256]> hidden_states_39 = add(x = hidden_states_31, y = input_47)[name = tensor<string, []>("hidden_states_39")];
376
+ tensor<fp32, []> var_18_promoted_5 = const()[name = tensor<string, []>("op_18_promoted_5"), val = tensor<fp32, []>(0x1p+1)];
377
+ tensor<fp32, [1, ?, 256]> var_400 = pow(x = hidden_states_39, y = var_18_promoted_5)[name = tensor<string, []>("op_400")];
378
+ tensor<int32, [1]> variance_11_axes_0 = const()[name = tensor<string, []>("variance_11_axes_0"), val = tensor<int32, [1]>([-1])];
379
+ tensor<bool, []> variance_11_keep_dims_0 = const()[name = tensor<string, []>("variance_11_keep_dims_0"), val = tensor<bool, []>(true)];
380
+ tensor<fp32, [1, ?, 1]> variance_11 = reduce_mean(axes = variance_11_axes_0, keep_dims = variance_11_keep_dims_0, x = var_400)[name = tensor<string, []>("variance_11")];
381
+ tensor<fp32, []> var_403 = const()[name = tensor<string, []>("op_403"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
382
+ tensor<fp32, [1, ?, 1]> var_404 = add(x = variance_11, y = var_403)[name = tensor<string, []>("op_404")];
383
+ tensor<fp32, []> var_405_epsilon_0 = const()[name = tensor<string, []>("op_405_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
384
+ tensor<fp32, [1, ?, 1]> var_405 = rsqrt(epsilon = var_405_epsilon_0, x = var_404)[name = tensor<string, []>("op_405")];
385
+ tensor<fp32, [1, ?, 256]> hidden_states_43 = mul(x = hidden_states_39, y = var_405)[name = tensor<string, []>("hidden_states_43")];
386
+ tensor<fp32, [1, ?, 256]> input_49 = mul(x = decoder_block_1_layer_2_layer_norm_weight, y = hidden_states_43)[name = tensor<string, []>("input_49")];
387
+ tensor<fp32, [1, ?, 1024]> input_51 = linear(bias = linear_8_bias_0, weight = decoder_block_1_layer_2_DenseReluDense_wi_0_weight, x = input_49)[name = tensor<string, []>("linear_19")];
388
+ tensor<string, []> hidden_gelu_3_mode_0 = const()[name = tensor<string, []>("hidden_gelu_3_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
389
+ tensor<fp32, [1, ?, 1024]> hidden_gelu_3 = gelu(mode = hidden_gelu_3_mode_0, x = input_51)[name = tensor<string, []>("hidden_gelu_3")];
390
+ tensor<fp32, [1, ?, 1024]> hidden_linear_3 = linear(bias = linear_8_bias_0, weight = decoder_block_1_layer_2_DenseReluDense_wi_1_weight, x = input_49)[name = tensor<string, []>("linear_20")];
391
+ tensor<fp32, [1, ?, 1024]> input_53 = mul(x = hidden_gelu_3, y = hidden_linear_3)[name = tensor<string, []>("input_53")];
392
+ tensor<fp32, [1, ?, 256]> input_57 = linear(bias = linear_3_bias_0, weight = decoder_block_1_layer_2_DenseReluDense_wo_weight, x = input_53)[name = tensor<string, []>("linear_21")];
393
+ tensor<fp32, [1, ?, 256]> hidden_states_45 = add(x = hidden_states_39, y = input_57)[name = tensor<string, []>("hidden_states_45")];
394
+ tensor<fp32, []> var_18_promoted_6 = const()[name = tensor<string, []>("op_18_promoted_6"), val = tensor<fp32, []>(0x1p+1)];
395
+ tensor<fp32, [1, ?, 256]> var_446 = pow(x = hidden_states_45, y = var_18_promoted_6)[name = tensor<string, []>("op_446")];
396
+ tensor<int32, [1]> variance_13_axes_0 = const()[name = tensor<string, []>("variance_13_axes_0"), val = tensor<int32, [1]>([-1])];
397
+ tensor<bool, []> variance_13_keep_dims_0 = const()[name = tensor<string, []>("variance_13_keep_dims_0"), val = tensor<bool, []>(true)];
398
+ tensor<fp32, [1, ?, 1]> variance_13 = reduce_mean(axes = variance_13_axes_0, keep_dims = variance_13_keep_dims_0, x = var_446)[name = tensor<string, []>("variance_13")];
399
+ tensor<fp32, []> var_449 = const()[name = tensor<string, []>("op_449"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
400
+ tensor<fp32, [1, ?, 1]> var_450 = add(x = variance_13, y = var_449)[name = tensor<string, []>("op_450")];
401
+ tensor<fp32, []> var_451_epsilon_0 = const()[name = tensor<string, []>("op_451_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
402
+ tensor<fp32, [1, ?, 1]> var_451 = rsqrt(epsilon = var_451_epsilon_0, x = var_450)[name = tensor<string, []>("op_451")];
403
+ tensor<fp32, [1, ?, 256]> hidden_states_49 = mul(x = hidden_states_45, y = var_451)[name = tensor<string, []>("hidden_states_49")];
404
+ tensor<fp32, [1, ?, 256]> hidden_states_51 = mul(x = decoder_block_2_layer_0_layer_norm_weight, y = hidden_states_49)[name = tensor<string, []>("hidden_states_51")];
405
+ tensor<fp32, [1, ?, 384]> states_33 = linear(bias = linear_0_bias_0, weight = decoder_block_2_layer_0_SelfAttention_q_weight, x = hidden_states_51)[name = tensor<string, []>("linear_22")];
406
+ tensor<int32, [4]> var_464 = const()[name = tensor<string, []>("op_464"), val = tensor<int32, [4]>([1, -1, 6, 64])];
407
+ tensor<fp32, [1, ?, 6, 64]> var_465 = reshape(shape = var_464, x = states_33)[name = tensor<string, []>("op_465")];
408
+ tensor<fp32, [1, ?, 384]> states_35 = linear(bias = linear_0_bias_0, weight = decoder_block_2_layer_0_SelfAttention_k_weight, x = hidden_states_51)[name = tensor<string, []>("linear_23")];
409
+ tensor<int32, [4]> var_469 = const()[name = tensor<string, []>("op_469"), val = tensor<int32, [4]>([1, -1, 6, 64])];
410
+ tensor<fp32, [1, ?, 6, 64]> var_470 = reshape(shape = var_469, x = states_35)[name = tensor<string, []>("op_470")];
411
+ tensor<fp32, [1, ?, 384]> states_37 = linear(bias = linear_0_bias_0, weight = decoder_block_2_layer_0_SelfAttention_v_weight, x = hidden_states_51)[name = tensor<string, []>("linear_24")];
412
+ tensor<int32, [4]> var_474 = const()[name = tensor<string, []>("op_474"), val = tensor<int32, [4]>([1, -1, 6, 64])];
413
+ tensor<fp32, [1, ?, 6, 64]> var_475 = reshape(shape = var_474, x = states_37)[name = tensor<string, []>("op_475")];
414
+ tensor<int32, [4]> value_states_9_perm_0 = const()[name = tensor<string, []>("value_states_9_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
415
+ tensor<bool, []> scores_17_transpose_x_0 = const()[name = tensor<string, []>("scores_17_transpose_x_0"), val = tensor<bool, []>(false)];
416
+ tensor<bool, []> scores_17_transpose_y_0 = const()[name = tensor<string, []>("scores_17_transpose_y_0"), val = tensor<bool, []>(false)];
417
+ tensor<int32, [4]> transpose_32_perm_0 = const()[name = tensor<string, []>("transpose_32_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])];
418
+ tensor<int32, [4]> transpose_33_perm_0 = const()[name = tensor<string, []>("transpose_33_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])];
419
+ tensor<fp32, [1, 6, 64, ?]> transpose_33 = transpose(perm = transpose_33_perm_0, x = var_470)[name = tensor<string, []>("transpose_53")];
420
+ tensor<fp32, [1, 6, ?, 64]> transpose_32 = transpose(perm = transpose_32_perm_0, x = var_465)[name = tensor<string, []>("transpose_54")];
421
+ tensor<fp32, [1, 6, ?, ?]> scores_17 = matmul(transpose_x = scores_17_transpose_x_0, transpose_y = scores_17_transpose_y_0, x = transpose_32, y = transpose_33)[name = tensor<string, []>("scores_17")];
422
+ tensor<fp32, [1, 6, ?, ?]> scores_19 = add(x = scores_17, y = position_bias_3)[name = tensor<string, []>("scores_19")];
423
+ tensor<fp32, [1, 6, ?, ?]> var_481 = softmax(axis = var_22, x = scores_19)[name = tensor<string, []>("op_481")];
424
+ tensor<bool, []> states_39_transpose_x_0 = const()[name = tensor<string, []>("states_39_transpose_x_0"), val = tensor<bool, []>(false)];
425
+ tensor<bool, []> states_39_transpose_y_0 = const()[name = tensor<string, []>("states_39_transpose_y_0"), val = tensor<bool, []>(false)];
426
+ tensor<fp32, [1, 6, ?, 64]> value_states_9 = transpose(perm = value_states_9_perm_0, x = var_475)[name = tensor<string, []>("transpose_55")];
427
+ tensor<fp32, [1, 6, ?, 64]> states_39 = matmul(transpose_x = states_39_transpose_x_0, transpose_y = states_39_transpose_y_0, x = var_481, y = value_states_9)[name = tensor<string, []>("states_39")];
428
+ tensor<int32, [4]> var_485_perm_0 = const()[name = tensor<string, []>("op_485_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
429
+ tensor<int32, [3]> var_487 = const()[name = tensor<string, []>("op_487"), val = tensor<int32, [3]>([1, -1, 384])];
430
+ tensor<fp32, [1, ?, 6, 64]> var_485 = transpose(perm = var_485_perm_0, x = states_39)[name = tensor<string, []>("transpose_52")];
431
+ tensor<fp32, [1, ?, 384]> input_63 = reshape(shape = var_487, x = var_485)[name = tensor<string, []>("input_63")];
432
+ tensor<fp32, [1, ?, 256]> input_65 = linear(bias = linear_3_bias_0, weight = decoder_block_2_layer_0_SelfAttention_o_weight, x = input_63)[name = tensor<string, []>("linear_25")];
433
+ tensor<fp32, [1, ?, 256]> hidden_states_53 = add(x = hidden_states_45, y = input_65)[name = tensor<string, []>("hidden_states_53")];
434
+ tensor<fp32, []> var_18_promoted_7 = const()[name = tensor<string, []>("op_18_promoted_7"), val = tensor<fp32, []>(0x1p+1)];
435
+ tensor<fp32, [1, ?, 256]> var_503 = pow(x = hidden_states_53, y = var_18_promoted_7)[name = tensor<string, []>("op_503")];
436
+ tensor<int32, [1]> variance_15_axes_0 = const()[name = tensor<string, []>("variance_15_axes_0"), val = tensor<int32, [1]>([-1])];
437
+ tensor<bool, []> variance_15_keep_dims_0 = const()[name = tensor<string, []>("variance_15_keep_dims_0"), val = tensor<bool, []>(true)];
438
+ tensor<fp32, [1, ?, 1]> variance_15 = reduce_mean(axes = variance_15_axes_0, keep_dims = variance_15_keep_dims_0, x = var_503)[name = tensor<string, []>("variance_15")];
439
+ tensor<fp32, []> var_506 = const()[name = tensor<string, []>("op_506"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
440
+ tensor<fp32, [1, ?, 1]> var_507 = add(x = variance_15, y = var_506)[name = tensor<string, []>("op_507")];
441
+ tensor<fp32, []> var_508_epsilon_0 = const()[name = tensor<string, []>("op_508_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
442
+ tensor<fp32, [1, ?, 1]> var_508 = rsqrt(epsilon = var_508_epsilon_0, x = var_507)[name = tensor<string, []>("op_508")];
443
+ tensor<fp32, [1, ?, 256]> hidden_states_57 = mul(x = hidden_states_53, y = var_508)[name = tensor<string, []>("hidden_states_57")];
444
+ tensor<fp32, [1, ?, 256]> hidden_states_59 = mul(x = decoder_block_2_layer_1_layer_norm_weight, y = hidden_states_57)[name = tensor<string, []>("hidden_states_59")];
445
+ tensor<fp32, [1, ?, 384]> states_41 = linear(bias = linear_0_bias_0, weight = decoder_block_2_layer_1_EncDecAttention_q_weight, x = hidden_states_59)[name = tensor<string, []>("linear_26")];
446
+ tensor<int32, [4]> var_521 = const()[name = tensor<string, []>("op_521"), val = tensor<int32, [4]>([1, -1, 6, 64])];
447
+ tensor<fp32, [1, ?, 6, 64]> var_522 = reshape(shape = var_521, x = states_41)[name = tensor<string, []>("op_522")];
448
+ tensor<fp32, [1, ?, 384]> states_43 = linear(bias = linear_0_bias_0, weight = decoder_block_2_layer_1_EncDecAttention_k_weight, x = encoder_hidden_states)[name = tensor<string, []>("linear_27")];
449
+ tensor<int32, [4]> var_526 = const()[name = tensor<string, []>("op_526"), val = tensor<int32, [4]>([1, -1, 6, 64])];
450
+ tensor<fp32, [1, ?, 6, 64]> var_527 = reshape(shape = var_526, x = states_43)[name = tensor<string, []>("op_527")];
451
+ tensor<fp32, [1, ?, 384]> states_45 = linear(bias = linear_0_bias_0, weight = decoder_block_2_layer_1_EncDecAttention_v_weight, x = encoder_hidden_states)[name = tensor<string, []>("linear_28")];
452
+ tensor<int32, [4]> var_531 = const()[name = tensor<string, []>("op_531"), val = tensor<int32, [4]>([1, -1, 6, 64])];
453
+ tensor<fp32, [1, ?, 6, 64]> var_532 = reshape(shape = var_531, x = states_45)[name = tensor<string, []>("op_532")];
454
+ tensor<int32, [4]> value_states_11_perm_0 = const()[name = tensor<string, []>("value_states_11_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
455
+ tensor<bool, []> scores_21_transpose_x_0 = const()[name = tensor<string, []>("scores_21_transpose_x_0"), val = tensor<bool, []>(false)];
456
+ tensor<bool, []> scores_21_transpose_y_0 = const()[name = tensor<string, []>("scores_21_transpose_y_0"), val = tensor<bool, []>(false)];
457
+ tensor<int32, [4]> transpose_34_perm_0 = const()[name = tensor<string, []>("transpose_34_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])];
458
+ tensor<int32, [4]> transpose_35_perm_0 = const()[name = tensor<string, []>("transpose_35_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])];
459
+ tensor<fp32, [1, 6, 64, ?]> transpose_35 = transpose(perm = transpose_35_perm_0, x = var_527)[name = tensor<string, []>("transpose_49")];
460
+ tensor<fp32, [1, 6, ?, 64]> transpose_34 = transpose(perm = transpose_34_perm_0, x = var_522)[name = tensor<string, []>("transpose_50")];
461
+ tensor<fp32, [1, 6, ?, ?]> scores_21 = matmul(transpose_x = scores_21_transpose_x_0, transpose_y = scores_21_transpose_y_0, x = transpose_34, y = transpose_35)[name = tensor<string, []>("scores_21")];
462
+ tensor<fp32, [1, 6, ?, ?]> scores_23 = add(x = scores_21, y = position_bias)[name = tensor<string, []>("scores_23")];
463
+ tensor<fp32, [1, 6, ?, ?]> var_538 = softmax(axis = var_22, x = scores_23)[name = tensor<string, []>("op_538")];
464
+ tensor<bool, []> states_47_transpose_x_0 = const()[name = tensor<string, []>("states_47_transpose_x_0"), val = tensor<bool, []>(false)];
465
+ tensor<bool, []> states_47_transpose_y_0 = const()[name = tensor<string, []>("states_47_transpose_y_0"), val = tensor<bool, []>(false)];
466
+ tensor<fp32, [1, 6, ?, 64]> value_states_11 = transpose(perm = value_states_11_perm_0, x = var_532)[name = tensor<string, []>("transpose_51")];
467
+ tensor<fp32, [1, 6, ?, 64]> states_47 = matmul(transpose_x = states_47_transpose_x_0, transpose_y = states_47_transpose_y_0, x = var_538, y = value_states_11)[name = tensor<string, []>("states_47")];
468
+ tensor<int32, [4]> var_542_perm_0 = const()[name = tensor<string, []>("op_542_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
469
+ tensor<int32, [3]> var_544 = const()[name = tensor<string, []>("op_544"), val = tensor<int32, [3]>([1, -1, 384])];
470
+ tensor<fp32, [1, ?, 6, 64]> var_542 = transpose(perm = var_542_perm_0, x = states_47)[name = tensor<string, []>("transpose_48")];
471
+ tensor<fp32, [1, ?, 384]> input_71 = reshape(shape = var_544, x = var_542)[name = tensor<string, []>("input_71")];
472
+ tensor<fp32, [1, ?, 256]> input_73 = linear(bias = linear_3_bias_0, weight = decoder_block_2_layer_1_EncDecAttention_o_weight, x = input_71)[name = tensor<string, []>("linear_29")];
473
+ tensor<fp32, [1, ?, 256]> hidden_states_61 = add(x = hidden_states_53, y = input_73)[name = tensor<string, []>("hidden_states_61")];
474
+ tensor<fp32, []> var_18_promoted_8 = const()[name = tensor<string, []>("op_18_promoted_8"), val = tensor<fp32, []>(0x1p+1)];
475
+ tensor<fp32, [1, ?, 256]> var_554 = pow(x = hidden_states_61, y = var_18_promoted_8)[name = tensor<string, []>("op_554")];
476
+ tensor<int32, [1]> variance_17_axes_0 = const()[name = tensor<string, []>("variance_17_axes_0"), val = tensor<int32, [1]>([-1])];
477
+ tensor<bool, []> variance_17_keep_dims_0 = const()[name = tensor<string, []>("variance_17_keep_dims_0"), val = tensor<bool, []>(true)];
478
+ tensor<fp32, [1, ?, 1]> variance_17 = reduce_mean(axes = variance_17_axes_0, keep_dims = variance_17_keep_dims_0, x = var_554)[name = tensor<string, []>("variance_17")];
479
+ tensor<fp32, []> var_557 = const()[name = tensor<string, []>("op_557"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
480
+ tensor<fp32, [1, ?, 1]> var_558 = add(x = variance_17, y = var_557)[name = tensor<string, []>("op_558")];
481
+ tensor<fp32, []> var_559_epsilon_0 = const()[name = tensor<string, []>("op_559_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
482
+ tensor<fp32, [1, ?, 1]> var_559 = rsqrt(epsilon = var_559_epsilon_0, x = var_558)[name = tensor<string, []>("op_559")];
483
+ tensor<fp32, [1, ?, 256]> hidden_states_65 = mul(x = hidden_states_61, y = var_559)[name = tensor<string, []>("hidden_states_65")];
484
+ tensor<fp32, [1, ?, 256]> input_75 = mul(x = decoder_block_2_layer_2_layer_norm_weight, y = hidden_states_65)[name = tensor<string, []>("input_75")];
485
+ tensor<fp32, [1, ?, 1024]> input_77 = linear(bias = linear_8_bias_0, weight = decoder_block_2_layer_2_DenseReluDense_wi_0_weight, x = input_75)[name = tensor<string, []>("linear_30")];
486
+ tensor<string, []> hidden_gelu_5_mode_0 = const()[name = tensor<string, []>("hidden_gelu_5_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
487
+ tensor<fp32, [1, ?, 1024]> hidden_gelu_5 = gelu(mode = hidden_gelu_5_mode_0, x = input_77)[name = tensor<string, []>("hidden_gelu_5")];
488
+ tensor<fp32, [1, ?, 1024]> hidden_linear_5 = linear(bias = linear_8_bias_0, weight = decoder_block_2_layer_2_DenseReluDense_wi_1_weight, x = input_75)[name = tensor<string, []>("linear_31")];
489
+ tensor<fp32, [1, ?, 1024]> input_79 = mul(x = hidden_gelu_5, y = hidden_linear_5)[name = tensor<string, []>("input_79")];
490
+ tensor<fp32, [1, ?, 256]> input_83 = linear(bias = linear_3_bias_0, weight = decoder_block_2_layer_2_DenseReluDense_wo_weight, x = input_79)[name = tensor<string, []>("linear_32")];
491
+ tensor<fp32, [1, ?, 256]> hidden_states_67 = add(x = hidden_states_61, y = input_83)[name = tensor<string, []>("hidden_states_67")];
492
+ tensor<fp32, []> var_18_promoted_9 = const()[name = tensor<string, []>("op_18_promoted_9"), val = tensor<fp32, []>(0x1p+1)];
493
+ tensor<fp32, [1, ?, 256]> var_600 = pow(x = hidden_states_67, y = var_18_promoted_9)[name = tensor<string, []>("op_600")];
494
+ tensor<int32, [1]> variance_19_axes_0 = const()[name = tensor<string, []>("variance_19_axes_0"), val = tensor<int32, [1]>([-1])];
495
+ tensor<bool, []> variance_19_keep_dims_0 = const()[name = tensor<string, []>("variance_19_keep_dims_0"), val = tensor<bool, []>(true)];
496
+ tensor<fp32, [1, ?, 1]> variance_19 = reduce_mean(axes = variance_19_axes_0, keep_dims = variance_19_keep_dims_0, x = var_600)[name = tensor<string, []>("variance_19")];
497
+ tensor<fp32, []> var_603 = const()[name = tensor<string, []>("op_603"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
498
+ tensor<fp32, [1, ?, 1]> var_604 = add(x = variance_19, y = var_603)[name = tensor<string, []>("op_604")];
499
+ tensor<fp32, []> var_605_epsilon_0 = const()[name = tensor<string, []>("op_605_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
500
+ tensor<fp32, [1, ?, 1]> var_605 = rsqrt(epsilon = var_605_epsilon_0, x = var_604)[name = tensor<string, []>("op_605")];
501
+ tensor<fp32, [1, ?, 256]> hidden_states_71 = mul(x = hidden_states_67, y = var_605)[name = tensor<string, []>("hidden_states_71")];
502
+ tensor<fp32, [1, ?, 256]> hidden_states_73 = mul(x = decoder_block_3_layer_0_layer_norm_weight, y = hidden_states_71)[name = tensor<string, []>("hidden_states_73")];
503
+ tensor<fp32, [1, ?, 384]> states_49 = linear(bias = linear_0_bias_0, weight = decoder_block_3_layer_0_SelfAttention_q_weight, x = hidden_states_73)[name = tensor<string, []>("linear_33")];
504
+ tensor<int32, [4]> var_618 = const()[name = tensor<string, []>("op_618"), val = tensor<int32, [4]>([1, -1, 6, 64])];
505
+ tensor<fp32, [1, ?, 6, 64]> var_619 = reshape(shape = var_618, x = states_49)[name = tensor<string, []>("op_619")];
506
+ tensor<fp32, [1, ?, 384]> states_51 = linear(bias = linear_0_bias_0, weight = decoder_block_3_layer_0_SelfAttention_k_weight, x = hidden_states_73)[name = tensor<string, []>("linear_34")];
507
+ tensor<int32, [4]> var_623 = const()[name = tensor<string, []>("op_623"), val = tensor<int32, [4]>([1, -1, 6, 64])];
508
+ tensor<fp32, [1, ?, 6, 64]> var_624 = reshape(shape = var_623, x = states_51)[name = tensor<string, []>("op_624")];
509
+ tensor<fp32, [1, ?, 384]> states_53 = linear(bias = linear_0_bias_0, weight = decoder_block_3_layer_0_SelfAttention_v_weight, x = hidden_states_73)[name = tensor<string, []>("linear_35")];
510
+ tensor<int32, [4]> var_628 = const()[name = tensor<string, []>("op_628"), val = tensor<int32, [4]>([1, -1, 6, 64])];
511
+ tensor<fp32, [1, ?, 6, 64]> var_629 = reshape(shape = var_628, x = states_53)[name = tensor<string, []>("op_629")];
512
+ tensor<int32, [4]> value_states_13_perm_0 = const()[name = tensor<string, []>("value_states_13_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
513
+ tensor<bool, []> scores_25_transpose_x_0 = const()[name = tensor<string, []>("scores_25_transpose_x_0"), val = tensor<bool, []>(false)];
514
+ tensor<bool, []> scores_25_transpose_y_0 = const()[name = tensor<string, []>("scores_25_transpose_y_0"), val = tensor<bool, []>(false)];
515
+ tensor<int32, [4]> transpose_36_perm_0 = const()[name = tensor<string, []>("transpose_36_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])];
516
+ tensor<int32, [4]> transpose_37_perm_0 = const()[name = tensor<string, []>("transpose_37_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])];
517
+ tensor<fp32, [1, 6, 64, ?]> transpose_37 = transpose(perm = transpose_37_perm_0, x = var_624)[name = tensor<string, []>("transpose_45")];
518
+ tensor<fp32, [1, 6, ?, 64]> transpose_36 = transpose(perm = transpose_36_perm_0, x = var_619)[name = tensor<string, []>("transpose_46")];
519
+ tensor<fp32, [1, 6, ?, ?]> scores_25 = matmul(transpose_x = scores_25_transpose_x_0, transpose_y = scores_25_transpose_y_0, x = transpose_36, y = transpose_37)[name = tensor<string, []>("scores_25")];
520
+ tensor<fp32, [1, 6, ?, ?]> scores_27 = add(x = scores_25, y = position_bias_3)[name = tensor<string, []>("scores_27")];
521
+ tensor<fp32, [1, 6, ?, ?]> var_635 = softmax(axis = var_22, x = scores_27)[name = tensor<string, []>("op_635")];
522
+ tensor<bool, []> states_55_transpose_x_0 = const()[name = tensor<string, []>("states_55_transpose_x_0"), val = tensor<bool, []>(false)];
523
+ tensor<bool, []> states_55_transpose_y_0 = const()[name = tensor<string, []>("states_55_transpose_y_0"), val = tensor<bool, []>(false)];
524
+ tensor<fp32, [1, 6, ?, 64]> value_states_13 = transpose(perm = value_states_13_perm_0, x = var_629)[name = tensor<string, []>("transpose_47")];
525
+ tensor<fp32, [1, 6, ?, 64]> states_55 = matmul(transpose_x = states_55_transpose_x_0, transpose_y = states_55_transpose_y_0, x = var_635, y = value_states_13)[name = tensor<string, []>("states_55")];
526
+ tensor<int32, [4]> var_639_perm_0 = const()[name = tensor<string, []>("op_639_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
527
+ tensor<int32, [3]> var_641 = const()[name = tensor<string, []>("op_641"), val = tensor<int32, [3]>([1, -1, 384])];
528
+ tensor<fp32, [1, ?, 6, 64]> var_639 = transpose(perm = var_639_perm_0, x = states_55)[name = tensor<string, []>("transpose_44")];
529
+ tensor<fp32, [1, ?, 384]> input_89 = reshape(shape = var_641, x = var_639)[name = tensor<string, []>("input_89")];
530
+ tensor<fp32, [1, ?, 256]> input_91 = linear(bias = linear_3_bias_0, weight = decoder_block_3_layer_0_SelfAttention_o_weight, x = input_89)[name = tensor<string, []>("linear_36")];
531
+ tensor<fp32, [1, ?, 256]> hidden_states_75 = add(x = hidden_states_67, y = input_91)[name = tensor<string, []>("hidden_states_75")];
532
+ tensor<fp32, []> var_18_promoted_10 = const()[name = tensor<string, []>("op_18_promoted_10"), val = tensor<fp32, []>(0x1p+1)];
533
+ tensor<fp32, [1, ?, 256]> var_657 = pow(x = hidden_states_75, y = var_18_promoted_10)[name = tensor<string, []>("op_657")];
534
+ tensor<int32, [1]> variance_21_axes_0 = const()[name = tensor<string, []>("variance_21_axes_0"), val = tensor<int32, [1]>([-1])];
535
+ tensor<bool, []> variance_21_keep_dims_0 = const()[name = tensor<string, []>("variance_21_keep_dims_0"), val = tensor<bool, []>(true)];
536
+ tensor<fp32, [1, ?, 1]> variance_21 = reduce_mean(axes = variance_21_axes_0, keep_dims = variance_21_keep_dims_0, x = var_657)[name = tensor<string, []>("variance_21")];
537
+ tensor<fp32, []> var_660 = const()[name = tensor<string, []>("op_660"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
538
+ tensor<fp32, [1, ?, 1]> var_661 = add(x = variance_21, y = var_660)[name = tensor<string, []>("op_661")];
539
+ tensor<fp32, []> var_662_epsilon_0 = const()[name = tensor<string, []>("op_662_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
540
+ tensor<fp32, [1, ?, 1]> var_662 = rsqrt(epsilon = var_662_epsilon_0, x = var_661)[name = tensor<string, []>("op_662")];
541
+ tensor<fp32, [1, ?, 256]> hidden_states_79 = mul(x = hidden_states_75, y = var_662)[name = tensor<string, []>("hidden_states_79")];
542
+ tensor<fp32, [1, ?, 256]> hidden_states_81 = mul(x = decoder_block_3_layer_1_layer_norm_weight, y = hidden_states_79)[name = tensor<string, []>("hidden_states_81")];
543
+ tensor<fp32, [1, ?, 384]> states_57 = linear(bias = linear_0_bias_0, weight = decoder_block_3_layer_1_EncDecAttention_q_weight, x = hidden_states_81)[name = tensor<string, []>("linear_37")];
544
+ tensor<int32, [4]> var_675 = const()[name = tensor<string, []>("op_675"), val = tensor<int32, [4]>([1, -1, 6, 64])];
545
+ tensor<fp32, [1, ?, 6, 64]> var_676 = reshape(shape = var_675, x = states_57)[name = tensor<string, []>("op_676")];
546
+ tensor<fp32, [1, ?, 384]> states_59 = linear(bias = linear_0_bias_0, weight = decoder_block_3_layer_1_EncDecAttention_k_weight, x = encoder_hidden_states)[name = tensor<string, []>("linear_38")];
547
+ tensor<int32, [4]> var_680 = const()[name = tensor<string, []>("op_680"), val = tensor<int32, [4]>([1, -1, 6, 64])];
548
+ tensor<fp32, [1, ?, 6, 64]> var_681 = reshape(shape = var_680, x = states_59)[name = tensor<string, []>("op_681")];
549
+ tensor<fp32, [1, ?, 384]> states_61 = linear(bias = linear_0_bias_0, weight = decoder_block_3_layer_1_EncDecAttention_v_weight, x = encoder_hidden_states)[name = tensor<string, []>("linear_39")];
550
+ tensor<int32, [4]> var_685 = const()[name = tensor<string, []>("op_685"), val = tensor<int32, [4]>([1, -1, 6, 64])];
551
+ tensor<fp32, [1, ?, 6, 64]> var_686 = reshape(shape = var_685, x = states_61)[name = tensor<string, []>("op_686")];
552
+ tensor<int32, [4]> value_states_perm_0 = const()[name = tensor<string, []>("value_states_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
553
+ tensor<bool, []> scores_29_transpose_x_0 = const()[name = tensor<string, []>("scores_29_transpose_x_0"), val = tensor<bool, []>(false)];
554
+ tensor<bool, []> scores_29_transpose_y_0 = const()[name = tensor<string, []>("scores_29_transpose_y_0"), val = tensor<bool, []>(false)];
555
+ tensor<int32, [4]> transpose_38_perm_0 = const()[name = tensor<string, []>("transpose_38_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])];
556
+ tensor<int32, [4]> transpose_39_perm_0 = const()[name = tensor<string, []>("transpose_39_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])];
557
+ tensor<fp32, [1, 6, 64, ?]> transpose_39 = transpose(perm = transpose_39_perm_0, x = var_681)[name = tensor<string, []>("transpose_41")];
558
+ tensor<fp32, [1, 6, ?, 64]> transpose_38 = transpose(perm = transpose_38_perm_0, x = var_676)[name = tensor<string, []>("transpose_42")];
559
+ tensor<fp32, [1, 6, ?, ?]> scores_29 = matmul(transpose_x = scores_29_transpose_x_0, transpose_y = scores_29_transpose_y_0, x = transpose_38, y = transpose_39)[name = tensor<string, []>("scores_29")];
560
+ tensor<fp32, [1, 6, ?, ?]> scores = add(x = scores_29, y = position_bias)[name = tensor<string, []>("scores")];
561
+ tensor<fp32, [1, 6, ?, ?]> var_692 = softmax(axis = var_22, x = scores)[name = tensor<string, []>("op_692")];
562
+ tensor<bool, []> states_transpose_x_0 = const()[name = tensor<string, []>("states_transpose_x_0"), val = tensor<bool, []>(false)];
563
+ tensor<bool, []> states_transpose_y_0 = const()[name = tensor<string, []>("states_transpose_y_0"), val = tensor<bool, []>(false)];
564
+ tensor<fp32, [1, 6, ?, 64]> value_states = transpose(perm = value_states_perm_0, x = var_686)[name = tensor<string, []>("transpose_43")];
565
+ tensor<fp32, [1, 6, ?, 64]> states = matmul(transpose_x = states_transpose_x_0, transpose_y = states_transpose_y_0, x = var_692, y = value_states)[name = tensor<string, []>("states")];
566
+ tensor<int32, [4]> var_696_perm_0 = const()[name = tensor<string, []>("op_696_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
567
+ tensor<int32, [3]> var_698 = const()[name = tensor<string, []>("op_698"), val = tensor<int32, [3]>([1, -1, 384])];
568
+ tensor<fp32, [1, ?, 6, 64]> var_696 = transpose(perm = var_696_perm_0, x = states)[name = tensor<string, []>("transpose_40")];
569
+ tensor<fp32, [1, ?, 384]> input_97 = reshape(shape = var_698, x = var_696)[name = tensor<string, []>("input_97")];
570
+ tensor<fp32, [1, ?, 256]> input_99 = linear(bias = linear_3_bias_0, weight = decoder_block_3_layer_1_EncDecAttention_o_weight, x = input_97)[name = tensor<string, []>("linear_40")];
571
+ tensor<fp32, [1, ?, 256]> hidden_states_83 = add(x = hidden_states_75, y = input_99)[name = tensor<string, []>("hidden_states_83")];
572
+ tensor<fp32, []> var_18_promoted_11 = const()[name = tensor<string, []>("op_18_promoted_11"), val = tensor<fp32, []>(0x1p+1)];
573
+ tensor<fp32, [1, ?, 256]> var_708 = pow(x = hidden_states_83, y = var_18_promoted_11)[name = tensor<string, []>("op_708")];
574
+ tensor<int32, [1]> variance_23_axes_0 = const()[name = tensor<string, []>("variance_23_axes_0"), val = tensor<int32, [1]>([-1])];
575
+ tensor<bool, []> variance_23_keep_dims_0 = const()[name = tensor<string, []>("variance_23_keep_dims_0"), val = tensor<bool, []>(true)];
576
+ tensor<fp32, [1, ?, 1]> variance_23 = reduce_mean(axes = variance_23_axes_0, keep_dims = variance_23_keep_dims_0, x = var_708)[name = tensor<string, []>("variance_23")];
577
+ tensor<fp32, []> var_711 = const()[name = tensor<string, []>("op_711"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
578
+ tensor<fp32, [1, ?, 1]> var_712 = add(x = variance_23, y = var_711)[name = tensor<string, []>("op_712")];
579
+ tensor<fp32, []> var_713_epsilon_0 = const()[name = tensor<string, []>("op_713_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
580
+ tensor<fp32, [1, ?, 1]> var_713 = rsqrt(epsilon = var_713_epsilon_0, x = var_712)[name = tensor<string, []>("op_713")];
581
+ tensor<fp32, [1, ?, 256]> hidden_states_87 = mul(x = hidden_states_83, y = var_713)[name = tensor<string, []>("hidden_states_87")];
582
+ tensor<fp32, [1, ?, 256]> input_101 = mul(x = decoder_block_3_layer_2_layer_norm_weight, y = hidden_states_87)[name = tensor<string, []>("input_101")];
583
+ tensor<fp32, [1, ?, 1024]> input_103 = linear(bias = linear_8_bias_0, weight = decoder_block_3_layer_2_DenseReluDense_wi_0_weight, x = input_101)[name = tensor<string, []>("linear_41")];
584
+ tensor<string, []> hidden_gelu_mode_0 = const()[name = tensor<string, []>("hidden_gelu_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
585
+ tensor<fp32, [1, ?, 1024]> hidden_gelu = gelu(mode = hidden_gelu_mode_0, x = input_103)[name = tensor<string, []>("hidden_gelu")];
586
+ tensor<fp32, [1, ?, 1024]> hidden_linear = linear(bias = linear_8_bias_0, weight = decoder_block_3_layer_2_DenseReluDense_wi_1_weight, x = input_101)[name = tensor<string, []>("linear_42")];
587
+ tensor<fp32, [1, ?, 1024]> input_105 = mul(x = hidden_gelu, y = hidden_linear)[name = tensor<string, []>("input_105")];
588
+ tensor<fp32, [1, ?, 256]> input_109 = linear(bias = linear_3_bias_0, weight = decoder_block_3_layer_2_DenseReluDense_wo_weight, x = input_105)[name = tensor<string, []>("linear_43")];
589
+ tensor<fp32, [1, ?, 256]> hidden_states_89 = add(x = hidden_states_83, y = input_109)[name = tensor<string, []>("hidden_states_89")];
590
+ tensor<fp32, []> var_18_promoted_12 = const()[name = tensor<string, []>("op_18_promoted_12"), val = tensor<fp32, []>(0x1p+1)];
591
+ tensor<fp32, [1, ?, 256]> var_746 = pow(x = hidden_states_89, y = var_18_promoted_12)[name = tensor<string, []>("op_746")];
592
+ tensor<int32, [1]> variance_axes_0 = const()[name = tensor<string, []>("variance_axes_0"), val = tensor<int32, [1]>([-1])];
593
+ tensor<bool, []> variance_keep_dims_0 = const()[name = tensor<string, []>("variance_keep_dims_0"), val = tensor<bool, []>(true)];
594
+ tensor<fp32, [1, ?, 1]> variance = reduce_mean(axes = variance_axes_0, keep_dims = variance_keep_dims_0, x = var_746)[name = tensor<string, []>("variance")];
595
+ tensor<fp32, []> var_749 = const()[name = tensor<string, []>("op_749"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
596
+ tensor<fp32, [1, ?, 1]> var_750 = add(x = variance, y = var_749)[name = tensor<string, []>("op_750")];
597
+ tensor<fp32, []> var_751_epsilon_0 = const()[name = tensor<string, []>("op_751_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
598
+ tensor<fp32, [1, ?, 1]> var_751 = rsqrt(epsilon = var_751_epsilon_0, x = var_750)[name = tensor<string, []>("op_751")];
599
+ tensor<fp32, [1, ?, 256]> hidden_states = mul(x = hidden_states_89, y = var_751)[name = tensor<string, []>("hidden_states")];
600
+ tensor<fp32, [1, ?, 256]> input_111 = mul(x = decoder_final_layer_norm_weight, y = hidden_states)[name = tensor<string, []>("input_111")];
601
+ tensor<fp32, [1, ?, 384]> logits = linear(bias = linear_0_bias_0, weight = lm_head_weight, x = input_111)[name = tensor<string, []>("linear_44")];
602
+ } -> (logits);
603
+ }
MultilingualG2PDecoder.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:005b5ffbccabe4fd4074204d16af745b5d8f458a687b0c07e80060f7fe0a08e4
3
+ size 25977088
MultilingualG2PEncoder.mlmodelc/analytics/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee8fd1ea46ec79fd7816493973deaa583cd867ce0c7d2dd55124d2368db094bd
3
+ size 243
MultilingualG2PEncoder.mlmodelc/coremldata.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed8bf165b8d5939f995b29490872ee581c9834d5b22d3686fc5c7b300680b058
3
+ size 439
MultilingualG2PEncoder.mlmodelc/metadata.json ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "metadataOutputVersion" : "3.0",
4
+ "storagePrecision" : "Float32",
5
+ "outputSchema" : [
6
+ {
7
+ "hasShapeFlexibility" : "0",
8
+ "isOptional" : "0",
9
+ "dataType" : "Float32",
10
+ "formattedType" : "MultiArray (Float32)",
11
+ "shortDescription" : "",
12
+ "shape" : "[]",
13
+ "name" : "last_hidden_state",
14
+ "type" : "MultiArray"
15
+ }
16
+ ],
17
+ "modelParameters" : [
18
+
19
+ ],
20
+ "specificationVersion" : 8,
21
+ "mlProgramOperationTypeHistogram" : {
22
+ "Range1d" : 1,
23
+ "Ios17.reshape" : 48,
24
+ "Ios16.reduceMean" : 25,
25
+ "Ios16.softmax" : 12,
26
+ "Ios17.matmul" : 24,
27
+ "Ios17.transpose" : 49,
28
+ "Select" : 3,
29
+ "Ios17.expandDims" : 5,
30
+ "Ios17.add" : 66,
31
+ "Ios16.fillLike" : 1,
32
+ "Shape" : 1,
33
+ "Ios17.gather" : 3,
34
+ "Ios17.log" : 1,
35
+ "Ios17.less" : 1,
36
+ "Ios17.sub" : 2,
37
+ "Ios17.pow" : 25,
38
+ "Ios17.cast" : 4,
39
+ "Ios16.gelu" : 12,
40
+ "Ios17.linear" : 84,
41
+ "Ios17.abs" : 1,
42
+ "Ios17.greaterEqual" : 2,
43
+ "Ios17.minimum" : 1,
44
+ "Ios17.rsqrt" : 25,
45
+ "Ios17.greater" : 1,
46
+ "Ios17.mul" : 67
47
+ },
48
+ "computePrecision" : "Mixed (Float32, Int32)",
49
+ "isUpdatable" : "0",
50
+ "stateSchema" : [
51
+
52
+ ],
53
+ "availability" : {
54
+ "macOS" : "14.0",
55
+ "tvOS" : "17.0",
56
+ "visionOS" : "1.0",
57
+ "watchOS" : "10.0",
58
+ "iOS" : "17.0",
59
+ "macCatalyst" : "17.0"
60
+ },
61
+ "modelType" : {
62
+ "name" : "MLModelType_mlProgram"
63
+ },
64
+ "userDefinedMetadata" : {
65
+ "com.github.apple.coremltools.conversion_date" : "2026-03-13",
66
+ "com.github.apple.coremltools.source" : "torch==2.7.0",
67
+ "com.github.apple.coremltools.version" : "9.0",
68
+ "com.github.apple.coremltools.source_dialect" : "TorchScript"
69
+ },
70
+ "inputSchema" : [
71
+ {
72
+ "dataType" : "Int32",
73
+ "hasShapeFlexibility" : "1",
74
+ "isOptional" : "0",
75
+ "shapeFlexibility" : "1 × 1...64",
76
+ "shapeRange" : "[[1, 1], [1, 64]]",
77
+ "formattedType" : "MultiArray (Int32 1 × 16)",
78
+ "type" : "MultiArray",
79
+ "shape" : "[1, 16]",
80
+ "name" : "input_ids",
81
+ "shortDescription" : ""
82
+ },
83
+ {
84
+ "dataType" : "Int32",
85
+ "hasShapeFlexibility" : "1",
86
+ "isOptional" : "0",
87
+ "shapeFlexibility" : "1 × 1...64",
88
+ "shapeRange" : "[[1, 1], [1, 64]]",
89
+ "formattedType" : "MultiArray (Int32 1 × 16)",
90
+ "type" : "MultiArray",
91
+ "shape" : "[1, 16]",
92
+ "name" : "attention_mask",
93
+ "shortDescription" : ""
94
+ }
95
+ ],
96
+ "generatedClassName" : "G2PEncoder",
97
+ "method" : "predict"
98
+ }
99
+ ]
MultilingualG2PEncoder.mlmodelc/model.mil ADDED
The diff for this file is too large to render. See raw diff
 
MultilingualG2PEncoder.mlmodelc/weights/weight.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11b225e93b6b1fe6fb85c9d4317724e1a033d6123fdc01dc2ad85f3c1f168eb3
3
+ size 57056704