Upload 16 files
Browse files- G2PDecoder.mlpackage/Data/com.apple.CoreML/model.mlmodel +2 -2
- G2PDecoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin +2 -2
- G2PDecoder.mlpackage/Manifest.json +8 -8
- G2PEncoder.mlpackage/Data/com.apple.CoreML/model.mlmodel +2 -2
- G2PEncoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin +2 -2
- G2PEncoder.mlpackage/Manifest.json +8 -8
- MultilingualG2PDecoder.mlmodelc/analytics/coremldata.bin +3 -0
- MultilingualG2PDecoder.mlmodelc/coremldata.bin +3 -0
- MultilingualG2PDecoder.mlmodelc/metadata.json +113 -0
- MultilingualG2PDecoder.mlmodelc/model.mil +603 -0
- MultilingualG2PDecoder.mlmodelc/weights/weight.bin +3 -0
- MultilingualG2PEncoder.mlmodelc/analytics/coremldata.bin +3 -0
- MultilingualG2PEncoder.mlmodelc/coremldata.bin +3 -0
- MultilingualG2PEncoder.mlmodelc/metadata.json +99 -0
- MultilingualG2PEncoder.mlmodelc/model.mil +0 -0
- MultilingualG2PEncoder.mlmodelc/weights/weight.bin +3 -0
G2PDecoder.mlpackage/Data/com.apple.CoreML/model.mlmodel
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3b2bfc025be6563494c66b3f9c1b62674741e392d14d92d2ecaeb1730643e50c
|
| 3 |
+
size 85095
|
G2PDecoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:005b5ffbccabe4fd4074204d16af745b5d8f458a687b0c07e80060f7fe0a08e4
|
| 3 |
+
size 25977088
|
G2PDecoder.mlpackage/Manifest.json
CHANGED
|
@@ -1,18 +1,18 @@
|
|
| 1 |
{
|
| 2 |
"fileFormatVersion": "1.0.0",
|
| 3 |
"itemInfoEntries": {
|
| 4 |
-
"
|
| 5 |
-
"author": "com.apple.CoreML",
|
| 6 |
-
"description": "CoreML Model Specification",
|
| 7 |
-
"name": "model.mlmodel",
|
| 8 |
-
"path": "com.apple.CoreML/model.mlmodel"
|
| 9 |
-
},
|
| 10 |
-
"5D000863-3BC2-4F18-AC66-6F1DE5E29001": {
|
| 11 |
"author": "com.apple.CoreML",
|
| 12 |
"description": "CoreML Model Weights",
|
| 13 |
"name": "weights",
|
| 14 |
"path": "com.apple.CoreML/weights"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 15 |
}
|
| 16 |
},
|
| 17 |
-
"rootModelIdentifier": "
|
| 18 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"fileFormatVersion": "1.0.0",
|
| 3 |
"itemInfoEntries": {
|
| 4 |
+
"837F74EA-4434-419F-AE52-FD61A69F6E0A": {
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5 |
"author": "com.apple.CoreML",
|
| 6 |
"description": "CoreML Model Weights",
|
| 7 |
"name": "weights",
|
| 8 |
"path": "com.apple.CoreML/weights"
|
| 9 |
+
},
|
| 10 |
+
"FEF5E4E3-07B4-4F5A-BF3F-C4A2BB7E68E2": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Specification",
|
| 13 |
+
"name": "model.mlmodel",
|
| 14 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 15 |
}
|
| 16 |
},
|
| 17 |
+
"rootModelIdentifier": "FEF5E4E3-07B4-4F5A-BF3F-C4A2BB7E68E2"
|
| 18 |
}
|
G2PEncoder.mlpackage/Data/com.apple.CoreML/model.mlmodel
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:338ee3222fb062efddd1f85374d1aa15478b4975b74f90c59264ad961d9879a3
|
| 3 |
+
size 131789
|
G2PEncoder.mlpackage/Data/com.apple.CoreML/weights/weight.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:11b225e93b6b1fe6fb85c9d4317724e1a033d6123fdc01dc2ad85f3c1f168eb3
|
| 3 |
+
size 57056704
|
G2PEncoder.mlpackage/Manifest.json
CHANGED
|
@@ -1,18 +1,18 @@
|
|
| 1 |
{
|
| 2 |
"fileFormatVersion": "1.0.0",
|
| 3 |
"itemInfoEntries": {
|
| 4 |
-
"
|
| 5 |
-
"author": "com.apple.CoreML",
|
| 6 |
-
"description": "CoreML Model Weights",
|
| 7 |
-
"name": "weights",
|
| 8 |
-
"path": "com.apple.CoreML/weights"
|
| 9 |
-
},
|
| 10 |
-
"D40EF921-64C1-4EEC-BF85-D226D10F6B90": {
|
| 11 |
"author": "com.apple.CoreML",
|
| 12 |
"description": "CoreML Model Specification",
|
| 13 |
"name": "model.mlmodel",
|
| 14 |
"path": "com.apple.CoreML/model.mlmodel"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 15 |
}
|
| 16 |
},
|
| 17 |
-
"rootModelIdentifier": "
|
| 18 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"fileFormatVersion": "1.0.0",
|
| 3 |
"itemInfoEntries": {
|
| 4 |
+
"48AE8C97-A0EB-4155-AE9E-D179548FBDD0": {
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5 |
"author": "com.apple.CoreML",
|
| 6 |
"description": "CoreML Model Specification",
|
| 7 |
"name": "model.mlmodel",
|
| 8 |
"path": "com.apple.CoreML/model.mlmodel"
|
| 9 |
+
},
|
| 10 |
+
"7760FC9D-D7D7-4E6E-8C85-EBF0D242EFC9": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Weights",
|
| 13 |
+
"name": "weights",
|
| 14 |
+
"path": "com.apple.CoreML/weights"
|
| 15 |
}
|
| 16 |
},
|
| 17 |
+
"rootModelIdentifier": "48AE8C97-A0EB-4155-AE9E-D179548FBDD0"
|
| 18 |
}
|
MultilingualG2PDecoder.mlmodelc/analytics/coremldata.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5f34464b8c4e85cde3ca62bc7e22d1ab3eb7494c8aa72c220391c99800910856
|
| 3 |
+
size 243
|
MultilingualG2PDecoder.mlmodelc/coremldata.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb5b5003066a66bde1b5bff980e3267453910b04f96ca7352c0adc996ae7df8f
|
| 3 |
+
size 507
|
MultilingualG2PDecoder.mlmodelc/metadata.json
ADDED
|
@@ -0,0 +1,113 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"metadataOutputVersion" : "3.0",
|
| 4 |
+
"storagePrecision" : "Float32",
|
| 5 |
+
"outputSchema" : [
|
| 6 |
+
{
|
| 7 |
+
"hasShapeFlexibility" : "0",
|
| 8 |
+
"isOptional" : "0",
|
| 9 |
+
"dataType" : "Float32",
|
| 10 |
+
"formattedType" : "MultiArray (Float32)",
|
| 11 |
+
"shortDescription" : "",
|
| 12 |
+
"shape" : "[]",
|
| 13 |
+
"name" : "logits",
|
| 14 |
+
"type" : "MultiArray"
|
| 15 |
+
}
|
| 16 |
+
],
|
| 17 |
+
"modelParameters" : [
|
| 18 |
+
|
| 19 |
+
],
|
| 20 |
+
"specificationVersion" : 8,
|
| 21 |
+
"mlProgramOperationTypeHistogram" : {
|
| 22 |
+
"Range1d" : 2,
|
| 23 |
+
"Fill" : 2,
|
| 24 |
+
"Ios17.reshape" : 32,
|
| 25 |
+
"Ios16.reduceMean" : 13,
|
| 26 |
+
"Ios16.softmax" : 8,
|
| 27 |
+
"Ios17.matmul" : 16,
|
| 28 |
+
"Ios17.transpose" : 33,
|
| 29 |
+
"Select" : 3,
|
| 30 |
+
"Ios17.expandDims" : 11,
|
| 31 |
+
"Ios17.add" : 38,
|
| 32 |
+
"Tile" : 1,
|
| 33 |
+
"Ios17.lessEqual" : 1,
|
| 34 |
+
"Ios16.fillLike" : 1,
|
| 35 |
+
"Shape" : 4,
|
| 36 |
+
"Ios17.gather" : 6,
|
| 37 |
+
"Ios17.log" : 1,
|
| 38 |
+
"Ios17.cast" : 4,
|
| 39 |
+
"Ios17.sub" : 4,
|
| 40 |
+
"Ios17.pow" : 13,
|
| 41 |
+
"Ios17.less" : 1,
|
| 42 |
+
"Ios16.gelu" : 4,
|
| 43 |
+
"Ios17.linear" : 45,
|
| 44 |
+
"Ios17.concat" : 3,
|
| 45 |
+
"Ios17.greaterEqual" : 2,
|
| 46 |
+
"Ios17.minimum" : 2,
|
| 47 |
+
"Ios17.rsqrt" : 13,
|
| 48 |
+
"Ios17.mul" : 37
|
| 49 |
+
},
|
| 50 |
+
"computePrecision" : "Mixed (Float32, Int32)",
|
| 51 |
+
"isUpdatable" : "0",
|
| 52 |
+
"stateSchema" : [
|
| 53 |
+
|
| 54 |
+
],
|
| 55 |
+
"availability" : {
|
| 56 |
+
"macOS" : "14.0",
|
| 57 |
+
"tvOS" : "17.0",
|
| 58 |
+
"visionOS" : "1.0",
|
| 59 |
+
"watchOS" : "10.0",
|
| 60 |
+
"iOS" : "17.0",
|
| 61 |
+
"macCatalyst" : "17.0"
|
| 62 |
+
},
|
| 63 |
+
"modelType" : {
|
| 64 |
+
"name" : "MLModelType_mlProgram"
|
| 65 |
+
},
|
| 66 |
+
"userDefinedMetadata" : {
|
| 67 |
+
"com.github.apple.coremltools.conversion_date" : "2026-03-13",
|
| 68 |
+
"com.github.apple.coremltools.source" : "torch==2.7.0",
|
| 69 |
+
"com.github.apple.coremltools.version" : "9.0",
|
| 70 |
+
"com.github.apple.coremltools.source_dialect" : "TorchScript"
|
| 71 |
+
},
|
| 72 |
+
"inputSchema" : [
|
| 73 |
+
{
|
| 74 |
+
"dataType" : "Int32",
|
| 75 |
+
"hasShapeFlexibility" : "1",
|
| 76 |
+
"isOptional" : "0",
|
| 77 |
+
"shapeFlexibility" : "1 × 1...128",
|
| 78 |
+
"shapeRange" : "[[1, 1], [1, 128]]",
|
| 79 |
+
"formattedType" : "MultiArray (Int32 1 × 8)",
|
| 80 |
+
"type" : "MultiArray",
|
| 81 |
+
"shape" : "[1, 8]",
|
| 82 |
+
"name" : "decoder_input_ids",
|
| 83 |
+
"shortDescription" : ""
|
| 84 |
+
},
|
| 85 |
+
{
|
| 86 |
+
"dataType" : "Float32",
|
| 87 |
+
"hasShapeFlexibility" : "1",
|
| 88 |
+
"isOptional" : "0",
|
| 89 |
+
"shapeFlexibility" : "1 × 1...64 × 256",
|
| 90 |
+
"shapeRange" : "[[1, 1], [1, 64], [256, 256]]",
|
| 91 |
+
"formattedType" : "MultiArray (Float32 1 × 16 × 256)",
|
| 92 |
+
"type" : "MultiArray",
|
| 93 |
+
"shape" : "[1, 16, 256]",
|
| 94 |
+
"name" : "encoder_hidden_states",
|
| 95 |
+
"shortDescription" : ""
|
| 96 |
+
},
|
| 97 |
+
{
|
| 98 |
+
"dataType" : "Int32",
|
| 99 |
+
"hasShapeFlexibility" : "1",
|
| 100 |
+
"isOptional" : "0",
|
| 101 |
+
"shapeFlexibility" : "1 × 1...64",
|
| 102 |
+
"shapeRange" : "[[1, 1], [1, 64]]",
|
| 103 |
+
"formattedType" : "MultiArray (Int32 1 × 16)",
|
| 104 |
+
"type" : "MultiArray",
|
| 105 |
+
"shape" : "[1, 16]",
|
| 106 |
+
"name" : "encoder_attention_mask",
|
| 107 |
+
"shortDescription" : ""
|
| 108 |
+
}
|
| 109 |
+
],
|
| 110 |
+
"generatedClassName" : "G2PDecoder",
|
| 111 |
+
"method" : "predict"
|
| 112 |
+
}
|
| 113 |
+
]
|
MultilingualG2PDecoder.mlmodelc/model.mil
ADDED
|
@@ -0,0 +1,603 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
program(1.0)
|
| 2 |
+
[buildInfo = dict<tensor<string, []>, tensor<string, []>>({{"coremlc-component-MIL", "3510.2.1"}, {"coremlc-version", "3500.32.1"}, {"coremltools-component-torch", "2.7.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "9.0"}})]
|
| 3 |
+
{
|
| 4 |
+
func main<ios17>(tensor<int32, [1, ?]> decoder_input_ids, tensor<int32, [1, ?]> encoder_attention_mask, tensor<fp32, [1, ?, 256]> encoder_hidden_states) [FlexibleShapeInformation = tuple<tuple<tensor<string, []>, dict<tensor<string, []>, tensor<int32, [?]>>>, tuple<tensor<string, []>, dict<tensor<string, []>, list<tensor<int32, [2]>, ?>>>>((("DefaultShapes", {{"decoder_input_ids", [1, 8]}, {"encoder_attention_mask", [1, 16]}, {"encoder_hidden_states", [1, 16, 256]}}), ("RangeDims", {{"decoder_input_ids", [[1, 1], [1, 128]]}, {"encoder_attention_mask", [[1, 1], [1, 64]]}, {"encoder_hidden_states", [[1, 1], [1, 64], [256, 256]]}})))] {
|
| 5 |
+
tensor<fp32, [384, 256]> decoder_embed_tokens_weight = const()[name = tensor<string, []>("decoder_embed_tokens_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(64)))];
|
| 6 |
+
tensor<fp32, [256]> decoder_block_0_layer_0_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_0_layer_0_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(393344)))];
|
| 7 |
+
tensor<fp32, [384, 256]> decoder_block_0_layer_0_SelfAttention_q_weight = const()[name = tensor<string, []>("decoder_block_0_layer_0_SelfAttention_q_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(394432)))];
|
| 8 |
+
tensor<fp32, [384, 256]> decoder_block_0_layer_0_SelfAttention_k_weight = const()[name = tensor<string, []>("decoder_block_0_layer_0_SelfAttention_k_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(787712)))];
|
| 9 |
+
tensor<fp32, [384, 256]> decoder_block_0_layer_0_SelfAttention_v_weight = const()[name = tensor<string, []>("decoder_block_0_layer_0_SelfAttention_v_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1180992)))];
|
| 10 |
+
tensor<fp32, [32, 6]> decoder_block_0_layer_0_SelfAttention_relative_attention_bias_weight = const()[name = tensor<string, []>("decoder_block_0_layer_0_SelfAttention_relative_attention_bias_weight"), val = tensor<fp32, [32, 6]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1574272)))];
|
| 11 |
+
tensor<fp32, [256, 384]> decoder_block_0_layer_0_SelfAttention_o_weight = const()[name = tensor<string, []>("decoder_block_0_layer_0_SelfAttention_o_weight"), val = tensor<fp32, [256, 384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1575104)))];
|
| 12 |
+
tensor<fp32, [256]> decoder_block_0_layer_1_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_0_layer_1_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1968384)))];
|
| 13 |
+
tensor<fp32, [384, 256]> decoder_block_0_layer_1_EncDecAttention_q_weight = const()[name = tensor<string, []>("decoder_block_0_layer_1_EncDecAttention_q_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1969472)))];
|
| 14 |
+
tensor<fp32, [384, 256]> decoder_block_0_layer_1_EncDecAttention_k_weight = const()[name = tensor<string, []>("decoder_block_0_layer_1_EncDecAttention_k_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2362752)))];
|
| 15 |
+
tensor<fp32, [384, 256]> decoder_block_0_layer_1_EncDecAttention_v_weight = const()[name = tensor<string, []>("decoder_block_0_layer_1_EncDecAttention_v_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2756032)))];
|
| 16 |
+
tensor<fp32, [256, 384]> decoder_block_0_layer_1_EncDecAttention_o_weight = const()[name = tensor<string, []>("decoder_block_0_layer_1_EncDecAttention_o_weight"), val = tensor<fp32, [256, 384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3149312)))];
|
| 17 |
+
tensor<fp32, [256]> decoder_block_0_layer_2_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_0_layer_2_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3542592)))];
|
| 18 |
+
tensor<fp32, [1024, 256]> decoder_block_0_layer_2_DenseReluDense_wi_0_weight = const()[name = tensor<string, []>("decoder_block_0_layer_2_DenseReluDense_wi_0_weight"), val = tensor<fp32, [1024, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3543680)))];
|
| 19 |
+
tensor<fp32, [1024, 256]> decoder_block_0_layer_2_DenseReluDense_wi_1_weight = const()[name = tensor<string, []>("decoder_block_0_layer_2_DenseReluDense_wi_1_weight"), val = tensor<fp32, [1024, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4592320)))];
|
| 20 |
+
tensor<fp32, [256, 1024]> decoder_block_0_layer_2_DenseReluDense_wo_weight = const()[name = tensor<string, []>("decoder_block_0_layer_2_DenseReluDense_wo_weight"), val = tensor<fp32, [256, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5640960)))];
|
| 21 |
+
tensor<fp32, [256]> decoder_block_1_layer_0_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_1_layer_0_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6689600)))];
|
| 22 |
+
tensor<fp32, [384, 256]> decoder_block_1_layer_0_SelfAttention_q_weight = const()[name = tensor<string, []>("decoder_block_1_layer_0_SelfAttention_q_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6690688)))];
|
| 23 |
+
tensor<fp32, [384, 256]> decoder_block_1_layer_0_SelfAttention_k_weight = const()[name = tensor<string, []>("decoder_block_1_layer_0_SelfAttention_k_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7083968)))];
|
| 24 |
+
tensor<fp32, [384, 256]> decoder_block_1_layer_0_SelfAttention_v_weight = const()[name = tensor<string, []>("decoder_block_1_layer_0_SelfAttention_v_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7477248)))];
|
| 25 |
+
tensor<fp32, [256, 384]> decoder_block_1_layer_0_SelfAttention_o_weight = const()[name = tensor<string, []>("decoder_block_1_layer_0_SelfAttention_o_weight"), val = tensor<fp32, [256, 384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7870528)))];
|
| 26 |
+
tensor<fp32, [256]> decoder_block_1_layer_1_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_1_layer_1_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8263808)))];
|
| 27 |
+
tensor<fp32, [384, 256]> decoder_block_1_layer_1_EncDecAttention_q_weight = const()[name = tensor<string, []>("decoder_block_1_layer_1_EncDecAttention_q_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8264896)))];
|
| 28 |
+
tensor<fp32, [384, 256]> decoder_block_1_layer_1_EncDecAttention_k_weight = const()[name = tensor<string, []>("decoder_block_1_layer_1_EncDecAttention_k_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8658176)))];
|
| 29 |
+
tensor<fp32, [384, 256]> decoder_block_1_layer_1_EncDecAttention_v_weight = const()[name = tensor<string, []>("decoder_block_1_layer_1_EncDecAttention_v_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9051456)))];
|
| 30 |
+
tensor<fp32, [256, 384]> decoder_block_1_layer_1_EncDecAttention_o_weight = const()[name = tensor<string, []>("decoder_block_1_layer_1_EncDecAttention_o_weight"), val = tensor<fp32, [256, 384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9444736)))];
|
| 31 |
+
tensor<fp32, [256]> decoder_block_1_layer_2_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_1_layer_2_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9838016)))];
|
| 32 |
+
tensor<fp32, [1024, 256]> decoder_block_1_layer_2_DenseReluDense_wi_0_weight = const()[name = tensor<string, []>("decoder_block_1_layer_2_DenseReluDense_wi_0_weight"), val = tensor<fp32, [1024, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9839104)))];
|
| 33 |
+
tensor<fp32, [1024, 256]> decoder_block_1_layer_2_DenseReluDense_wi_1_weight = const()[name = tensor<string, []>("decoder_block_1_layer_2_DenseReluDense_wi_1_weight"), val = tensor<fp32, [1024, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(10887744)))];
|
| 34 |
+
tensor<fp32, [256, 1024]> decoder_block_1_layer_2_DenseReluDense_wo_weight = const()[name = tensor<string, []>("decoder_block_1_layer_2_DenseReluDense_wo_weight"), val = tensor<fp32, [256, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(11936384)))];
|
| 35 |
+
tensor<fp32, [256]> decoder_block_2_layer_0_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_2_layer_0_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12985024)))];
|
| 36 |
+
tensor<fp32, [384, 256]> decoder_block_2_layer_0_SelfAttention_q_weight = const()[name = tensor<string, []>("decoder_block_2_layer_0_SelfAttention_q_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12986112)))];
|
| 37 |
+
tensor<fp32, [384, 256]> decoder_block_2_layer_0_SelfAttention_k_weight = const()[name = tensor<string, []>("decoder_block_2_layer_0_SelfAttention_k_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(13379392)))];
|
| 38 |
+
tensor<fp32, [384, 256]> decoder_block_2_layer_0_SelfAttention_v_weight = const()[name = tensor<string, []>("decoder_block_2_layer_0_SelfAttention_v_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(13772672)))];
|
| 39 |
+
tensor<fp32, [256, 384]> decoder_block_2_layer_0_SelfAttention_o_weight = const()[name = tensor<string, []>("decoder_block_2_layer_0_SelfAttention_o_weight"), val = tensor<fp32, [256, 384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(14165952)))];
|
| 40 |
+
tensor<fp32, [256]> decoder_block_2_layer_1_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_2_layer_1_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(14559232)))];
|
| 41 |
+
tensor<fp32, [384, 256]> decoder_block_2_layer_1_EncDecAttention_q_weight = const()[name = tensor<string, []>("decoder_block_2_layer_1_EncDecAttention_q_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(14560320)))];
|
| 42 |
+
tensor<fp32, [384, 256]> decoder_block_2_layer_1_EncDecAttention_k_weight = const()[name = tensor<string, []>("decoder_block_2_layer_1_EncDecAttention_k_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(14953600)))];
|
| 43 |
+
tensor<fp32, [384, 256]> decoder_block_2_layer_1_EncDecAttention_v_weight = const()[name = tensor<string, []>("decoder_block_2_layer_1_EncDecAttention_v_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(15346880)))];
|
| 44 |
+
tensor<fp32, [256, 384]> decoder_block_2_layer_1_EncDecAttention_o_weight = const()[name = tensor<string, []>("decoder_block_2_layer_1_EncDecAttention_o_weight"), val = tensor<fp32, [256, 384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(15740160)))];
|
| 45 |
+
tensor<fp32, [256]> decoder_block_2_layer_2_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_2_layer_2_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16133440)))];
|
| 46 |
+
tensor<fp32, [1024, 256]> decoder_block_2_layer_2_DenseReluDense_wi_0_weight = const()[name = tensor<string, []>("decoder_block_2_layer_2_DenseReluDense_wi_0_weight"), val = tensor<fp32, [1024, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16134528)))];
|
| 47 |
+
tensor<fp32, [1024, 256]> decoder_block_2_layer_2_DenseReluDense_wi_1_weight = const()[name = tensor<string, []>("decoder_block_2_layer_2_DenseReluDense_wi_1_weight"), val = tensor<fp32, [1024, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17183168)))];
|
| 48 |
+
tensor<fp32, [256, 1024]> decoder_block_2_layer_2_DenseReluDense_wo_weight = const()[name = tensor<string, []>("decoder_block_2_layer_2_DenseReluDense_wo_weight"), val = tensor<fp32, [256, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(18231808)))];
|
| 49 |
+
tensor<fp32, [256]> decoder_block_3_layer_0_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_3_layer_0_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(19280448)))];
|
| 50 |
+
tensor<fp32, [384, 256]> decoder_block_3_layer_0_SelfAttention_q_weight = const()[name = tensor<string, []>("decoder_block_3_layer_0_SelfAttention_q_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(19281536)))];
|
| 51 |
+
tensor<fp32, [384, 256]> decoder_block_3_layer_0_SelfAttention_k_weight = const()[name = tensor<string, []>("decoder_block_3_layer_0_SelfAttention_k_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(19674816)))];
|
| 52 |
+
tensor<fp32, [384, 256]> decoder_block_3_layer_0_SelfAttention_v_weight = const()[name = tensor<string, []>("decoder_block_3_layer_0_SelfAttention_v_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(20068096)))];
|
| 53 |
+
tensor<fp32, [256, 384]> decoder_block_3_layer_0_SelfAttention_o_weight = const()[name = tensor<string, []>("decoder_block_3_layer_0_SelfAttention_o_weight"), val = tensor<fp32, [256, 384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(20461376)))];
|
| 54 |
+
tensor<fp32, [256]> decoder_block_3_layer_1_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_3_layer_1_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(20854656)))];
|
| 55 |
+
tensor<fp32, [384, 256]> decoder_block_3_layer_1_EncDecAttention_q_weight = const()[name = tensor<string, []>("decoder_block_3_layer_1_EncDecAttention_q_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(20855744)))];
|
| 56 |
+
tensor<fp32, [384, 256]> decoder_block_3_layer_1_EncDecAttention_k_weight = const()[name = tensor<string, []>("decoder_block_3_layer_1_EncDecAttention_k_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(21249024)))];
|
| 57 |
+
tensor<fp32, [384, 256]> decoder_block_3_layer_1_EncDecAttention_v_weight = const()[name = tensor<string, []>("decoder_block_3_layer_1_EncDecAttention_v_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(21642304)))];
|
| 58 |
+
tensor<fp32, [256, 384]> decoder_block_3_layer_1_EncDecAttention_o_weight = const()[name = tensor<string, []>("decoder_block_3_layer_1_EncDecAttention_o_weight"), val = tensor<fp32, [256, 384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22035584)))];
|
| 59 |
+
tensor<fp32, [256]> decoder_block_3_layer_2_layer_norm_weight = const()[name = tensor<string, []>("decoder_block_3_layer_2_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22428864)))];
|
| 60 |
+
tensor<fp32, [1024, 256]> decoder_block_3_layer_2_DenseReluDense_wi_0_weight = const()[name = tensor<string, []>("decoder_block_3_layer_2_DenseReluDense_wi_0_weight"), val = tensor<fp32, [1024, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22429952)))];
|
| 61 |
+
tensor<fp32, [1024, 256]> decoder_block_3_layer_2_DenseReluDense_wi_1_weight = const()[name = tensor<string, []>("decoder_block_3_layer_2_DenseReluDense_wi_1_weight"), val = tensor<fp32, [1024, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(23478592)))];
|
| 62 |
+
tensor<fp32, [256, 1024]> decoder_block_3_layer_2_DenseReluDense_wo_weight = const()[name = tensor<string, []>("decoder_block_3_layer_2_DenseReluDense_wo_weight"), val = tensor<fp32, [256, 1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(24527232)))];
|
| 63 |
+
tensor<fp32, [256]> decoder_final_layer_norm_weight = const()[name = tensor<string, []>("decoder_final_layer_norm_weight"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25575872)))];
|
| 64 |
+
tensor<fp32, [384, 256]> lm_head_weight = const()[name = tensor<string, []>("lm_head_weight"), val = tensor<fp32, [384, 256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25576960)))];
|
| 65 |
+
tensor<int32, []> var_8 = const()[name = tensor<string, []>("op_8"), val = tensor<int32, []>(16)];
|
| 66 |
+
tensor<fp32, []> var_14 = const()[name = tensor<string, []>("op_14"), val = tensor<fp32, []>(0x1p+0)];
|
| 67 |
+
tensor<int32, []> var_16 = const()[name = tensor<string, []>("op_16"), val = tensor<int32, []>(6)];
|
| 68 |
+
tensor<int32, []> var_22 = const()[name = tensor<string, []>("op_22"), val = tensor<int32, []>(-1)];
|
| 69 |
+
tensor<int32, []> var_23 = const()[name = tensor<string, []>("op_23"), val = tensor<int32, []>(1)];
|
| 70 |
+
tensor<int32, [2]> var_35_shape = shape(x = decoder_input_ids)[name = tensor<string, []>("op_35_shape")];
|
| 71 |
+
tensor<int32, []> gather_0 = const()[name = tensor<string, []>("gather_0"), val = tensor<int32, []>(1)];
|
| 72 |
+
tensor<int32, []> gather_1_batch_dims_0 = const()[name = tensor<string, []>("gather_1_batch_dims_0"), val = tensor<int32, []>(0)];
|
| 73 |
+
tensor<bool, []> gather_1_validate_indices_0 = const()[name = tensor<string, []>("gather_1_validate_indices_0"), val = tensor<bool, []>(false)];
|
| 74 |
+
tensor<int32, []> select_0 = const()[name = tensor<string, []>("select_0"), val = tensor<int32, []>(1)];
|
| 75 |
+
tensor<int32, []> gather_1_axis_1 = const()[name = tensor<string, []>("gather_1_axis_1"), val = tensor<int32, []>(0)];
|
| 76 |
+
tensor<int32, []> gather_1 = gather(axis = gather_1_axis_1, batch_dims = gather_1_batch_dims_0, indices = select_0, validate_indices = gather_1_validate_indices_0, x = var_35_shape)[name = tensor<string, []>("gather_1")];
|
| 77 |
+
tensor<int32, []> input_3_batch_dims_0 = const()[name = tensor<string, []>("input_3_batch_dims_0"), val = tensor<int32, []>(0)];
|
| 78 |
+
tensor<bool, []> input_3_validate_indices_0 = const()[name = tensor<string, []>("input_3_validate_indices_0"), val = tensor<bool, []>(false)];
|
| 79 |
+
tensor<int32, []> greater_equal_1_y_0 = const()[name = tensor<string, []>("greater_equal_1_y_0"), val = tensor<int32, []>(0)];
|
| 80 |
+
tensor<bool, [1, ?]> greater_equal_1 = greater_equal(x = decoder_input_ids, y = greater_equal_1_y_0)[name = tensor<string, []>("greater_equal_1")];
|
| 81 |
+
tensor<int32, []> slice_by_index_1 = const()[name = tensor<string, []>("slice_by_index_1"), val = tensor<int32, []>(384)];
|
| 82 |
+
tensor<int32, [1, ?]> add_1 = add(x = decoder_input_ids, y = slice_by_index_1)[name = tensor<string, []>("add_1")];
|
| 83 |
+
tensor<int32, [1, ?]> select_1 = select(a = decoder_input_ids, b = add_1, cond = greater_equal_1)[name = tensor<string, []>("select_1")];
|
| 84 |
+
tensor<int32, []> input_3_axis_1 = const()[name = tensor<string, []>("input_3_axis_1"), val = tensor<int32, []>(0)];
|
| 85 |
+
tensor<fp32, [1, ?, 256]> input_3 = gather(axis = input_3_axis_1, batch_dims = input_3_batch_dims_0, indices = select_1, validate_indices = input_3_validate_indices_0, x = decoder_embed_tokens_weight)[name = tensor<string, []>("input_3")];
|
| 86 |
+
tensor<int32, []> concat_1_axis_0 = const()[name = tensor<string, []>("concat_1_axis_0"), val = tensor<int32, []>(0)];
|
| 87 |
+
tensor<bool, []> concat_1_interleave_0 = const()[name = tensor<string, []>("concat_1_interleave_0"), val = tensor<bool, []>(false)];
|
| 88 |
+
tensor<int32, [2]> concat_1 = concat(axis = concat_1_axis_0, interleave = concat_1_interleave_0, values = (gather_0, gather_1))[name = tensor<string, []>("concat_1")];
|
| 89 |
+
tensor<fp32, []> fill_0_value_0 = const()[name = tensor<string, []>("fill_0_value_0"), val = tensor<fp32, []>(0x1p+0)];
|
| 90 |
+
tensor<fp32, [1, ?]> fill_0 = fill(shape = concat_1, value = fill_0_value_0)[name = tensor<string, []>("fill_0")];
|
| 91 |
+
tensor<int32, []> const_0 = const()[name = tensor<string, []>("const_0"), val = tensor<int32, []>(0)];
|
| 92 |
+
tensor<int32, []> const_1 = const()[name = tensor<string, []>("const_1"), val = tensor<int32, []>(1)];
|
| 93 |
+
tensor<int32, [?]> seq_ids = range_1d(end = gather_1, start = const_0, step = const_1)[name = tensor<string, []>("seq_ids")];
|
| 94 |
+
tensor<int32, [1]> var_44_axes_0 = const()[name = tensor<string, []>("op_44_axes_0"), val = tensor<int32, [1]>([0])];
|
| 95 |
+
tensor<int32, [1, ?]> var_44 = expand_dims(axes = var_44_axes_0, x = seq_ids)[name = tensor<string, []>("op_44")];
|
| 96 |
+
tensor<int32, [1]> var_45_axes_0 = const()[name = tensor<string, []>("op_45_axes_0"), val = tensor<int32, [1]>([1])];
|
| 97 |
+
tensor<int32, [1, 1, ?]> var_45 = expand_dims(axes = var_45_axes_0, x = var_44)[name = tensor<string, []>("op_45")];
|
| 98 |
+
tensor<int32, []> concat_2_axis_0 = const()[name = tensor<string, []>("concat_2_axis_0"), val = tensor<int32, []>(0)];
|
| 99 |
+
tensor<bool, []> concat_2_interleave_0 = const()[name = tensor<string, []>("concat_2_interleave_0"), val = tensor<bool, []>(false)];
|
| 100 |
+
tensor<int32, [3]> concat_2 = concat(axis = concat_2_axis_0, interleave = concat_2_interleave_0, values = (gather_0, gather_1, var_23))[name = tensor<string, []>("concat_2")];
|
| 101 |
+
tensor<int32, [1, ?, ?]> var_48 = tile(reps = concat_2, x = var_45)[name = tensor<string, []>("op_48")];
|
| 102 |
+
tensor<int32, [1]> var_51_axes_0 = const()[name = tensor<string, []>("op_51_axes_0"), val = tensor<int32, [1]>([2])];
|
| 103 |
+
tensor<int32, [1, ?, 1]> var_51 = expand_dims(axes = var_51_axes_0, x = var_44)[name = tensor<string, []>("op_51")];
|
| 104 |
+
tensor<bool, [1, ?, ?]> causal_mask_1 = less_equal(x = var_48, y = var_51)[name = tensor<string, []>("causal_mask_1")];
|
| 105 |
+
tensor<string, []> causal_mask_dtype_0 = const()[name = tensor<string, []>("causal_mask_dtype_0"), val = tensor<string, []>("fp32")];
|
| 106 |
+
tensor<int32, [1]> var_55_axes_0 = const()[name = tensor<string, []>("op_55_axes_0"), val = tensor<int32, [1]>([1])];
|
| 107 |
+
tensor<fp32, [1, ?, ?]> causal_mask = cast(dtype = causal_mask_dtype_0, x = causal_mask_1)[name = tensor<string, []>("cast_42")];
|
| 108 |
+
tensor<fp32, [1, 1, ?, ?]> var_55 = expand_dims(axes = var_55_axes_0, x = causal_mask)[name = tensor<string, []>("op_55")];
|
| 109 |
+
tensor<int32, [1]> var_59_axes_0 = const()[name = tensor<string, []>("op_59_axes_0"), val = tensor<int32, [1]>([1])];
|
| 110 |
+
tensor<fp32, [1, 1, ?]> var_59 = expand_dims(axes = var_59_axes_0, x = fill_0)[name = tensor<string, []>("op_59")];
|
| 111 |
+
tensor<int32, [1]> var_60_axes_0 = const()[name = tensor<string, []>("op_60_axes_0"), val = tensor<int32, [1]>([2])];
|
| 112 |
+
tensor<fp32, [1, 1, 1, ?]> var_60 = expand_dims(axes = var_60_axes_0, x = var_59)[name = tensor<string, []>("op_60")];
|
| 113 |
+
tensor<fp32, [1, 1, ?, ?]> extended_attention_mask = mul(x = var_55, y = var_60)[name = tensor<string, []>("extended_attention_mask")];
|
| 114 |
+
tensor<fp32, [1, 1, ?, ?]> var_64 = sub(x = var_14, y = extended_attention_mask)[name = tensor<string, []>("op_64")];
|
| 115 |
+
tensor<fp32, []> var_65 = const()[name = tensor<string, []>("op_65"), val = tensor<fp32, []>(-0x1.fffffep+127)];
|
| 116 |
+
tensor<fp32, [1, 1, ?, ?]> mask_1 = mul(x = var_64, y = var_65)[name = tensor<string, []>("mask_1")];
|
| 117 |
+
tensor<int32, [1]> var_68_axes_0 = const()[name = tensor<string, []>("op_68_axes_0"), val = tensor<int32, [1]>([1])];
|
| 118 |
+
tensor<int32, [1, 1, ?]> var_68 = expand_dims(axes = var_68_axes_0, x = encoder_attention_mask)[name = tensor<string, []>("op_68")];
|
| 119 |
+
tensor<int32, [1]> var_69_axes_0 = const()[name = tensor<string, []>("op_69_axes_0"), val = tensor<int32, [1]>([2])];
|
| 120 |
+
tensor<int32, [1, 1, 1, ?]> var_69 = expand_dims(axes = var_69_axes_0, x = var_68)[name = tensor<string, []>("op_69")];
|
| 121 |
+
tensor<string, []> var_71_dtype_0 = const()[name = tensor<string, []>("op_71_dtype_0"), val = tensor<string, []>("fp32")];
|
| 122 |
+
tensor<fp32, [1, 1, 1, ?]> var_71 = cast(dtype = var_71_dtype_0, x = var_69)[name = tensor<string, []>("cast_41")];
|
| 123 |
+
tensor<fp32, [1, 1, 1, ?]> var_72 = sub(x = var_14, y = var_71)[name = tensor<string, []>("op_72")];
|
| 124 |
+
tensor<fp32, []> var_73 = const()[name = tensor<string, []>("op_73"), val = tensor<fp32, []>(-0x1.fffffep+127)];
|
| 125 |
+
tensor<fp32, [1, 1, 1, ?]> mask = mul(x = var_72, y = var_73)[name = tensor<string, []>("mask")];
|
| 126 |
+
tensor<fp32, []> var_18_promoted = const()[name = tensor<string, []>("op_18_promoted"), val = tensor<fp32, []>(0x1p+1)];
|
| 127 |
+
tensor<fp32, [1, ?, 256]> var_86 = pow(x = input_3, y = var_18_promoted)[name = tensor<string, []>("op_86")];
|
| 128 |
+
tensor<int32, [1]> variance_1_axes_0 = const()[name = tensor<string, []>("variance_1_axes_0"), val = tensor<int32, [1]>([-1])];
|
| 129 |
+
tensor<bool, []> variance_1_keep_dims_0 = const()[name = tensor<string, []>("variance_1_keep_dims_0"), val = tensor<bool, []>(true)];
|
| 130 |
+
tensor<fp32, [1, ?, 1]> variance_1 = reduce_mean(axes = variance_1_axes_0, keep_dims = variance_1_keep_dims_0, x = var_86)[name = tensor<string, []>("variance_1")];
|
| 131 |
+
tensor<fp32, []> var_89 = const()[name = tensor<string, []>("op_89"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
|
| 132 |
+
tensor<fp32, [1, ?, 1]> var_90 = add(x = variance_1, y = var_89)[name = tensor<string, []>("op_90")];
|
| 133 |
+
tensor<fp32, []> var_91_epsilon_0 = const()[name = tensor<string, []>("op_91_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
|
| 134 |
+
tensor<fp32, [1, ?, 1]> var_91 = rsqrt(epsilon = var_91_epsilon_0, x = var_90)[name = tensor<string, []>("op_91")];
|
| 135 |
+
tensor<fp32, [1, ?, 256]> hidden_states_5 = mul(x = input_3, y = var_91)[name = tensor<string, []>("hidden_states_5")];
|
| 136 |
+
tensor<fp32, [1, ?, 256]> hidden_states_7 = mul(x = decoder_block_0_layer_0_layer_norm_weight, y = hidden_states_5)[name = tensor<string, []>("hidden_states_7")];
|
| 137 |
+
tensor<int32, [3]> var_103_shape = shape(x = hidden_states_7)[name = tensor<string, []>("op_103_shape")];
|
| 138 |
+
tensor<int32, []> gather_3_batch_dims_0 = const()[name = tensor<string, []>("gather_3_batch_dims_0"), val = tensor<int32, []>(0)];
|
| 139 |
+
tensor<bool, []> gather_3_validate_indices_0 = const()[name = tensor<string, []>("gather_3_validate_indices_0"), val = tensor<bool, []>(false)];
|
| 140 |
+
tensor<int32, []> select_2 = const()[name = tensor<string, []>("select_2"), val = tensor<int32, []>(1)];
|
| 141 |
+
tensor<int32, []> gather_3_axis_1 = const()[name = tensor<string, []>("gather_3_axis_1"), val = tensor<int32, []>(0)];
|
| 142 |
+
tensor<int32, []> gather_3 = gather(axis = gather_3_axis_1, batch_dims = gather_3_batch_dims_0, indices = select_2, validate_indices = gather_3_validate_indices_0, x = var_103_shape)[name = tensor<string, []>("gather_3")];
|
| 143 |
+
tensor<fp32, [384]> linear_0_bias_0 = const()[name = tensor<string, []>("linear_0_bias_0"), val = tensor<fp32, [384]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25970240)))];
|
| 144 |
+
tensor<fp32, [1, ?, 384]> states_1 = linear(bias = linear_0_bias_0, weight = decoder_block_0_layer_0_SelfAttention_q_weight, x = hidden_states_7)[name = tensor<string, []>("linear_0")];
|
| 145 |
+
tensor<int32, [4]> var_106 = const()[name = tensor<string, []>("op_106"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 146 |
+
tensor<fp32, [1, ?, 6, 64]> var_107 = reshape(shape = var_106, x = states_1)[name = tensor<string, []>("op_107")];
|
| 147 |
+
tensor<fp32, [1, ?, 384]> states_3 = linear(bias = linear_0_bias_0, weight = decoder_block_0_layer_0_SelfAttention_k_weight, x = hidden_states_7)[name = tensor<string, []>("linear_1")];
|
| 148 |
+
tensor<int32, [4]> var_111 = const()[name = tensor<string, []>("op_111"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 149 |
+
tensor<fp32, [1, ?, 6, 64]> var_112 = reshape(shape = var_111, x = states_3)[name = tensor<string, []>("op_112")];
|
| 150 |
+
tensor<fp32, [1, ?, 384]> states_5 = linear(bias = linear_0_bias_0, weight = decoder_block_0_layer_0_SelfAttention_v_weight, x = hidden_states_7)[name = tensor<string, []>("linear_2")];
|
| 151 |
+
tensor<int32, [4]> var_116 = const()[name = tensor<string, []>("op_116"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 152 |
+
tensor<fp32, [1, ?, 6, 64]> var_117 = reshape(shape = var_116, x = states_5)[name = tensor<string, []>("op_117")];
|
| 153 |
+
tensor<int32, [4]> value_states_1_perm_0 = const()[name = tensor<string, []>("value_states_1_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
|
| 154 |
+
tensor<bool, []> scores_1_transpose_x_0 = const()[name = tensor<string, []>("scores_1_transpose_x_0"), val = tensor<bool, []>(false)];
|
| 155 |
+
tensor<bool, []> scores_1_transpose_y_0 = const()[name = tensor<string, []>("scores_1_transpose_y_0"), val = tensor<bool, []>(false)];
|
| 156 |
+
tensor<int32, [4]> transpose_24_perm_0 = const()[name = tensor<string, []>("transpose_24_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])];
|
| 157 |
+
tensor<int32, [4]> transpose_25_perm_0 = const()[name = tensor<string, []>("transpose_25_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])];
|
| 158 |
+
tensor<fp32, [1, 6, 64, ?]> transpose_25 = transpose(perm = transpose_25_perm_0, x = var_112)[name = tensor<string, []>("transpose_70")];
|
| 159 |
+
tensor<fp32, [1, 6, ?, 64]> transpose_24 = transpose(perm = transpose_24_perm_0, x = var_107)[name = tensor<string, []>("transpose_71")];
|
| 160 |
+
tensor<fp32, [1, 6, ?, ?]> scores_1 = matmul(transpose_x = scores_1_transpose_x_0, transpose_y = scores_1_transpose_y_0, x = transpose_24, y = transpose_25)[name = tensor<string, []>("scores_1")];
|
| 161 |
+
tensor<int32, []> const_2 = const()[name = tensor<string, []>("const_2"), val = tensor<int32, []>(0)];
|
| 162 |
+
tensor<int32, []> const_3 = const()[name = tensor<string, []>("const_3"), val = tensor<int32, []>(1)];
|
| 163 |
+
tensor<int32, [?]> var_121 = range_1d(end = gather_3, start = const_2, step = const_3)[name = tensor<string, []>("op_121")];
|
| 164 |
+
tensor<int32, [1]> context_position_axes_0 = const()[name = tensor<string, []>("context_position_axes_0"), val = tensor<int32, [1]>([1])];
|
| 165 |
+
tensor<int32, [?, 1]> context_position = expand_dims(axes = context_position_axes_0, x = var_121)[name = tensor<string, []>("context_position")];
|
| 166 |
+
tensor<int32, [1]> var_125_axes_0 = const()[name = tensor<string, []>("op_125_axes_0"), val = tensor<int32, [1]>([0])];
|
| 167 |
+
tensor<int32, [1, ?]> var_125 = expand_dims(axes = var_125_axes_0, x = var_121)[name = tensor<string, []>("op_125")];
|
| 168 |
+
tensor<int32, [?, ?]> relative_position_1 = sub(x = var_125, y = context_position)[name = tensor<string, []>("relative_position_1")];
|
| 169 |
+
tensor<int32, [?, ?]> var_128 = sub(x = relative_position_1, y = relative_position_1)[name = tensor<string, []>("sub_0")];
|
| 170 |
+
tensor<int32, [?, ?]> var_129 = minimum(x = relative_position_1, y = var_128)[name = tensor<string, []>("op_129")];
|
| 171 |
+
tensor<int32, []> const_6 = const()[name = tensor<string, []>("const_6"), val = tensor<int32, []>(-1)];
|
| 172 |
+
tensor<int32, [?, ?]> relative_position = mul(x = var_129, y = const_6)[name = tensor<string, []>("relative_position")];
|
| 173 |
+
tensor<bool, [?, ?]> is_small = less(x = relative_position, y = var_8)[name = tensor<string, []>("is_small")];
|
| 174 |
+
tensor<string, []> var_132_dtype_0 = const()[name = tensor<string, []>("op_132_dtype_0"), val = tensor<string, []>("fp32")];
|
| 175 |
+
tensor<fp32, []> _inversed_134_y_0 = const()[name = tensor<string, []>("_inversed_134_y_0"), val = tensor<fp32, []>(0x1p-4)];
|
| 176 |
+
tensor<fp32, [?, ?]> var_132 = cast(dtype = var_132_dtype_0, x = relative_position)[name = tensor<string, []>("cast_40")];
|
| 177 |
+
tensor<fp32, [?, ?]> _inversed_134 = mul(x = var_132, y = _inversed_134_y_0)[name = tensor<string, []>("_inversed_134")];
|
| 178 |
+
tensor<fp32, []> var_135_epsilon_0 = const()[name = tensor<string, []>("op_135_epsilon_0"), val = tensor<fp32, []>(0x1p-149)];
|
| 179 |
+
tensor<fp32, [?, ?]> var_135 = log(epsilon = var_135_epsilon_0, x = _inversed_134)[name = tensor<string, []>("op_135")];
|
| 180 |
+
tensor<fp32, []> _inversed_137_y_0 = const()[name = tensor<string, []>("_inversed_137_y_0"), val = tensor<fp32, []>(0x1.ec709ep-2)];
|
| 181 |
+
tensor<fp32, [?, ?]> _inversed_137 = mul(x = var_135, y = _inversed_137_y_0)[name = tensor<string, []>("_inversed_137")];
|
| 182 |
+
tensor<fp32, []> var_138_promoted = const()[name = tensor<string, []>("op_138_promoted"), val = tensor<fp32, []>(0x1p+4)];
|
| 183 |
+
tensor<fp32, [?, ?]> var_139 = mul(x = _inversed_137, y = var_138_promoted)[name = tensor<string, []>("op_139")];
|
| 184 |
+
tensor<string, []> var_140_dtype_0 = const()[name = tensor<string, []>("op_140_dtype_0"), val = tensor<string, []>("int32")];
|
| 185 |
+
tensor<int32, []> var_141 = const()[name = tensor<string, []>("op_141"), val = tensor<int32, []>(16)];
|
| 186 |
+
tensor<int32, [?, ?]> var_140 = cast(dtype = var_140_dtype_0, x = var_139)[name = tensor<string, []>("cast_39")];
|
| 187 |
+
tensor<int32, [?, ?]> relative_position_if_large_1 = add(x = var_140, y = var_141)[name = tensor<string, []>("relative_position_if_large_1")];
|
| 188 |
+
tensor<int32, []> var_143_value_0 = const()[name = tensor<string, []>("op_143_value_0"), val = tensor<int32, []>(31)];
|
| 189 |
+
tensor<int32, [?, ?]> var_143 = fill_like(ref_tensor = relative_position_if_large_1, value = var_143_value_0)[name = tensor<string, []>("op_143")];
|
| 190 |
+
tensor<int32, [?, ?]> relative_position_if_large = minimum(x = relative_position_if_large_1, y = var_143)[name = tensor<string, []>("relative_position_if_large")];
|
| 191 |
+
tensor<int32, [?, ?]> var_145 = select(a = relative_position, b = relative_position_if_large, cond = is_small)[name = tensor<string, []>("op_145")];
|
| 192 |
+
tensor<int32, []> values_batch_dims_0 = const()[name = tensor<string, []>("values_batch_dims_0"), val = tensor<int32, []>(0)];
|
| 193 |
+
tensor<bool, []> values_validate_indices_0 = const()[name = tensor<string, []>("values_validate_indices_0"), val = tensor<bool, []>(false)];
|
| 194 |
+
tensor<int32, []> greater_equal_3_y_0 = const()[name = tensor<string, []>("greater_equal_3_y_0"), val = tensor<int32, []>(0)];
|
| 195 |
+
tensor<bool, [?, ?]> greater_equal_3 = greater_equal(x = var_145, y = greater_equal_3_y_0)[name = tensor<string, []>("greater_equal_3")];
|
| 196 |
+
tensor<int32, []> slice_by_index_3 = const()[name = tensor<string, []>("slice_by_index_3"), val = tensor<int32, []>(32)];
|
| 197 |
+
tensor<int32, [?, ?]> add_3 = add(x = var_145, y = slice_by_index_3)[name = tensor<string, []>("add_3")];
|
| 198 |
+
tensor<int32, [?, ?]> select_3 = select(a = var_145, b = add_3, cond = greater_equal_3)[name = tensor<string, []>("select_3")];
|
| 199 |
+
tensor<int32, []> values_axis_1 = const()[name = tensor<string, []>("values_axis_1"), val = tensor<int32, []>(0)];
|
| 200 |
+
tensor<fp32, [?, ?, 6]> values = gather(axis = values_axis_1, batch_dims = values_batch_dims_0, indices = select_3, validate_indices = values_validate_indices_0, x = decoder_block_0_layer_0_SelfAttention_relative_attention_bias_weight)[name = tensor<string, []>("values")];
|
| 201 |
+
tensor<int32, [3]> var_150 = const()[name = tensor<string, []>("op_150"), val = tensor<int32, [3]>([2, 0, 1])];
|
| 202 |
+
tensor<int32, [1]> position_bias_1_axes_0 = const()[name = tensor<string, []>("position_bias_1_axes_0"), val = tensor<int32, [1]>([0])];
|
| 203 |
+
tensor<fp32, [6, ?, ?]> var_151 = transpose(perm = var_150, x = values)[name = tensor<string, []>("transpose_69")];
|
| 204 |
+
tensor<fp32, [1, 6, ?, ?]> position_bias_1 = expand_dims(axes = position_bias_1_axes_0, x = var_151)[name = tensor<string, []>("position_bias_1")];
|
| 205 |
+
tensor<fp32, [1, 6, ?, ?]> position_bias_3 = add(x = position_bias_1, y = mask_1)[name = tensor<string, []>("position_bias_3")];
|
| 206 |
+
tensor<fp32, [1, 6, ?, ?]> scores_3 = add(x = scores_1, y = position_bias_3)[name = tensor<string, []>("scores_3")];
|
| 207 |
+
tensor<fp32, [1, 6, ?, ?]> var_156 = softmax(axis = var_22, x = scores_3)[name = tensor<string, []>("op_156")];
|
| 208 |
+
tensor<bool, []> states_7_transpose_x_0 = const()[name = tensor<string, []>("states_7_transpose_x_0"), val = tensor<bool, []>(false)];
|
| 209 |
+
tensor<bool, []> states_7_transpose_y_0 = const()[name = tensor<string, []>("states_7_transpose_y_0"), val = tensor<bool, []>(false)];
|
| 210 |
+
tensor<fp32, [1, 6, ?, 64]> value_states_1 = transpose(perm = value_states_1_perm_0, x = var_117)[name = tensor<string, []>("transpose_72")];
|
| 211 |
+
tensor<fp32, [1, 6, ?, 64]> states_7 = matmul(transpose_x = states_7_transpose_x_0, transpose_y = states_7_transpose_y_0, x = var_156, y = value_states_1)[name = tensor<string, []>("states_7")];
|
| 212 |
+
tensor<int32, [4]> var_160_perm_0 = const()[name = tensor<string, []>("op_160_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
|
| 213 |
+
tensor<int32, [3]> var_162 = const()[name = tensor<string, []>("op_162"), val = tensor<int32, [3]>([1, -1, 384])];
|
| 214 |
+
tensor<fp32, [1, ?, 6, 64]> var_160 = transpose(perm = var_160_perm_0, x = states_7)[name = tensor<string, []>("transpose_68")];
|
| 215 |
+
tensor<fp32, [1, ?, 384]> input_11 = reshape(shape = var_162, x = var_160)[name = tensor<string, []>("input_11")];
|
| 216 |
+
tensor<fp32, [256]> linear_3_bias_0 = const()[name = tensor<string, []>("linear_3_bias_0"), val = tensor<fp32, [256]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25971840)))];
|
| 217 |
+
tensor<fp32, [1, ?, 256]> input_13 = linear(bias = linear_3_bias_0, weight = decoder_block_0_layer_0_SelfAttention_o_weight, x = input_11)[name = tensor<string, []>("linear_3")];
|
| 218 |
+
tensor<fp32, [1, ?, 256]> hidden_states_9 = add(x = input_3, y = input_13)[name = tensor<string, []>("hidden_states_9")];
|
| 219 |
+
tensor<fp32, []> var_18_promoted_1 = const()[name = tensor<string, []>("op_18_promoted_1"), val = tensor<fp32, []>(0x1p+1)];
|
| 220 |
+
tensor<fp32, [1, ?, 256]> var_180 = pow(x = hidden_states_9, y = var_18_promoted_1)[name = tensor<string, []>("op_180")];
|
| 221 |
+
tensor<int32, [1]> variance_3_axes_0 = const()[name = tensor<string, []>("variance_3_axes_0"), val = tensor<int32, [1]>([-1])];
|
| 222 |
+
tensor<bool, []> variance_3_keep_dims_0 = const()[name = tensor<string, []>("variance_3_keep_dims_0"), val = tensor<bool, []>(true)];
|
| 223 |
+
tensor<fp32, [1, ?, 1]> variance_3 = reduce_mean(axes = variance_3_axes_0, keep_dims = variance_3_keep_dims_0, x = var_180)[name = tensor<string, []>("variance_3")];
|
| 224 |
+
tensor<fp32, []> var_183 = const()[name = tensor<string, []>("op_183"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
|
| 225 |
+
tensor<fp32, [1, ?, 1]> var_184 = add(x = variance_3, y = var_183)[name = tensor<string, []>("op_184")];
|
| 226 |
+
tensor<fp32, []> var_185_epsilon_0 = const()[name = tensor<string, []>("op_185_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
|
| 227 |
+
tensor<fp32, [1, ?, 1]> var_185 = rsqrt(epsilon = var_185_epsilon_0, x = var_184)[name = tensor<string, []>("op_185")];
|
| 228 |
+
tensor<fp32, [1, ?, 256]> hidden_states_13 = mul(x = hidden_states_9, y = var_185)[name = tensor<string, []>("hidden_states_13")];
|
| 229 |
+
tensor<fp32, [1, ?, 256]> hidden_states_15 = mul(x = decoder_block_0_layer_1_layer_norm_weight, y = hidden_states_13)[name = tensor<string, []>("hidden_states_15")];
|
| 230 |
+
tensor<int32, [3]> var_196_shape = shape(x = hidden_states_15)[name = tensor<string, []>("op_196_shape")];
|
| 231 |
+
tensor<int32, []> gather_5_batch_dims_0 = const()[name = tensor<string, []>("gather_5_batch_dims_0"), val = tensor<int32, []>(0)];
|
| 232 |
+
tensor<bool, []> gather_5_validate_indices_0 = const()[name = tensor<string, []>("gather_5_validate_indices_0"), val = tensor<bool, []>(false)];
|
| 233 |
+
tensor<int32, []> select_4 = const()[name = tensor<string, []>("select_4"), val = tensor<int32, []>(1)];
|
| 234 |
+
tensor<int32, []> gather_5_axis_1 = const()[name = tensor<string, []>("gather_5_axis_1"), val = tensor<int32, []>(0)];
|
| 235 |
+
tensor<int32, []> gather_5 = gather(axis = gather_5_axis_1, batch_dims = gather_5_batch_dims_0, indices = select_4, validate_indices = gather_5_validate_indices_0, x = var_196_shape)[name = tensor<string, []>("gather_5")];
|
| 236 |
+
tensor<int32, [3]> var_197_shape = shape(x = encoder_hidden_states)[name = tensor<string, []>("op_197_shape")];
|
| 237 |
+
tensor<int32, []> gather_6_batch_dims_0 = const()[name = tensor<string, []>("gather_6_batch_dims_0"), val = tensor<int32, []>(0)];
|
| 238 |
+
tensor<bool, []> gather_6_validate_indices_0 = const()[name = tensor<string, []>("gather_6_validate_indices_0"), val = tensor<bool, []>(false)];
|
| 239 |
+
tensor<int32, []> select_5 = const()[name = tensor<string, []>("select_5"), val = tensor<int32, []>(1)];
|
| 240 |
+
tensor<int32, []> gather_6_axis_1 = const()[name = tensor<string, []>("gather_6_axis_1"), val = tensor<int32, []>(0)];
|
| 241 |
+
tensor<int32, []> gather_6 = gather(axis = gather_6_axis_1, batch_dims = gather_6_batch_dims_0, indices = select_5, validate_indices = gather_6_validate_indices_0, x = var_197_shape)[name = tensor<string, []>("gather_6")];
|
| 242 |
+
tensor<fp32, [1, ?, 384]> states_9 = linear(bias = linear_0_bias_0, weight = decoder_block_0_layer_1_EncDecAttention_q_weight, x = hidden_states_15)[name = tensor<string, []>("linear_4")];
|
| 243 |
+
tensor<int32, [4]> var_200 = const()[name = tensor<string, []>("op_200"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 244 |
+
tensor<fp32, [1, ?, 6, 64]> var_201 = reshape(shape = var_200, x = states_9)[name = tensor<string, []>("op_201")];
|
| 245 |
+
tensor<fp32, [1, ?, 384]> states_11 = linear(bias = linear_0_bias_0, weight = decoder_block_0_layer_1_EncDecAttention_k_weight, x = encoder_hidden_states)[name = tensor<string, []>("linear_5")];
|
| 246 |
+
tensor<int32, [4]> var_205 = const()[name = tensor<string, []>("op_205"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 247 |
+
tensor<fp32, [1, ?, 6, 64]> var_206 = reshape(shape = var_205, x = states_11)[name = tensor<string, []>("op_206")];
|
| 248 |
+
tensor<fp32, [1, ?, 384]> states_13 = linear(bias = linear_0_bias_0, weight = decoder_block_0_layer_1_EncDecAttention_v_weight, x = encoder_hidden_states)[name = tensor<string, []>("linear_6")];
|
| 249 |
+
tensor<int32, [4]> var_210 = const()[name = tensor<string, []>("op_210"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 250 |
+
tensor<fp32, [1, ?, 6, 64]> var_211 = reshape(shape = var_210, x = states_13)[name = tensor<string, []>("op_211")];
|
| 251 |
+
tensor<int32, [4]> value_states_3_perm_0 = const()[name = tensor<string, []>("value_states_3_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
|
| 252 |
+
tensor<bool, []> scores_5_transpose_x_0 = const()[name = tensor<string, []>("scores_5_transpose_x_0"), val = tensor<bool, []>(false)];
|
| 253 |
+
tensor<bool, []> scores_5_transpose_y_0 = const()[name = tensor<string, []>("scores_5_transpose_y_0"), val = tensor<bool, []>(false)];
|
| 254 |
+
tensor<int32, [4]> transpose_26_perm_0 = const()[name = tensor<string, []>("transpose_26_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])];
|
| 255 |
+
tensor<int32, [4]> transpose_27_perm_0 = const()[name = tensor<string, []>("transpose_27_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])];
|
| 256 |
+
tensor<fp32, [1, 6, 64, ?]> transpose_27 = transpose(perm = transpose_27_perm_0, x = var_206)[name = tensor<string, []>("transpose_65")];
|
| 257 |
+
tensor<fp32, [1, 6, ?, 64]> transpose_26 = transpose(perm = transpose_26_perm_0, x = var_201)[name = tensor<string, []>("transpose_66")];
|
| 258 |
+
tensor<fp32, [1, 6, ?, ?]> scores_5 = matmul(transpose_x = scores_5_transpose_x_0, transpose_y = scores_5_transpose_y_0, x = transpose_26, y = transpose_27)[name = tensor<string, []>("scores_5")];
|
| 259 |
+
tensor<int32, []> concat_3_axis_0 = const()[name = tensor<string, []>("concat_3_axis_0"), val = tensor<int32, []>(0)];
|
| 260 |
+
tensor<bool, []> concat_3_interleave_0 = const()[name = tensor<string, []>("concat_3_interleave_0"), val = tensor<bool, []>(false)];
|
| 261 |
+
tensor<int32, [4]> concat_3 = concat(axis = concat_3_axis_0, interleave = concat_3_interleave_0, values = (var_23, var_16, gather_5, gather_6))[name = tensor<string, []>("concat_3")];
|
| 262 |
+
tensor<fp32, []> position_bias_5_value_0 = const()[name = tensor<string, []>("position_bias_5_value_0"), val = tensor<fp32, []>(0x0p+0)];
|
| 263 |
+
tensor<fp32, [1, 6, ?, ?]> position_bias_5 = fill(shape = concat_3, value = position_bias_5_value_0)[name = tensor<string, []>("position_bias_5")];
|
| 264 |
+
tensor<fp32, [1, 6, ?, ?]> position_bias = add(x = position_bias_5, y = mask)[name = tensor<string, []>("position_bias")];
|
| 265 |
+
tensor<fp32, [1, 6, ?, ?]> scores_7 = add(x = scores_5, y = position_bias)[name = tensor<string, []>("scores_7")];
|
| 266 |
+
tensor<fp32, [1, 6, ?, ?]> var_220 = softmax(axis = var_22, x = scores_7)[name = tensor<string, []>("op_220")];
|
| 267 |
+
tensor<bool, []> states_15_transpose_x_0 = const()[name = tensor<string, []>("states_15_transpose_x_0"), val = tensor<bool, []>(false)];
|
| 268 |
+
tensor<bool, []> states_15_transpose_y_0 = const()[name = tensor<string, []>("states_15_transpose_y_0"), val = tensor<bool, []>(false)];
|
| 269 |
+
tensor<fp32, [1, 6, ?, 64]> value_states_3 = transpose(perm = value_states_3_perm_0, x = var_211)[name = tensor<string, []>("transpose_67")];
|
| 270 |
+
tensor<fp32, [1, 6, ?, 64]> states_15 = matmul(transpose_x = states_15_transpose_x_0, transpose_y = states_15_transpose_y_0, x = var_220, y = value_states_3)[name = tensor<string, []>("states_15")];
|
| 271 |
+
tensor<int32, [4]> var_224_perm_0 = const()[name = tensor<string, []>("op_224_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
|
| 272 |
+
tensor<int32, [3]> var_226 = const()[name = tensor<string, []>("op_226"), val = tensor<int32, [3]>([1, -1, 384])];
|
| 273 |
+
tensor<fp32, [1, ?, 6, 64]> var_224 = transpose(perm = var_224_perm_0, x = states_15)[name = tensor<string, []>("transpose_64")];
|
| 274 |
+
tensor<fp32, [1, ?, 384]> input_19 = reshape(shape = var_226, x = var_224)[name = tensor<string, []>("input_19")];
|
| 275 |
+
tensor<fp32, [1, ?, 256]> input_21 = linear(bias = linear_3_bias_0, weight = decoder_block_0_layer_1_EncDecAttention_o_weight, x = input_19)[name = tensor<string, []>("linear_7")];
|
| 276 |
+
tensor<fp32, [1, ?, 256]> hidden_states_17 = add(x = hidden_states_9, y = input_21)[name = tensor<string, []>("hidden_states_17")];
|
| 277 |
+
tensor<fp32, []> var_18_promoted_2 = const()[name = tensor<string, []>("op_18_promoted_2"), val = tensor<fp32, []>(0x1p+1)];
|
| 278 |
+
tensor<fp32, [1, ?, 256]> var_242 = pow(x = hidden_states_17, y = var_18_promoted_2)[name = tensor<string, []>("op_242")];
|
| 279 |
+
tensor<int32, [1]> variance_5_axes_0 = const()[name = tensor<string, []>("variance_5_axes_0"), val = tensor<int32, [1]>([-1])];
|
| 280 |
+
tensor<bool, []> variance_5_keep_dims_0 = const()[name = tensor<string, []>("variance_5_keep_dims_0"), val = tensor<bool, []>(true)];
|
| 281 |
+
tensor<fp32, [1, ?, 1]> variance_5 = reduce_mean(axes = variance_5_axes_0, keep_dims = variance_5_keep_dims_0, x = var_242)[name = tensor<string, []>("variance_5")];
|
| 282 |
+
tensor<fp32, []> var_245 = const()[name = tensor<string, []>("op_245"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
|
| 283 |
+
tensor<fp32, [1, ?, 1]> var_246 = add(x = variance_5, y = var_245)[name = tensor<string, []>("op_246")];
|
| 284 |
+
tensor<fp32, []> var_247_epsilon_0 = const()[name = tensor<string, []>("op_247_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
|
| 285 |
+
tensor<fp32, [1, ?, 1]> var_247 = rsqrt(epsilon = var_247_epsilon_0, x = var_246)[name = tensor<string, []>("op_247")];
|
| 286 |
+
tensor<fp32, [1, ?, 256]> hidden_states_21 = mul(x = hidden_states_17, y = var_247)[name = tensor<string, []>("hidden_states_21")];
|
| 287 |
+
tensor<fp32, [1, ?, 256]> input_23 = mul(x = decoder_block_0_layer_2_layer_norm_weight, y = hidden_states_21)[name = tensor<string, []>("input_23")];
|
| 288 |
+
tensor<fp32, [1024]> linear_8_bias_0 = const()[name = tensor<string, []>("linear_8_bias_0"), val = tensor<fp32, [1024]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25972928)))];
|
| 289 |
+
tensor<fp32, [1, ?, 1024]> input_25 = linear(bias = linear_8_bias_0, weight = decoder_block_0_layer_2_DenseReluDense_wi_0_weight, x = input_23)[name = tensor<string, []>("linear_8")];
|
| 290 |
+
tensor<string, []> hidden_gelu_1_mode_0 = const()[name = tensor<string, []>("hidden_gelu_1_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
|
| 291 |
+
tensor<fp32, [1, ?, 1024]> hidden_gelu_1 = gelu(mode = hidden_gelu_1_mode_0, x = input_25)[name = tensor<string, []>("hidden_gelu_1")];
|
| 292 |
+
tensor<fp32, [1, ?, 1024]> hidden_linear_1 = linear(bias = linear_8_bias_0, weight = decoder_block_0_layer_2_DenseReluDense_wi_1_weight, x = input_23)[name = tensor<string, []>("linear_9")];
|
| 293 |
+
tensor<fp32, [1, ?, 1024]> input_27 = mul(x = hidden_gelu_1, y = hidden_linear_1)[name = tensor<string, []>("input_27")];
|
| 294 |
+
tensor<fp32, [1, ?, 256]> input_31 = linear(bias = linear_3_bias_0, weight = decoder_block_0_layer_2_DenseReluDense_wo_weight, x = input_27)[name = tensor<string, []>("linear_10")];
|
| 295 |
+
tensor<fp32, [1, ?, 256]> hidden_states_23 = add(x = hidden_states_17, y = input_31)[name = tensor<string, []>("hidden_states_23")];
|
| 296 |
+
tensor<fp32, []> var_18_promoted_3 = const()[name = tensor<string, []>("op_18_promoted_3"), val = tensor<fp32, []>(0x1p+1)];
|
| 297 |
+
tensor<fp32, [1, ?, 256]> var_292 = pow(x = hidden_states_23, y = var_18_promoted_3)[name = tensor<string, []>("op_292")];
|
| 298 |
+
tensor<int32, [1]> variance_7_axes_0 = const()[name = tensor<string, []>("variance_7_axes_0"), val = tensor<int32, [1]>([-1])];
|
| 299 |
+
tensor<bool, []> variance_7_keep_dims_0 = const()[name = tensor<string, []>("variance_7_keep_dims_0"), val = tensor<bool, []>(true)];
|
| 300 |
+
tensor<fp32, [1, ?, 1]> variance_7 = reduce_mean(axes = variance_7_axes_0, keep_dims = variance_7_keep_dims_0, x = var_292)[name = tensor<string, []>("variance_7")];
|
| 301 |
+
tensor<fp32, []> var_295 = const()[name = tensor<string, []>("op_295"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
|
| 302 |
+
tensor<fp32, [1, ?, 1]> var_296 = add(x = variance_7, y = var_295)[name = tensor<string, []>("op_296")];
|
| 303 |
+
tensor<fp32, []> var_297_epsilon_0 = const()[name = tensor<string, []>("op_297_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
|
| 304 |
+
tensor<fp32, [1, ?, 1]> var_297 = rsqrt(epsilon = var_297_epsilon_0, x = var_296)[name = tensor<string, []>("op_297")];
|
| 305 |
+
tensor<fp32, [1, ?, 256]> hidden_states_27 = mul(x = hidden_states_23, y = var_297)[name = tensor<string, []>("hidden_states_27")];
|
| 306 |
+
tensor<fp32, [1, ?, 256]> hidden_states_29 = mul(x = decoder_block_1_layer_0_layer_norm_weight, y = hidden_states_27)[name = tensor<string, []>("hidden_states_29")];
|
| 307 |
+
tensor<fp32, [1, ?, 384]> states_17 = linear(bias = linear_0_bias_0, weight = decoder_block_1_layer_0_SelfAttention_q_weight, x = hidden_states_29)[name = tensor<string, []>("linear_11")];
|
| 308 |
+
tensor<int32, [4]> var_310 = const()[name = tensor<string, []>("op_310"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 309 |
+
tensor<fp32, [1, ?, 6, 64]> var_311 = reshape(shape = var_310, x = states_17)[name = tensor<string, []>("op_311")];
|
| 310 |
+
tensor<fp32, [1, ?, 384]> states_19 = linear(bias = linear_0_bias_0, weight = decoder_block_1_layer_0_SelfAttention_k_weight, x = hidden_states_29)[name = tensor<string, []>("linear_12")];
|
| 311 |
+
tensor<int32, [4]> var_315 = const()[name = tensor<string, []>("op_315"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 312 |
+
tensor<fp32, [1, ?, 6, 64]> var_316 = reshape(shape = var_315, x = states_19)[name = tensor<string, []>("op_316")];
|
| 313 |
+
tensor<fp32, [1, ?, 384]> states_21 = linear(bias = linear_0_bias_0, weight = decoder_block_1_layer_0_SelfAttention_v_weight, x = hidden_states_29)[name = tensor<string, []>("linear_13")];
|
| 314 |
+
tensor<int32, [4]> var_320 = const()[name = tensor<string, []>("op_320"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 315 |
+
tensor<fp32, [1, ?, 6, 64]> var_321 = reshape(shape = var_320, x = states_21)[name = tensor<string, []>("op_321")];
|
| 316 |
+
tensor<int32, [4]> value_states_5_perm_0 = const()[name = tensor<string, []>("value_states_5_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
|
| 317 |
+
tensor<bool, []> scores_9_transpose_x_0 = const()[name = tensor<string, []>("scores_9_transpose_x_0"), val = tensor<bool, []>(false)];
|
| 318 |
+
tensor<bool, []> scores_9_transpose_y_0 = const()[name = tensor<string, []>("scores_9_transpose_y_0"), val = tensor<bool, []>(false)];
|
| 319 |
+
tensor<int32, [4]> transpose_28_perm_0 = const()[name = tensor<string, []>("transpose_28_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])];
|
| 320 |
+
tensor<int32, [4]> transpose_29_perm_0 = const()[name = tensor<string, []>("transpose_29_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])];
|
| 321 |
+
tensor<fp32, [1, 6, 64, ?]> transpose_29 = transpose(perm = transpose_29_perm_0, x = var_316)[name = tensor<string, []>("transpose_61")];
|
| 322 |
+
tensor<fp32, [1, 6, ?, 64]> transpose_28 = transpose(perm = transpose_28_perm_0, x = var_311)[name = tensor<string, []>("transpose_62")];
|
| 323 |
+
tensor<fp32, [1, 6, ?, ?]> scores_9 = matmul(transpose_x = scores_9_transpose_x_0, transpose_y = scores_9_transpose_y_0, x = transpose_28, y = transpose_29)[name = tensor<string, []>("scores_9")];
|
| 324 |
+
tensor<fp32, [1, 6, ?, ?]> scores_11 = add(x = scores_9, y = position_bias_3)[name = tensor<string, []>("scores_11")];
|
| 325 |
+
tensor<fp32, [1, 6, ?, ?]> var_327 = softmax(axis = var_22, x = scores_11)[name = tensor<string, []>("op_327")];
|
| 326 |
+
tensor<bool, []> states_23_transpose_x_0 = const()[name = tensor<string, []>("states_23_transpose_x_0"), val = tensor<bool, []>(false)];
|
| 327 |
+
tensor<bool, []> states_23_transpose_y_0 = const()[name = tensor<string, []>("states_23_transpose_y_0"), val = tensor<bool, []>(false)];
|
| 328 |
+
tensor<fp32, [1, 6, ?, 64]> value_states_5 = transpose(perm = value_states_5_perm_0, x = var_321)[name = tensor<string, []>("transpose_63")];
|
| 329 |
+
tensor<fp32, [1, 6, ?, 64]> states_23 = matmul(transpose_x = states_23_transpose_x_0, transpose_y = states_23_transpose_y_0, x = var_327, y = value_states_5)[name = tensor<string, []>("states_23")];
|
| 330 |
+
tensor<int32, [4]> var_331_perm_0 = const()[name = tensor<string, []>("op_331_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
|
| 331 |
+
tensor<int32, [3]> var_333 = const()[name = tensor<string, []>("op_333"), val = tensor<int32, [3]>([1, -1, 384])];
|
| 332 |
+
tensor<fp32, [1, ?, 6, 64]> var_331 = transpose(perm = var_331_perm_0, x = states_23)[name = tensor<string, []>("transpose_60")];
|
| 333 |
+
tensor<fp32, [1, ?, 384]> input_37 = reshape(shape = var_333, x = var_331)[name = tensor<string, []>("input_37")];
|
| 334 |
+
tensor<fp32, [1, ?, 256]> input_39 = linear(bias = linear_3_bias_0, weight = decoder_block_1_layer_0_SelfAttention_o_weight, x = input_37)[name = tensor<string, []>("linear_14")];
|
| 335 |
+
tensor<fp32, [1, ?, 256]> hidden_states_31 = add(x = hidden_states_23, y = input_39)[name = tensor<string, []>("hidden_states_31")];
|
| 336 |
+
tensor<fp32, []> var_18_promoted_4 = const()[name = tensor<string, []>("op_18_promoted_4"), val = tensor<fp32, []>(0x1p+1)];
|
| 337 |
+
tensor<fp32, [1, ?, 256]> var_349 = pow(x = hidden_states_31, y = var_18_promoted_4)[name = tensor<string, []>("op_349")];
|
| 338 |
+
tensor<int32, [1]> variance_9_axes_0 = const()[name = tensor<string, []>("variance_9_axes_0"), val = tensor<int32, [1]>([-1])];
|
| 339 |
+
tensor<bool, []> variance_9_keep_dims_0 = const()[name = tensor<string, []>("variance_9_keep_dims_0"), val = tensor<bool, []>(true)];
|
| 340 |
+
tensor<fp32, [1, ?, 1]> variance_9 = reduce_mean(axes = variance_9_axes_0, keep_dims = variance_9_keep_dims_0, x = var_349)[name = tensor<string, []>("variance_9")];
|
| 341 |
+
tensor<fp32, []> var_352 = const()[name = tensor<string, []>("op_352"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
|
| 342 |
+
tensor<fp32, [1, ?, 1]> var_353 = add(x = variance_9, y = var_352)[name = tensor<string, []>("op_353")];
|
| 343 |
+
tensor<fp32, []> var_354_epsilon_0 = const()[name = tensor<string, []>("op_354_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
|
| 344 |
+
tensor<fp32, [1, ?, 1]> var_354 = rsqrt(epsilon = var_354_epsilon_0, x = var_353)[name = tensor<string, []>("op_354")];
|
| 345 |
+
tensor<fp32, [1, ?, 256]> hidden_states_35 = mul(x = hidden_states_31, y = var_354)[name = tensor<string, []>("hidden_states_35")];
|
| 346 |
+
tensor<fp32, [1, ?, 256]> hidden_states_37 = mul(x = decoder_block_1_layer_1_layer_norm_weight, y = hidden_states_35)[name = tensor<string, []>("hidden_states_37")];
|
| 347 |
+
tensor<fp32, [1, ?, 384]> states_25 = linear(bias = linear_0_bias_0, weight = decoder_block_1_layer_1_EncDecAttention_q_weight, x = hidden_states_37)[name = tensor<string, []>("linear_15")];
|
| 348 |
+
tensor<int32, [4]> var_367 = const()[name = tensor<string, []>("op_367"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 349 |
+
tensor<fp32, [1, ?, 6, 64]> var_368 = reshape(shape = var_367, x = states_25)[name = tensor<string, []>("op_368")];
|
| 350 |
+
tensor<fp32, [1, ?, 384]> states_27 = linear(bias = linear_0_bias_0, weight = decoder_block_1_layer_1_EncDecAttention_k_weight, x = encoder_hidden_states)[name = tensor<string, []>("linear_16")];
|
| 351 |
+
tensor<int32, [4]> var_372 = const()[name = tensor<string, []>("op_372"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 352 |
+
tensor<fp32, [1, ?, 6, 64]> var_373 = reshape(shape = var_372, x = states_27)[name = tensor<string, []>("op_373")];
|
| 353 |
+
tensor<fp32, [1, ?, 384]> states_29 = linear(bias = linear_0_bias_0, weight = decoder_block_1_layer_1_EncDecAttention_v_weight, x = encoder_hidden_states)[name = tensor<string, []>("linear_17")];
|
| 354 |
+
tensor<int32, [4]> var_377 = const()[name = tensor<string, []>("op_377"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 355 |
+
tensor<fp32, [1, ?, 6, 64]> var_378 = reshape(shape = var_377, x = states_29)[name = tensor<string, []>("op_378")];
|
| 356 |
+
tensor<int32, [4]> value_states_7_perm_0 = const()[name = tensor<string, []>("value_states_7_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
|
| 357 |
+
tensor<bool, []> scores_13_transpose_x_0 = const()[name = tensor<string, []>("scores_13_transpose_x_0"), val = tensor<bool, []>(false)];
|
| 358 |
+
tensor<bool, []> scores_13_transpose_y_0 = const()[name = tensor<string, []>("scores_13_transpose_y_0"), val = tensor<bool, []>(false)];
|
| 359 |
+
tensor<int32, [4]> transpose_30_perm_0 = const()[name = tensor<string, []>("transpose_30_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])];
|
| 360 |
+
tensor<int32, [4]> transpose_31_perm_0 = const()[name = tensor<string, []>("transpose_31_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])];
|
| 361 |
+
tensor<fp32, [1, 6, 64, ?]> transpose_31 = transpose(perm = transpose_31_perm_0, x = var_373)[name = tensor<string, []>("transpose_57")];
|
| 362 |
+
tensor<fp32, [1, 6, ?, 64]> transpose_30 = transpose(perm = transpose_30_perm_0, x = var_368)[name = tensor<string, []>("transpose_58")];
|
| 363 |
+
tensor<fp32, [1, 6, ?, ?]> scores_13 = matmul(transpose_x = scores_13_transpose_x_0, transpose_y = scores_13_transpose_y_0, x = transpose_30, y = transpose_31)[name = tensor<string, []>("scores_13")];
|
| 364 |
+
tensor<fp32, [1, 6, ?, ?]> scores_15 = add(x = scores_13, y = position_bias)[name = tensor<string, []>("scores_15")];
|
| 365 |
+
tensor<fp32, [1, 6, ?, ?]> var_384 = softmax(axis = var_22, x = scores_15)[name = tensor<string, []>("op_384")];
|
| 366 |
+
tensor<bool, []> states_31_transpose_x_0 = const()[name = tensor<string, []>("states_31_transpose_x_0"), val = tensor<bool, []>(false)];
|
| 367 |
+
tensor<bool, []> states_31_transpose_y_0 = const()[name = tensor<string, []>("states_31_transpose_y_0"), val = tensor<bool, []>(false)];
|
| 368 |
+
tensor<fp32, [1, 6, ?, 64]> value_states_7 = transpose(perm = value_states_7_perm_0, x = var_378)[name = tensor<string, []>("transpose_59")];
|
| 369 |
+
tensor<fp32, [1, 6, ?, 64]> states_31 = matmul(transpose_x = states_31_transpose_x_0, transpose_y = states_31_transpose_y_0, x = var_384, y = value_states_7)[name = tensor<string, []>("states_31")];
|
| 370 |
+
tensor<int32, [4]> var_388_perm_0 = const()[name = tensor<string, []>("op_388_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
|
| 371 |
+
tensor<int32, [3]> var_390 = const()[name = tensor<string, []>("op_390"), val = tensor<int32, [3]>([1, -1, 384])];
|
| 372 |
+
tensor<fp32, [1, ?, 6, 64]> var_388 = transpose(perm = var_388_perm_0, x = states_31)[name = tensor<string, []>("transpose_56")];
|
| 373 |
+
tensor<fp32, [1, ?, 384]> input_45 = reshape(shape = var_390, x = var_388)[name = tensor<string, []>("input_45")];
|
| 374 |
+
tensor<fp32, [1, ?, 256]> input_47 = linear(bias = linear_3_bias_0, weight = decoder_block_1_layer_1_EncDecAttention_o_weight, x = input_45)[name = tensor<string, []>("linear_18")];
|
| 375 |
+
tensor<fp32, [1, ?, 256]> hidden_states_39 = add(x = hidden_states_31, y = input_47)[name = tensor<string, []>("hidden_states_39")];
|
| 376 |
+
tensor<fp32, []> var_18_promoted_5 = const()[name = tensor<string, []>("op_18_promoted_5"), val = tensor<fp32, []>(0x1p+1)];
|
| 377 |
+
tensor<fp32, [1, ?, 256]> var_400 = pow(x = hidden_states_39, y = var_18_promoted_5)[name = tensor<string, []>("op_400")];
|
| 378 |
+
tensor<int32, [1]> variance_11_axes_0 = const()[name = tensor<string, []>("variance_11_axes_0"), val = tensor<int32, [1]>([-1])];
|
| 379 |
+
tensor<bool, []> variance_11_keep_dims_0 = const()[name = tensor<string, []>("variance_11_keep_dims_0"), val = tensor<bool, []>(true)];
|
| 380 |
+
tensor<fp32, [1, ?, 1]> variance_11 = reduce_mean(axes = variance_11_axes_0, keep_dims = variance_11_keep_dims_0, x = var_400)[name = tensor<string, []>("variance_11")];
|
| 381 |
+
tensor<fp32, []> var_403 = const()[name = tensor<string, []>("op_403"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
|
| 382 |
+
tensor<fp32, [1, ?, 1]> var_404 = add(x = variance_11, y = var_403)[name = tensor<string, []>("op_404")];
|
| 383 |
+
tensor<fp32, []> var_405_epsilon_0 = const()[name = tensor<string, []>("op_405_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
|
| 384 |
+
tensor<fp32, [1, ?, 1]> var_405 = rsqrt(epsilon = var_405_epsilon_0, x = var_404)[name = tensor<string, []>("op_405")];
|
| 385 |
+
tensor<fp32, [1, ?, 256]> hidden_states_43 = mul(x = hidden_states_39, y = var_405)[name = tensor<string, []>("hidden_states_43")];
|
| 386 |
+
tensor<fp32, [1, ?, 256]> input_49 = mul(x = decoder_block_1_layer_2_layer_norm_weight, y = hidden_states_43)[name = tensor<string, []>("input_49")];
|
| 387 |
+
tensor<fp32, [1, ?, 1024]> input_51 = linear(bias = linear_8_bias_0, weight = decoder_block_1_layer_2_DenseReluDense_wi_0_weight, x = input_49)[name = tensor<string, []>("linear_19")];
|
| 388 |
+
tensor<string, []> hidden_gelu_3_mode_0 = const()[name = tensor<string, []>("hidden_gelu_3_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
|
| 389 |
+
tensor<fp32, [1, ?, 1024]> hidden_gelu_3 = gelu(mode = hidden_gelu_3_mode_0, x = input_51)[name = tensor<string, []>("hidden_gelu_3")];
|
| 390 |
+
tensor<fp32, [1, ?, 1024]> hidden_linear_3 = linear(bias = linear_8_bias_0, weight = decoder_block_1_layer_2_DenseReluDense_wi_1_weight, x = input_49)[name = tensor<string, []>("linear_20")];
|
| 391 |
+
tensor<fp32, [1, ?, 1024]> input_53 = mul(x = hidden_gelu_3, y = hidden_linear_3)[name = tensor<string, []>("input_53")];
|
| 392 |
+
tensor<fp32, [1, ?, 256]> input_57 = linear(bias = linear_3_bias_0, weight = decoder_block_1_layer_2_DenseReluDense_wo_weight, x = input_53)[name = tensor<string, []>("linear_21")];
|
| 393 |
+
tensor<fp32, [1, ?, 256]> hidden_states_45 = add(x = hidden_states_39, y = input_57)[name = tensor<string, []>("hidden_states_45")];
|
| 394 |
+
tensor<fp32, []> var_18_promoted_6 = const()[name = tensor<string, []>("op_18_promoted_6"), val = tensor<fp32, []>(0x1p+1)];
|
| 395 |
+
tensor<fp32, [1, ?, 256]> var_446 = pow(x = hidden_states_45, y = var_18_promoted_6)[name = tensor<string, []>("op_446")];
|
| 396 |
+
tensor<int32, [1]> variance_13_axes_0 = const()[name = tensor<string, []>("variance_13_axes_0"), val = tensor<int32, [1]>([-1])];
|
| 397 |
+
tensor<bool, []> variance_13_keep_dims_0 = const()[name = tensor<string, []>("variance_13_keep_dims_0"), val = tensor<bool, []>(true)];
|
| 398 |
+
tensor<fp32, [1, ?, 1]> variance_13 = reduce_mean(axes = variance_13_axes_0, keep_dims = variance_13_keep_dims_0, x = var_446)[name = tensor<string, []>("variance_13")];
|
| 399 |
+
tensor<fp32, []> var_449 = const()[name = tensor<string, []>("op_449"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
|
| 400 |
+
tensor<fp32, [1, ?, 1]> var_450 = add(x = variance_13, y = var_449)[name = tensor<string, []>("op_450")];
|
| 401 |
+
tensor<fp32, []> var_451_epsilon_0 = const()[name = tensor<string, []>("op_451_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
|
| 402 |
+
tensor<fp32, [1, ?, 1]> var_451 = rsqrt(epsilon = var_451_epsilon_0, x = var_450)[name = tensor<string, []>("op_451")];
|
| 403 |
+
tensor<fp32, [1, ?, 256]> hidden_states_49 = mul(x = hidden_states_45, y = var_451)[name = tensor<string, []>("hidden_states_49")];
|
| 404 |
+
tensor<fp32, [1, ?, 256]> hidden_states_51 = mul(x = decoder_block_2_layer_0_layer_norm_weight, y = hidden_states_49)[name = tensor<string, []>("hidden_states_51")];
|
| 405 |
+
tensor<fp32, [1, ?, 384]> states_33 = linear(bias = linear_0_bias_0, weight = decoder_block_2_layer_0_SelfAttention_q_weight, x = hidden_states_51)[name = tensor<string, []>("linear_22")];
|
| 406 |
+
tensor<int32, [4]> var_464 = const()[name = tensor<string, []>("op_464"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 407 |
+
tensor<fp32, [1, ?, 6, 64]> var_465 = reshape(shape = var_464, x = states_33)[name = tensor<string, []>("op_465")];
|
| 408 |
+
tensor<fp32, [1, ?, 384]> states_35 = linear(bias = linear_0_bias_0, weight = decoder_block_2_layer_0_SelfAttention_k_weight, x = hidden_states_51)[name = tensor<string, []>("linear_23")];
|
| 409 |
+
tensor<int32, [4]> var_469 = const()[name = tensor<string, []>("op_469"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 410 |
+
tensor<fp32, [1, ?, 6, 64]> var_470 = reshape(shape = var_469, x = states_35)[name = tensor<string, []>("op_470")];
|
| 411 |
+
tensor<fp32, [1, ?, 384]> states_37 = linear(bias = linear_0_bias_0, weight = decoder_block_2_layer_0_SelfAttention_v_weight, x = hidden_states_51)[name = tensor<string, []>("linear_24")];
|
| 412 |
+
tensor<int32, [4]> var_474 = const()[name = tensor<string, []>("op_474"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 413 |
+
tensor<fp32, [1, ?, 6, 64]> var_475 = reshape(shape = var_474, x = states_37)[name = tensor<string, []>("op_475")];
|
| 414 |
+
tensor<int32, [4]> value_states_9_perm_0 = const()[name = tensor<string, []>("value_states_9_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
|
| 415 |
+
tensor<bool, []> scores_17_transpose_x_0 = const()[name = tensor<string, []>("scores_17_transpose_x_0"), val = tensor<bool, []>(false)];
|
| 416 |
+
tensor<bool, []> scores_17_transpose_y_0 = const()[name = tensor<string, []>("scores_17_transpose_y_0"), val = tensor<bool, []>(false)];
|
| 417 |
+
tensor<int32, [4]> transpose_32_perm_0 = const()[name = tensor<string, []>("transpose_32_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])];
|
| 418 |
+
tensor<int32, [4]> transpose_33_perm_0 = const()[name = tensor<string, []>("transpose_33_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])];
|
| 419 |
+
tensor<fp32, [1, 6, 64, ?]> transpose_33 = transpose(perm = transpose_33_perm_0, x = var_470)[name = tensor<string, []>("transpose_53")];
|
| 420 |
+
tensor<fp32, [1, 6, ?, 64]> transpose_32 = transpose(perm = transpose_32_perm_0, x = var_465)[name = tensor<string, []>("transpose_54")];
|
| 421 |
+
tensor<fp32, [1, 6, ?, ?]> scores_17 = matmul(transpose_x = scores_17_transpose_x_0, transpose_y = scores_17_transpose_y_0, x = transpose_32, y = transpose_33)[name = tensor<string, []>("scores_17")];
|
| 422 |
+
tensor<fp32, [1, 6, ?, ?]> scores_19 = add(x = scores_17, y = position_bias_3)[name = tensor<string, []>("scores_19")];
|
| 423 |
+
tensor<fp32, [1, 6, ?, ?]> var_481 = softmax(axis = var_22, x = scores_19)[name = tensor<string, []>("op_481")];
|
| 424 |
+
tensor<bool, []> states_39_transpose_x_0 = const()[name = tensor<string, []>("states_39_transpose_x_0"), val = tensor<bool, []>(false)];
|
| 425 |
+
tensor<bool, []> states_39_transpose_y_0 = const()[name = tensor<string, []>("states_39_transpose_y_0"), val = tensor<bool, []>(false)];
|
| 426 |
+
tensor<fp32, [1, 6, ?, 64]> value_states_9 = transpose(perm = value_states_9_perm_0, x = var_475)[name = tensor<string, []>("transpose_55")];
|
| 427 |
+
tensor<fp32, [1, 6, ?, 64]> states_39 = matmul(transpose_x = states_39_transpose_x_0, transpose_y = states_39_transpose_y_0, x = var_481, y = value_states_9)[name = tensor<string, []>("states_39")];
|
| 428 |
+
tensor<int32, [4]> var_485_perm_0 = const()[name = tensor<string, []>("op_485_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
|
| 429 |
+
tensor<int32, [3]> var_487 = const()[name = tensor<string, []>("op_487"), val = tensor<int32, [3]>([1, -1, 384])];
|
| 430 |
+
tensor<fp32, [1, ?, 6, 64]> var_485 = transpose(perm = var_485_perm_0, x = states_39)[name = tensor<string, []>("transpose_52")];
|
| 431 |
+
tensor<fp32, [1, ?, 384]> input_63 = reshape(shape = var_487, x = var_485)[name = tensor<string, []>("input_63")];
|
| 432 |
+
tensor<fp32, [1, ?, 256]> input_65 = linear(bias = linear_3_bias_0, weight = decoder_block_2_layer_0_SelfAttention_o_weight, x = input_63)[name = tensor<string, []>("linear_25")];
|
| 433 |
+
tensor<fp32, [1, ?, 256]> hidden_states_53 = add(x = hidden_states_45, y = input_65)[name = tensor<string, []>("hidden_states_53")];
|
| 434 |
+
tensor<fp32, []> var_18_promoted_7 = const()[name = tensor<string, []>("op_18_promoted_7"), val = tensor<fp32, []>(0x1p+1)];
|
| 435 |
+
tensor<fp32, [1, ?, 256]> var_503 = pow(x = hidden_states_53, y = var_18_promoted_7)[name = tensor<string, []>("op_503")];
|
| 436 |
+
tensor<int32, [1]> variance_15_axes_0 = const()[name = tensor<string, []>("variance_15_axes_0"), val = tensor<int32, [1]>([-1])];
|
| 437 |
+
tensor<bool, []> variance_15_keep_dims_0 = const()[name = tensor<string, []>("variance_15_keep_dims_0"), val = tensor<bool, []>(true)];
|
| 438 |
+
tensor<fp32, [1, ?, 1]> variance_15 = reduce_mean(axes = variance_15_axes_0, keep_dims = variance_15_keep_dims_0, x = var_503)[name = tensor<string, []>("variance_15")];
|
| 439 |
+
tensor<fp32, []> var_506 = const()[name = tensor<string, []>("op_506"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
|
| 440 |
+
tensor<fp32, [1, ?, 1]> var_507 = add(x = variance_15, y = var_506)[name = tensor<string, []>("op_507")];
|
| 441 |
+
tensor<fp32, []> var_508_epsilon_0 = const()[name = tensor<string, []>("op_508_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
|
| 442 |
+
tensor<fp32, [1, ?, 1]> var_508 = rsqrt(epsilon = var_508_epsilon_0, x = var_507)[name = tensor<string, []>("op_508")];
|
| 443 |
+
tensor<fp32, [1, ?, 256]> hidden_states_57 = mul(x = hidden_states_53, y = var_508)[name = tensor<string, []>("hidden_states_57")];
|
| 444 |
+
tensor<fp32, [1, ?, 256]> hidden_states_59 = mul(x = decoder_block_2_layer_1_layer_norm_weight, y = hidden_states_57)[name = tensor<string, []>("hidden_states_59")];
|
| 445 |
+
tensor<fp32, [1, ?, 384]> states_41 = linear(bias = linear_0_bias_0, weight = decoder_block_2_layer_1_EncDecAttention_q_weight, x = hidden_states_59)[name = tensor<string, []>("linear_26")];
|
| 446 |
+
tensor<int32, [4]> var_521 = const()[name = tensor<string, []>("op_521"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 447 |
+
tensor<fp32, [1, ?, 6, 64]> var_522 = reshape(shape = var_521, x = states_41)[name = tensor<string, []>("op_522")];
|
| 448 |
+
tensor<fp32, [1, ?, 384]> states_43 = linear(bias = linear_0_bias_0, weight = decoder_block_2_layer_1_EncDecAttention_k_weight, x = encoder_hidden_states)[name = tensor<string, []>("linear_27")];
|
| 449 |
+
tensor<int32, [4]> var_526 = const()[name = tensor<string, []>("op_526"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 450 |
+
tensor<fp32, [1, ?, 6, 64]> var_527 = reshape(shape = var_526, x = states_43)[name = tensor<string, []>("op_527")];
|
| 451 |
+
tensor<fp32, [1, ?, 384]> states_45 = linear(bias = linear_0_bias_0, weight = decoder_block_2_layer_1_EncDecAttention_v_weight, x = encoder_hidden_states)[name = tensor<string, []>("linear_28")];
|
| 452 |
+
tensor<int32, [4]> var_531 = const()[name = tensor<string, []>("op_531"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 453 |
+
tensor<fp32, [1, ?, 6, 64]> var_532 = reshape(shape = var_531, x = states_45)[name = tensor<string, []>("op_532")];
|
| 454 |
+
tensor<int32, [4]> value_states_11_perm_0 = const()[name = tensor<string, []>("value_states_11_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
|
| 455 |
+
tensor<bool, []> scores_21_transpose_x_0 = const()[name = tensor<string, []>("scores_21_transpose_x_0"), val = tensor<bool, []>(false)];
|
| 456 |
+
tensor<bool, []> scores_21_transpose_y_0 = const()[name = tensor<string, []>("scores_21_transpose_y_0"), val = tensor<bool, []>(false)];
|
| 457 |
+
tensor<int32, [4]> transpose_34_perm_0 = const()[name = tensor<string, []>("transpose_34_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])];
|
| 458 |
+
tensor<int32, [4]> transpose_35_perm_0 = const()[name = tensor<string, []>("transpose_35_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])];
|
| 459 |
+
tensor<fp32, [1, 6, 64, ?]> transpose_35 = transpose(perm = transpose_35_perm_0, x = var_527)[name = tensor<string, []>("transpose_49")];
|
| 460 |
+
tensor<fp32, [1, 6, ?, 64]> transpose_34 = transpose(perm = transpose_34_perm_0, x = var_522)[name = tensor<string, []>("transpose_50")];
|
| 461 |
+
tensor<fp32, [1, 6, ?, ?]> scores_21 = matmul(transpose_x = scores_21_transpose_x_0, transpose_y = scores_21_transpose_y_0, x = transpose_34, y = transpose_35)[name = tensor<string, []>("scores_21")];
|
| 462 |
+
tensor<fp32, [1, 6, ?, ?]> scores_23 = add(x = scores_21, y = position_bias)[name = tensor<string, []>("scores_23")];
|
| 463 |
+
tensor<fp32, [1, 6, ?, ?]> var_538 = softmax(axis = var_22, x = scores_23)[name = tensor<string, []>("op_538")];
|
| 464 |
+
tensor<bool, []> states_47_transpose_x_0 = const()[name = tensor<string, []>("states_47_transpose_x_0"), val = tensor<bool, []>(false)];
|
| 465 |
+
tensor<bool, []> states_47_transpose_y_0 = const()[name = tensor<string, []>("states_47_transpose_y_0"), val = tensor<bool, []>(false)];
|
| 466 |
+
tensor<fp32, [1, 6, ?, 64]> value_states_11 = transpose(perm = value_states_11_perm_0, x = var_532)[name = tensor<string, []>("transpose_51")];
|
| 467 |
+
tensor<fp32, [1, 6, ?, 64]> states_47 = matmul(transpose_x = states_47_transpose_x_0, transpose_y = states_47_transpose_y_0, x = var_538, y = value_states_11)[name = tensor<string, []>("states_47")];
|
| 468 |
+
tensor<int32, [4]> var_542_perm_0 = const()[name = tensor<string, []>("op_542_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
|
| 469 |
+
tensor<int32, [3]> var_544 = const()[name = tensor<string, []>("op_544"), val = tensor<int32, [3]>([1, -1, 384])];
|
| 470 |
+
tensor<fp32, [1, ?, 6, 64]> var_542 = transpose(perm = var_542_perm_0, x = states_47)[name = tensor<string, []>("transpose_48")];
|
| 471 |
+
tensor<fp32, [1, ?, 384]> input_71 = reshape(shape = var_544, x = var_542)[name = tensor<string, []>("input_71")];
|
| 472 |
+
tensor<fp32, [1, ?, 256]> input_73 = linear(bias = linear_3_bias_0, weight = decoder_block_2_layer_1_EncDecAttention_o_weight, x = input_71)[name = tensor<string, []>("linear_29")];
|
| 473 |
+
tensor<fp32, [1, ?, 256]> hidden_states_61 = add(x = hidden_states_53, y = input_73)[name = tensor<string, []>("hidden_states_61")];
|
| 474 |
+
tensor<fp32, []> var_18_promoted_8 = const()[name = tensor<string, []>("op_18_promoted_8"), val = tensor<fp32, []>(0x1p+1)];
|
| 475 |
+
tensor<fp32, [1, ?, 256]> var_554 = pow(x = hidden_states_61, y = var_18_promoted_8)[name = tensor<string, []>("op_554")];
|
| 476 |
+
tensor<int32, [1]> variance_17_axes_0 = const()[name = tensor<string, []>("variance_17_axes_0"), val = tensor<int32, [1]>([-1])];
|
| 477 |
+
tensor<bool, []> variance_17_keep_dims_0 = const()[name = tensor<string, []>("variance_17_keep_dims_0"), val = tensor<bool, []>(true)];
|
| 478 |
+
tensor<fp32, [1, ?, 1]> variance_17 = reduce_mean(axes = variance_17_axes_0, keep_dims = variance_17_keep_dims_0, x = var_554)[name = tensor<string, []>("variance_17")];
|
| 479 |
+
tensor<fp32, []> var_557 = const()[name = tensor<string, []>("op_557"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
|
| 480 |
+
tensor<fp32, [1, ?, 1]> var_558 = add(x = variance_17, y = var_557)[name = tensor<string, []>("op_558")];
|
| 481 |
+
tensor<fp32, []> var_559_epsilon_0 = const()[name = tensor<string, []>("op_559_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
|
| 482 |
+
tensor<fp32, [1, ?, 1]> var_559 = rsqrt(epsilon = var_559_epsilon_0, x = var_558)[name = tensor<string, []>("op_559")];
|
| 483 |
+
tensor<fp32, [1, ?, 256]> hidden_states_65 = mul(x = hidden_states_61, y = var_559)[name = tensor<string, []>("hidden_states_65")];
|
| 484 |
+
tensor<fp32, [1, ?, 256]> input_75 = mul(x = decoder_block_2_layer_2_layer_norm_weight, y = hidden_states_65)[name = tensor<string, []>("input_75")];
|
| 485 |
+
tensor<fp32, [1, ?, 1024]> input_77 = linear(bias = linear_8_bias_0, weight = decoder_block_2_layer_2_DenseReluDense_wi_0_weight, x = input_75)[name = tensor<string, []>("linear_30")];
|
| 486 |
+
tensor<string, []> hidden_gelu_5_mode_0 = const()[name = tensor<string, []>("hidden_gelu_5_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
|
| 487 |
+
tensor<fp32, [1, ?, 1024]> hidden_gelu_5 = gelu(mode = hidden_gelu_5_mode_0, x = input_77)[name = tensor<string, []>("hidden_gelu_5")];
|
| 488 |
+
tensor<fp32, [1, ?, 1024]> hidden_linear_5 = linear(bias = linear_8_bias_0, weight = decoder_block_2_layer_2_DenseReluDense_wi_1_weight, x = input_75)[name = tensor<string, []>("linear_31")];
|
| 489 |
+
tensor<fp32, [1, ?, 1024]> input_79 = mul(x = hidden_gelu_5, y = hidden_linear_5)[name = tensor<string, []>("input_79")];
|
| 490 |
+
tensor<fp32, [1, ?, 256]> input_83 = linear(bias = linear_3_bias_0, weight = decoder_block_2_layer_2_DenseReluDense_wo_weight, x = input_79)[name = tensor<string, []>("linear_32")];
|
| 491 |
+
tensor<fp32, [1, ?, 256]> hidden_states_67 = add(x = hidden_states_61, y = input_83)[name = tensor<string, []>("hidden_states_67")];
|
| 492 |
+
tensor<fp32, []> var_18_promoted_9 = const()[name = tensor<string, []>("op_18_promoted_9"), val = tensor<fp32, []>(0x1p+1)];
|
| 493 |
+
tensor<fp32, [1, ?, 256]> var_600 = pow(x = hidden_states_67, y = var_18_promoted_9)[name = tensor<string, []>("op_600")];
|
| 494 |
+
tensor<int32, [1]> variance_19_axes_0 = const()[name = tensor<string, []>("variance_19_axes_0"), val = tensor<int32, [1]>([-1])];
|
| 495 |
+
tensor<bool, []> variance_19_keep_dims_0 = const()[name = tensor<string, []>("variance_19_keep_dims_0"), val = tensor<bool, []>(true)];
|
| 496 |
+
tensor<fp32, [1, ?, 1]> variance_19 = reduce_mean(axes = variance_19_axes_0, keep_dims = variance_19_keep_dims_0, x = var_600)[name = tensor<string, []>("variance_19")];
|
| 497 |
+
tensor<fp32, []> var_603 = const()[name = tensor<string, []>("op_603"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
|
| 498 |
+
tensor<fp32, [1, ?, 1]> var_604 = add(x = variance_19, y = var_603)[name = tensor<string, []>("op_604")];
|
| 499 |
+
tensor<fp32, []> var_605_epsilon_0 = const()[name = tensor<string, []>("op_605_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
|
| 500 |
+
tensor<fp32, [1, ?, 1]> var_605 = rsqrt(epsilon = var_605_epsilon_0, x = var_604)[name = tensor<string, []>("op_605")];
|
| 501 |
+
tensor<fp32, [1, ?, 256]> hidden_states_71 = mul(x = hidden_states_67, y = var_605)[name = tensor<string, []>("hidden_states_71")];
|
| 502 |
+
tensor<fp32, [1, ?, 256]> hidden_states_73 = mul(x = decoder_block_3_layer_0_layer_norm_weight, y = hidden_states_71)[name = tensor<string, []>("hidden_states_73")];
|
| 503 |
+
tensor<fp32, [1, ?, 384]> states_49 = linear(bias = linear_0_bias_0, weight = decoder_block_3_layer_0_SelfAttention_q_weight, x = hidden_states_73)[name = tensor<string, []>("linear_33")];
|
| 504 |
+
tensor<int32, [4]> var_618 = const()[name = tensor<string, []>("op_618"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 505 |
+
tensor<fp32, [1, ?, 6, 64]> var_619 = reshape(shape = var_618, x = states_49)[name = tensor<string, []>("op_619")];
|
| 506 |
+
tensor<fp32, [1, ?, 384]> states_51 = linear(bias = linear_0_bias_0, weight = decoder_block_3_layer_0_SelfAttention_k_weight, x = hidden_states_73)[name = tensor<string, []>("linear_34")];
|
| 507 |
+
tensor<int32, [4]> var_623 = const()[name = tensor<string, []>("op_623"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 508 |
+
tensor<fp32, [1, ?, 6, 64]> var_624 = reshape(shape = var_623, x = states_51)[name = tensor<string, []>("op_624")];
|
| 509 |
+
tensor<fp32, [1, ?, 384]> states_53 = linear(bias = linear_0_bias_0, weight = decoder_block_3_layer_0_SelfAttention_v_weight, x = hidden_states_73)[name = tensor<string, []>("linear_35")];
|
| 510 |
+
tensor<int32, [4]> var_628 = const()[name = tensor<string, []>("op_628"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 511 |
+
tensor<fp32, [1, ?, 6, 64]> var_629 = reshape(shape = var_628, x = states_53)[name = tensor<string, []>("op_629")];
|
| 512 |
+
tensor<int32, [4]> value_states_13_perm_0 = const()[name = tensor<string, []>("value_states_13_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
|
| 513 |
+
tensor<bool, []> scores_25_transpose_x_0 = const()[name = tensor<string, []>("scores_25_transpose_x_0"), val = tensor<bool, []>(false)];
|
| 514 |
+
tensor<bool, []> scores_25_transpose_y_0 = const()[name = tensor<string, []>("scores_25_transpose_y_0"), val = tensor<bool, []>(false)];
|
| 515 |
+
tensor<int32, [4]> transpose_36_perm_0 = const()[name = tensor<string, []>("transpose_36_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])];
|
| 516 |
+
tensor<int32, [4]> transpose_37_perm_0 = const()[name = tensor<string, []>("transpose_37_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])];
|
| 517 |
+
tensor<fp32, [1, 6, 64, ?]> transpose_37 = transpose(perm = transpose_37_perm_0, x = var_624)[name = tensor<string, []>("transpose_45")];
|
| 518 |
+
tensor<fp32, [1, 6, ?, 64]> transpose_36 = transpose(perm = transpose_36_perm_0, x = var_619)[name = tensor<string, []>("transpose_46")];
|
| 519 |
+
tensor<fp32, [1, 6, ?, ?]> scores_25 = matmul(transpose_x = scores_25_transpose_x_0, transpose_y = scores_25_transpose_y_0, x = transpose_36, y = transpose_37)[name = tensor<string, []>("scores_25")];
|
| 520 |
+
tensor<fp32, [1, 6, ?, ?]> scores_27 = add(x = scores_25, y = position_bias_3)[name = tensor<string, []>("scores_27")];
|
| 521 |
+
tensor<fp32, [1, 6, ?, ?]> var_635 = softmax(axis = var_22, x = scores_27)[name = tensor<string, []>("op_635")];
|
| 522 |
+
tensor<bool, []> states_55_transpose_x_0 = const()[name = tensor<string, []>("states_55_transpose_x_0"), val = tensor<bool, []>(false)];
|
| 523 |
+
tensor<bool, []> states_55_transpose_y_0 = const()[name = tensor<string, []>("states_55_transpose_y_0"), val = tensor<bool, []>(false)];
|
| 524 |
+
tensor<fp32, [1, 6, ?, 64]> value_states_13 = transpose(perm = value_states_13_perm_0, x = var_629)[name = tensor<string, []>("transpose_47")];
|
| 525 |
+
tensor<fp32, [1, 6, ?, 64]> states_55 = matmul(transpose_x = states_55_transpose_x_0, transpose_y = states_55_transpose_y_0, x = var_635, y = value_states_13)[name = tensor<string, []>("states_55")];
|
| 526 |
+
tensor<int32, [4]> var_639_perm_0 = const()[name = tensor<string, []>("op_639_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
|
| 527 |
+
tensor<int32, [3]> var_641 = const()[name = tensor<string, []>("op_641"), val = tensor<int32, [3]>([1, -1, 384])];
|
| 528 |
+
tensor<fp32, [1, ?, 6, 64]> var_639 = transpose(perm = var_639_perm_0, x = states_55)[name = tensor<string, []>("transpose_44")];
|
| 529 |
+
tensor<fp32, [1, ?, 384]> input_89 = reshape(shape = var_641, x = var_639)[name = tensor<string, []>("input_89")];
|
| 530 |
+
tensor<fp32, [1, ?, 256]> input_91 = linear(bias = linear_3_bias_0, weight = decoder_block_3_layer_0_SelfAttention_o_weight, x = input_89)[name = tensor<string, []>("linear_36")];
|
| 531 |
+
tensor<fp32, [1, ?, 256]> hidden_states_75 = add(x = hidden_states_67, y = input_91)[name = tensor<string, []>("hidden_states_75")];
|
| 532 |
+
tensor<fp32, []> var_18_promoted_10 = const()[name = tensor<string, []>("op_18_promoted_10"), val = tensor<fp32, []>(0x1p+1)];
|
| 533 |
+
tensor<fp32, [1, ?, 256]> var_657 = pow(x = hidden_states_75, y = var_18_promoted_10)[name = tensor<string, []>("op_657")];
|
| 534 |
+
tensor<int32, [1]> variance_21_axes_0 = const()[name = tensor<string, []>("variance_21_axes_0"), val = tensor<int32, [1]>([-1])];
|
| 535 |
+
tensor<bool, []> variance_21_keep_dims_0 = const()[name = tensor<string, []>("variance_21_keep_dims_0"), val = tensor<bool, []>(true)];
|
| 536 |
+
tensor<fp32, [1, ?, 1]> variance_21 = reduce_mean(axes = variance_21_axes_0, keep_dims = variance_21_keep_dims_0, x = var_657)[name = tensor<string, []>("variance_21")];
|
| 537 |
+
tensor<fp32, []> var_660 = const()[name = tensor<string, []>("op_660"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
|
| 538 |
+
tensor<fp32, [1, ?, 1]> var_661 = add(x = variance_21, y = var_660)[name = tensor<string, []>("op_661")];
|
| 539 |
+
tensor<fp32, []> var_662_epsilon_0 = const()[name = tensor<string, []>("op_662_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
|
| 540 |
+
tensor<fp32, [1, ?, 1]> var_662 = rsqrt(epsilon = var_662_epsilon_0, x = var_661)[name = tensor<string, []>("op_662")];
|
| 541 |
+
tensor<fp32, [1, ?, 256]> hidden_states_79 = mul(x = hidden_states_75, y = var_662)[name = tensor<string, []>("hidden_states_79")];
|
| 542 |
+
tensor<fp32, [1, ?, 256]> hidden_states_81 = mul(x = decoder_block_3_layer_1_layer_norm_weight, y = hidden_states_79)[name = tensor<string, []>("hidden_states_81")];
|
| 543 |
+
tensor<fp32, [1, ?, 384]> states_57 = linear(bias = linear_0_bias_0, weight = decoder_block_3_layer_1_EncDecAttention_q_weight, x = hidden_states_81)[name = tensor<string, []>("linear_37")];
|
| 544 |
+
tensor<int32, [4]> var_675 = const()[name = tensor<string, []>("op_675"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 545 |
+
tensor<fp32, [1, ?, 6, 64]> var_676 = reshape(shape = var_675, x = states_57)[name = tensor<string, []>("op_676")];
|
| 546 |
+
tensor<fp32, [1, ?, 384]> states_59 = linear(bias = linear_0_bias_0, weight = decoder_block_3_layer_1_EncDecAttention_k_weight, x = encoder_hidden_states)[name = tensor<string, []>("linear_38")];
|
| 547 |
+
tensor<int32, [4]> var_680 = const()[name = tensor<string, []>("op_680"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 548 |
+
tensor<fp32, [1, ?, 6, 64]> var_681 = reshape(shape = var_680, x = states_59)[name = tensor<string, []>("op_681")];
|
| 549 |
+
tensor<fp32, [1, ?, 384]> states_61 = linear(bias = linear_0_bias_0, weight = decoder_block_3_layer_1_EncDecAttention_v_weight, x = encoder_hidden_states)[name = tensor<string, []>("linear_39")];
|
| 550 |
+
tensor<int32, [4]> var_685 = const()[name = tensor<string, []>("op_685"), val = tensor<int32, [4]>([1, -1, 6, 64])];
|
| 551 |
+
tensor<fp32, [1, ?, 6, 64]> var_686 = reshape(shape = var_685, x = states_61)[name = tensor<string, []>("op_686")];
|
| 552 |
+
tensor<int32, [4]> value_states_perm_0 = const()[name = tensor<string, []>("value_states_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
|
| 553 |
+
tensor<bool, []> scores_29_transpose_x_0 = const()[name = tensor<string, []>("scores_29_transpose_x_0"), val = tensor<bool, []>(false)];
|
| 554 |
+
tensor<bool, []> scores_29_transpose_y_0 = const()[name = tensor<string, []>("scores_29_transpose_y_0"), val = tensor<bool, []>(false)];
|
| 555 |
+
tensor<int32, [4]> transpose_38_perm_0 = const()[name = tensor<string, []>("transpose_38_perm_0"), val = tensor<int32, [4]>([0, 2, -3, -1])];
|
| 556 |
+
tensor<int32, [4]> transpose_39_perm_0 = const()[name = tensor<string, []>("transpose_39_perm_0"), val = tensor<int32, [4]>([0, 2, -1, -3])];
|
| 557 |
+
tensor<fp32, [1, 6, 64, ?]> transpose_39 = transpose(perm = transpose_39_perm_0, x = var_681)[name = tensor<string, []>("transpose_41")];
|
| 558 |
+
tensor<fp32, [1, 6, ?, 64]> transpose_38 = transpose(perm = transpose_38_perm_0, x = var_676)[name = tensor<string, []>("transpose_42")];
|
| 559 |
+
tensor<fp32, [1, 6, ?, ?]> scores_29 = matmul(transpose_x = scores_29_transpose_x_0, transpose_y = scores_29_transpose_y_0, x = transpose_38, y = transpose_39)[name = tensor<string, []>("scores_29")];
|
| 560 |
+
tensor<fp32, [1, 6, ?, ?]> scores = add(x = scores_29, y = position_bias)[name = tensor<string, []>("scores")];
|
| 561 |
+
tensor<fp32, [1, 6, ?, ?]> var_692 = softmax(axis = var_22, x = scores)[name = tensor<string, []>("op_692")];
|
| 562 |
+
tensor<bool, []> states_transpose_x_0 = const()[name = tensor<string, []>("states_transpose_x_0"), val = tensor<bool, []>(false)];
|
| 563 |
+
tensor<bool, []> states_transpose_y_0 = const()[name = tensor<string, []>("states_transpose_y_0"), val = tensor<bool, []>(false)];
|
| 564 |
+
tensor<fp32, [1, 6, ?, 64]> value_states = transpose(perm = value_states_perm_0, x = var_686)[name = tensor<string, []>("transpose_43")];
|
| 565 |
+
tensor<fp32, [1, 6, ?, 64]> states = matmul(transpose_x = states_transpose_x_0, transpose_y = states_transpose_y_0, x = var_692, y = value_states)[name = tensor<string, []>("states")];
|
| 566 |
+
tensor<int32, [4]> var_696_perm_0 = const()[name = tensor<string, []>("op_696_perm_0"), val = tensor<int32, [4]>([0, 2, 1, 3])];
|
| 567 |
+
tensor<int32, [3]> var_698 = const()[name = tensor<string, []>("op_698"), val = tensor<int32, [3]>([1, -1, 384])];
|
| 568 |
+
tensor<fp32, [1, ?, 6, 64]> var_696 = transpose(perm = var_696_perm_0, x = states)[name = tensor<string, []>("transpose_40")];
|
| 569 |
+
tensor<fp32, [1, ?, 384]> input_97 = reshape(shape = var_698, x = var_696)[name = tensor<string, []>("input_97")];
|
| 570 |
+
tensor<fp32, [1, ?, 256]> input_99 = linear(bias = linear_3_bias_0, weight = decoder_block_3_layer_1_EncDecAttention_o_weight, x = input_97)[name = tensor<string, []>("linear_40")];
|
| 571 |
+
tensor<fp32, [1, ?, 256]> hidden_states_83 = add(x = hidden_states_75, y = input_99)[name = tensor<string, []>("hidden_states_83")];
|
| 572 |
+
tensor<fp32, []> var_18_promoted_11 = const()[name = tensor<string, []>("op_18_promoted_11"), val = tensor<fp32, []>(0x1p+1)];
|
| 573 |
+
tensor<fp32, [1, ?, 256]> var_708 = pow(x = hidden_states_83, y = var_18_promoted_11)[name = tensor<string, []>("op_708")];
|
| 574 |
+
tensor<int32, [1]> variance_23_axes_0 = const()[name = tensor<string, []>("variance_23_axes_0"), val = tensor<int32, [1]>([-1])];
|
| 575 |
+
tensor<bool, []> variance_23_keep_dims_0 = const()[name = tensor<string, []>("variance_23_keep_dims_0"), val = tensor<bool, []>(true)];
|
| 576 |
+
tensor<fp32, [1, ?, 1]> variance_23 = reduce_mean(axes = variance_23_axes_0, keep_dims = variance_23_keep_dims_0, x = var_708)[name = tensor<string, []>("variance_23")];
|
| 577 |
+
tensor<fp32, []> var_711 = const()[name = tensor<string, []>("op_711"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
|
| 578 |
+
tensor<fp32, [1, ?, 1]> var_712 = add(x = variance_23, y = var_711)[name = tensor<string, []>("op_712")];
|
| 579 |
+
tensor<fp32, []> var_713_epsilon_0 = const()[name = tensor<string, []>("op_713_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
|
| 580 |
+
tensor<fp32, [1, ?, 1]> var_713 = rsqrt(epsilon = var_713_epsilon_0, x = var_712)[name = tensor<string, []>("op_713")];
|
| 581 |
+
tensor<fp32, [1, ?, 256]> hidden_states_87 = mul(x = hidden_states_83, y = var_713)[name = tensor<string, []>("hidden_states_87")];
|
| 582 |
+
tensor<fp32, [1, ?, 256]> input_101 = mul(x = decoder_block_3_layer_2_layer_norm_weight, y = hidden_states_87)[name = tensor<string, []>("input_101")];
|
| 583 |
+
tensor<fp32, [1, ?, 1024]> input_103 = linear(bias = linear_8_bias_0, weight = decoder_block_3_layer_2_DenseReluDense_wi_0_weight, x = input_101)[name = tensor<string, []>("linear_41")];
|
| 584 |
+
tensor<string, []> hidden_gelu_mode_0 = const()[name = tensor<string, []>("hidden_gelu_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
|
| 585 |
+
tensor<fp32, [1, ?, 1024]> hidden_gelu = gelu(mode = hidden_gelu_mode_0, x = input_103)[name = tensor<string, []>("hidden_gelu")];
|
| 586 |
+
tensor<fp32, [1, ?, 1024]> hidden_linear = linear(bias = linear_8_bias_0, weight = decoder_block_3_layer_2_DenseReluDense_wi_1_weight, x = input_101)[name = tensor<string, []>("linear_42")];
|
| 587 |
+
tensor<fp32, [1, ?, 1024]> input_105 = mul(x = hidden_gelu, y = hidden_linear)[name = tensor<string, []>("input_105")];
|
| 588 |
+
tensor<fp32, [1, ?, 256]> input_109 = linear(bias = linear_3_bias_0, weight = decoder_block_3_layer_2_DenseReluDense_wo_weight, x = input_105)[name = tensor<string, []>("linear_43")];
|
| 589 |
+
tensor<fp32, [1, ?, 256]> hidden_states_89 = add(x = hidden_states_83, y = input_109)[name = tensor<string, []>("hidden_states_89")];
|
| 590 |
+
tensor<fp32, []> var_18_promoted_12 = const()[name = tensor<string, []>("op_18_promoted_12"), val = tensor<fp32, []>(0x1p+1)];
|
| 591 |
+
tensor<fp32, [1, ?, 256]> var_746 = pow(x = hidden_states_89, y = var_18_promoted_12)[name = tensor<string, []>("op_746")];
|
| 592 |
+
tensor<int32, [1]> variance_axes_0 = const()[name = tensor<string, []>("variance_axes_0"), val = tensor<int32, [1]>([-1])];
|
| 593 |
+
tensor<bool, []> variance_keep_dims_0 = const()[name = tensor<string, []>("variance_keep_dims_0"), val = tensor<bool, []>(true)];
|
| 594 |
+
tensor<fp32, [1, ?, 1]> variance = reduce_mean(axes = variance_axes_0, keep_dims = variance_keep_dims_0, x = var_746)[name = tensor<string, []>("variance")];
|
| 595 |
+
tensor<fp32, []> var_749 = const()[name = tensor<string, []>("op_749"), val = tensor<fp32, []>(0x1.0c6f7ap-20)];
|
| 596 |
+
tensor<fp32, [1, ?, 1]> var_750 = add(x = variance, y = var_749)[name = tensor<string, []>("op_750")];
|
| 597 |
+
tensor<fp32, []> var_751_epsilon_0 = const()[name = tensor<string, []>("op_751_epsilon_0"), val = tensor<fp32, []>(0x1.197998p-40)];
|
| 598 |
+
tensor<fp32, [1, ?, 1]> var_751 = rsqrt(epsilon = var_751_epsilon_0, x = var_750)[name = tensor<string, []>("op_751")];
|
| 599 |
+
tensor<fp32, [1, ?, 256]> hidden_states = mul(x = hidden_states_89, y = var_751)[name = tensor<string, []>("hidden_states")];
|
| 600 |
+
tensor<fp32, [1, ?, 256]> input_111 = mul(x = decoder_final_layer_norm_weight, y = hidden_states)[name = tensor<string, []>("input_111")];
|
| 601 |
+
tensor<fp32, [1, ?, 384]> logits = linear(bias = linear_0_bias_0, weight = lm_head_weight, x = input_111)[name = tensor<string, []>("linear_44")];
|
| 602 |
+
} -> (logits);
|
| 603 |
+
}
|
MultilingualG2PDecoder.mlmodelc/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:005b5ffbccabe4fd4074204d16af745b5d8f458a687b0c07e80060f7fe0a08e4
|
| 3 |
+
size 25977088
|
MultilingualG2PEncoder.mlmodelc/analytics/coremldata.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee8fd1ea46ec79fd7816493973deaa583cd867ce0c7d2dd55124d2368db094bd
|
| 3 |
+
size 243
|
MultilingualG2PEncoder.mlmodelc/coremldata.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed8bf165b8d5939f995b29490872ee581c9834d5b22d3686fc5c7b300680b058
|
| 3 |
+
size 439
|
MultilingualG2PEncoder.mlmodelc/metadata.json
ADDED
|
@@ -0,0 +1,99 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"metadataOutputVersion" : "3.0",
|
| 4 |
+
"storagePrecision" : "Float32",
|
| 5 |
+
"outputSchema" : [
|
| 6 |
+
{
|
| 7 |
+
"hasShapeFlexibility" : "0",
|
| 8 |
+
"isOptional" : "0",
|
| 9 |
+
"dataType" : "Float32",
|
| 10 |
+
"formattedType" : "MultiArray (Float32)",
|
| 11 |
+
"shortDescription" : "",
|
| 12 |
+
"shape" : "[]",
|
| 13 |
+
"name" : "last_hidden_state",
|
| 14 |
+
"type" : "MultiArray"
|
| 15 |
+
}
|
| 16 |
+
],
|
| 17 |
+
"modelParameters" : [
|
| 18 |
+
|
| 19 |
+
],
|
| 20 |
+
"specificationVersion" : 8,
|
| 21 |
+
"mlProgramOperationTypeHistogram" : {
|
| 22 |
+
"Range1d" : 1,
|
| 23 |
+
"Ios17.reshape" : 48,
|
| 24 |
+
"Ios16.reduceMean" : 25,
|
| 25 |
+
"Ios16.softmax" : 12,
|
| 26 |
+
"Ios17.matmul" : 24,
|
| 27 |
+
"Ios17.transpose" : 49,
|
| 28 |
+
"Select" : 3,
|
| 29 |
+
"Ios17.expandDims" : 5,
|
| 30 |
+
"Ios17.add" : 66,
|
| 31 |
+
"Ios16.fillLike" : 1,
|
| 32 |
+
"Shape" : 1,
|
| 33 |
+
"Ios17.gather" : 3,
|
| 34 |
+
"Ios17.log" : 1,
|
| 35 |
+
"Ios17.less" : 1,
|
| 36 |
+
"Ios17.sub" : 2,
|
| 37 |
+
"Ios17.pow" : 25,
|
| 38 |
+
"Ios17.cast" : 4,
|
| 39 |
+
"Ios16.gelu" : 12,
|
| 40 |
+
"Ios17.linear" : 84,
|
| 41 |
+
"Ios17.abs" : 1,
|
| 42 |
+
"Ios17.greaterEqual" : 2,
|
| 43 |
+
"Ios17.minimum" : 1,
|
| 44 |
+
"Ios17.rsqrt" : 25,
|
| 45 |
+
"Ios17.greater" : 1,
|
| 46 |
+
"Ios17.mul" : 67
|
| 47 |
+
},
|
| 48 |
+
"computePrecision" : "Mixed (Float32, Int32)",
|
| 49 |
+
"isUpdatable" : "0",
|
| 50 |
+
"stateSchema" : [
|
| 51 |
+
|
| 52 |
+
],
|
| 53 |
+
"availability" : {
|
| 54 |
+
"macOS" : "14.0",
|
| 55 |
+
"tvOS" : "17.0",
|
| 56 |
+
"visionOS" : "1.0",
|
| 57 |
+
"watchOS" : "10.0",
|
| 58 |
+
"iOS" : "17.0",
|
| 59 |
+
"macCatalyst" : "17.0"
|
| 60 |
+
},
|
| 61 |
+
"modelType" : {
|
| 62 |
+
"name" : "MLModelType_mlProgram"
|
| 63 |
+
},
|
| 64 |
+
"userDefinedMetadata" : {
|
| 65 |
+
"com.github.apple.coremltools.conversion_date" : "2026-03-13",
|
| 66 |
+
"com.github.apple.coremltools.source" : "torch==2.7.0",
|
| 67 |
+
"com.github.apple.coremltools.version" : "9.0",
|
| 68 |
+
"com.github.apple.coremltools.source_dialect" : "TorchScript"
|
| 69 |
+
},
|
| 70 |
+
"inputSchema" : [
|
| 71 |
+
{
|
| 72 |
+
"dataType" : "Int32",
|
| 73 |
+
"hasShapeFlexibility" : "1",
|
| 74 |
+
"isOptional" : "0",
|
| 75 |
+
"shapeFlexibility" : "1 × 1...64",
|
| 76 |
+
"shapeRange" : "[[1, 1], [1, 64]]",
|
| 77 |
+
"formattedType" : "MultiArray (Int32 1 × 16)",
|
| 78 |
+
"type" : "MultiArray",
|
| 79 |
+
"shape" : "[1, 16]",
|
| 80 |
+
"name" : "input_ids",
|
| 81 |
+
"shortDescription" : ""
|
| 82 |
+
},
|
| 83 |
+
{
|
| 84 |
+
"dataType" : "Int32",
|
| 85 |
+
"hasShapeFlexibility" : "1",
|
| 86 |
+
"isOptional" : "0",
|
| 87 |
+
"shapeFlexibility" : "1 × 1...64",
|
| 88 |
+
"shapeRange" : "[[1, 1], [1, 64]]",
|
| 89 |
+
"formattedType" : "MultiArray (Int32 1 × 16)",
|
| 90 |
+
"type" : "MultiArray",
|
| 91 |
+
"shape" : "[1, 16]",
|
| 92 |
+
"name" : "attention_mask",
|
| 93 |
+
"shortDescription" : ""
|
| 94 |
+
}
|
| 95 |
+
],
|
| 96 |
+
"generatedClassName" : "G2PEncoder",
|
| 97 |
+
"method" : "predict"
|
| 98 |
+
}
|
| 99 |
+
]
|
MultilingualG2PEncoder.mlmodelc/model.mil
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
MultilingualG2PEncoder.mlmodelc/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:11b225e93b6b1fe6fb85c9d4317724e1a033d6123fdc01dc2ad85f3c1f168eb3
|
| 3 |
+
size 57056704
|