7767517 2888 3632 MemoryData 0 0 1 tensor_197913 0=2048 21=0 MemoryData 1 0 1 tensor_197916 0=2048 21=0 MemoryData 2 0 1 tensor_197919 0=2048 21=0 MemoryData 3 0 1 tensor_197922 0=2048 21=0 MemoryData 4 0 1 tensor_197925 0=2048 21=0 MemoryData 5 0 1 tensor_197928 0=2048 21=0 MemoryData 6 0 1 tensor_197931 0=2048 21=0 MemoryData 7 0 1 tensor_197934 0=2048 21=0 MemoryData 8 0 1 tensor_197937 0=2048 21=0 MemoryData 9 0 1 tensor_197940 0=2048 21=0 MemoryData 10 0 1 tensor_197943 0=2048 21=0 MemoryData 11 0 1 tensor_197946 0=2048 21=0 MemoryData 12 0 1 tensor_197949 0=2048 21=0 MemoryData 13 0 1 tensor_197952 0=2048 21=0 MemoryData 14 0 1 tensor_197955 0=2048 21=0 MemoryData 15 0 1 tensor_197958 0=2048 21=0 MemoryData 16 0 1 tensor_197961 0=2048 21=0 MemoryData 17 0 1 tensor_197964 0=2048 21=0 MemoryData 18 0 1 tensor_197967 0=2048 21=0 MemoryData 19 0 1 tensor_197970 0=2048 21=0 MemoryData 20 0 1 tensor_197973 0=2048 21=0 MemoryData 21 0 1 tensor_197976 0=2048 21=0 MemoryData 22 0 1 tensor_197979 0=2048 21=0 MemoryData 23 0 1 tensor_197982 0=2048 21=0 MemoryData 24 0 1 tensor_197985 0=2048 21=0 MemoryData 25 0 1 tensor_197988 0=2048 21=0 MemoryData 26 0 1 tensor_197991 0=2048 21=0 MemoryData 27 0 1 tensor_197994 0=2048 21=0 MemoryData 28 0 1 tensor_197997 0=2048 21=0 MemoryData 29 0 1 tensor_198000 0=2048 21=0 MemoryData 30 0 1 tensor_198003 0=2048 21=0 MemoryData 31 0 1 tensor_198006 0=2048 21=0 MemoryData 32 0 1 tensor_198009 0=2048 21=0 MemoryData 33 0 1 tensor_198012 0=2048 21=0 MemoryData 34 0 1 tensor_198015 0=2048 21=0 MemoryData 35 0 1 tensor_198018 0=2048 21=0 MemoryData 36 0 1 tensor_198021 0=2048 21=0 MemoryData 37 0 1 tensor_198024 0=2048 21=0 MemoryData 38 0 1 tensor_198027 0=2048 21=0 MemoryData 39 0 1 tensor_198030 0=2048 21=0 MemoryData 40 0 1 tensor_198033 0=2048 21=0 MemoryData 41 0 1 tensor_198036 0=2048 21=0 MemoryData 42 0 1 tensor_198039 0=2048 21=0 MemoryData 43 0 1 tensor_198042 0=2048 21=0 MemoryData 44 0 1 tensor_198045 0=2048 21=0 MemoryData 45 0 1 tensor_198048 0=2048 21=0 MemoryData 46 0 1 tensor_198051 0=2048 21=0 MemoryData 47 0 1 tensor_198054 0=2048 21=0 MemoryData 48 0 1 tensor_198057 0=2048 21=0 MemoryData 49 0 1 tensor_198060 0=2048 21=0 MemoryData 50 0 1 tensor_198063 0=2048 21=0 MemoryData 51 0 1 tensor_198066 0=2048 21=0 MemoryData 52 0 1 tensor_198069 0=2048 21=0 MemoryData 53 0 1 tensor_198072 0=2048 21=0 MemoryData 54 0 1 tensor_198075 0=2048 21=0 MemoryData 55 0 1 tensor_198078 0=2048 21=0 MemoryData 56 0 1 tensor_198081 0=2048 21=0 MemoryData 57 0 1 tensor_198084 0=2048 21=0 MemoryData 58 0 1 tensor_198087 0=2048 21=0 MemoryData 59 0 1 tensor_198090 0=2048 21=0 MemoryData 60 0 1 tensor_198093 0=2048 21=0 MemoryData 61 0 1 tensor_198096 0=2048 21=0 MemoryData 62 0 1 tensor_198099 0=2048 21=0 MemoryData 63 0 1 tensor_198102 0=2048 21=0 MemoryData 64 0 1 tensor_198105 0=2048 21=0 MemoryData 65 0 1 tensor_198108 0=2048 21=0 MemoryData 66 0 1 tensor_198111 0=2048 21=0 MemoryData 67 0 1 tensor_198114 0=2048 21=0 MemoryData 68 0 1 tensor_198117 0=2048 21=0 MemoryData 69 0 1 tensor_198120 0=2048 21=0 MemoryData 70 0 1 tensor_198123 0=2048 21=0 MemoryData 71 0 1 tensor_198126 0=2048 21=0 MemoryData 72 0 1 tensor_198129 0=2048 21=0 MemoryData 73 0 1 tensor_198132 0=2048 21=0 MemoryData 74 0 1 tensor_198135 0=2048 21=0 MemoryData 75 0 1 tensor_198138 0=2048 21=0 MemoryData 76 0 1 tensor_198141 0=2048 21=0 MemoryData 77 0 1 tensor_198144 0=2048 21=0 MemoryData 78 0 1 tensor_198147 0=2048 21=0 MemoryData 79 0 1 tensor_198150 0=2048 21=0 MemoryData 80 0 1 tensor_198153 0=2048 21=0 MemoryData 81 0 1 tensor_198156 0=2048 21=0 MemoryData 82 0 1 tensor_198159 0=2048 21=0 MemoryData 83 0 1 tensor_198162 0=2048 21=0 MemoryData 84 0 1 tensor_198165 0=2048 21=0 MemoryData 85 0 1 tensor_198168 0=2048 21=0 MemoryData 86 0 1 tensor_198171 0=2048 21=0 MemoryData 87 0 1 tensor_198174 0=2048 21=0 MemoryData 88 0 1 tensor_198177 0=2048 21=0 MemoryData 89 0 1 tensor_198180 0=2048 21=0 MemoryData 90 0 1 tensor_198183 0=2048 21=0 MemoryData 91 0 1 tensor_198186 0=2048 21=0 MemoryData 92 0 1 tensor_198189 0=2048 21=0 MemoryData 93 0 1 tensor_198192 0=2048 21=0 MemoryData 94 0 1 tensor_198195 0=2048 21=0 MemoryData 95 0 1 tensor_198198 0=2048 21=0 MemoryData 96 0 1 tensor_198201 0=2048 21=0 MemoryData 97 0 1 tensor_198204 0=2048 21=0 MemoryData 98 0 1 tensor_198207 0=2048 21=0 MemoryData 99 0 1 tensor_198210 0=2048 21=0 MemoryData 100 0 1 tensor_198213 0=2048 21=0 MemoryData 101 0 1 tensor_198216 0=2048 21=0 MemoryData 102 0 1 tensor_198219 0=2048 21=0 MemoryData 103 0 1 tensor_198222 0=2048 21=0 MemoryData 104 0 1 tensor_198225 0=2048 21=0 MemoryData 105 0 1 tensor_198228 0=2048 21=0 MemoryData 106 0 1 tensor_198231 0=2048 21=0 MemoryData 107 0 1 tensor_198234 0=2048 21=0 MemoryData 108 0 1 tensor_198237 0=2048 21=0 MemoryData 109 0 1 tensor_198240 0=2048 21=0 MemoryData 110 0 1 tensor_198243 0=2048 21=0 MemoryData 111 0 1 tensor_198246 0=2048 21=0 MemoryData 112 0 1 tensor_198249 0=2048 21=0 MemoryData 113 0 1 tensor_198252 0=2048 21=0 MemoryData 114 0 1 tensor_198255 0=2048 21=0 MemoryData 115 0 1 tensor_198258 0=2048 21=0 MemoryData 116 0 1 tensor_198261 0=2048 21=0 MemoryData 117 0 1 tensor_198264 0=2048 21=0 MemoryData 118 0 1 tensor_198267 0=2048 21=0 MemoryData 119 0 1 tensor_198270 0=2048 21=0 Input 120 0 1 input_id 0=1 Input 121 0 1 state_0_0 0=2048 Input 122 0 1 state_0_1 0=2048 Input 123 0 1 state_0_2 0=2048 Input 124 0 1 state_0_3 0=2048 Input 125 0 1 state_0_4 0=2048 Input 126 0 1 state_1_0 0=2048 Input 127 0 1 state_1_1 0=2048 Input 128 0 1 state_1_2 0=2048 Input 129 0 1 state_1_3 0=2048 Input 130 0 1 state_1_4 0=2048 Input 131 0 1 state_2_0 0=2048 Input 132 0 1 state_2_1 0=2048 Input 133 0 1 state_2_2 0=2048 Input 134 0 1 state_2_3 0=2048 Input 135 0 1 state_2_4 0=2048 Input 136 0 1 state_3_0 0=2048 Input 137 0 1 state_3_1 0=2048 Input 138 0 1 state_3_2 0=2048 Input 139 0 1 state_3_3 0=2048 Input 140 0 1 state_3_4 0=2048 Input 141 0 1 state_4_0 0=2048 Input 142 0 1 state_4_1 0=2048 Input 143 0 1 state_4_2 0=2048 Input 144 0 1 state_4_3 0=2048 Input 145 0 1 state_4_4 0=2048 Input 146 0 1 state_5_0 0=2048 Input 147 0 1 state_5_1 0=2048 Input 148 0 1 state_5_2 0=2048 Input 149 0 1 state_5_3 0=2048 Input 150 0 1 state_5_4 0=2048 Input 151 0 1 state_6_0 0=2048 Input 152 0 1 state_6_1 0=2048 Input 153 0 1 state_6_2 0=2048 Input 154 0 1 state_6_3 0=2048 Input 155 0 1 state_6_4 0=2048 Input 156 0 1 state_7_0 0=2048 Input 157 0 1 state_7_1 0=2048 Input 158 0 1 state_7_2 0=2048 Input 159 0 1 state_7_3 0=2048 Input 160 0 1 state_7_4 0=2048 Input 161 0 1 state_8_0 0=2048 Input 162 0 1 state_8_1 0=2048 Input 163 0 1 state_8_2 0=2048 Input 164 0 1 state_8_3 0=2048 Input 165 0 1 state_8_4 0=2048 Input 166 0 1 state_9_0 0=2048 Input 167 0 1 state_9_1 0=2048 Input 168 0 1 state_9_2 0=2048 Input 169 0 1 state_9_3 0=2048 Input 170 0 1 state_9_4 0=2048 Input 171 0 1 state_10_0 0=2048 Input 172 0 1 state_10_1 0=2048 Input 173 0 1 state_10_2 0=2048 Input 174 0 1 state_10_3 0=2048 Input 175 0 1 state_10_4 0=2048 Input 176 0 1 state_11_0 0=2048 Input 177 0 1 state_11_1 0=2048 Input 178 0 1 state_11_2 0=2048 Input 179 0 1 state_11_3 0=2048 Input 180 0 1 state_11_4 0=2048 Input 181 0 1 state_12_0 0=2048 Input 182 0 1 state_12_1 0=2048 Input 183 0 1 state_12_2 0=2048 Input 184 0 1 state_12_3 0=2048 Input 185 0 1 state_12_4 0=2048 Input 186 0 1 state_13_0 0=2048 Input 187 0 1 state_13_1 0=2048 Input 188 0 1 state_13_2 0=2048 Input 189 0 1 state_13_3 0=2048 Input 190 0 1 state_13_4 0=2048 Input 191 0 1 state_14_0 0=2048 Input 192 0 1 state_14_1 0=2048 Input 193 0 1 state_14_2 0=2048 Input 194 0 1 state_14_3 0=2048 Input 195 0 1 state_14_4 0=2048 Input 196 0 1 state_15_0 0=2048 Input 197 0 1 state_15_1 0=2048 Input 198 0 1 state_15_2 0=2048 Input 199 0 1 state_15_3 0=2048 Input 200 0 1 state_15_4 0=2048 Input 201 0 1 state_16_0 0=2048 Input 202 0 1 state_16_1 0=2048 Input 203 0 1 state_16_2 0=2048 Input 204 0 1 state_16_3 0=2048 Input 205 0 1 state_16_4 0=2048 Input 206 0 1 state_17_0 0=2048 Input 207 0 1 state_17_1 0=2048 Input 208 0 1 state_17_2 0=2048 Input 209 0 1 state_17_3 0=2048 Input 210 0 1 state_17_4 0=2048 Input 211 0 1 state_18_0 0=2048 Input 212 0 1 state_18_1 0=2048 Input 213 0 1 state_18_2 0=2048 Input 214 0 1 state_18_3 0=2048 Input 215 0 1 state_18_4 0=2048 Input 216 0 1 state_19_0 0=2048 Input 217 0 1 state_19_1 0=2048 Input 218 0 1 state_19_2 0=2048 Input 219 0 1 state_19_3 0=2048 Input 220 0 1 state_19_4 0=2048 Input 221 0 1 state_20_0 0=2048 Input 222 0 1 state_20_1 0=2048 Input 223 0 1 state_20_2 0=2048 Input 224 0 1 state_20_3 0=2048 Input 225 0 1 state_20_4 0=2048 Input 226 0 1 state_21_0 0=2048 Input 227 0 1 state_21_1 0=2048 Input 228 0 1 state_21_2 0=2048 Input 229 0 1 state_21_3 0=2048 Input 230 0 1 state_21_4 0=2048 Input 231 0 1 state_22_0 0=2048 Input 232 0 1 state_22_1 0=2048 Input 233 0 1 state_22_2 0=2048 Input 234 0 1 state_22_3 0=2048 Input 235 0 1 state_22_4 0=2048 Input 236 0 1 state_23_0 0=2048 Input 237 0 1 state_23_1 0=2048 Input 238 0 1 state_23_2 0=2048 Input 239 0 1 state_23_3 0=2048 Input 240 0 1 state_23_4 0=2048 Embed 241 1 1 input_id tensor_198395 0=2048 1=65536 3=134217728 4=64 Reshape 242 1 1 tensor_198395 tensor_198398 0=2048 Split 243 1 2 tensor_198398 tensor_198399 tensor_198400 LayerNorm 244 1 1 tensor_198399 tensor_198401 0=2048 1=1.000000e-05 2=1 Split 245 1 4 tensor_198401 tensor_198402 tensor_198403 tensor_198404 tensor_198405 Split 246 1 3 state_0_0 tensor_198406 tensor_198407 tensor_198408 MemoryData 247 0 1 blocks.0.att.time_mix_k 0=2048 21=0 Split 248 1 2 blocks.0.att.time_mix_k tensor_198410 tensor_198411 MemoryData 249 0 1 blocks.0.att.time_mix_v 0=2048 21=0 Split 250 1 2 blocks.0.att.time_mix_v tensor_198413 tensor_198414 MemoryData 251 0 1 blocks.0.att.time_mix_r 0=2048 21=0 Split 252 1 2 blocks.0.att.time_mix_r tensor_198416 tensor_198417 BinaryOp 253 1 1 tensor_198411 tensor_198418 0=7 1=1 2=1.000000e+00 BinaryOp 254 2 1 tensor_198406 tensor_198418 tensor_198419 0=2 BinaryOp 255 2 1 tensor_198402 tensor_198410 tensor_198420 0=2 BinaryOp 256 2 1 tensor_198420 tensor_198419 tensor_198421 0=0 BinaryOp 257 1 1 tensor_198414 tensor_198422 0=7 1=1 2=1.000000e+00 BinaryOp 258 2 1 tensor_198407 tensor_198422 tensor_198423 0=2 BinaryOp 259 2 1 tensor_198403 tensor_198413 tensor_198424 0=2 BinaryOp 260 2 1 tensor_198424 tensor_198423 tensor_198425 0=0 BinaryOp 261 1 1 tensor_198417 tensor_198426 0=7 1=1 2=1.000000e+00 BinaryOp 262 2 1 tensor_198408 tensor_198426 tensor_198427 0=2 BinaryOp 263 2 1 tensor_198404 tensor_198416 tensor_198428 0=2 BinaryOp 264 2 1 tensor_198428 tensor_198427 tensor_198429 0=0 Reshape 265 1 1 tensor_198429 tensor_198430 0=0 1=1 Gemm 266 1 1 tensor_198430 tensor_198432 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 267 1 1 tensor_198432 tensor_198433 0=-1 Sigmoid 268 1 1 tensor_198433 tensor_198434 Reshape 269 1 1 tensor_198421 tensor_198435 0=0 1=1 Gemm 270 1 1 tensor_198435 tensor_198437 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 271 1 1 tensor_198437 tensor_198438 0=-1 Split 272 1 3 tensor_198438 tensor_198439 tensor_198440 tensor_198441 Reshape 273 1 1 tensor_198425 tensor_198442 0=0 1=1 Gemm 274 1 1 tensor_198442 tensor_198444 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 275 1 1 tensor_198444 tensor_198445 0=-1 Split 276 1 2 tensor_198445 tensor_198446 tensor_198447 MemoryData 277 0 1 blocks.0.att.time_first 0=2048 21=0 BinaryOp 278 2 1 blocks.0.att.time_first tensor_198439 tensor_198449 0=0 Split 279 1 2 tensor_198449 tensor_198450 tensor_198451 Split 280 1 3 state_0_3 tensor_198452 tensor_198453 tensor_198454 BinaryOp 281 2 1 tensor_198452 tensor_198450 tensor_198455 0=4 Split 282 1 2 tensor_198455 tensor_198456 tensor_198457 BinaryOp 283 2 1 tensor_198453 tensor_198456 tensor_198458 0=1 Exp 284 1 1 tensor_198458 tensor_198459 Split 285 1 2 tensor_198459 tensor_198460 tensor_198461 BinaryOp 286 2 1 tensor_198451 tensor_198457 tensor_198462 0=1 Exp 287 1 1 tensor_198462 tensor_198463 Split 288 1 2 tensor_198463 tensor_198464 tensor_198465 Split 289 1 2 state_0_1 tensor_198466 tensor_198467 Split 290 1 2 state_0_2 tensor_198468 tensor_198469 BinaryOp 291 2 1 tensor_198461 tensor_198468 tensor_198470 0=2 BinaryOp 292 2 1 tensor_198470 tensor_198465 tensor_198471 0=0 BinaryOp 293 2 1 tensor_198464 tensor_198446 tensor_198472 0=2 BinaryOp 294 2 1 tensor_198460 tensor_198466 tensor_198473 0=2 BinaryOp 295 2 1 tensor_198473 tensor_198472 tensor_198474 0=0 BinaryOp 296 2 1 tensor_198474 tensor_198471 tensor_198475 0=3 MemoryData 297 0 1 blocks.0.att.time_decay 0=2048 21=0 BinaryOp 298 2 1 blocks.0.att.time_decay tensor_198454 tensor_198477 0=0 Split 299 1 2 tensor_198477 tensor_198478 tensor_198479 BinaryOp 300 2 1 tensor_198478 tensor_198440 tensor_198480 0=4 Split 301 1 3 tensor_198480 tensor_198481 tensor_198482 tensor_198483 BinaryOp 302 2 1 tensor_198479 tensor_198481 tensor_198484 0=1 Exp 303 1 1 tensor_198484 tensor_198485 Split 304 1 2 tensor_198485 tensor_198486 tensor_198487 BinaryOp 305 2 1 tensor_198441 tensor_198482 tensor_198488 0=1 Exp 306 1 1 tensor_198488 tensor_198489 Split 307 1 2 tensor_198489 tensor_198490 tensor_198491 BinaryOp 308 2 1 tensor_198434 tensor_198475 tensor_198492 0=2 Reshape 309 1 1 tensor_198492 tensor_198493 0=0 1=1 Gemm 310 1 1 tensor_198493 tensor_198495 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 311 1 1 tensor_198495 tensor_198496 0=-1 BinaryOp 312 2 1 tensor_198400 tensor_198496 tensor_198497 0=0 BinaryOp 313 2 1 tensor_198490 tensor_198447 tensor_198498 0=2 BinaryOp 314 2 1 tensor_198486 tensor_198467 tensor_198499 0=2 BinaryOp 315 2 1 tensor_198499 tensor_198498 tensor_198500 0=0 BinaryOp 316 2 1 tensor_198487 tensor_198469 tensor_198501 0=2 BinaryOp 317 2 1 tensor_198501 tensor_198491 tensor_198502 0=0 Split 318 1 1 tensor_198405 output_state_0_0 Split 319 1 1 tensor_198500 output_state_0_1 Split 320 1 1 tensor_198502 output_state_0_2 Split 321 1 1 tensor_198483 output_state_0_3 Split 322 1 2 tensor_198497 tensor_198507 tensor_198508 LayerNorm 323 1 1 tensor_198507 tensor_198509 0=2048 1=1.000000e-05 2=1 Split 324 1 3 tensor_198509 tensor_198510 tensor_198511 tensor_198512 Split 325 1 2 state_0_4 tensor_198513 tensor_198514 MemoryData 326 0 1 blocks.0.ffn.time_mix_k 0=2048 21=0 Split 327 1 2 blocks.0.ffn.time_mix_k tensor_198516 tensor_198517 MemoryData 328 0 1 blocks.0.ffn.time_mix_r 0=2048 21=0 Split 329 1 2 blocks.0.ffn.time_mix_r tensor_198519 tensor_198520 BinaryOp 330 1 1 tensor_198517 tensor_198521 0=7 1=1 2=1.000000e+00 BinaryOp 331 2 1 tensor_198513 tensor_198521 tensor_198522 0=2 BinaryOp 332 2 1 tensor_198510 tensor_198516 tensor_198523 0=2 BinaryOp 333 2 1 tensor_198523 tensor_198522 tensor_198524 0=0 BinaryOp 334 1 1 tensor_198520 tensor_198525 0=7 1=1 2=1.000000e+00 BinaryOp 335 2 1 tensor_198514 tensor_198525 tensor_198526 0=2 BinaryOp 336 2 1 tensor_198511 tensor_198519 tensor_198527 0=2 BinaryOp 337 2 1 tensor_198527 tensor_198526 tensor_198528 0=0 Reshape 338 1 1 tensor_198528 tensor_198529 0=0 1=1 Gemm 339 1 1 tensor_198529 tensor_198531 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 340 1 1 tensor_198531 tensor_198532 0=-1 Sigmoid 341 1 1 tensor_198532 tensor_198533 Reshape 342 1 1 tensor_198524 tensor_198534 0=0 1=1 Gemm 343 1 1 tensor_198534 tensor_198536 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 344 1 1 tensor_198536 tensor_198537 0=-1 ReLU 345 1 1 tensor_198537 tensor_198538 BinaryOp 346 2 1 tensor_198538 tensor_198538 tensor_198539 0=2 Reshape 347 1 1 tensor_198539 tensor_198540 0=0 1=1 Gemm 348 1 1 tensor_198540 tensor_198542 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 349 1 1 tensor_198542 tensor_198543 0=-1 BinaryOp 350 2 1 tensor_198533 tensor_198543 tensor_198544 0=2 BinaryOp 351 2 1 tensor_198508 tensor_198544 tensor_198545 0=0 Split 352 1 1 tensor_198512 output_state_0_4 Split 353 1 2 tensor_198545 tensor_198547 tensor_198548 LayerNorm 354 1 1 tensor_198547 tensor_198549 0=2048 1=1.000000e-05 2=1 Split 355 1 4 tensor_198549 tensor_198550 tensor_198551 tensor_198552 tensor_198553 Split 356 1 3 state_1_0 tensor_198554 tensor_198555 tensor_198556 MemoryData 357 0 1 blocks.1.att.time_mix_k 0=2048 21=0 Split 358 1 2 blocks.1.att.time_mix_k tensor_198558 tensor_198559 MemoryData 359 0 1 blocks.1.att.time_mix_v 0=2048 21=0 Split 360 1 2 blocks.1.att.time_mix_v tensor_198561 tensor_198562 MemoryData 361 0 1 blocks.1.att.time_mix_r 0=2048 21=0 Split 362 1 2 blocks.1.att.time_mix_r tensor_198564 tensor_198565 BinaryOp 363 1 1 tensor_198559 tensor_198566 0=7 1=1 2=1.000000e+00 BinaryOp 364 2 1 tensor_198554 tensor_198566 tensor_198567 0=2 BinaryOp 365 2 1 tensor_198550 tensor_198558 tensor_198568 0=2 BinaryOp 366 2 1 tensor_198568 tensor_198567 tensor_198569 0=0 BinaryOp 367 1 1 tensor_198562 tensor_198570 0=7 1=1 2=1.000000e+00 BinaryOp 368 2 1 tensor_198555 tensor_198570 tensor_198571 0=2 BinaryOp 369 2 1 tensor_198551 tensor_198561 tensor_198572 0=2 BinaryOp 370 2 1 tensor_198572 tensor_198571 tensor_198573 0=0 BinaryOp 371 1 1 tensor_198565 tensor_198574 0=7 1=1 2=1.000000e+00 BinaryOp 372 2 1 tensor_198556 tensor_198574 tensor_198575 0=2 BinaryOp 373 2 1 tensor_198552 tensor_198564 tensor_198576 0=2 BinaryOp 374 2 1 tensor_198576 tensor_198575 tensor_198577 0=0 Reshape 375 1 1 tensor_198577 tensor_198578 0=0 1=1 Gemm 376 1 1 tensor_198578 tensor_198580 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 377 1 1 tensor_198580 tensor_198581 0=-1 Sigmoid 378 1 1 tensor_198581 tensor_198582 Reshape 379 1 1 tensor_198569 tensor_198583 0=0 1=1 Gemm 380 1 1 tensor_198583 tensor_198585 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 381 1 1 tensor_198585 tensor_198586 0=-1 Split 382 1 3 tensor_198586 tensor_198587 tensor_198588 tensor_198589 Reshape 383 1 1 tensor_198573 tensor_198590 0=0 1=1 Gemm 384 1 1 tensor_198590 tensor_198592 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 385 1 1 tensor_198592 tensor_198593 0=-1 Split 386 1 2 tensor_198593 tensor_198594 tensor_198595 MemoryData 387 0 1 blocks.1.att.time_first 0=2048 21=0 BinaryOp 388 2 1 blocks.1.att.time_first tensor_198587 tensor_198597 0=0 Split 389 1 2 tensor_198597 tensor_198598 tensor_198599 Split 390 1 3 state_1_3 tensor_198600 tensor_198601 tensor_198602 BinaryOp 391 2 1 tensor_198600 tensor_198598 tensor_198603 0=4 Split 392 1 2 tensor_198603 tensor_198604 tensor_198605 BinaryOp 393 2 1 tensor_198601 tensor_198604 tensor_198606 0=1 Exp 394 1 1 tensor_198606 tensor_198607 Split 395 1 2 tensor_198607 tensor_198608 tensor_198609 BinaryOp 396 2 1 tensor_198599 tensor_198605 tensor_198610 0=1 Exp 397 1 1 tensor_198610 tensor_198611 Split 398 1 2 tensor_198611 tensor_198612 tensor_198613 Split 399 1 2 state_1_1 tensor_198614 tensor_198615 Split 400 1 2 state_1_2 tensor_198616 tensor_198617 BinaryOp 401 2 1 tensor_198609 tensor_198616 tensor_198618 0=2 BinaryOp 402 2 1 tensor_198618 tensor_198613 tensor_198619 0=0 BinaryOp 403 2 1 tensor_198612 tensor_198594 tensor_198620 0=2 BinaryOp 404 2 1 tensor_198608 tensor_198614 tensor_198621 0=2 BinaryOp 405 2 1 tensor_198621 tensor_198620 tensor_198622 0=0 BinaryOp 406 2 1 tensor_198622 tensor_198619 tensor_198623 0=3 MemoryData 407 0 1 blocks.1.att.time_decay 0=2048 21=0 BinaryOp 408 2 1 blocks.1.att.time_decay tensor_198602 tensor_198625 0=0 Split 409 1 2 tensor_198625 tensor_198626 tensor_198627 BinaryOp 410 2 1 tensor_198626 tensor_198588 tensor_198628 0=4 Split 411 1 3 tensor_198628 tensor_198629 tensor_198630 tensor_198631 BinaryOp 412 2 1 tensor_198627 tensor_198629 tensor_198632 0=1 Exp 413 1 1 tensor_198632 tensor_198633 Split 414 1 2 tensor_198633 tensor_198634 tensor_198635 BinaryOp 415 2 1 tensor_198589 tensor_198630 tensor_198636 0=1 Exp 416 1 1 tensor_198636 tensor_198637 Split 417 1 2 tensor_198637 tensor_198638 tensor_198639 BinaryOp 418 2 1 tensor_198582 tensor_198623 tensor_198640 0=2 Reshape 419 1 1 tensor_198640 tensor_198641 0=0 1=1 Gemm 420 1 1 tensor_198641 tensor_198643 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 421 1 1 tensor_198643 tensor_198644 0=-1 BinaryOp 422 2 1 tensor_198548 tensor_198644 tensor_198645 0=0 BinaryOp 423 2 1 tensor_198638 tensor_198595 tensor_198646 0=2 BinaryOp 424 2 1 tensor_198634 tensor_198615 tensor_198647 0=2 BinaryOp 425 2 1 tensor_198647 tensor_198646 tensor_198648 0=0 BinaryOp 426 2 1 tensor_198635 tensor_198617 tensor_198649 0=2 BinaryOp 427 2 1 tensor_198649 tensor_198639 tensor_198650 0=0 Split 428 1 1 tensor_198553 output_state_1_0 Split 429 1 1 tensor_198648 output_state_1_1 Split 430 1 1 tensor_198650 output_state_1_2 Split 431 1 1 tensor_198631 output_state_1_3 Split 432 1 2 tensor_198645 tensor_198655 tensor_198656 LayerNorm 433 1 1 tensor_198655 tensor_198657 0=2048 1=1.000000e-05 2=1 Split 434 1 3 tensor_198657 tensor_198658 tensor_198659 tensor_198660 Split 435 1 2 state_1_4 tensor_198661 tensor_198662 MemoryData 436 0 1 blocks.1.ffn.time_mix_k 0=2048 21=0 Split 437 1 2 blocks.1.ffn.time_mix_k tensor_198664 tensor_198665 MemoryData 438 0 1 blocks.1.ffn.time_mix_r 0=2048 21=0 Split 439 1 2 blocks.1.ffn.time_mix_r tensor_198667 tensor_198668 BinaryOp 440 1 1 tensor_198665 tensor_198669 0=7 1=1 2=1.000000e+00 BinaryOp 441 2 1 tensor_198661 tensor_198669 tensor_198670 0=2 BinaryOp 442 2 1 tensor_198658 tensor_198664 tensor_198671 0=2 BinaryOp 443 2 1 tensor_198671 tensor_198670 tensor_198672 0=0 BinaryOp 444 1 1 tensor_198668 tensor_198673 0=7 1=1 2=1.000000e+00 BinaryOp 445 2 1 tensor_198662 tensor_198673 tensor_198674 0=2 BinaryOp 446 2 1 tensor_198659 tensor_198667 tensor_198675 0=2 BinaryOp 447 2 1 tensor_198675 tensor_198674 tensor_198676 0=0 Reshape 448 1 1 tensor_198676 tensor_198677 0=0 1=1 Gemm 449 1 1 tensor_198677 tensor_198679 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 450 1 1 tensor_198679 tensor_198680 0=-1 Sigmoid 451 1 1 tensor_198680 tensor_198681 Reshape 452 1 1 tensor_198672 tensor_198682 0=0 1=1 Gemm 453 1 1 tensor_198682 tensor_198684 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 454 1 1 tensor_198684 tensor_198685 0=-1 ReLU 455 1 1 tensor_198685 tensor_198686 BinaryOp 456 2 1 tensor_198686 tensor_198686 tensor_198687 0=2 Reshape 457 1 1 tensor_198687 tensor_198688 0=0 1=1 Gemm 458 1 1 tensor_198688 tensor_198690 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 459 1 1 tensor_198690 tensor_198691 0=-1 BinaryOp 460 2 1 tensor_198681 tensor_198691 tensor_198692 0=2 BinaryOp 461 2 1 tensor_198656 tensor_198692 tensor_198693 0=0 Split 462 1 1 tensor_198660 output_state_1_4 Split 463 1 2 tensor_198693 tensor_198695 tensor_198696 LayerNorm 464 1 1 tensor_198695 tensor_198697 0=2048 1=1.000000e-05 2=1 Split 465 1 4 tensor_198697 tensor_198698 tensor_198699 tensor_198700 tensor_198701 Split 466 1 3 state_2_0 tensor_198702 tensor_198703 tensor_198704 MemoryData 467 0 1 blocks.2.att.time_mix_k 0=2048 21=0 Split 468 1 2 blocks.2.att.time_mix_k tensor_198706 tensor_198707 MemoryData 469 0 1 blocks.2.att.time_mix_v 0=2048 21=0 Split 470 1 2 blocks.2.att.time_mix_v tensor_198709 tensor_198710 MemoryData 471 0 1 blocks.2.att.time_mix_r 0=2048 21=0 Split 472 1 2 blocks.2.att.time_mix_r tensor_198712 tensor_198713 BinaryOp 473 1 1 tensor_198707 tensor_198714 0=7 1=1 2=1.000000e+00 BinaryOp 474 2 1 tensor_198702 tensor_198714 tensor_198715 0=2 BinaryOp 475 2 1 tensor_198698 tensor_198706 tensor_198716 0=2 BinaryOp 476 2 1 tensor_198716 tensor_198715 tensor_198717 0=0 BinaryOp 477 1 1 tensor_198710 tensor_198718 0=7 1=1 2=1.000000e+00 BinaryOp 478 2 1 tensor_198703 tensor_198718 tensor_198719 0=2 BinaryOp 479 2 1 tensor_198699 tensor_198709 tensor_198720 0=2 BinaryOp 480 2 1 tensor_198720 tensor_198719 tensor_198721 0=0 BinaryOp 481 1 1 tensor_198713 tensor_198722 0=7 1=1 2=1.000000e+00 BinaryOp 482 2 1 tensor_198704 tensor_198722 tensor_198723 0=2 BinaryOp 483 2 1 tensor_198700 tensor_198712 tensor_198724 0=2 BinaryOp 484 2 1 tensor_198724 tensor_198723 tensor_198725 0=0 Reshape 485 1 1 tensor_198725 tensor_198726 0=0 1=1 Gemm 486 1 1 tensor_198726 tensor_198728 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 487 1 1 tensor_198728 tensor_198729 0=-1 Sigmoid 488 1 1 tensor_198729 tensor_198730 Reshape 489 1 1 tensor_198717 tensor_198731 0=0 1=1 Gemm 490 1 1 tensor_198731 tensor_198733 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 491 1 1 tensor_198733 tensor_198734 0=-1 Split 492 1 3 tensor_198734 tensor_198735 tensor_198736 tensor_198737 Reshape 493 1 1 tensor_198721 tensor_198738 0=0 1=1 Gemm 494 1 1 tensor_198738 tensor_198740 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 495 1 1 tensor_198740 tensor_198741 0=-1 Split 496 1 2 tensor_198741 tensor_198742 tensor_198743 MemoryData 497 0 1 blocks.2.att.time_first 0=2048 21=0 BinaryOp 498 2 1 blocks.2.att.time_first tensor_198735 tensor_198745 0=0 Split 499 1 2 tensor_198745 tensor_198746 tensor_198747 Split 500 1 3 state_2_3 tensor_198748 tensor_198749 tensor_198750 BinaryOp 501 2 1 tensor_198748 tensor_198746 tensor_198751 0=4 Split 502 1 2 tensor_198751 tensor_198752 tensor_198753 BinaryOp 503 2 1 tensor_198749 tensor_198752 tensor_198754 0=1 Exp 504 1 1 tensor_198754 tensor_198755 Split 505 1 2 tensor_198755 tensor_198756 tensor_198757 BinaryOp 506 2 1 tensor_198747 tensor_198753 tensor_198758 0=1 Exp 507 1 1 tensor_198758 tensor_198759 Split 508 1 2 tensor_198759 tensor_198760 tensor_198761 Split 509 1 2 state_2_1 tensor_198762 tensor_198763 Split 510 1 2 state_2_2 tensor_198764 tensor_198765 BinaryOp 511 2 1 tensor_198757 tensor_198764 tensor_198766 0=2 BinaryOp 512 2 1 tensor_198766 tensor_198761 tensor_198767 0=0 BinaryOp 513 2 1 tensor_198760 tensor_198742 tensor_198768 0=2 BinaryOp 514 2 1 tensor_198756 tensor_198762 tensor_198769 0=2 BinaryOp 515 2 1 tensor_198769 tensor_198768 tensor_198770 0=0 BinaryOp 516 2 1 tensor_198770 tensor_198767 tensor_198771 0=3 MemoryData 517 0 1 blocks.2.att.time_decay 0=2048 21=0 BinaryOp 518 2 1 blocks.2.att.time_decay tensor_198750 tensor_198773 0=0 Split 519 1 2 tensor_198773 tensor_198774 tensor_198775 BinaryOp 520 2 1 tensor_198774 tensor_198736 tensor_198776 0=4 Split 521 1 3 tensor_198776 tensor_198777 tensor_198778 tensor_198779 BinaryOp 522 2 1 tensor_198775 tensor_198777 tensor_198780 0=1 Exp 523 1 1 tensor_198780 tensor_198781 Split 524 1 2 tensor_198781 tensor_198782 tensor_198783 BinaryOp 525 2 1 tensor_198737 tensor_198778 tensor_198784 0=1 Exp 526 1 1 tensor_198784 tensor_198785 Split 527 1 2 tensor_198785 tensor_198786 tensor_198787 BinaryOp 528 2 1 tensor_198730 tensor_198771 tensor_198788 0=2 Reshape 529 1 1 tensor_198788 tensor_198789 0=0 1=1 Gemm 530 1 1 tensor_198789 tensor_198791 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 531 1 1 tensor_198791 tensor_198792 0=-1 BinaryOp 532 2 1 tensor_198696 tensor_198792 tensor_198793 0=0 BinaryOp 533 2 1 tensor_198786 tensor_198743 tensor_198794 0=2 BinaryOp 534 2 1 tensor_198782 tensor_198763 tensor_198795 0=2 BinaryOp 535 2 1 tensor_198795 tensor_198794 tensor_198796 0=0 BinaryOp 536 2 1 tensor_198783 tensor_198765 tensor_198797 0=2 BinaryOp 537 2 1 tensor_198797 tensor_198787 tensor_198798 0=0 Split 538 1 1 tensor_198701 output_state_2_0 Split 539 1 1 tensor_198796 output_state_2_1 Split 540 1 1 tensor_198798 output_state_2_2 Split 541 1 1 tensor_198779 output_state_2_3 Split 542 1 2 tensor_198793 tensor_198803 tensor_198804 LayerNorm 543 1 1 tensor_198803 tensor_198805 0=2048 1=1.000000e-05 2=1 Split 544 1 3 tensor_198805 tensor_198806 tensor_198807 tensor_198808 Split 545 1 2 state_2_4 tensor_198809 tensor_198810 MemoryData 546 0 1 blocks.2.ffn.time_mix_k 0=2048 21=0 Split 547 1 2 blocks.2.ffn.time_mix_k tensor_198812 tensor_198813 MemoryData 548 0 1 blocks.2.ffn.time_mix_r 0=2048 21=0 Split 549 1 2 blocks.2.ffn.time_mix_r tensor_198815 tensor_198816 BinaryOp 550 1 1 tensor_198813 tensor_198817 0=7 1=1 2=1.000000e+00 BinaryOp 551 2 1 tensor_198809 tensor_198817 tensor_198818 0=2 BinaryOp 552 2 1 tensor_198806 tensor_198812 tensor_198819 0=2 BinaryOp 553 2 1 tensor_198819 tensor_198818 tensor_198820 0=0 BinaryOp 554 1 1 tensor_198816 tensor_198821 0=7 1=1 2=1.000000e+00 BinaryOp 555 2 1 tensor_198810 tensor_198821 tensor_198822 0=2 BinaryOp 556 2 1 tensor_198807 tensor_198815 tensor_198823 0=2 BinaryOp 557 2 1 tensor_198823 tensor_198822 tensor_198824 0=0 Reshape 558 1 1 tensor_198824 tensor_198825 0=0 1=1 Gemm 559 1 1 tensor_198825 tensor_198827 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 560 1 1 tensor_198827 tensor_198828 0=-1 Sigmoid 561 1 1 tensor_198828 tensor_198829 Reshape 562 1 1 tensor_198820 tensor_198830 0=0 1=1 Gemm 563 1 1 tensor_198830 tensor_198832 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 564 1 1 tensor_198832 tensor_198833 0=-1 ReLU 565 1 1 tensor_198833 tensor_198834 BinaryOp 566 2 1 tensor_198834 tensor_198834 tensor_198835 0=2 Reshape 567 1 1 tensor_198835 tensor_198836 0=0 1=1 Gemm 568 1 1 tensor_198836 tensor_198838 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 569 1 1 tensor_198838 tensor_198839 0=-1 BinaryOp 570 2 1 tensor_198829 tensor_198839 tensor_198840 0=2 BinaryOp 571 2 1 tensor_198804 tensor_198840 tensor_198841 0=0 Split 572 1 1 tensor_198808 output_state_2_4 Split 573 1 2 tensor_198841 tensor_198843 tensor_198844 LayerNorm 574 1 1 tensor_198843 tensor_198845 0=2048 1=1.000000e-05 2=1 Split 575 1 4 tensor_198845 tensor_198846 tensor_198847 tensor_198848 tensor_198849 Split 576 1 3 state_3_0 tensor_198850 tensor_198851 tensor_198852 MemoryData 577 0 1 blocks.3.att.time_mix_k 0=2048 21=0 Split 578 1 2 blocks.3.att.time_mix_k tensor_198854 tensor_198855 MemoryData 579 0 1 blocks.3.att.time_mix_v 0=2048 21=0 Split 580 1 2 blocks.3.att.time_mix_v tensor_198857 tensor_198858 MemoryData 581 0 1 blocks.3.att.time_mix_r 0=2048 21=0 Split 582 1 2 blocks.3.att.time_mix_r tensor_198860 tensor_198861 BinaryOp 583 1 1 tensor_198855 tensor_198862 0=7 1=1 2=1.000000e+00 BinaryOp 584 2 1 tensor_198850 tensor_198862 tensor_198863 0=2 BinaryOp 585 2 1 tensor_198846 tensor_198854 tensor_198864 0=2 BinaryOp 586 2 1 tensor_198864 tensor_198863 tensor_198865 0=0 BinaryOp 587 1 1 tensor_198858 tensor_198866 0=7 1=1 2=1.000000e+00 BinaryOp 588 2 1 tensor_198851 tensor_198866 tensor_198867 0=2 BinaryOp 589 2 1 tensor_198847 tensor_198857 tensor_198868 0=2 BinaryOp 590 2 1 tensor_198868 tensor_198867 tensor_198869 0=0 BinaryOp 591 1 1 tensor_198861 tensor_198870 0=7 1=1 2=1.000000e+00 BinaryOp 592 2 1 tensor_198852 tensor_198870 tensor_198871 0=2 BinaryOp 593 2 1 tensor_198848 tensor_198860 tensor_198872 0=2 BinaryOp 594 2 1 tensor_198872 tensor_198871 tensor_198873 0=0 Reshape 595 1 1 tensor_198873 tensor_198874 0=0 1=1 Gemm 596 1 1 tensor_198874 tensor_198876 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 597 1 1 tensor_198876 tensor_198877 0=-1 Sigmoid 598 1 1 tensor_198877 tensor_198878 Reshape 599 1 1 tensor_198865 tensor_198879 0=0 1=1 Gemm 600 1 1 tensor_198879 tensor_198881 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 601 1 1 tensor_198881 tensor_198882 0=-1 Split 602 1 3 tensor_198882 tensor_198883 tensor_198884 tensor_198885 Reshape 603 1 1 tensor_198869 tensor_198886 0=0 1=1 Gemm 604 1 1 tensor_198886 tensor_198888 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 605 1 1 tensor_198888 tensor_198889 0=-1 Split 606 1 2 tensor_198889 tensor_198890 tensor_198891 MemoryData 607 0 1 blocks.3.att.time_first 0=2048 21=0 BinaryOp 608 2 1 blocks.3.att.time_first tensor_198883 tensor_198893 0=0 Split 609 1 2 tensor_198893 tensor_198894 tensor_198895 Split 610 1 3 state_3_3 tensor_198896 tensor_198897 tensor_198898 BinaryOp 611 2 1 tensor_198896 tensor_198894 tensor_198899 0=4 Split 612 1 2 tensor_198899 tensor_198900 tensor_198901 BinaryOp 613 2 1 tensor_198897 tensor_198900 tensor_198902 0=1 Exp 614 1 1 tensor_198902 tensor_198903 Split 615 1 2 tensor_198903 tensor_198904 tensor_198905 BinaryOp 616 2 1 tensor_198895 tensor_198901 tensor_198906 0=1 Exp 617 1 1 tensor_198906 tensor_198907 Split 618 1 2 tensor_198907 tensor_198908 tensor_198909 Split 619 1 2 state_3_1 tensor_198910 tensor_198911 Split 620 1 2 state_3_2 tensor_198912 tensor_198913 BinaryOp 621 2 1 tensor_198905 tensor_198912 tensor_198914 0=2 BinaryOp 622 2 1 tensor_198914 tensor_198909 tensor_198915 0=0 BinaryOp 623 2 1 tensor_198908 tensor_198890 tensor_198916 0=2 BinaryOp 624 2 1 tensor_198904 tensor_198910 tensor_198917 0=2 BinaryOp 625 2 1 tensor_198917 tensor_198916 tensor_198918 0=0 BinaryOp 626 2 1 tensor_198918 tensor_198915 tensor_198919 0=3 MemoryData 627 0 1 blocks.3.att.time_decay 0=2048 21=0 BinaryOp 628 2 1 blocks.3.att.time_decay tensor_198898 tensor_198921 0=0 Split 629 1 2 tensor_198921 tensor_198922 tensor_198923 BinaryOp 630 2 1 tensor_198922 tensor_198884 tensor_198924 0=4 Split 631 1 3 tensor_198924 tensor_198925 tensor_198926 tensor_198927 BinaryOp 632 2 1 tensor_198923 tensor_198925 tensor_198928 0=1 Exp 633 1 1 tensor_198928 tensor_198929 Split 634 1 2 tensor_198929 tensor_198930 tensor_198931 BinaryOp 635 2 1 tensor_198885 tensor_198926 tensor_198932 0=1 Exp 636 1 1 tensor_198932 tensor_198933 Split 637 1 2 tensor_198933 tensor_198934 tensor_198935 BinaryOp 638 2 1 tensor_198878 tensor_198919 tensor_198936 0=2 Reshape 639 1 1 tensor_198936 tensor_198937 0=0 1=1 Gemm 640 1 1 tensor_198937 tensor_198939 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 641 1 1 tensor_198939 tensor_198940 0=-1 BinaryOp 642 2 1 tensor_198844 tensor_198940 tensor_198941 0=0 BinaryOp 643 2 1 tensor_198934 tensor_198891 tensor_198942 0=2 BinaryOp 644 2 1 tensor_198930 tensor_198911 tensor_198943 0=2 BinaryOp 645 2 1 tensor_198943 tensor_198942 tensor_198944 0=0 BinaryOp 646 2 1 tensor_198931 tensor_198913 tensor_198945 0=2 BinaryOp 647 2 1 tensor_198945 tensor_198935 tensor_198946 0=0 Split 648 1 1 tensor_198849 output_state_3_0 Split 649 1 1 tensor_198944 output_state_3_1 Split 650 1 1 tensor_198946 output_state_3_2 Split 651 1 1 tensor_198927 output_state_3_3 Split 652 1 2 tensor_198941 tensor_198951 tensor_198952 LayerNorm 653 1 1 tensor_198951 tensor_198953 0=2048 1=1.000000e-05 2=1 Split 654 1 3 tensor_198953 tensor_198954 tensor_198955 tensor_198956 Split 655 1 2 state_3_4 tensor_198957 tensor_198958 MemoryData 656 0 1 blocks.3.ffn.time_mix_k 0=2048 21=0 Split 657 1 2 blocks.3.ffn.time_mix_k tensor_198960 tensor_198961 MemoryData 658 0 1 blocks.3.ffn.time_mix_r 0=2048 21=0 Split 659 1 2 blocks.3.ffn.time_mix_r tensor_198963 tensor_198964 BinaryOp 660 1 1 tensor_198961 tensor_198965 0=7 1=1 2=1.000000e+00 BinaryOp 661 2 1 tensor_198957 tensor_198965 tensor_198966 0=2 BinaryOp 662 2 1 tensor_198954 tensor_198960 tensor_198967 0=2 BinaryOp 663 2 1 tensor_198967 tensor_198966 tensor_198968 0=0 BinaryOp 664 1 1 tensor_198964 tensor_198969 0=7 1=1 2=1.000000e+00 BinaryOp 665 2 1 tensor_198958 tensor_198969 tensor_198970 0=2 BinaryOp 666 2 1 tensor_198955 tensor_198963 tensor_198971 0=2 BinaryOp 667 2 1 tensor_198971 tensor_198970 tensor_198972 0=0 Reshape 668 1 1 tensor_198972 tensor_198973 0=0 1=1 Gemm 669 1 1 tensor_198973 tensor_198975 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 670 1 1 tensor_198975 tensor_198976 0=-1 Sigmoid 671 1 1 tensor_198976 tensor_198977 Reshape 672 1 1 tensor_198968 tensor_198978 0=0 1=1 Gemm 673 1 1 tensor_198978 tensor_198980 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 674 1 1 tensor_198980 tensor_198981 0=-1 ReLU 675 1 1 tensor_198981 tensor_198982 BinaryOp 676 2 1 tensor_198982 tensor_198982 tensor_198983 0=2 Reshape 677 1 1 tensor_198983 tensor_198984 0=0 1=1 Gemm 678 1 1 tensor_198984 tensor_198986 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 679 1 1 tensor_198986 tensor_198987 0=-1 BinaryOp 680 2 1 tensor_198977 tensor_198987 tensor_198988 0=2 BinaryOp 681 2 1 tensor_198952 tensor_198988 tensor_198989 0=0 Split 682 1 1 tensor_198956 output_state_3_4 Split 683 1 2 tensor_198989 tensor_198991 tensor_198992 LayerNorm 684 1 1 tensor_198991 tensor_198993 0=2048 1=1.000000e-05 2=1 Split 685 1 4 tensor_198993 tensor_198994 tensor_198995 tensor_198996 tensor_198997 Split 686 1 3 state_4_0 tensor_198998 tensor_198999 tensor_199000 MemoryData 687 0 1 blocks.4.att.time_mix_k 0=2048 21=0 Split 688 1 2 blocks.4.att.time_mix_k tensor_199002 tensor_199003 MemoryData 689 0 1 blocks.4.att.time_mix_v 0=2048 21=0 Split 690 1 2 blocks.4.att.time_mix_v tensor_199005 tensor_199006 MemoryData 691 0 1 blocks.4.att.time_mix_r 0=2048 21=0 Split 692 1 2 blocks.4.att.time_mix_r tensor_199008 tensor_199009 BinaryOp 693 1 1 tensor_199003 tensor_199010 0=7 1=1 2=1.000000e+00 BinaryOp 694 2 1 tensor_198998 tensor_199010 tensor_199011 0=2 BinaryOp 695 2 1 tensor_198994 tensor_199002 tensor_199012 0=2 BinaryOp 696 2 1 tensor_199012 tensor_199011 tensor_199013 0=0 BinaryOp 697 1 1 tensor_199006 tensor_199014 0=7 1=1 2=1.000000e+00 BinaryOp 698 2 1 tensor_198999 tensor_199014 tensor_199015 0=2 BinaryOp 699 2 1 tensor_198995 tensor_199005 tensor_199016 0=2 BinaryOp 700 2 1 tensor_199016 tensor_199015 tensor_199017 0=0 BinaryOp 701 1 1 tensor_199009 tensor_199018 0=7 1=1 2=1.000000e+00 BinaryOp 702 2 1 tensor_199000 tensor_199018 tensor_199019 0=2 BinaryOp 703 2 1 tensor_198996 tensor_199008 tensor_199020 0=2 BinaryOp 704 2 1 tensor_199020 tensor_199019 tensor_199021 0=0 Reshape 705 1 1 tensor_199021 tensor_199022 0=0 1=1 Gemm 706 1 1 tensor_199022 tensor_199024 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 707 1 1 tensor_199024 tensor_199025 0=-1 Sigmoid 708 1 1 tensor_199025 tensor_199026 Reshape 709 1 1 tensor_199013 tensor_199027 0=0 1=1 Gemm 710 1 1 tensor_199027 tensor_199029 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 711 1 1 tensor_199029 tensor_199030 0=-1 Split 712 1 3 tensor_199030 tensor_199031 tensor_199032 tensor_199033 Reshape 713 1 1 tensor_199017 tensor_199034 0=0 1=1 Gemm 714 1 1 tensor_199034 tensor_199036 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 715 1 1 tensor_199036 tensor_199037 0=-1 Split 716 1 2 tensor_199037 tensor_199038 tensor_199039 MemoryData 717 0 1 blocks.4.att.time_first 0=2048 21=0 BinaryOp 718 2 1 blocks.4.att.time_first tensor_199031 tensor_199041 0=0 Split 719 1 2 tensor_199041 tensor_199042 tensor_199043 Split 720 1 3 state_4_3 tensor_199044 tensor_199045 tensor_199046 BinaryOp 721 2 1 tensor_199044 tensor_199042 tensor_199047 0=4 Split 722 1 2 tensor_199047 tensor_199048 tensor_199049 BinaryOp 723 2 1 tensor_199045 tensor_199048 tensor_199050 0=1 Exp 724 1 1 tensor_199050 tensor_199051 Split 725 1 2 tensor_199051 tensor_199052 tensor_199053 BinaryOp 726 2 1 tensor_199043 tensor_199049 tensor_199054 0=1 Exp 727 1 1 tensor_199054 tensor_199055 Split 728 1 2 tensor_199055 tensor_199056 tensor_199057 Split 729 1 2 state_4_1 tensor_199058 tensor_199059 Split 730 1 2 state_4_2 tensor_199060 tensor_199061 BinaryOp 731 2 1 tensor_199053 tensor_199060 tensor_199062 0=2 BinaryOp 732 2 1 tensor_199062 tensor_199057 tensor_199063 0=0 BinaryOp 733 2 1 tensor_199056 tensor_199038 tensor_199064 0=2 BinaryOp 734 2 1 tensor_199052 tensor_199058 tensor_199065 0=2 BinaryOp 735 2 1 tensor_199065 tensor_199064 tensor_199066 0=0 BinaryOp 736 2 1 tensor_199066 tensor_199063 tensor_199067 0=3 MemoryData 737 0 1 blocks.4.att.time_decay 0=2048 21=0 BinaryOp 738 2 1 blocks.4.att.time_decay tensor_199046 tensor_199069 0=0 Split 739 1 2 tensor_199069 tensor_199070 tensor_199071 BinaryOp 740 2 1 tensor_199070 tensor_199032 tensor_199072 0=4 Split 741 1 3 tensor_199072 tensor_199073 tensor_199074 tensor_199075 BinaryOp 742 2 1 tensor_199071 tensor_199073 tensor_199076 0=1 Exp 743 1 1 tensor_199076 tensor_199077 Split 744 1 2 tensor_199077 tensor_199078 tensor_199079 BinaryOp 745 2 1 tensor_199033 tensor_199074 tensor_199080 0=1 Exp 746 1 1 tensor_199080 tensor_199081 Split 747 1 2 tensor_199081 tensor_199082 tensor_199083 BinaryOp 748 2 1 tensor_199026 tensor_199067 tensor_199084 0=2 Reshape 749 1 1 tensor_199084 tensor_199085 0=0 1=1 Gemm 750 1 1 tensor_199085 tensor_199087 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 751 1 1 tensor_199087 tensor_199088 0=-1 BinaryOp 752 2 1 tensor_198992 tensor_199088 tensor_199089 0=0 BinaryOp 753 2 1 tensor_199082 tensor_199039 tensor_199090 0=2 BinaryOp 754 2 1 tensor_199078 tensor_199059 tensor_199091 0=2 BinaryOp 755 2 1 tensor_199091 tensor_199090 tensor_199092 0=0 BinaryOp 756 2 1 tensor_199079 tensor_199061 tensor_199093 0=2 BinaryOp 757 2 1 tensor_199093 tensor_199083 tensor_199094 0=0 Split 758 1 1 tensor_198997 output_state_4_0 Split 759 1 1 tensor_199092 output_state_4_1 Split 760 1 1 tensor_199094 output_state_4_2 Split 761 1 1 tensor_199075 output_state_4_3 Split 762 1 2 tensor_199089 tensor_199099 tensor_199100 LayerNorm 763 1 1 tensor_199099 tensor_199101 0=2048 1=1.000000e-05 2=1 Split 764 1 3 tensor_199101 tensor_199102 tensor_199103 tensor_199104 Split 765 1 2 state_4_4 tensor_199105 tensor_199106 MemoryData 766 0 1 blocks.4.ffn.time_mix_k 0=2048 21=0 Split 767 1 2 blocks.4.ffn.time_mix_k tensor_199108 tensor_199109 MemoryData 768 0 1 blocks.4.ffn.time_mix_r 0=2048 21=0 Split 769 1 2 blocks.4.ffn.time_mix_r tensor_199111 tensor_199112 BinaryOp 770 1 1 tensor_199109 tensor_199113 0=7 1=1 2=1.000000e+00 BinaryOp 771 2 1 tensor_199105 tensor_199113 tensor_199114 0=2 BinaryOp 772 2 1 tensor_199102 tensor_199108 tensor_199115 0=2 BinaryOp 773 2 1 tensor_199115 tensor_199114 tensor_199116 0=0 BinaryOp 774 1 1 tensor_199112 tensor_199117 0=7 1=1 2=1.000000e+00 BinaryOp 775 2 1 tensor_199106 tensor_199117 tensor_199118 0=2 BinaryOp 776 2 1 tensor_199103 tensor_199111 tensor_199119 0=2 BinaryOp 777 2 1 tensor_199119 tensor_199118 tensor_199120 0=0 Reshape 778 1 1 tensor_199120 tensor_199121 0=0 1=1 Gemm 779 1 1 tensor_199121 tensor_199123 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 780 1 1 tensor_199123 tensor_199124 0=-1 Sigmoid 781 1 1 tensor_199124 tensor_199125 Reshape 782 1 1 tensor_199116 tensor_199126 0=0 1=1 Gemm 783 1 1 tensor_199126 tensor_199128 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 784 1 1 tensor_199128 tensor_199129 0=-1 ReLU 785 1 1 tensor_199129 tensor_199130 BinaryOp 786 2 1 tensor_199130 tensor_199130 tensor_199131 0=2 Reshape 787 1 1 tensor_199131 tensor_199132 0=0 1=1 Gemm 788 1 1 tensor_199132 tensor_199134 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 789 1 1 tensor_199134 tensor_199135 0=-1 BinaryOp 790 2 1 tensor_199125 tensor_199135 tensor_199136 0=2 BinaryOp 791 2 1 tensor_199100 tensor_199136 tensor_199137 0=0 Split 792 1 1 tensor_199104 output_state_4_4 Split 793 1 2 tensor_199137 tensor_199139 tensor_199140 LayerNorm 794 1 1 tensor_199139 tensor_199141 0=2048 1=1.000000e-05 2=1 Split 795 1 4 tensor_199141 tensor_199142 tensor_199143 tensor_199144 tensor_199145 Split 796 1 3 state_5_0 tensor_199146 tensor_199147 tensor_199148 MemoryData 797 0 1 blocks.5.att.time_mix_k 0=2048 21=0 Split 798 1 2 blocks.5.att.time_mix_k tensor_199150 tensor_199151 MemoryData 799 0 1 blocks.5.att.time_mix_v 0=2048 21=0 Split 800 1 2 blocks.5.att.time_mix_v tensor_199153 tensor_199154 MemoryData 801 0 1 blocks.5.att.time_mix_r 0=2048 21=0 Split 802 1 2 blocks.5.att.time_mix_r tensor_199156 tensor_199157 BinaryOp 803 1 1 tensor_199151 tensor_199158 0=7 1=1 2=1.000000e+00 BinaryOp 804 2 1 tensor_199146 tensor_199158 tensor_199159 0=2 BinaryOp 805 2 1 tensor_199142 tensor_199150 tensor_199160 0=2 BinaryOp 806 2 1 tensor_199160 tensor_199159 tensor_199161 0=0 BinaryOp 807 1 1 tensor_199154 tensor_199162 0=7 1=1 2=1.000000e+00 BinaryOp 808 2 1 tensor_199147 tensor_199162 tensor_199163 0=2 BinaryOp 809 2 1 tensor_199143 tensor_199153 tensor_199164 0=2 BinaryOp 810 2 1 tensor_199164 tensor_199163 tensor_199165 0=0 BinaryOp 811 1 1 tensor_199157 tensor_199166 0=7 1=1 2=1.000000e+00 BinaryOp 812 2 1 tensor_199148 tensor_199166 tensor_199167 0=2 BinaryOp 813 2 1 tensor_199144 tensor_199156 tensor_199168 0=2 BinaryOp 814 2 1 tensor_199168 tensor_199167 tensor_199169 0=0 Reshape 815 1 1 tensor_199169 tensor_199170 0=0 1=1 Gemm 816 1 1 tensor_199170 tensor_199172 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 817 1 1 tensor_199172 tensor_199173 0=-1 Sigmoid 818 1 1 tensor_199173 tensor_199174 Reshape 819 1 1 tensor_199161 tensor_199175 0=0 1=1 Gemm 820 1 1 tensor_199175 tensor_199177 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 821 1 1 tensor_199177 tensor_199178 0=-1 Split 822 1 3 tensor_199178 tensor_199179 tensor_199180 tensor_199181 Reshape 823 1 1 tensor_199165 tensor_199182 0=0 1=1 Gemm 824 1 1 tensor_199182 tensor_199184 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 825 1 1 tensor_199184 tensor_199185 0=-1 Split 826 1 2 tensor_199185 tensor_199186 tensor_199187 MemoryData 827 0 1 blocks.5.att.time_first 0=2048 21=0 BinaryOp 828 2 1 blocks.5.att.time_first tensor_199179 tensor_199189 0=0 Split 829 1 2 tensor_199189 tensor_199190 tensor_199191 Split 830 1 3 state_5_3 tensor_199192 tensor_199193 tensor_199194 BinaryOp 831 2 1 tensor_199192 tensor_199190 tensor_199195 0=4 Split 832 1 2 tensor_199195 tensor_199196 tensor_199197 BinaryOp 833 2 1 tensor_199193 tensor_199196 tensor_199198 0=1 Exp 834 1 1 tensor_199198 tensor_199199 Split 835 1 2 tensor_199199 tensor_199200 tensor_199201 BinaryOp 836 2 1 tensor_199191 tensor_199197 tensor_199202 0=1 Exp 837 1 1 tensor_199202 tensor_199203 Split 838 1 2 tensor_199203 tensor_199204 tensor_199205 Split 839 1 2 state_5_1 tensor_199206 tensor_199207 Split 840 1 2 state_5_2 tensor_199208 tensor_199209 BinaryOp 841 2 1 tensor_199201 tensor_199208 tensor_199210 0=2 BinaryOp 842 2 1 tensor_199210 tensor_199205 tensor_199211 0=0 BinaryOp 843 2 1 tensor_199204 tensor_199186 tensor_199212 0=2 BinaryOp 844 2 1 tensor_199200 tensor_199206 tensor_199213 0=2 BinaryOp 845 2 1 tensor_199213 tensor_199212 tensor_199214 0=0 BinaryOp 846 2 1 tensor_199214 tensor_199211 tensor_199215 0=3 MemoryData 847 0 1 blocks.5.att.time_decay 0=2048 21=0 BinaryOp 848 2 1 blocks.5.att.time_decay tensor_199194 tensor_199217 0=0 Split 849 1 2 tensor_199217 tensor_199218 tensor_199219 BinaryOp 850 2 1 tensor_199218 tensor_199180 tensor_199220 0=4 Split 851 1 3 tensor_199220 tensor_199221 tensor_199222 tensor_199223 BinaryOp 852 2 1 tensor_199219 tensor_199221 tensor_199224 0=1 Exp 853 1 1 tensor_199224 tensor_199225 Split 854 1 2 tensor_199225 tensor_199226 tensor_199227 BinaryOp 855 2 1 tensor_199181 tensor_199222 tensor_199228 0=1 Exp 856 1 1 tensor_199228 tensor_199229 Split 857 1 2 tensor_199229 tensor_199230 tensor_199231 BinaryOp 858 2 1 tensor_199174 tensor_199215 tensor_199232 0=2 Reshape 859 1 1 tensor_199232 tensor_199233 0=0 1=1 Gemm 860 1 1 tensor_199233 tensor_199235 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 861 1 1 tensor_199235 tensor_199236 0=-1 BinaryOp 862 2 1 tensor_199140 tensor_199236 tensor_199237 0=0 BinaryOp 863 2 1 tensor_199230 tensor_199187 tensor_199238 0=2 BinaryOp 864 2 1 tensor_199226 tensor_199207 tensor_199239 0=2 BinaryOp 865 2 1 tensor_199239 tensor_199238 tensor_199240 0=0 BinaryOp 866 2 1 tensor_199227 tensor_199209 tensor_199241 0=2 BinaryOp 867 2 1 tensor_199241 tensor_199231 tensor_199242 0=0 Split 868 1 1 tensor_199145 output_state_5_0 Split 869 1 1 tensor_199240 output_state_5_1 Split 870 1 1 tensor_199242 output_state_5_2 Split 871 1 1 tensor_199223 output_state_5_3 Split 872 1 2 tensor_199237 tensor_199247 tensor_199248 LayerNorm 873 1 1 tensor_199247 tensor_199249 0=2048 1=1.000000e-05 2=1 Split 874 1 3 tensor_199249 tensor_199250 tensor_199251 tensor_199252 Split 875 1 2 state_5_4 tensor_199253 tensor_199254 MemoryData 876 0 1 blocks.5.ffn.time_mix_k 0=2048 21=0 Split 877 1 2 blocks.5.ffn.time_mix_k tensor_199256 tensor_199257 MemoryData 878 0 1 blocks.5.ffn.time_mix_r 0=2048 21=0 Split 879 1 2 blocks.5.ffn.time_mix_r tensor_199259 tensor_199260 BinaryOp 880 1 1 tensor_199257 tensor_199261 0=7 1=1 2=1.000000e+00 BinaryOp 881 2 1 tensor_199253 tensor_199261 tensor_199262 0=2 BinaryOp 882 2 1 tensor_199250 tensor_199256 tensor_199263 0=2 BinaryOp 883 2 1 tensor_199263 tensor_199262 tensor_199264 0=0 BinaryOp 884 1 1 tensor_199260 tensor_199265 0=7 1=1 2=1.000000e+00 BinaryOp 885 2 1 tensor_199254 tensor_199265 tensor_199266 0=2 BinaryOp 886 2 1 tensor_199251 tensor_199259 tensor_199267 0=2 BinaryOp 887 2 1 tensor_199267 tensor_199266 tensor_199268 0=0 Reshape 888 1 1 tensor_199268 tensor_199269 0=0 1=1 Gemm 889 1 1 tensor_199269 tensor_199271 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 890 1 1 tensor_199271 tensor_199272 0=-1 Sigmoid 891 1 1 tensor_199272 tensor_199273 Reshape 892 1 1 tensor_199264 tensor_199274 0=0 1=1 Gemm 893 1 1 tensor_199274 tensor_199276 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 894 1 1 tensor_199276 tensor_199277 0=-1 ReLU 895 1 1 tensor_199277 tensor_199278 BinaryOp 896 2 1 tensor_199278 tensor_199278 tensor_199279 0=2 Reshape 897 1 1 tensor_199279 tensor_199280 0=0 1=1 Gemm 898 1 1 tensor_199280 tensor_199282 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 899 1 1 tensor_199282 tensor_199283 0=-1 BinaryOp 900 2 1 tensor_199273 tensor_199283 tensor_199284 0=2 BinaryOp 901 2 1 tensor_199248 tensor_199284 tensor_199285 0=0 Split 902 1 1 tensor_199252 output_state_5_4 Split 903 1 2 tensor_199285 tensor_199287 tensor_199288 LayerNorm 904 1 1 tensor_199287 tensor_199289 0=2048 1=1.000000e-05 2=1 Split 905 1 4 tensor_199289 tensor_199290 tensor_199291 tensor_199292 tensor_199293 Split 906 1 3 state_6_0 tensor_199294 tensor_199295 tensor_199296 MemoryData 907 0 1 blocks.6.att.time_mix_k 0=2048 21=0 Split 908 1 2 blocks.6.att.time_mix_k tensor_199298 tensor_199299 MemoryData 909 0 1 blocks.6.att.time_mix_v 0=2048 21=0 Split 910 1 2 blocks.6.att.time_mix_v tensor_199301 tensor_199302 MemoryData 911 0 1 blocks.6.att.time_mix_r 0=2048 21=0 Split 912 1 2 blocks.6.att.time_mix_r tensor_199304 tensor_199305 BinaryOp 913 1 1 tensor_199299 tensor_199306 0=7 1=1 2=1.000000e+00 BinaryOp 914 2 1 tensor_199294 tensor_199306 tensor_199307 0=2 BinaryOp 915 2 1 tensor_199290 tensor_199298 tensor_199308 0=2 BinaryOp 916 2 1 tensor_199308 tensor_199307 tensor_199309 0=0 BinaryOp 917 1 1 tensor_199302 tensor_199310 0=7 1=1 2=1.000000e+00 BinaryOp 918 2 1 tensor_199295 tensor_199310 tensor_199311 0=2 BinaryOp 919 2 1 tensor_199291 tensor_199301 tensor_199312 0=2 BinaryOp 920 2 1 tensor_199312 tensor_199311 tensor_199313 0=0 BinaryOp 921 1 1 tensor_199305 tensor_199314 0=7 1=1 2=1.000000e+00 BinaryOp 922 2 1 tensor_199296 tensor_199314 tensor_199315 0=2 BinaryOp 923 2 1 tensor_199292 tensor_199304 tensor_199316 0=2 BinaryOp 924 2 1 tensor_199316 tensor_199315 tensor_199317 0=0 Reshape 925 1 1 tensor_199317 tensor_199318 0=0 1=1 Gemm 926 1 1 tensor_199318 tensor_199320 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 927 1 1 tensor_199320 tensor_199321 0=-1 Sigmoid 928 1 1 tensor_199321 tensor_199322 Reshape 929 1 1 tensor_199309 tensor_199323 0=0 1=1 Gemm 930 1 1 tensor_199323 tensor_199325 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 931 1 1 tensor_199325 tensor_199326 0=-1 Split 932 1 3 tensor_199326 tensor_199327 tensor_199328 tensor_199329 Reshape 933 1 1 tensor_199313 tensor_199330 0=0 1=1 Gemm 934 1 1 tensor_199330 tensor_199332 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 935 1 1 tensor_199332 tensor_199333 0=-1 Split 936 1 2 tensor_199333 tensor_199334 tensor_199335 MemoryData 937 0 1 blocks.6.att.time_first 0=2048 21=0 BinaryOp 938 2 1 blocks.6.att.time_first tensor_199327 tensor_199337 0=0 Split 939 1 2 tensor_199337 tensor_199338 tensor_199339 Split 940 1 3 state_6_3 tensor_199340 tensor_199341 tensor_199342 BinaryOp 941 2 1 tensor_199340 tensor_199338 tensor_199343 0=4 Split 942 1 2 tensor_199343 tensor_199344 tensor_199345 BinaryOp 943 2 1 tensor_199341 tensor_199344 tensor_199346 0=1 Exp 944 1 1 tensor_199346 tensor_199347 Split 945 1 2 tensor_199347 tensor_199348 tensor_199349 BinaryOp 946 2 1 tensor_199339 tensor_199345 tensor_199350 0=1 Exp 947 1 1 tensor_199350 tensor_199351 Split 948 1 2 tensor_199351 tensor_199352 tensor_199353 Split 949 1 2 state_6_1 tensor_199354 tensor_199355 Split 950 1 2 state_6_2 tensor_199356 tensor_199357 BinaryOp 951 2 1 tensor_199349 tensor_199356 tensor_199358 0=2 BinaryOp 952 2 1 tensor_199358 tensor_199353 tensor_199359 0=0 BinaryOp 953 2 1 tensor_199352 tensor_199334 tensor_199360 0=2 BinaryOp 954 2 1 tensor_199348 tensor_199354 tensor_199361 0=2 BinaryOp 955 2 1 tensor_199361 tensor_199360 tensor_199362 0=0 BinaryOp 956 2 1 tensor_199362 tensor_199359 tensor_199363 0=3 MemoryData 957 0 1 blocks.6.att.time_decay 0=2048 21=0 BinaryOp 958 2 1 blocks.6.att.time_decay tensor_199342 tensor_199365 0=0 Split 959 1 2 tensor_199365 tensor_199366 tensor_199367 BinaryOp 960 2 1 tensor_199366 tensor_199328 tensor_199368 0=4 Split 961 1 3 tensor_199368 tensor_199369 tensor_199370 tensor_199371 BinaryOp 962 2 1 tensor_199367 tensor_199369 tensor_199372 0=1 Exp 963 1 1 tensor_199372 tensor_199373 Split 964 1 2 tensor_199373 tensor_199374 tensor_199375 BinaryOp 965 2 1 tensor_199329 tensor_199370 tensor_199376 0=1 Exp 966 1 1 tensor_199376 tensor_199377 Split 967 1 2 tensor_199377 tensor_199378 tensor_199379 BinaryOp 968 2 1 tensor_199322 tensor_199363 tensor_199380 0=2 Reshape 969 1 1 tensor_199380 tensor_199381 0=0 1=1 Gemm 970 1 1 tensor_199381 tensor_199383 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 971 1 1 tensor_199383 tensor_199384 0=-1 BinaryOp 972 2 1 tensor_199288 tensor_199384 tensor_199385 0=0 BinaryOp 973 2 1 tensor_199378 tensor_199335 tensor_199386 0=2 BinaryOp 974 2 1 tensor_199374 tensor_199355 tensor_199387 0=2 BinaryOp 975 2 1 tensor_199387 tensor_199386 tensor_199388 0=0 BinaryOp 976 2 1 tensor_199375 tensor_199357 tensor_199389 0=2 BinaryOp 977 2 1 tensor_199389 tensor_199379 tensor_199390 0=0 Split 978 1 1 tensor_199293 output_state_6_0 Split 979 1 1 tensor_199388 output_state_6_1 Split 980 1 1 tensor_199390 output_state_6_2 Split 981 1 1 tensor_199371 output_state_6_3 Split 982 1 2 tensor_199385 tensor_199395 tensor_199396 LayerNorm 983 1 1 tensor_199395 tensor_199397 0=2048 1=1.000000e-05 2=1 Split 984 1 3 tensor_199397 tensor_199398 tensor_199399 tensor_199400 Split 985 1 2 state_6_4 tensor_199401 tensor_199402 MemoryData 986 0 1 blocks.6.ffn.time_mix_k 0=2048 21=0 Split 987 1 2 blocks.6.ffn.time_mix_k tensor_199404 tensor_199405 MemoryData 988 0 1 blocks.6.ffn.time_mix_r 0=2048 21=0 Split 989 1 2 blocks.6.ffn.time_mix_r tensor_199407 tensor_199408 BinaryOp 990 1 1 tensor_199405 tensor_199409 0=7 1=1 2=1.000000e+00 BinaryOp 991 2 1 tensor_199401 tensor_199409 tensor_199410 0=2 BinaryOp 992 2 1 tensor_199398 tensor_199404 tensor_199411 0=2 BinaryOp 993 2 1 tensor_199411 tensor_199410 tensor_199412 0=0 BinaryOp 994 1 1 tensor_199408 tensor_199413 0=7 1=1 2=1.000000e+00 BinaryOp 995 2 1 tensor_199402 tensor_199413 tensor_199414 0=2 BinaryOp 996 2 1 tensor_199399 tensor_199407 tensor_199415 0=2 BinaryOp 997 2 1 tensor_199415 tensor_199414 tensor_199416 0=0 Reshape 998 1 1 tensor_199416 tensor_199417 0=0 1=1 Gemm 999 1 1 tensor_199417 tensor_199419 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1000 1 1 tensor_199419 tensor_199420 0=-1 Sigmoid 1001 1 1 tensor_199420 tensor_199421 Reshape 1002 1 1 tensor_199412 tensor_199422 0=0 1=1 Gemm 1003 1 1 tensor_199422 tensor_199424 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 1004 1 1 tensor_199424 tensor_199425 0=-1 ReLU 1005 1 1 tensor_199425 tensor_199426 BinaryOp 1006 2 1 tensor_199426 tensor_199426 tensor_199427 0=2 Reshape 1007 1 1 tensor_199427 tensor_199428 0=0 1=1 Gemm 1008 1 1 tensor_199428 tensor_199430 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 1009 1 1 tensor_199430 tensor_199431 0=-1 BinaryOp 1010 2 1 tensor_199421 tensor_199431 tensor_199432 0=2 BinaryOp 1011 2 1 tensor_199396 tensor_199432 tensor_199433 0=0 Split 1012 1 1 tensor_199400 output_state_6_4 Split 1013 1 2 tensor_199433 tensor_199435 tensor_199436 LayerNorm 1014 1 1 tensor_199435 tensor_199437 0=2048 1=1.000000e-05 2=1 Split 1015 1 4 tensor_199437 tensor_199438 tensor_199439 tensor_199440 tensor_199441 Split 1016 1 3 state_7_0 tensor_199442 tensor_199443 tensor_199444 MemoryData 1017 0 1 blocks.7.att.time_mix_k 0=2048 21=0 Split 1018 1 2 blocks.7.att.time_mix_k tensor_199446 tensor_199447 MemoryData 1019 0 1 blocks.7.att.time_mix_v 0=2048 21=0 Split 1020 1 2 blocks.7.att.time_mix_v tensor_199449 tensor_199450 MemoryData 1021 0 1 blocks.7.att.time_mix_r 0=2048 21=0 Split 1022 1 2 blocks.7.att.time_mix_r tensor_199452 tensor_199453 BinaryOp 1023 1 1 tensor_199447 tensor_199454 0=7 1=1 2=1.000000e+00 BinaryOp 1024 2 1 tensor_199442 tensor_199454 tensor_199455 0=2 BinaryOp 1025 2 1 tensor_199438 tensor_199446 tensor_199456 0=2 BinaryOp 1026 2 1 tensor_199456 tensor_199455 tensor_199457 0=0 BinaryOp 1027 1 1 tensor_199450 tensor_199458 0=7 1=1 2=1.000000e+00 BinaryOp 1028 2 1 tensor_199443 tensor_199458 tensor_199459 0=2 BinaryOp 1029 2 1 tensor_199439 tensor_199449 tensor_199460 0=2 BinaryOp 1030 2 1 tensor_199460 tensor_199459 tensor_199461 0=0 BinaryOp 1031 1 1 tensor_199453 tensor_199462 0=7 1=1 2=1.000000e+00 BinaryOp 1032 2 1 tensor_199444 tensor_199462 tensor_199463 0=2 BinaryOp 1033 2 1 tensor_199440 tensor_199452 tensor_199464 0=2 BinaryOp 1034 2 1 tensor_199464 tensor_199463 tensor_199465 0=0 Reshape 1035 1 1 tensor_199465 tensor_199466 0=0 1=1 Gemm 1036 1 1 tensor_199466 tensor_199468 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1037 1 1 tensor_199468 tensor_199469 0=-1 Sigmoid 1038 1 1 tensor_199469 tensor_199470 Reshape 1039 1 1 tensor_199457 tensor_199471 0=0 1=1 Gemm 1040 1 1 tensor_199471 tensor_199473 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1041 1 1 tensor_199473 tensor_199474 0=-1 Split 1042 1 3 tensor_199474 tensor_199475 tensor_199476 tensor_199477 Reshape 1043 1 1 tensor_199461 tensor_199478 0=0 1=1 Gemm 1044 1 1 tensor_199478 tensor_199480 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1045 1 1 tensor_199480 tensor_199481 0=-1 Split 1046 1 2 tensor_199481 tensor_199482 tensor_199483 MemoryData 1047 0 1 blocks.7.att.time_first 0=2048 21=0 BinaryOp 1048 2 1 blocks.7.att.time_first tensor_199475 tensor_199485 0=0 Split 1049 1 2 tensor_199485 tensor_199486 tensor_199487 Split 1050 1 3 state_7_3 tensor_199488 tensor_199489 tensor_199490 BinaryOp 1051 2 1 tensor_199488 tensor_199486 tensor_199491 0=4 Split 1052 1 2 tensor_199491 tensor_199492 tensor_199493 BinaryOp 1053 2 1 tensor_199489 tensor_199492 tensor_199494 0=1 Exp 1054 1 1 tensor_199494 tensor_199495 Split 1055 1 2 tensor_199495 tensor_199496 tensor_199497 BinaryOp 1056 2 1 tensor_199487 tensor_199493 tensor_199498 0=1 Exp 1057 1 1 tensor_199498 tensor_199499 Split 1058 1 2 tensor_199499 tensor_199500 tensor_199501 Split 1059 1 2 state_7_1 tensor_199502 tensor_199503 Split 1060 1 2 state_7_2 tensor_199504 tensor_199505 BinaryOp 1061 2 1 tensor_199497 tensor_199504 tensor_199506 0=2 BinaryOp 1062 2 1 tensor_199506 tensor_199501 tensor_199507 0=0 BinaryOp 1063 2 1 tensor_199500 tensor_199482 tensor_199508 0=2 BinaryOp 1064 2 1 tensor_199496 tensor_199502 tensor_199509 0=2 BinaryOp 1065 2 1 tensor_199509 tensor_199508 tensor_199510 0=0 BinaryOp 1066 2 1 tensor_199510 tensor_199507 tensor_199511 0=3 MemoryData 1067 0 1 blocks.7.att.time_decay 0=2048 21=0 BinaryOp 1068 2 1 blocks.7.att.time_decay tensor_199490 tensor_199513 0=0 Split 1069 1 2 tensor_199513 tensor_199514 tensor_199515 BinaryOp 1070 2 1 tensor_199514 tensor_199476 tensor_199516 0=4 Split 1071 1 3 tensor_199516 tensor_199517 tensor_199518 tensor_199519 BinaryOp 1072 2 1 tensor_199515 tensor_199517 tensor_199520 0=1 Exp 1073 1 1 tensor_199520 tensor_199521 Split 1074 1 2 tensor_199521 tensor_199522 tensor_199523 BinaryOp 1075 2 1 tensor_199477 tensor_199518 tensor_199524 0=1 Exp 1076 1 1 tensor_199524 tensor_199525 Split 1077 1 2 tensor_199525 tensor_199526 tensor_199527 BinaryOp 1078 2 1 tensor_199470 tensor_199511 tensor_199528 0=2 Reshape 1079 1 1 tensor_199528 tensor_199529 0=0 1=1 Gemm 1080 1 1 tensor_199529 tensor_199531 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1081 1 1 tensor_199531 tensor_199532 0=-1 BinaryOp 1082 2 1 tensor_199436 tensor_199532 tensor_199533 0=0 BinaryOp 1083 2 1 tensor_199526 tensor_199483 tensor_199534 0=2 BinaryOp 1084 2 1 tensor_199522 tensor_199503 tensor_199535 0=2 BinaryOp 1085 2 1 tensor_199535 tensor_199534 tensor_199536 0=0 BinaryOp 1086 2 1 tensor_199523 tensor_199505 tensor_199537 0=2 BinaryOp 1087 2 1 tensor_199537 tensor_199527 tensor_199538 0=0 Split 1088 1 1 tensor_199441 output_state_7_0 Split 1089 1 1 tensor_199536 output_state_7_1 Split 1090 1 1 tensor_199538 output_state_7_2 Split 1091 1 1 tensor_199519 output_state_7_3 Split 1092 1 2 tensor_199533 tensor_199543 tensor_199544 LayerNorm 1093 1 1 tensor_199543 tensor_199545 0=2048 1=1.000000e-05 2=1 Split 1094 1 3 tensor_199545 tensor_199546 tensor_199547 tensor_199548 Split 1095 1 2 state_7_4 tensor_199549 tensor_199550 MemoryData 1096 0 1 blocks.7.ffn.time_mix_k 0=2048 21=0 Split 1097 1 2 blocks.7.ffn.time_mix_k tensor_199552 tensor_199553 MemoryData 1098 0 1 blocks.7.ffn.time_mix_r 0=2048 21=0 Split 1099 1 2 blocks.7.ffn.time_mix_r tensor_199555 tensor_199556 BinaryOp 1100 1 1 tensor_199553 tensor_199557 0=7 1=1 2=1.000000e+00 BinaryOp 1101 2 1 tensor_199549 tensor_199557 tensor_199558 0=2 BinaryOp 1102 2 1 tensor_199546 tensor_199552 tensor_199559 0=2 BinaryOp 1103 2 1 tensor_199559 tensor_199558 tensor_199560 0=0 BinaryOp 1104 1 1 tensor_199556 tensor_199561 0=7 1=1 2=1.000000e+00 BinaryOp 1105 2 1 tensor_199550 tensor_199561 tensor_199562 0=2 BinaryOp 1106 2 1 tensor_199547 tensor_199555 tensor_199563 0=2 BinaryOp 1107 2 1 tensor_199563 tensor_199562 tensor_199564 0=0 Reshape 1108 1 1 tensor_199564 tensor_199565 0=0 1=1 Gemm 1109 1 1 tensor_199565 tensor_199567 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1110 1 1 tensor_199567 tensor_199568 0=-1 Sigmoid 1111 1 1 tensor_199568 tensor_199569 Reshape 1112 1 1 tensor_199560 tensor_199570 0=0 1=1 Gemm 1113 1 1 tensor_199570 tensor_199572 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 1114 1 1 tensor_199572 tensor_199573 0=-1 ReLU 1115 1 1 tensor_199573 tensor_199574 BinaryOp 1116 2 1 tensor_199574 tensor_199574 tensor_199575 0=2 Reshape 1117 1 1 tensor_199575 tensor_199576 0=0 1=1 Gemm 1118 1 1 tensor_199576 tensor_199578 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 1119 1 1 tensor_199578 tensor_199579 0=-1 BinaryOp 1120 2 1 tensor_199569 tensor_199579 tensor_199580 0=2 BinaryOp 1121 2 1 tensor_199544 tensor_199580 tensor_199581 0=0 Split 1122 1 1 tensor_199548 output_state_7_4 Split 1123 1 2 tensor_199581 tensor_199583 tensor_199584 LayerNorm 1124 1 1 tensor_199583 tensor_199585 0=2048 1=1.000000e-05 2=1 Split 1125 1 4 tensor_199585 tensor_199586 tensor_199587 tensor_199588 tensor_199589 Split 1126 1 3 state_8_0 tensor_199590 tensor_199591 tensor_199592 MemoryData 1127 0 1 blocks.8.att.time_mix_k 0=2048 21=0 Split 1128 1 2 blocks.8.att.time_mix_k tensor_199594 tensor_199595 MemoryData 1129 0 1 blocks.8.att.time_mix_v 0=2048 21=0 Split 1130 1 2 blocks.8.att.time_mix_v tensor_199597 tensor_199598 MemoryData 1131 0 1 blocks.8.att.time_mix_r 0=2048 21=0 Split 1132 1 2 blocks.8.att.time_mix_r tensor_199600 tensor_199601 BinaryOp 1133 1 1 tensor_199595 tensor_199602 0=7 1=1 2=1.000000e+00 BinaryOp 1134 2 1 tensor_199590 tensor_199602 tensor_199603 0=2 BinaryOp 1135 2 1 tensor_199586 tensor_199594 tensor_199604 0=2 BinaryOp 1136 2 1 tensor_199604 tensor_199603 tensor_199605 0=0 BinaryOp 1137 1 1 tensor_199598 tensor_199606 0=7 1=1 2=1.000000e+00 BinaryOp 1138 2 1 tensor_199591 tensor_199606 tensor_199607 0=2 BinaryOp 1139 2 1 tensor_199587 tensor_199597 tensor_199608 0=2 BinaryOp 1140 2 1 tensor_199608 tensor_199607 tensor_199609 0=0 BinaryOp 1141 1 1 tensor_199601 tensor_199610 0=7 1=1 2=1.000000e+00 BinaryOp 1142 2 1 tensor_199592 tensor_199610 tensor_199611 0=2 BinaryOp 1143 2 1 tensor_199588 tensor_199600 tensor_199612 0=2 BinaryOp 1144 2 1 tensor_199612 tensor_199611 tensor_199613 0=0 Reshape 1145 1 1 tensor_199613 tensor_199614 0=0 1=1 Gemm 1146 1 1 tensor_199614 tensor_199616 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1147 1 1 tensor_199616 tensor_199617 0=-1 Sigmoid 1148 1 1 tensor_199617 tensor_199618 Reshape 1149 1 1 tensor_199605 tensor_199619 0=0 1=1 Gemm 1150 1 1 tensor_199619 tensor_199621 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1151 1 1 tensor_199621 tensor_199622 0=-1 Split 1152 1 3 tensor_199622 tensor_199623 tensor_199624 tensor_199625 Reshape 1153 1 1 tensor_199609 tensor_199626 0=0 1=1 Gemm 1154 1 1 tensor_199626 tensor_199628 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1155 1 1 tensor_199628 tensor_199629 0=-1 Split 1156 1 2 tensor_199629 tensor_199630 tensor_199631 MemoryData 1157 0 1 blocks.8.att.time_first 0=2048 21=0 BinaryOp 1158 2 1 blocks.8.att.time_first tensor_199623 tensor_199633 0=0 Split 1159 1 2 tensor_199633 tensor_199634 tensor_199635 Split 1160 1 3 state_8_3 tensor_199636 tensor_199637 tensor_199638 BinaryOp 1161 2 1 tensor_199636 tensor_199634 tensor_199639 0=4 Split 1162 1 2 tensor_199639 tensor_199640 tensor_199641 BinaryOp 1163 2 1 tensor_199637 tensor_199640 tensor_199642 0=1 Exp 1164 1 1 tensor_199642 tensor_199643 Split 1165 1 2 tensor_199643 tensor_199644 tensor_199645 BinaryOp 1166 2 1 tensor_199635 tensor_199641 tensor_199646 0=1 Exp 1167 1 1 tensor_199646 tensor_199647 Split 1168 1 2 tensor_199647 tensor_199648 tensor_199649 Split 1169 1 2 state_8_1 tensor_199650 tensor_199651 Split 1170 1 2 state_8_2 tensor_199652 tensor_199653 BinaryOp 1171 2 1 tensor_199645 tensor_199652 tensor_199654 0=2 BinaryOp 1172 2 1 tensor_199654 tensor_199649 tensor_199655 0=0 BinaryOp 1173 2 1 tensor_199648 tensor_199630 tensor_199656 0=2 BinaryOp 1174 2 1 tensor_199644 tensor_199650 tensor_199657 0=2 BinaryOp 1175 2 1 tensor_199657 tensor_199656 tensor_199658 0=0 BinaryOp 1176 2 1 tensor_199658 tensor_199655 tensor_199659 0=3 MemoryData 1177 0 1 blocks.8.att.time_decay 0=2048 21=0 BinaryOp 1178 2 1 blocks.8.att.time_decay tensor_199638 tensor_199661 0=0 Split 1179 1 2 tensor_199661 tensor_199662 tensor_199663 BinaryOp 1180 2 1 tensor_199662 tensor_199624 tensor_199664 0=4 Split 1181 1 3 tensor_199664 tensor_199665 tensor_199666 tensor_199667 BinaryOp 1182 2 1 tensor_199663 tensor_199665 tensor_199668 0=1 Exp 1183 1 1 tensor_199668 tensor_199669 Split 1184 1 2 tensor_199669 tensor_199670 tensor_199671 BinaryOp 1185 2 1 tensor_199625 tensor_199666 tensor_199672 0=1 Exp 1186 1 1 tensor_199672 tensor_199673 Split 1187 1 2 tensor_199673 tensor_199674 tensor_199675 BinaryOp 1188 2 1 tensor_199618 tensor_199659 tensor_199676 0=2 Reshape 1189 1 1 tensor_199676 tensor_199677 0=0 1=1 Gemm 1190 1 1 tensor_199677 tensor_199679 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1191 1 1 tensor_199679 tensor_199680 0=-1 BinaryOp 1192 2 1 tensor_199584 tensor_199680 tensor_199681 0=0 BinaryOp 1193 2 1 tensor_199674 tensor_199631 tensor_199682 0=2 BinaryOp 1194 2 1 tensor_199670 tensor_199651 tensor_199683 0=2 BinaryOp 1195 2 1 tensor_199683 tensor_199682 tensor_199684 0=0 BinaryOp 1196 2 1 tensor_199671 tensor_199653 tensor_199685 0=2 BinaryOp 1197 2 1 tensor_199685 tensor_199675 tensor_199686 0=0 Split 1198 1 1 tensor_199589 output_state_8_0 Split 1199 1 1 tensor_199684 output_state_8_1 Split 1200 1 1 tensor_199686 output_state_8_2 Split 1201 1 1 tensor_199667 output_state_8_3 Split 1202 1 2 tensor_199681 tensor_199691 tensor_199692 LayerNorm 1203 1 1 tensor_199691 tensor_199693 0=2048 1=1.000000e-05 2=1 Split 1204 1 3 tensor_199693 tensor_199694 tensor_199695 tensor_199696 Split 1205 1 2 state_8_4 tensor_199697 tensor_199698 MemoryData 1206 0 1 blocks.8.ffn.time_mix_k 0=2048 21=0 Split 1207 1 2 blocks.8.ffn.time_mix_k tensor_199700 tensor_199701 MemoryData 1208 0 1 blocks.8.ffn.time_mix_r 0=2048 21=0 Split 1209 1 2 blocks.8.ffn.time_mix_r tensor_199703 tensor_199704 BinaryOp 1210 1 1 tensor_199701 tensor_199705 0=7 1=1 2=1.000000e+00 BinaryOp 1211 2 1 tensor_199697 tensor_199705 tensor_199706 0=2 BinaryOp 1212 2 1 tensor_199694 tensor_199700 tensor_199707 0=2 BinaryOp 1213 2 1 tensor_199707 tensor_199706 tensor_199708 0=0 BinaryOp 1214 1 1 tensor_199704 tensor_199709 0=7 1=1 2=1.000000e+00 BinaryOp 1215 2 1 tensor_199698 tensor_199709 tensor_199710 0=2 BinaryOp 1216 2 1 tensor_199695 tensor_199703 tensor_199711 0=2 BinaryOp 1217 2 1 tensor_199711 tensor_199710 tensor_199712 0=0 Reshape 1218 1 1 tensor_199712 tensor_199713 0=0 1=1 Gemm 1219 1 1 tensor_199713 tensor_199715 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1220 1 1 tensor_199715 tensor_199716 0=-1 Sigmoid 1221 1 1 tensor_199716 tensor_199717 Reshape 1222 1 1 tensor_199708 tensor_199718 0=0 1=1 Gemm 1223 1 1 tensor_199718 tensor_199720 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 1224 1 1 tensor_199720 tensor_199721 0=-1 ReLU 1225 1 1 tensor_199721 tensor_199722 BinaryOp 1226 2 1 tensor_199722 tensor_199722 tensor_199723 0=2 Reshape 1227 1 1 tensor_199723 tensor_199724 0=0 1=1 Gemm 1228 1 1 tensor_199724 tensor_199726 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 1229 1 1 tensor_199726 tensor_199727 0=-1 BinaryOp 1230 2 1 tensor_199717 tensor_199727 tensor_199728 0=2 BinaryOp 1231 2 1 tensor_199692 tensor_199728 tensor_199729 0=0 Split 1232 1 1 tensor_199696 output_state_8_4 Split 1233 1 2 tensor_199729 tensor_199731 tensor_199732 LayerNorm 1234 1 1 tensor_199731 tensor_199733 0=2048 1=1.000000e-05 2=1 Split 1235 1 4 tensor_199733 tensor_199734 tensor_199735 tensor_199736 tensor_199737 Split 1236 1 3 state_9_0 tensor_199738 tensor_199739 tensor_199740 MemoryData 1237 0 1 blocks.9.att.time_mix_k 0=2048 21=0 Split 1238 1 2 blocks.9.att.time_mix_k tensor_199742 tensor_199743 MemoryData 1239 0 1 blocks.9.att.time_mix_v 0=2048 21=0 Split 1240 1 2 blocks.9.att.time_mix_v tensor_199745 tensor_199746 MemoryData 1241 0 1 blocks.9.att.time_mix_r 0=2048 21=0 Split 1242 1 2 blocks.9.att.time_mix_r tensor_199748 tensor_199749 BinaryOp 1243 1 1 tensor_199743 tensor_199750 0=7 1=1 2=1.000000e+00 BinaryOp 1244 2 1 tensor_199738 tensor_199750 tensor_199751 0=2 BinaryOp 1245 2 1 tensor_199734 tensor_199742 tensor_199752 0=2 BinaryOp 1246 2 1 tensor_199752 tensor_199751 tensor_199753 0=0 BinaryOp 1247 1 1 tensor_199746 tensor_199754 0=7 1=1 2=1.000000e+00 BinaryOp 1248 2 1 tensor_199739 tensor_199754 tensor_199755 0=2 BinaryOp 1249 2 1 tensor_199735 tensor_199745 tensor_199756 0=2 BinaryOp 1250 2 1 tensor_199756 tensor_199755 tensor_199757 0=0 BinaryOp 1251 1 1 tensor_199749 tensor_199758 0=7 1=1 2=1.000000e+00 BinaryOp 1252 2 1 tensor_199740 tensor_199758 tensor_199759 0=2 BinaryOp 1253 2 1 tensor_199736 tensor_199748 tensor_199760 0=2 BinaryOp 1254 2 1 tensor_199760 tensor_199759 tensor_199761 0=0 Reshape 1255 1 1 tensor_199761 tensor_199762 0=0 1=1 Gemm 1256 1 1 tensor_199762 tensor_199764 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1257 1 1 tensor_199764 tensor_199765 0=-1 Sigmoid 1258 1 1 tensor_199765 tensor_199766 Reshape 1259 1 1 tensor_199753 tensor_199767 0=0 1=1 Gemm 1260 1 1 tensor_199767 tensor_199769 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1261 1 1 tensor_199769 tensor_199770 0=-1 Split 1262 1 3 tensor_199770 tensor_199771 tensor_199772 tensor_199773 Reshape 1263 1 1 tensor_199757 tensor_199774 0=0 1=1 Gemm 1264 1 1 tensor_199774 tensor_199776 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1265 1 1 tensor_199776 tensor_199777 0=-1 Split 1266 1 2 tensor_199777 tensor_199778 tensor_199779 MemoryData 1267 0 1 blocks.9.att.time_first 0=2048 21=0 BinaryOp 1268 2 1 blocks.9.att.time_first tensor_199771 tensor_199781 0=0 Split 1269 1 2 tensor_199781 tensor_199782 tensor_199783 Split 1270 1 3 state_9_3 tensor_199784 tensor_199785 tensor_199786 BinaryOp 1271 2 1 tensor_199784 tensor_199782 tensor_199787 0=4 Split 1272 1 2 tensor_199787 tensor_199788 tensor_199789 BinaryOp 1273 2 1 tensor_199785 tensor_199788 tensor_199790 0=1 Exp 1274 1 1 tensor_199790 tensor_199791 Split 1275 1 2 tensor_199791 tensor_199792 tensor_199793 BinaryOp 1276 2 1 tensor_199783 tensor_199789 tensor_199794 0=1 Exp 1277 1 1 tensor_199794 tensor_199795 Split 1278 1 2 tensor_199795 tensor_199796 tensor_199797 Split 1279 1 2 state_9_1 tensor_199798 tensor_199799 Split 1280 1 2 state_9_2 tensor_199800 tensor_199801 BinaryOp 1281 2 1 tensor_199793 tensor_199800 tensor_199802 0=2 BinaryOp 1282 2 1 tensor_199802 tensor_199797 tensor_199803 0=0 BinaryOp 1283 2 1 tensor_199796 tensor_199778 tensor_199804 0=2 BinaryOp 1284 2 1 tensor_199792 tensor_199798 tensor_199805 0=2 BinaryOp 1285 2 1 tensor_199805 tensor_199804 tensor_199806 0=0 BinaryOp 1286 2 1 tensor_199806 tensor_199803 tensor_199807 0=3 MemoryData 1287 0 1 blocks.9.att.time_decay 0=2048 21=0 BinaryOp 1288 2 1 blocks.9.att.time_decay tensor_199786 tensor_199809 0=0 Split 1289 1 2 tensor_199809 tensor_199810 tensor_199811 BinaryOp 1290 2 1 tensor_199810 tensor_199772 tensor_199812 0=4 Split 1291 1 3 tensor_199812 tensor_199813 tensor_199814 tensor_199815 BinaryOp 1292 2 1 tensor_199811 tensor_199813 tensor_199816 0=1 Exp 1293 1 1 tensor_199816 tensor_199817 Split 1294 1 2 tensor_199817 tensor_199818 tensor_199819 BinaryOp 1295 2 1 tensor_199773 tensor_199814 tensor_199820 0=1 Exp 1296 1 1 tensor_199820 tensor_199821 Split 1297 1 2 tensor_199821 tensor_199822 tensor_199823 BinaryOp 1298 2 1 tensor_199766 tensor_199807 tensor_199824 0=2 Reshape 1299 1 1 tensor_199824 tensor_199825 0=0 1=1 Gemm 1300 1 1 tensor_199825 tensor_199827 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1301 1 1 tensor_199827 tensor_199828 0=-1 BinaryOp 1302 2 1 tensor_199732 tensor_199828 tensor_199829 0=0 BinaryOp 1303 2 1 tensor_199822 tensor_199779 tensor_199830 0=2 BinaryOp 1304 2 1 tensor_199818 tensor_199799 tensor_199831 0=2 BinaryOp 1305 2 1 tensor_199831 tensor_199830 tensor_199832 0=0 BinaryOp 1306 2 1 tensor_199819 tensor_199801 tensor_199833 0=2 BinaryOp 1307 2 1 tensor_199833 tensor_199823 tensor_199834 0=0 Split 1308 1 1 tensor_199737 output_state_9_0 Split 1309 1 1 tensor_199832 output_state_9_1 Split 1310 1 1 tensor_199834 output_state_9_2 Split 1311 1 1 tensor_199815 output_state_9_3 Split 1312 1 2 tensor_199829 tensor_199839 tensor_199840 LayerNorm 1313 1 1 tensor_199839 tensor_199841 0=2048 1=1.000000e-05 2=1 Split 1314 1 3 tensor_199841 tensor_199842 tensor_199843 tensor_199844 Split 1315 1 2 state_9_4 tensor_199845 tensor_199846 MemoryData 1316 0 1 blocks.9.ffn.time_mix_k 0=2048 21=0 Split 1317 1 2 blocks.9.ffn.time_mix_k tensor_199848 tensor_199849 MemoryData 1318 0 1 blocks.9.ffn.time_mix_r 0=2048 21=0 Split 1319 1 2 blocks.9.ffn.time_mix_r tensor_199851 tensor_199852 BinaryOp 1320 1 1 tensor_199849 tensor_199853 0=7 1=1 2=1.000000e+00 BinaryOp 1321 2 1 tensor_199845 tensor_199853 tensor_199854 0=2 BinaryOp 1322 2 1 tensor_199842 tensor_199848 tensor_199855 0=2 BinaryOp 1323 2 1 tensor_199855 tensor_199854 tensor_199856 0=0 BinaryOp 1324 1 1 tensor_199852 tensor_199857 0=7 1=1 2=1.000000e+00 BinaryOp 1325 2 1 tensor_199846 tensor_199857 tensor_199858 0=2 BinaryOp 1326 2 1 tensor_199843 tensor_199851 tensor_199859 0=2 BinaryOp 1327 2 1 tensor_199859 tensor_199858 tensor_199860 0=0 Reshape 1328 1 1 tensor_199860 tensor_199861 0=0 1=1 Gemm 1329 1 1 tensor_199861 tensor_199863 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1330 1 1 tensor_199863 tensor_199864 0=-1 Sigmoid 1331 1 1 tensor_199864 tensor_199865 Reshape 1332 1 1 tensor_199856 tensor_199866 0=0 1=1 Gemm 1333 1 1 tensor_199866 tensor_199868 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 1334 1 1 tensor_199868 tensor_199869 0=-1 ReLU 1335 1 1 tensor_199869 tensor_199870 BinaryOp 1336 2 1 tensor_199870 tensor_199870 tensor_199871 0=2 Reshape 1337 1 1 tensor_199871 tensor_199872 0=0 1=1 Gemm 1338 1 1 tensor_199872 tensor_199874 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 1339 1 1 tensor_199874 tensor_199875 0=-1 BinaryOp 1340 2 1 tensor_199865 tensor_199875 tensor_199876 0=2 BinaryOp 1341 2 1 tensor_199840 tensor_199876 tensor_199877 0=0 Split 1342 1 1 tensor_199844 output_state_9_4 Split 1343 1 2 tensor_199877 tensor_199879 tensor_199880 LayerNorm 1344 1 1 tensor_199879 tensor_199881 0=2048 1=1.000000e-05 2=1 Split 1345 1 4 tensor_199881 tensor_199882 tensor_199883 tensor_199884 tensor_199885 Split 1346 1 3 state_10_0 tensor_199886 tensor_199887 tensor_199888 MemoryData 1347 0 1 blocks.10.att.time_mix_k 0=2048 21=0 Split 1348 1 2 blocks.10.att.time_mix_k tensor_199890 tensor_199891 MemoryData 1349 0 1 blocks.10.att.time_mix_v 0=2048 21=0 Split 1350 1 2 blocks.10.att.time_mix_v tensor_199893 tensor_199894 MemoryData 1351 0 1 blocks.10.att.time_mix_r 0=2048 21=0 Split 1352 1 2 blocks.10.att.time_mix_r tensor_199896 tensor_199897 BinaryOp 1353 1 1 tensor_199891 tensor_199898 0=7 1=1 2=1.000000e+00 BinaryOp 1354 2 1 tensor_199886 tensor_199898 tensor_199899 0=2 BinaryOp 1355 2 1 tensor_199882 tensor_199890 tensor_199900 0=2 BinaryOp 1356 2 1 tensor_199900 tensor_199899 tensor_199901 0=0 BinaryOp 1357 1 1 tensor_199894 tensor_199902 0=7 1=1 2=1.000000e+00 BinaryOp 1358 2 1 tensor_199887 tensor_199902 tensor_199903 0=2 BinaryOp 1359 2 1 tensor_199883 tensor_199893 tensor_199904 0=2 BinaryOp 1360 2 1 tensor_199904 tensor_199903 tensor_199905 0=0 BinaryOp 1361 1 1 tensor_199897 tensor_199906 0=7 1=1 2=1.000000e+00 BinaryOp 1362 2 1 tensor_199888 tensor_199906 tensor_199907 0=2 BinaryOp 1363 2 1 tensor_199884 tensor_199896 tensor_199908 0=2 BinaryOp 1364 2 1 tensor_199908 tensor_199907 tensor_199909 0=0 Reshape 1365 1 1 tensor_199909 tensor_199910 0=0 1=1 Gemm 1366 1 1 tensor_199910 tensor_199912 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1367 1 1 tensor_199912 tensor_199913 0=-1 Sigmoid 1368 1 1 tensor_199913 tensor_199914 Reshape 1369 1 1 tensor_199901 tensor_199915 0=0 1=1 Gemm 1370 1 1 tensor_199915 tensor_199917 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1371 1 1 tensor_199917 tensor_199918 0=-1 Split 1372 1 3 tensor_199918 tensor_199919 tensor_199920 tensor_199921 Reshape 1373 1 1 tensor_199905 tensor_199922 0=0 1=1 Gemm 1374 1 1 tensor_199922 tensor_199924 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1375 1 1 tensor_199924 tensor_199925 0=-1 Split 1376 1 2 tensor_199925 tensor_199926 tensor_199927 MemoryData 1377 0 1 blocks.10.att.time_first 0=2048 21=0 BinaryOp 1378 2 1 blocks.10.att.time_first tensor_199919 tensor_199929 0=0 Split 1379 1 2 tensor_199929 tensor_199930 tensor_199931 Split 1380 1 3 state_10_3 tensor_199932 tensor_199933 tensor_199934 BinaryOp 1381 2 1 tensor_199932 tensor_199930 tensor_199935 0=4 Split 1382 1 2 tensor_199935 tensor_199936 tensor_199937 BinaryOp 1383 2 1 tensor_199933 tensor_199936 tensor_199938 0=1 Exp 1384 1 1 tensor_199938 tensor_199939 Split 1385 1 2 tensor_199939 tensor_199940 tensor_199941 BinaryOp 1386 2 1 tensor_199931 tensor_199937 tensor_199942 0=1 Exp 1387 1 1 tensor_199942 tensor_199943 Split 1388 1 2 tensor_199943 tensor_199944 tensor_199945 Split 1389 1 2 state_10_1 tensor_199946 tensor_199947 Split 1390 1 2 state_10_2 tensor_199948 tensor_199949 BinaryOp 1391 2 1 tensor_199941 tensor_199948 tensor_199950 0=2 BinaryOp 1392 2 1 tensor_199950 tensor_199945 tensor_199951 0=0 BinaryOp 1393 2 1 tensor_199944 tensor_199926 tensor_199952 0=2 BinaryOp 1394 2 1 tensor_199940 tensor_199946 tensor_199953 0=2 BinaryOp 1395 2 1 tensor_199953 tensor_199952 tensor_199954 0=0 BinaryOp 1396 2 1 tensor_199954 tensor_199951 tensor_199955 0=3 MemoryData 1397 0 1 blocks.10.att.time_decay 0=2048 21=0 BinaryOp 1398 2 1 blocks.10.att.time_decay tensor_199934 tensor_199957 0=0 Split 1399 1 2 tensor_199957 tensor_199958 tensor_199959 BinaryOp 1400 2 1 tensor_199958 tensor_199920 tensor_199960 0=4 Split 1401 1 3 tensor_199960 tensor_199961 tensor_199962 tensor_199963 BinaryOp 1402 2 1 tensor_199959 tensor_199961 tensor_199964 0=1 Exp 1403 1 1 tensor_199964 tensor_199965 Split 1404 1 2 tensor_199965 tensor_199966 tensor_199967 BinaryOp 1405 2 1 tensor_199921 tensor_199962 tensor_199968 0=1 Exp 1406 1 1 tensor_199968 tensor_199969 Split 1407 1 2 tensor_199969 tensor_199970 tensor_199971 BinaryOp 1408 2 1 tensor_199914 tensor_199955 tensor_199972 0=2 Reshape 1409 1 1 tensor_199972 tensor_199973 0=0 1=1 Gemm 1410 1 1 tensor_199973 tensor_199975 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1411 1 1 tensor_199975 tensor_199976 0=-1 BinaryOp 1412 2 1 tensor_199880 tensor_199976 tensor_199977 0=0 BinaryOp 1413 2 1 tensor_199970 tensor_199927 tensor_199978 0=2 BinaryOp 1414 2 1 tensor_199966 tensor_199947 tensor_199979 0=2 BinaryOp 1415 2 1 tensor_199979 tensor_199978 tensor_199980 0=0 BinaryOp 1416 2 1 tensor_199967 tensor_199949 tensor_199981 0=2 BinaryOp 1417 2 1 tensor_199981 tensor_199971 tensor_199982 0=0 Split 1418 1 1 tensor_199885 output_state_10_0 Split 1419 1 1 tensor_199980 output_state_10_1 Split 1420 1 1 tensor_199982 output_state_10_2 Split 1421 1 1 tensor_199963 output_state_10_3 Split 1422 1 2 tensor_199977 tensor_199987 tensor_199988 LayerNorm 1423 1 1 tensor_199987 tensor_199989 0=2048 1=1.000000e-05 2=1 Split 1424 1 3 tensor_199989 tensor_199990 tensor_199991 tensor_199992 Split 1425 1 2 state_10_4 tensor_199993 tensor_199994 MemoryData 1426 0 1 blocks.10.ffn.time_mix_k 0=2048 21=0 Split 1427 1 2 blocks.10.ffn.time_mix_k tensor_199996 tensor_199997 MemoryData 1428 0 1 blocks.10.ffn.time_mix_r 0=2048 21=0 Split 1429 1 2 blocks.10.ffn.time_mix_r tensor_199999 tensor_200000 BinaryOp 1430 1 1 tensor_199997 tensor_200001 0=7 1=1 2=1.000000e+00 BinaryOp 1431 2 1 tensor_199993 tensor_200001 tensor_200002 0=2 BinaryOp 1432 2 1 tensor_199990 tensor_199996 tensor_200003 0=2 BinaryOp 1433 2 1 tensor_200003 tensor_200002 tensor_200004 0=0 BinaryOp 1434 1 1 tensor_200000 tensor_200005 0=7 1=1 2=1.000000e+00 BinaryOp 1435 2 1 tensor_199994 tensor_200005 tensor_200006 0=2 BinaryOp 1436 2 1 tensor_199991 tensor_199999 tensor_200007 0=2 BinaryOp 1437 2 1 tensor_200007 tensor_200006 tensor_200008 0=0 Reshape 1438 1 1 tensor_200008 tensor_200009 0=0 1=1 Gemm 1439 1 1 tensor_200009 tensor_200011 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1440 1 1 tensor_200011 tensor_200012 0=-1 Sigmoid 1441 1 1 tensor_200012 tensor_200013 Reshape 1442 1 1 tensor_200004 tensor_200014 0=0 1=1 Gemm 1443 1 1 tensor_200014 tensor_200016 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 1444 1 1 tensor_200016 tensor_200017 0=-1 ReLU 1445 1 1 tensor_200017 tensor_200018 BinaryOp 1446 2 1 tensor_200018 tensor_200018 tensor_200019 0=2 Reshape 1447 1 1 tensor_200019 tensor_200020 0=0 1=1 Gemm 1448 1 1 tensor_200020 tensor_200022 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 1449 1 1 tensor_200022 tensor_200023 0=-1 BinaryOp 1450 2 1 tensor_200013 tensor_200023 tensor_200024 0=2 BinaryOp 1451 2 1 tensor_199988 tensor_200024 tensor_200025 0=0 Split 1452 1 1 tensor_199992 output_state_10_4 Split 1453 1 2 tensor_200025 tensor_200027 tensor_200028 LayerNorm 1454 1 1 tensor_200027 tensor_200029 0=2048 1=1.000000e-05 2=1 Split 1455 1 4 tensor_200029 tensor_200030 tensor_200031 tensor_200032 tensor_200033 Split 1456 1 3 state_11_0 tensor_200034 tensor_200035 tensor_200036 MemoryData 1457 0 1 blocks.11.att.time_mix_k 0=2048 21=0 Split 1458 1 2 blocks.11.att.time_mix_k tensor_200038 tensor_200039 MemoryData 1459 0 1 blocks.11.att.time_mix_v 0=2048 21=0 Split 1460 1 2 blocks.11.att.time_mix_v tensor_200041 tensor_200042 MemoryData 1461 0 1 blocks.11.att.time_mix_r 0=2048 21=0 Split 1462 1 2 blocks.11.att.time_mix_r tensor_200044 tensor_200045 BinaryOp 1463 1 1 tensor_200039 tensor_200046 0=7 1=1 2=1.000000e+00 BinaryOp 1464 2 1 tensor_200034 tensor_200046 tensor_200047 0=2 BinaryOp 1465 2 1 tensor_200030 tensor_200038 tensor_200048 0=2 BinaryOp 1466 2 1 tensor_200048 tensor_200047 tensor_200049 0=0 BinaryOp 1467 1 1 tensor_200042 tensor_200050 0=7 1=1 2=1.000000e+00 BinaryOp 1468 2 1 tensor_200035 tensor_200050 tensor_200051 0=2 BinaryOp 1469 2 1 tensor_200031 tensor_200041 tensor_200052 0=2 BinaryOp 1470 2 1 tensor_200052 tensor_200051 tensor_200053 0=0 BinaryOp 1471 1 1 tensor_200045 tensor_200054 0=7 1=1 2=1.000000e+00 BinaryOp 1472 2 1 tensor_200036 tensor_200054 tensor_200055 0=2 BinaryOp 1473 2 1 tensor_200032 tensor_200044 tensor_200056 0=2 BinaryOp 1474 2 1 tensor_200056 tensor_200055 tensor_200057 0=0 Reshape 1475 1 1 tensor_200057 tensor_200058 0=0 1=1 Gemm 1476 1 1 tensor_200058 tensor_200060 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1477 1 1 tensor_200060 tensor_200061 0=-1 Sigmoid 1478 1 1 tensor_200061 tensor_200062 Reshape 1479 1 1 tensor_200049 tensor_200063 0=0 1=1 Gemm 1480 1 1 tensor_200063 tensor_200065 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1481 1 1 tensor_200065 tensor_200066 0=-1 Split 1482 1 3 tensor_200066 tensor_200067 tensor_200068 tensor_200069 Reshape 1483 1 1 tensor_200053 tensor_200070 0=0 1=1 Gemm 1484 1 1 tensor_200070 tensor_200072 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1485 1 1 tensor_200072 tensor_200073 0=-1 Split 1486 1 2 tensor_200073 tensor_200074 tensor_200075 MemoryData 1487 0 1 blocks.11.att.time_first 0=2048 21=0 BinaryOp 1488 2 1 blocks.11.att.time_first tensor_200067 tensor_200077 0=0 Split 1489 1 2 tensor_200077 tensor_200078 tensor_200079 Split 1490 1 3 state_11_3 tensor_200080 tensor_200081 tensor_200082 BinaryOp 1491 2 1 tensor_200080 tensor_200078 tensor_200083 0=4 Split 1492 1 2 tensor_200083 tensor_200084 tensor_200085 BinaryOp 1493 2 1 tensor_200081 tensor_200084 tensor_200086 0=1 Exp 1494 1 1 tensor_200086 tensor_200087 Split 1495 1 2 tensor_200087 tensor_200088 tensor_200089 BinaryOp 1496 2 1 tensor_200079 tensor_200085 tensor_200090 0=1 Exp 1497 1 1 tensor_200090 tensor_200091 Split 1498 1 2 tensor_200091 tensor_200092 tensor_200093 Split 1499 1 2 state_11_1 tensor_200094 tensor_200095 Split 1500 1 2 state_11_2 tensor_200096 tensor_200097 BinaryOp 1501 2 1 tensor_200089 tensor_200096 tensor_200098 0=2 BinaryOp 1502 2 1 tensor_200098 tensor_200093 tensor_200099 0=0 BinaryOp 1503 2 1 tensor_200092 tensor_200074 tensor_200100 0=2 BinaryOp 1504 2 1 tensor_200088 tensor_200094 tensor_200101 0=2 BinaryOp 1505 2 1 tensor_200101 tensor_200100 tensor_200102 0=0 BinaryOp 1506 2 1 tensor_200102 tensor_200099 tensor_200103 0=3 MemoryData 1507 0 1 blocks.11.att.time_decay 0=2048 21=0 BinaryOp 1508 2 1 blocks.11.att.time_decay tensor_200082 tensor_200105 0=0 Split 1509 1 2 tensor_200105 tensor_200106 tensor_200107 BinaryOp 1510 2 1 tensor_200106 tensor_200068 tensor_200108 0=4 Split 1511 1 3 tensor_200108 tensor_200109 tensor_200110 tensor_200111 BinaryOp 1512 2 1 tensor_200107 tensor_200109 tensor_200112 0=1 Exp 1513 1 1 tensor_200112 tensor_200113 Split 1514 1 2 tensor_200113 tensor_200114 tensor_200115 BinaryOp 1515 2 1 tensor_200069 tensor_200110 tensor_200116 0=1 Exp 1516 1 1 tensor_200116 tensor_200117 Split 1517 1 2 tensor_200117 tensor_200118 tensor_200119 BinaryOp 1518 2 1 tensor_200062 tensor_200103 tensor_200120 0=2 Reshape 1519 1 1 tensor_200120 tensor_200121 0=0 1=1 Gemm 1520 1 1 tensor_200121 tensor_200123 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1521 1 1 tensor_200123 tensor_200124 0=-1 BinaryOp 1522 2 1 tensor_200028 tensor_200124 tensor_200125 0=0 BinaryOp 1523 2 1 tensor_200118 tensor_200075 tensor_200126 0=2 BinaryOp 1524 2 1 tensor_200114 tensor_200095 tensor_200127 0=2 BinaryOp 1525 2 1 tensor_200127 tensor_200126 tensor_200128 0=0 BinaryOp 1526 2 1 tensor_200115 tensor_200097 tensor_200129 0=2 BinaryOp 1527 2 1 tensor_200129 tensor_200119 tensor_200130 0=0 Split 1528 1 1 tensor_200033 output_state_11_0 Split 1529 1 1 tensor_200128 output_state_11_1 Split 1530 1 1 tensor_200130 output_state_11_2 Split 1531 1 1 tensor_200111 output_state_11_3 Split 1532 1 2 tensor_200125 tensor_200135 tensor_200136 LayerNorm 1533 1 1 tensor_200135 tensor_200137 0=2048 1=1.000000e-05 2=1 Split 1534 1 3 tensor_200137 tensor_200138 tensor_200139 tensor_200140 Split 1535 1 2 state_11_4 tensor_200141 tensor_200142 MemoryData 1536 0 1 blocks.11.ffn.time_mix_k 0=2048 21=0 Split 1537 1 2 blocks.11.ffn.time_mix_k tensor_200144 tensor_200145 MemoryData 1538 0 1 blocks.11.ffn.time_mix_r 0=2048 21=0 Split 1539 1 2 blocks.11.ffn.time_mix_r tensor_200147 tensor_200148 BinaryOp 1540 1 1 tensor_200145 tensor_200149 0=7 1=1 2=1.000000e+00 BinaryOp 1541 2 1 tensor_200141 tensor_200149 tensor_200150 0=2 BinaryOp 1542 2 1 tensor_200138 tensor_200144 tensor_200151 0=2 BinaryOp 1543 2 1 tensor_200151 tensor_200150 tensor_200152 0=0 BinaryOp 1544 1 1 tensor_200148 tensor_200153 0=7 1=1 2=1.000000e+00 BinaryOp 1545 2 1 tensor_200142 tensor_200153 tensor_200154 0=2 BinaryOp 1546 2 1 tensor_200139 tensor_200147 tensor_200155 0=2 BinaryOp 1547 2 1 tensor_200155 tensor_200154 tensor_200156 0=0 Reshape 1548 1 1 tensor_200156 tensor_200157 0=0 1=1 Gemm 1549 1 1 tensor_200157 tensor_200159 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1550 1 1 tensor_200159 tensor_200160 0=-1 Sigmoid 1551 1 1 tensor_200160 tensor_200161 Reshape 1552 1 1 tensor_200152 tensor_200162 0=0 1=1 Gemm 1553 1 1 tensor_200162 tensor_200164 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 1554 1 1 tensor_200164 tensor_200165 0=-1 ReLU 1555 1 1 tensor_200165 tensor_200166 BinaryOp 1556 2 1 tensor_200166 tensor_200166 tensor_200167 0=2 Reshape 1557 1 1 tensor_200167 tensor_200168 0=0 1=1 Gemm 1558 1 1 tensor_200168 tensor_200170 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 1559 1 1 tensor_200170 tensor_200171 0=-1 BinaryOp 1560 2 1 tensor_200161 tensor_200171 tensor_200172 0=2 BinaryOp 1561 2 1 tensor_200136 tensor_200172 tensor_200173 0=0 Split 1562 1 1 tensor_200140 output_state_11_4 Split 1563 1 2 tensor_200173 tensor_200175 tensor_200176 LayerNorm 1564 1 1 tensor_200175 tensor_200177 0=2048 1=1.000000e-05 2=1 Split 1565 1 4 tensor_200177 tensor_200178 tensor_200179 tensor_200180 tensor_200181 Split 1566 1 3 state_12_0 tensor_200182 tensor_200183 tensor_200184 MemoryData 1567 0 1 blocks.12.att.time_mix_k 0=2048 21=0 Split 1568 1 2 blocks.12.att.time_mix_k tensor_200186 tensor_200187 MemoryData 1569 0 1 blocks.12.att.time_mix_v 0=2048 21=0 Split 1570 1 2 blocks.12.att.time_mix_v tensor_200189 tensor_200190 MemoryData 1571 0 1 blocks.12.att.time_mix_r 0=2048 21=0 Split 1572 1 2 blocks.12.att.time_mix_r tensor_200192 tensor_200193 BinaryOp 1573 1 1 tensor_200187 tensor_200194 0=7 1=1 2=1.000000e+00 BinaryOp 1574 2 1 tensor_200182 tensor_200194 tensor_200195 0=2 BinaryOp 1575 2 1 tensor_200178 tensor_200186 tensor_200196 0=2 BinaryOp 1576 2 1 tensor_200196 tensor_200195 tensor_200197 0=0 BinaryOp 1577 1 1 tensor_200190 tensor_200198 0=7 1=1 2=1.000000e+00 BinaryOp 1578 2 1 tensor_200183 tensor_200198 tensor_200199 0=2 BinaryOp 1579 2 1 tensor_200179 tensor_200189 tensor_200200 0=2 BinaryOp 1580 2 1 tensor_200200 tensor_200199 tensor_200201 0=0 BinaryOp 1581 1 1 tensor_200193 tensor_200202 0=7 1=1 2=1.000000e+00 BinaryOp 1582 2 1 tensor_200184 tensor_200202 tensor_200203 0=2 BinaryOp 1583 2 1 tensor_200180 tensor_200192 tensor_200204 0=2 BinaryOp 1584 2 1 tensor_200204 tensor_200203 tensor_200205 0=0 Reshape 1585 1 1 tensor_200205 tensor_200206 0=0 1=1 Gemm 1586 1 1 tensor_200206 tensor_200208 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1587 1 1 tensor_200208 tensor_200209 0=-1 Sigmoid 1588 1 1 tensor_200209 tensor_200210 Reshape 1589 1 1 tensor_200197 tensor_200211 0=0 1=1 Gemm 1590 1 1 tensor_200211 tensor_200213 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1591 1 1 tensor_200213 tensor_200214 0=-1 Split 1592 1 3 tensor_200214 tensor_200215 tensor_200216 tensor_200217 Reshape 1593 1 1 tensor_200201 tensor_200218 0=0 1=1 Gemm 1594 1 1 tensor_200218 tensor_200220 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1595 1 1 tensor_200220 tensor_200221 0=-1 Split 1596 1 2 tensor_200221 tensor_200222 tensor_200223 MemoryData 1597 0 1 blocks.12.att.time_first 0=2048 21=0 BinaryOp 1598 2 1 blocks.12.att.time_first tensor_200215 tensor_200225 0=0 Split 1599 1 2 tensor_200225 tensor_200226 tensor_200227 Split 1600 1 3 state_12_3 tensor_200228 tensor_200229 tensor_200230 BinaryOp 1601 2 1 tensor_200228 tensor_200226 tensor_200231 0=4 Split 1602 1 2 tensor_200231 tensor_200232 tensor_200233 BinaryOp 1603 2 1 tensor_200229 tensor_200232 tensor_200234 0=1 Exp 1604 1 1 tensor_200234 tensor_200235 Split 1605 1 2 tensor_200235 tensor_200236 tensor_200237 BinaryOp 1606 2 1 tensor_200227 tensor_200233 tensor_200238 0=1 Exp 1607 1 1 tensor_200238 tensor_200239 Split 1608 1 2 tensor_200239 tensor_200240 tensor_200241 Split 1609 1 2 state_12_1 tensor_200242 tensor_200243 Split 1610 1 2 state_12_2 tensor_200244 tensor_200245 BinaryOp 1611 2 1 tensor_200237 tensor_200244 tensor_200246 0=2 BinaryOp 1612 2 1 tensor_200246 tensor_200241 tensor_200247 0=0 BinaryOp 1613 2 1 tensor_200240 tensor_200222 tensor_200248 0=2 BinaryOp 1614 2 1 tensor_200236 tensor_200242 tensor_200249 0=2 BinaryOp 1615 2 1 tensor_200249 tensor_200248 tensor_200250 0=0 BinaryOp 1616 2 1 tensor_200250 tensor_200247 tensor_200251 0=3 MemoryData 1617 0 1 blocks.12.att.time_decay 0=2048 21=0 BinaryOp 1618 2 1 blocks.12.att.time_decay tensor_200230 tensor_200253 0=0 Split 1619 1 2 tensor_200253 tensor_200254 tensor_200255 BinaryOp 1620 2 1 tensor_200254 tensor_200216 tensor_200256 0=4 Split 1621 1 3 tensor_200256 tensor_200257 tensor_200258 tensor_200259 BinaryOp 1622 2 1 tensor_200255 tensor_200257 tensor_200260 0=1 Exp 1623 1 1 tensor_200260 tensor_200261 Split 1624 1 2 tensor_200261 tensor_200262 tensor_200263 BinaryOp 1625 2 1 tensor_200217 tensor_200258 tensor_200264 0=1 Exp 1626 1 1 tensor_200264 tensor_200265 Split 1627 1 2 tensor_200265 tensor_200266 tensor_200267 BinaryOp 1628 2 1 tensor_200210 tensor_200251 tensor_200268 0=2 Reshape 1629 1 1 tensor_200268 tensor_200269 0=0 1=1 Gemm 1630 1 1 tensor_200269 tensor_200271 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1631 1 1 tensor_200271 tensor_200272 0=-1 BinaryOp 1632 2 1 tensor_200176 tensor_200272 tensor_200273 0=0 BinaryOp 1633 2 1 tensor_200266 tensor_200223 tensor_200274 0=2 BinaryOp 1634 2 1 tensor_200262 tensor_200243 tensor_200275 0=2 BinaryOp 1635 2 1 tensor_200275 tensor_200274 tensor_200276 0=0 BinaryOp 1636 2 1 tensor_200263 tensor_200245 tensor_200277 0=2 BinaryOp 1637 2 1 tensor_200277 tensor_200267 tensor_200278 0=0 Split 1638 1 1 tensor_200181 output_state_12_0 Split 1639 1 1 tensor_200276 output_state_12_1 Split 1640 1 1 tensor_200278 output_state_12_2 Split 1641 1 1 tensor_200259 output_state_12_3 Split 1642 1 2 tensor_200273 tensor_200283 tensor_200284 LayerNorm 1643 1 1 tensor_200283 tensor_200285 0=2048 1=1.000000e-05 2=1 Split 1644 1 3 tensor_200285 tensor_200286 tensor_200287 tensor_200288 Split 1645 1 2 state_12_4 tensor_200289 tensor_200290 MemoryData 1646 0 1 blocks.12.ffn.time_mix_k 0=2048 21=0 Split 1647 1 2 blocks.12.ffn.time_mix_k tensor_200292 tensor_200293 MemoryData 1648 0 1 blocks.12.ffn.time_mix_r 0=2048 21=0 Split 1649 1 2 blocks.12.ffn.time_mix_r tensor_200295 tensor_200296 BinaryOp 1650 1 1 tensor_200293 tensor_200297 0=7 1=1 2=1.000000e+00 BinaryOp 1651 2 1 tensor_200289 tensor_200297 tensor_200298 0=2 BinaryOp 1652 2 1 tensor_200286 tensor_200292 tensor_200299 0=2 BinaryOp 1653 2 1 tensor_200299 tensor_200298 tensor_200300 0=0 BinaryOp 1654 1 1 tensor_200296 tensor_200301 0=7 1=1 2=1.000000e+00 BinaryOp 1655 2 1 tensor_200290 tensor_200301 tensor_200302 0=2 BinaryOp 1656 2 1 tensor_200287 tensor_200295 tensor_200303 0=2 BinaryOp 1657 2 1 tensor_200303 tensor_200302 tensor_200304 0=0 Reshape 1658 1 1 tensor_200304 tensor_200305 0=0 1=1 Gemm 1659 1 1 tensor_200305 tensor_200307 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1660 1 1 tensor_200307 tensor_200308 0=-1 Sigmoid 1661 1 1 tensor_200308 tensor_200309 Reshape 1662 1 1 tensor_200300 tensor_200310 0=0 1=1 Gemm 1663 1 1 tensor_200310 tensor_200312 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 1664 1 1 tensor_200312 tensor_200313 0=-1 ReLU 1665 1 1 tensor_200313 tensor_200314 BinaryOp 1666 2 1 tensor_200314 tensor_200314 tensor_200315 0=2 Reshape 1667 1 1 tensor_200315 tensor_200316 0=0 1=1 Gemm 1668 1 1 tensor_200316 tensor_200318 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 1669 1 1 tensor_200318 tensor_200319 0=-1 BinaryOp 1670 2 1 tensor_200309 tensor_200319 tensor_200320 0=2 BinaryOp 1671 2 1 tensor_200284 tensor_200320 tensor_200321 0=0 Split 1672 1 1 tensor_200288 output_state_12_4 Split 1673 1 2 tensor_200321 tensor_200323 tensor_200324 LayerNorm 1674 1 1 tensor_200323 tensor_200325 0=2048 1=1.000000e-05 2=1 Split 1675 1 4 tensor_200325 tensor_200326 tensor_200327 tensor_200328 tensor_200329 Split 1676 1 3 state_13_0 tensor_200330 tensor_200331 tensor_200332 MemoryData 1677 0 1 blocks.13.att.time_mix_k 0=2048 21=0 Split 1678 1 2 blocks.13.att.time_mix_k tensor_200334 tensor_200335 MemoryData 1679 0 1 blocks.13.att.time_mix_v 0=2048 21=0 Split 1680 1 2 blocks.13.att.time_mix_v tensor_200337 tensor_200338 MemoryData 1681 0 1 blocks.13.att.time_mix_r 0=2048 21=0 Split 1682 1 2 blocks.13.att.time_mix_r tensor_200340 tensor_200341 BinaryOp 1683 1 1 tensor_200335 tensor_200342 0=7 1=1 2=1.000000e+00 BinaryOp 1684 2 1 tensor_200330 tensor_200342 tensor_200343 0=2 BinaryOp 1685 2 1 tensor_200326 tensor_200334 tensor_200344 0=2 BinaryOp 1686 2 1 tensor_200344 tensor_200343 tensor_200345 0=0 BinaryOp 1687 1 1 tensor_200338 tensor_200346 0=7 1=1 2=1.000000e+00 BinaryOp 1688 2 1 tensor_200331 tensor_200346 tensor_200347 0=2 BinaryOp 1689 2 1 tensor_200327 tensor_200337 tensor_200348 0=2 BinaryOp 1690 2 1 tensor_200348 tensor_200347 tensor_200349 0=0 BinaryOp 1691 1 1 tensor_200341 tensor_200350 0=7 1=1 2=1.000000e+00 BinaryOp 1692 2 1 tensor_200332 tensor_200350 tensor_200351 0=2 BinaryOp 1693 2 1 tensor_200328 tensor_200340 tensor_200352 0=2 BinaryOp 1694 2 1 tensor_200352 tensor_200351 tensor_200353 0=0 Reshape 1695 1 1 tensor_200353 tensor_200354 0=0 1=1 Gemm 1696 1 1 tensor_200354 tensor_200356 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1697 1 1 tensor_200356 tensor_200357 0=-1 Sigmoid 1698 1 1 tensor_200357 tensor_200358 Reshape 1699 1 1 tensor_200345 tensor_200359 0=0 1=1 Gemm 1700 1 1 tensor_200359 tensor_200361 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1701 1 1 tensor_200361 tensor_200362 0=-1 Split 1702 1 3 tensor_200362 tensor_200363 tensor_200364 tensor_200365 Reshape 1703 1 1 tensor_200349 tensor_200366 0=0 1=1 Gemm 1704 1 1 tensor_200366 tensor_200368 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1705 1 1 tensor_200368 tensor_200369 0=-1 Split 1706 1 2 tensor_200369 tensor_200370 tensor_200371 MemoryData 1707 0 1 blocks.13.att.time_first 0=2048 21=0 BinaryOp 1708 2 1 blocks.13.att.time_first tensor_200363 tensor_200373 0=0 Split 1709 1 2 tensor_200373 tensor_200374 tensor_200375 Split 1710 1 3 state_13_3 tensor_200376 tensor_200377 tensor_200378 BinaryOp 1711 2 1 tensor_200376 tensor_200374 tensor_200379 0=4 Split 1712 1 2 tensor_200379 tensor_200380 tensor_200381 BinaryOp 1713 2 1 tensor_200377 tensor_200380 tensor_200382 0=1 Exp 1714 1 1 tensor_200382 tensor_200383 Split 1715 1 2 tensor_200383 tensor_200384 tensor_200385 BinaryOp 1716 2 1 tensor_200375 tensor_200381 tensor_200386 0=1 Exp 1717 1 1 tensor_200386 tensor_200387 Split 1718 1 2 tensor_200387 tensor_200388 tensor_200389 Split 1719 1 2 state_13_1 tensor_200390 tensor_200391 Split 1720 1 2 state_13_2 tensor_200392 tensor_200393 BinaryOp 1721 2 1 tensor_200385 tensor_200392 tensor_200394 0=2 BinaryOp 1722 2 1 tensor_200394 tensor_200389 tensor_200395 0=0 BinaryOp 1723 2 1 tensor_200388 tensor_200370 tensor_200396 0=2 BinaryOp 1724 2 1 tensor_200384 tensor_200390 tensor_200397 0=2 BinaryOp 1725 2 1 tensor_200397 tensor_200396 tensor_200398 0=0 BinaryOp 1726 2 1 tensor_200398 tensor_200395 tensor_200399 0=3 MemoryData 1727 0 1 blocks.13.att.time_decay 0=2048 21=0 BinaryOp 1728 2 1 blocks.13.att.time_decay tensor_200378 tensor_200401 0=0 Split 1729 1 2 tensor_200401 tensor_200402 tensor_200403 BinaryOp 1730 2 1 tensor_200402 tensor_200364 tensor_200404 0=4 Split 1731 1 3 tensor_200404 tensor_200405 tensor_200406 tensor_200407 BinaryOp 1732 2 1 tensor_200403 tensor_200405 tensor_200408 0=1 Exp 1733 1 1 tensor_200408 tensor_200409 Split 1734 1 2 tensor_200409 tensor_200410 tensor_200411 BinaryOp 1735 2 1 tensor_200365 tensor_200406 tensor_200412 0=1 Exp 1736 1 1 tensor_200412 tensor_200413 Split 1737 1 2 tensor_200413 tensor_200414 tensor_200415 BinaryOp 1738 2 1 tensor_200358 tensor_200399 tensor_200416 0=2 Reshape 1739 1 1 tensor_200416 tensor_200417 0=0 1=1 Gemm 1740 1 1 tensor_200417 tensor_200419 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1741 1 1 tensor_200419 tensor_200420 0=-1 BinaryOp 1742 2 1 tensor_200324 tensor_200420 tensor_200421 0=0 BinaryOp 1743 2 1 tensor_200414 tensor_200371 tensor_200422 0=2 BinaryOp 1744 2 1 tensor_200410 tensor_200391 tensor_200423 0=2 BinaryOp 1745 2 1 tensor_200423 tensor_200422 tensor_200424 0=0 BinaryOp 1746 2 1 tensor_200411 tensor_200393 tensor_200425 0=2 BinaryOp 1747 2 1 tensor_200425 tensor_200415 tensor_200426 0=0 Split 1748 1 1 tensor_200329 output_state_13_0 Split 1749 1 1 tensor_200424 output_state_13_1 Split 1750 1 1 tensor_200426 output_state_13_2 Split 1751 1 1 tensor_200407 output_state_13_3 Split 1752 1 2 tensor_200421 tensor_200431 tensor_200432 LayerNorm 1753 1 1 tensor_200431 tensor_200433 0=2048 1=1.000000e-05 2=1 Split 1754 1 3 tensor_200433 tensor_200434 tensor_200435 tensor_200436 Split 1755 1 2 state_13_4 tensor_200437 tensor_200438 MemoryData 1756 0 1 blocks.13.ffn.time_mix_k 0=2048 21=0 Split 1757 1 2 blocks.13.ffn.time_mix_k tensor_200440 tensor_200441 MemoryData 1758 0 1 blocks.13.ffn.time_mix_r 0=2048 21=0 Split 1759 1 2 blocks.13.ffn.time_mix_r tensor_200443 tensor_200444 BinaryOp 1760 1 1 tensor_200441 tensor_200445 0=7 1=1 2=1.000000e+00 BinaryOp 1761 2 1 tensor_200437 tensor_200445 tensor_200446 0=2 BinaryOp 1762 2 1 tensor_200434 tensor_200440 tensor_200447 0=2 BinaryOp 1763 2 1 tensor_200447 tensor_200446 tensor_200448 0=0 BinaryOp 1764 1 1 tensor_200444 tensor_200449 0=7 1=1 2=1.000000e+00 BinaryOp 1765 2 1 tensor_200438 tensor_200449 tensor_200450 0=2 BinaryOp 1766 2 1 tensor_200435 tensor_200443 tensor_200451 0=2 BinaryOp 1767 2 1 tensor_200451 tensor_200450 tensor_200452 0=0 Reshape 1768 1 1 tensor_200452 tensor_200453 0=0 1=1 Gemm 1769 1 1 tensor_200453 tensor_200455 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1770 1 1 tensor_200455 tensor_200456 0=-1 Sigmoid 1771 1 1 tensor_200456 tensor_200457 Reshape 1772 1 1 tensor_200448 tensor_200458 0=0 1=1 Gemm 1773 1 1 tensor_200458 tensor_200460 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 1774 1 1 tensor_200460 tensor_200461 0=-1 ReLU 1775 1 1 tensor_200461 tensor_200462 BinaryOp 1776 2 1 tensor_200462 tensor_200462 tensor_200463 0=2 Reshape 1777 1 1 tensor_200463 tensor_200464 0=0 1=1 Gemm 1778 1 1 tensor_200464 tensor_200466 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 1779 1 1 tensor_200466 tensor_200467 0=-1 BinaryOp 1780 2 1 tensor_200457 tensor_200467 tensor_200468 0=2 BinaryOp 1781 2 1 tensor_200432 tensor_200468 tensor_200469 0=0 Split 1782 1 1 tensor_200436 output_state_13_4 Split 1783 1 2 tensor_200469 tensor_200471 tensor_200472 LayerNorm 1784 1 1 tensor_200471 tensor_200473 0=2048 1=1.000000e-05 2=1 Split 1785 1 4 tensor_200473 tensor_200474 tensor_200475 tensor_200476 tensor_200477 Split 1786 1 3 state_14_0 tensor_200478 tensor_200479 tensor_200480 MemoryData 1787 0 1 blocks.14.att.time_mix_k 0=2048 21=0 Split 1788 1 2 blocks.14.att.time_mix_k tensor_200482 tensor_200483 MemoryData 1789 0 1 blocks.14.att.time_mix_v 0=2048 21=0 Split 1790 1 2 blocks.14.att.time_mix_v tensor_200485 tensor_200486 MemoryData 1791 0 1 blocks.14.att.time_mix_r 0=2048 21=0 Split 1792 1 2 blocks.14.att.time_mix_r tensor_200488 tensor_200489 BinaryOp 1793 1 1 tensor_200483 tensor_200490 0=7 1=1 2=1.000000e+00 BinaryOp 1794 2 1 tensor_200478 tensor_200490 tensor_200491 0=2 BinaryOp 1795 2 1 tensor_200474 tensor_200482 tensor_200492 0=2 BinaryOp 1796 2 1 tensor_200492 tensor_200491 tensor_200493 0=0 BinaryOp 1797 1 1 tensor_200486 tensor_200494 0=7 1=1 2=1.000000e+00 BinaryOp 1798 2 1 tensor_200479 tensor_200494 tensor_200495 0=2 BinaryOp 1799 2 1 tensor_200475 tensor_200485 tensor_200496 0=2 BinaryOp 1800 2 1 tensor_200496 tensor_200495 tensor_200497 0=0 BinaryOp 1801 1 1 tensor_200489 tensor_200498 0=7 1=1 2=1.000000e+00 BinaryOp 1802 2 1 tensor_200480 tensor_200498 tensor_200499 0=2 BinaryOp 1803 2 1 tensor_200476 tensor_200488 tensor_200500 0=2 BinaryOp 1804 2 1 tensor_200500 tensor_200499 tensor_200501 0=0 Reshape 1805 1 1 tensor_200501 tensor_200502 0=0 1=1 Gemm 1806 1 1 tensor_200502 tensor_200504 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1807 1 1 tensor_200504 tensor_200505 0=-1 Sigmoid 1808 1 1 tensor_200505 tensor_200506 Reshape 1809 1 1 tensor_200493 tensor_200507 0=0 1=1 Gemm 1810 1 1 tensor_200507 tensor_200509 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1811 1 1 tensor_200509 tensor_200510 0=-1 Split 1812 1 3 tensor_200510 tensor_200511 tensor_200512 tensor_200513 Reshape 1813 1 1 tensor_200497 tensor_200514 0=0 1=1 Gemm 1814 1 1 tensor_200514 tensor_200516 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1815 1 1 tensor_200516 tensor_200517 0=-1 Split 1816 1 2 tensor_200517 tensor_200518 tensor_200519 MemoryData 1817 0 1 blocks.14.att.time_first 0=2048 21=0 BinaryOp 1818 2 1 blocks.14.att.time_first tensor_200511 tensor_200521 0=0 Split 1819 1 2 tensor_200521 tensor_200522 tensor_200523 Split 1820 1 3 state_14_3 tensor_200524 tensor_200525 tensor_200526 BinaryOp 1821 2 1 tensor_200524 tensor_200522 tensor_200527 0=4 Split 1822 1 2 tensor_200527 tensor_200528 tensor_200529 BinaryOp 1823 2 1 tensor_200525 tensor_200528 tensor_200530 0=1 Exp 1824 1 1 tensor_200530 tensor_200531 Split 1825 1 2 tensor_200531 tensor_200532 tensor_200533 BinaryOp 1826 2 1 tensor_200523 tensor_200529 tensor_200534 0=1 Exp 1827 1 1 tensor_200534 tensor_200535 Split 1828 1 2 tensor_200535 tensor_200536 tensor_200537 Split 1829 1 2 state_14_1 tensor_200538 tensor_200539 Split 1830 1 2 state_14_2 tensor_200540 tensor_200541 BinaryOp 1831 2 1 tensor_200533 tensor_200540 tensor_200542 0=2 BinaryOp 1832 2 1 tensor_200542 tensor_200537 tensor_200543 0=0 BinaryOp 1833 2 1 tensor_200536 tensor_200518 tensor_200544 0=2 BinaryOp 1834 2 1 tensor_200532 tensor_200538 tensor_200545 0=2 BinaryOp 1835 2 1 tensor_200545 tensor_200544 tensor_200546 0=0 BinaryOp 1836 2 1 tensor_200546 tensor_200543 tensor_200547 0=3 MemoryData 1837 0 1 blocks.14.att.time_decay 0=2048 21=0 BinaryOp 1838 2 1 blocks.14.att.time_decay tensor_200526 tensor_200549 0=0 Split 1839 1 2 tensor_200549 tensor_200550 tensor_200551 BinaryOp 1840 2 1 tensor_200550 tensor_200512 tensor_200552 0=4 Split 1841 1 3 tensor_200552 tensor_200553 tensor_200554 tensor_200555 BinaryOp 1842 2 1 tensor_200551 tensor_200553 tensor_200556 0=1 Exp 1843 1 1 tensor_200556 tensor_200557 Split 1844 1 2 tensor_200557 tensor_200558 tensor_200559 BinaryOp 1845 2 1 tensor_200513 tensor_200554 tensor_200560 0=1 Exp 1846 1 1 tensor_200560 tensor_200561 Split 1847 1 2 tensor_200561 tensor_200562 tensor_200563 BinaryOp 1848 2 1 tensor_200506 tensor_200547 tensor_200564 0=2 Reshape 1849 1 1 tensor_200564 tensor_200565 0=0 1=1 Gemm 1850 1 1 tensor_200565 tensor_200567 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1851 1 1 tensor_200567 tensor_200568 0=-1 BinaryOp 1852 2 1 tensor_200472 tensor_200568 tensor_200569 0=0 BinaryOp 1853 2 1 tensor_200562 tensor_200519 tensor_200570 0=2 BinaryOp 1854 2 1 tensor_200558 tensor_200539 tensor_200571 0=2 BinaryOp 1855 2 1 tensor_200571 tensor_200570 tensor_200572 0=0 BinaryOp 1856 2 1 tensor_200559 tensor_200541 tensor_200573 0=2 BinaryOp 1857 2 1 tensor_200573 tensor_200563 tensor_200574 0=0 Split 1858 1 1 tensor_200477 output_state_14_0 Split 1859 1 1 tensor_200572 output_state_14_1 Split 1860 1 1 tensor_200574 output_state_14_2 Split 1861 1 1 tensor_200555 output_state_14_3 Split 1862 1 2 tensor_200569 tensor_200579 tensor_200580 LayerNorm 1863 1 1 tensor_200579 tensor_200581 0=2048 1=1.000000e-05 2=1 Split 1864 1 3 tensor_200581 tensor_200582 tensor_200583 tensor_200584 Split 1865 1 2 state_14_4 tensor_200585 tensor_200586 MemoryData 1866 0 1 blocks.14.ffn.time_mix_k 0=2048 21=0 Split 1867 1 2 blocks.14.ffn.time_mix_k tensor_200588 tensor_200589 MemoryData 1868 0 1 blocks.14.ffn.time_mix_r 0=2048 21=0 Split 1869 1 2 blocks.14.ffn.time_mix_r tensor_200591 tensor_200592 BinaryOp 1870 1 1 tensor_200589 tensor_200593 0=7 1=1 2=1.000000e+00 BinaryOp 1871 2 1 tensor_200585 tensor_200593 tensor_200594 0=2 BinaryOp 1872 2 1 tensor_200582 tensor_200588 tensor_200595 0=2 BinaryOp 1873 2 1 tensor_200595 tensor_200594 tensor_200596 0=0 BinaryOp 1874 1 1 tensor_200592 tensor_200597 0=7 1=1 2=1.000000e+00 BinaryOp 1875 2 1 tensor_200586 tensor_200597 tensor_200598 0=2 BinaryOp 1876 2 1 tensor_200583 tensor_200591 tensor_200599 0=2 BinaryOp 1877 2 1 tensor_200599 tensor_200598 tensor_200600 0=0 Reshape 1878 1 1 tensor_200600 tensor_200601 0=0 1=1 Gemm 1879 1 1 tensor_200601 tensor_200603 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1880 1 1 tensor_200603 tensor_200604 0=-1 Sigmoid 1881 1 1 tensor_200604 tensor_200605 Reshape 1882 1 1 tensor_200596 tensor_200606 0=0 1=1 Gemm 1883 1 1 tensor_200606 tensor_200608 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 1884 1 1 tensor_200608 tensor_200609 0=-1 ReLU 1885 1 1 tensor_200609 tensor_200610 BinaryOp 1886 2 1 tensor_200610 tensor_200610 tensor_200611 0=2 Reshape 1887 1 1 tensor_200611 tensor_200612 0=0 1=1 Gemm 1888 1 1 tensor_200612 tensor_200614 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 1889 1 1 tensor_200614 tensor_200615 0=-1 BinaryOp 1890 2 1 tensor_200605 tensor_200615 tensor_200616 0=2 BinaryOp 1891 2 1 tensor_200580 tensor_200616 tensor_200617 0=0 Split 1892 1 1 tensor_200584 output_state_14_4 Split 1893 1 2 tensor_200617 tensor_200619 tensor_200620 LayerNorm 1894 1 1 tensor_200619 tensor_200621 0=2048 1=1.000000e-05 2=1 Split 1895 1 4 tensor_200621 tensor_200622 tensor_200623 tensor_200624 tensor_200625 Split 1896 1 3 state_15_0 tensor_200626 tensor_200627 tensor_200628 MemoryData 1897 0 1 blocks.15.att.time_mix_k 0=2048 21=0 Split 1898 1 2 blocks.15.att.time_mix_k tensor_200630 tensor_200631 MemoryData 1899 0 1 blocks.15.att.time_mix_v 0=2048 21=0 Split 1900 1 2 blocks.15.att.time_mix_v tensor_200633 tensor_200634 MemoryData 1901 0 1 blocks.15.att.time_mix_r 0=2048 21=0 Split 1902 1 2 blocks.15.att.time_mix_r tensor_200636 tensor_200637 BinaryOp 1903 1 1 tensor_200631 tensor_200638 0=7 1=1 2=1.000000e+00 BinaryOp 1904 2 1 tensor_200626 tensor_200638 tensor_200639 0=2 BinaryOp 1905 2 1 tensor_200622 tensor_200630 tensor_200640 0=2 BinaryOp 1906 2 1 tensor_200640 tensor_200639 tensor_200641 0=0 BinaryOp 1907 1 1 tensor_200634 tensor_200642 0=7 1=1 2=1.000000e+00 BinaryOp 1908 2 1 tensor_200627 tensor_200642 tensor_200643 0=2 BinaryOp 1909 2 1 tensor_200623 tensor_200633 tensor_200644 0=2 BinaryOp 1910 2 1 tensor_200644 tensor_200643 tensor_200645 0=0 BinaryOp 1911 1 1 tensor_200637 tensor_200646 0=7 1=1 2=1.000000e+00 BinaryOp 1912 2 1 tensor_200628 tensor_200646 tensor_200647 0=2 BinaryOp 1913 2 1 tensor_200624 tensor_200636 tensor_200648 0=2 BinaryOp 1914 2 1 tensor_200648 tensor_200647 tensor_200649 0=0 Reshape 1915 1 1 tensor_200649 tensor_200650 0=0 1=1 Gemm 1916 1 1 tensor_200650 tensor_200652 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1917 1 1 tensor_200652 tensor_200653 0=-1 Sigmoid 1918 1 1 tensor_200653 tensor_200654 Reshape 1919 1 1 tensor_200641 tensor_200655 0=0 1=1 Gemm 1920 1 1 tensor_200655 tensor_200657 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1921 1 1 tensor_200657 tensor_200658 0=-1 Split 1922 1 3 tensor_200658 tensor_200659 tensor_200660 tensor_200661 Reshape 1923 1 1 tensor_200645 tensor_200662 0=0 1=1 Gemm 1924 1 1 tensor_200662 tensor_200664 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1925 1 1 tensor_200664 tensor_200665 0=-1 Split 1926 1 2 tensor_200665 tensor_200666 tensor_200667 MemoryData 1927 0 1 blocks.15.att.time_first 0=2048 21=0 BinaryOp 1928 2 1 blocks.15.att.time_first tensor_200659 tensor_200669 0=0 Split 1929 1 2 tensor_200669 tensor_200670 tensor_200671 Split 1930 1 3 state_15_3 tensor_200672 tensor_200673 tensor_200674 BinaryOp 1931 2 1 tensor_200672 tensor_200670 tensor_200675 0=4 Split 1932 1 2 tensor_200675 tensor_200676 tensor_200677 BinaryOp 1933 2 1 tensor_200673 tensor_200676 tensor_200678 0=1 Exp 1934 1 1 tensor_200678 tensor_200679 Split 1935 1 2 tensor_200679 tensor_200680 tensor_200681 BinaryOp 1936 2 1 tensor_200671 tensor_200677 tensor_200682 0=1 Exp 1937 1 1 tensor_200682 tensor_200683 Split 1938 1 2 tensor_200683 tensor_200684 tensor_200685 Split 1939 1 2 state_15_1 tensor_200686 tensor_200687 Split 1940 1 2 state_15_2 tensor_200688 tensor_200689 BinaryOp 1941 2 1 tensor_200681 tensor_200688 tensor_200690 0=2 BinaryOp 1942 2 1 tensor_200690 tensor_200685 tensor_200691 0=0 BinaryOp 1943 2 1 tensor_200684 tensor_200666 tensor_200692 0=2 BinaryOp 1944 2 1 tensor_200680 tensor_200686 tensor_200693 0=2 BinaryOp 1945 2 1 tensor_200693 tensor_200692 tensor_200694 0=0 BinaryOp 1946 2 1 tensor_200694 tensor_200691 tensor_200695 0=3 MemoryData 1947 0 1 blocks.15.att.time_decay 0=2048 21=0 BinaryOp 1948 2 1 blocks.15.att.time_decay tensor_200674 tensor_200697 0=0 Split 1949 1 2 tensor_200697 tensor_200698 tensor_200699 BinaryOp 1950 2 1 tensor_200698 tensor_200660 tensor_200700 0=4 Split 1951 1 3 tensor_200700 tensor_200701 tensor_200702 tensor_200703 BinaryOp 1952 2 1 tensor_200699 tensor_200701 tensor_200704 0=1 Exp 1953 1 1 tensor_200704 tensor_200705 Split 1954 1 2 tensor_200705 tensor_200706 tensor_200707 BinaryOp 1955 2 1 tensor_200661 tensor_200702 tensor_200708 0=1 Exp 1956 1 1 tensor_200708 tensor_200709 Split 1957 1 2 tensor_200709 tensor_200710 tensor_200711 BinaryOp 1958 2 1 tensor_200654 tensor_200695 tensor_200712 0=2 Reshape 1959 1 1 tensor_200712 tensor_200713 0=0 1=1 Gemm 1960 1 1 tensor_200713 tensor_200715 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1961 1 1 tensor_200715 tensor_200716 0=-1 BinaryOp 1962 2 1 tensor_200620 tensor_200716 tensor_200717 0=0 BinaryOp 1963 2 1 tensor_200710 tensor_200667 tensor_200718 0=2 BinaryOp 1964 2 1 tensor_200706 tensor_200687 tensor_200719 0=2 BinaryOp 1965 2 1 tensor_200719 tensor_200718 tensor_200720 0=0 BinaryOp 1966 2 1 tensor_200707 tensor_200689 tensor_200721 0=2 BinaryOp 1967 2 1 tensor_200721 tensor_200711 tensor_200722 0=0 Split 1968 1 1 tensor_200625 output_state_15_0 Split 1969 1 1 tensor_200720 output_state_15_1 Split 1970 1 1 tensor_200722 output_state_15_2 Split 1971 1 1 tensor_200703 output_state_15_3 Split 1972 1 2 tensor_200717 tensor_200727 tensor_200728 LayerNorm 1973 1 1 tensor_200727 tensor_200729 0=2048 1=1.000000e-05 2=1 Split 1974 1 3 tensor_200729 tensor_200730 tensor_200731 tensor_200732 Split 1975 1 2 state_15_4 tensor_200733 tensor_200734 MemoryData 1976 0 1 blocks.15.ffn.time_mix_k 0=2048 21=0 Split 1977 1 2 blocks.15.ffn.time_mix_k tensor_200736 tensor_200737 MemoryData 1978 0 1 blocks.15.ffn.time_mix_r 0=2048 21=0 Split 1979 1 2 blocks.15.ffn.time_mix_r tensor_200739 tensor_200740 BinaryOp 1980 1 1 tensor_200737 tensor_200741 0=7 1=1 2=1.000000e+00 BinaryOp 1981 2 1 tensor_200733 tensor_200741 tensor_200742 0=2 BinaryOp 1982 2 1 tensor_200730 tensor_200736 tensor_200743 0=2 BinaryOp 1983 2 1 tensor_200743 tensor_200742 tensor_200744 0=0 BinaryOp 1984 1 1 tensor_200740 tensor_200745 0=7 1=1 2=1.000000e+00 BinaryOp 1985 2 1 tensor_200734 tensor_200745 tensor_200746 0=2 BinaryOp 1986 2 1 tensor_200731 tensor_200739 tensor_200747 0=2 BinaryOp 1987 2 1 tensor_200747 tensor_200746 tensor_200748 0=0 Reshape 1988 1 1 tensor_200748 tensor_200749 0=0 1=1 Gemm 1989 1 1 tensor_200749 tensor_200751 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 1990 1 1 tensor_200751 tensor_200752 0=-1 Sigmoid 1991 1 1 tensor_200752 tensor_200753 Reshape 1992 1 1 tensor_200744 tensor_200754 0=0 1=1 Gemm 1993 1 1 tensor_200754 tensor_200756 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 1994 1 1 tensor_200756 tensor_200757 0=-1 ReLU 1995 1 1 tensor_200757 tensor_200758 BinaryOp 1996 2 1 tensor_200758 tensor_200758 tensor_200759 0=2 Reshape 1997 1 1 tensor_200759 tensor_200760 0=0 1=1 Gemm 1998 1 1 tensor_200760 tensor_200762 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 1999 1 1 tensor_200762 tensor_200763 0=-1 BinaryOp 2000 2 1 tensor_200753 tensor_200763 tensor_200764 0=2 BinaryOp 2001 2 1 tensor_200728 tensor_200764 tensor_200765 0=0 Split 2002 1 1 tensor_200732 output_state_15_4 Split 2003 1 2 tensor_200765 tensor_200767 tensor_200768 LayerNorm 2004 1 1 tensor_200767 tensor_200769 0=2048 1=1.000000e-05 2=1 Split 2005 1 4 tensor_200769 tensor_200770 tensor_200771 tensor_200772 tensor_200773 Split 2006 1 3 state_16_0 tensor_200774 tensor_200775 tensor_200776 MemoryData 2007 0 1 blocks.16.att.time_mix_k 0=2048 21=0 Split 2008 1 2 blocks.16.att.time_mix_k tensor_200778 tensor_200779 MemoryData 2009 0 1 blocks.16.att.time_mix_v 0=2048 21=0 Split 2010 1 2 blocks.16.att.time_mix_v tensor_200781 tensor_200782 MemoryData 2011 0 1 blocks.16.att.time_mix_r 0=2048 21=0 Split 2012 1 2 blocks.16.att.time_mix_r tensor_200784 tensor_200785 BinaryOp 2013 1 1 tensor_200779 tensor_200786 0=7 1=1 2=1.000000e+00 BinaryOp 2014 2 1 tensor_200774 tensor_200786 tensor_200787 0=2 BinaryOp 2015 2 1 tensor_200770 tensor_200778 tensor_200788 0=2 BinaryOp 2016 2 1 tensor_200788 tensor_200787 tensor_200789 0=0 BinaryOp 2017 1 1 tensor_200782 tensor_200790 0=7 1=1 2=1.000000e+00 BinaryOp 2018 2 1 tensor_200775 tensor_200790 tensor_200791 0=2 BinaryOp 2019 2 1 tensor_200771 tensor_200781 tensor_200792 0=2 BinaryOp 2020 2 1 tensor_200792 tensor_200791 tensor_200793 0=0 BinaryOp 2021 1 1 tensor_200785 tensor_200794 0=7 1=1 2=1.000000e+00 BinaryOp 2022 2 1 tensor_200776 tensor_200794 tensor_200795 0=2 BinaryOp 2023 2 1 tensor_200772 tensor_200784 tensor_200796 0=2 BinaryOp 2024 2 1 tensor_200796 tensor_200795 tensor_200797 0=0 Reshape 2025 1 1 tensor_200797 tensor_200798 0=0 1=1 Gemm 2026 1 1 tensor_200798 tensor_200800 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2027 1 1 tensor_200800 tensor_200801 0=-1 Sigmoid 2028 1 1 tensor_200801 tensor_200802 Reshape 2029 1 1 tensor_200789 tensor_200803 0=0 1=1 Gemm 2030 1 1 tensor_200803 tensor_200805 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2031 1 1 tensor_200805 tensor_200806 0=-1 Split 2032 1 3 tensor_200806 tensor_200807 tensor_200808 tensor_200809 Reshape 2033 1 1 tensor_200793 tensor_200810 0=0 1=1 Gemm 2034 1 1 tensor_200810 tensor_200812 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2035 1 1 tensor_200812 tensor_200813 0=-1 Split 2036 1 2 tensor_200813 tensor_200814 tensor_200815 MemoryData 2037 0 1 blocks.16.att.time_first 0=2048 21=0 BinaryOp 2038 2 1 blocks.16.att.time_first tensor_200807 tensor_200817 0=0 Split 2039 1 2 tensor_200817 tensor_200818 tensor_200819 Split 2040 1 3 state_16_3 tensor_200820 tensor_200821 tensor_200822 BinaryOp 2041 2 1 tensor_200820 tensor_200818 tensor_200823 0=4 Split 2042 1 2 tensor_200823 tensor_200824 tensor_200825 BinaryOp 2043 2 1 tensor_200821 tensor_200824 tensor_200826 0=1 Exp 2044 1 1 tensor_200826 tensor_200827 Split 2045 1 2 tensor_200827 tensor_200828 tensor_200829 BinaryOp 2046 2 1 tensor_200819 tensor_200825 tensor_200830 0=1 Exp 2047 1 1 tensor_200830 tensor_200831 Split 2048 1 2 tensor_200831 tensor_200832 tensor_200833 Split 2049 1 2 state_16_1 tensor_200834 tensor_200835 Split 2050 1 2 state_16_2 tensor_200836 tensor_200837 BinaryOp 2051 2 1 tensor_200829 tensor_200836 tensor_200838 0=2 BinaryOp 2052 2 1 tensor_200838 tensor_200833 tensor_200839 0=0 BinaryOp 2053 2 1 tensor_200832 tensor_200814 tensor_200840 0=2 BinaryOp 2054 2 1 tensor_200828 tensor_200834 tensor_200841 0=2 BinaryOp 2055 2 1 tensor_200841 tensor_200840 tensor_200842 0=0 BinaryOp 2056 2 1 tensor_200842 tensor_200839 tensor_200843 0=3 MemoryData 2057 0 1 blocks.16.att.time_decay 0=2048 21=0 BinaryOp 2058 2 1 blocks.16.att.time_decay tensor_200822 tensor_200845 0=0 Split 2059 1 2 tensor_200845 tensor_200846 tensor_200847 BinaryOp 2060 2 1 tensor_200846 tensor_200808 tensor_200848 0=4 Split 2061 1 3 tensor_200848 tensor_200849 tensor_200850 tensor_200851 BinaryOp 2062 2 1 tensor_200847 tensor_200849 tensor_200852 0=1 Exp 2063 1 1 tensor_200852 tensor_200853 Split 2064 1 2 tensor_200853 tensor_200854 tensor_200855 BinaryOp 2065 2 1 tensor_200809 tensor_200850 tensor_200856 0=1 Exp 2066 1 1 tensor_200856 tensor_200857 Split 2067 1 2 tensor_200857 tensor_200858 tensor_200859 BinaryOp 2068 2 1 tensor_200802 tensor_200843 tensor_200860 0=2 Reshape 2069 1 1 tensor_200860 tensor_200861 0=0 1=1 Gemm 2070 1 1 tensor_200861 tensor_200863 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2071 1 1 tensor_200863 tensor_200864 0=-1 BinaryOp 2072 2 1 tensor_200768 tensor_200864 tensor_200865 0=0 BinaryOp 2073 2 1 tensor_200858 tensor_200815 tensor_200866 0=2 BinaryOp 2074 2 1 tensor_200854 tensor_200835 tensor_200867 0=2 BinaryOp 2075 2 1 tensor_200867 tensor_200866 tensor_200868 0=0 BinaryOp 2076 2 1 tensor_200855 tensor_200837 tensor_200869 0=2 BinaryOp 2077 2 1 tensor_200869 tensor_200859 tensor_200870 0=0 Split 2078 1 1 tensor_200773 output_state_16_0 Split 2079 1 1 tensor_200868 output_state_16_1 Split 2080 1 1 tensor_200870 output_state_16_2 Split 2081 1 1 tensor_200851 output_state_16_3 Split 2082 1 2 tensor_200865 tensor_200875 tensor_200876 LayerNorm 2083 1 1 tensor_200875 tensor_200877 0=2048 1=1.000000e-05 2=1 Split 2084 1 3 tensor_200877 tensor_200878 tensor_200879 tensor_200880 Split 2085 1 2 state_16_4 tensor_200881 tensor_200882 MemoryData 2086 0 1 blocks.16.ffn.time_mix_k 0=2048 21=0 Split 2087 1 2 blocks.16.ffn.time_mix_k tensor_200884 tensor_200885 MemoryData 2088 0 1 blocks.16.ffn.time_mix_r 0=2048 21=0 Split 2089 1 2 blocks.16.ffn.time_mix_r tensor_200887 tensor_200888 BinaryOp 2090 1 1 tensor_200885 tensor_200889 0=7 1=1 2=1.000000e+00 BinaryOp 2091 2 1 tensor_200881 tensor_200889 tensor_200890 0=2 BinaryOp 2092 2 1 tensor_200878 tensor_200884 tensor_200891 0=2 BinaryOp 2093 2 1 tensor_200891 tensor_200890 tensor_200892 0=0 BinaryOp 2094 1 1 tensor_200888 tensor_200893 0=7 1=1 2=1.000000e+00 BinaryOp 2095 2 1 tensor_200882 tensor_200893 tensor_200894 0=2 BinaryOp 2096 2 1 tensor_200879 tensor_200887 tensor_200895 0=2 BinaryOp 2097 2 1 tensor_200895 tensor_200894 tensor_200896 0=0 Reshape 2098 1 1 tensor_200896 tensor_200897 0=0 1=1 Gemm 2099 1 1 tensor_200897 tensor_200899 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2100 1 1 tensor_200899 tensor_200900 0=-1 Sigmoid 2101 1 1 tensor_200900 tensor_200901 Reshape 2102 1 1 tensor_200892 tensor_200902 0=0 1=1 Gemm 2103 1 1 tensor_200902 tensor_200904 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 2104 1 1 tensor_200904 tensor_200905 0=-1 ReLU 2105 1 1 tensor_200905 tensor_200906 BinaryOp 2106 2 1 tensor_200906 tensor_200906 tensor_200907 0=2 Reshape 2107 1 1 tensor_200907 tensor_200908 0=0 1=1 Gemm 2108 1 1 tensor_200908 tensor_200910 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 2109 1 1 tensor_200910 tensor_200911 0=-1 BinaryOp 2110 2 1 tensor_200901 tensor_200911 tensor_200912 0=2 BinaryOp 2111 2 1 tensor_200876 tensor_200912 tensor_200913 0=0 Split 2112 1 1 tensor_200880 output_state_16_4 Split 2113 1 2 tensor_200913 tensor_200915 tensor_200916 LayerNorm 2114 1 1 tensor_200915 tensor_200917 0=2048 1=1.000000e-05 2=1 Split 2115 1 4 tensor_200917 tensor_200918 tensor_200919 tensor_200920 tensor_200921 Split 2116 1 3 state_17_0 tensor_200922 tensor_200923 tensor_200924 MemoryData 2117 0 1 blocks.17.att.time_mix_k 0=2048 21=0 Split 2118 1 2 blocks.17.att.time_mix_k tensor_200926 tensor_200927 MemoryData 2119 0 1 blocks.17.att.time_mix_v 0=2048 21=0 Split 2120 1 2 blocks.17.att.time_mix_v tensor_200929 tensor_200930 MemoryData 2121 0 1 blocks.17.att.time_mix_r 0=2048 21=0 Split 2122 1 2 blocks.17.att.time_mix_r tensor_200932 tensor_200933 BinaryOp 2123 1 1 tensor_200927 tensor_200934 0=7 1=1 2=1.000000e+00 BinaryOp 2124 2 1 tensor_200922 tensor_200934 tensor_200935 0=2 BinaryOp 2125 2 1 tensor_200918 tensor_200926 tensor_200936 0=2 BinaryOp 2126 2 1 tensor_200936 tensor_200935 tensor_200937 0=0 BinaryOp 2127 1 1 tensor_200930 tensor_200938 0=7 1=1 2=1.000000e+00 BinaryOp 2128 2 1 tensor_200923 tensor_200938 tensor_200939 0=2 BinaryOp 2129 2 1 tensor_200919 tensor_200929 tensor_200940 0=2 BinaryOp 2130 2 1 tensor_200940 tensor_200939 tensor_200941 0=0 BinaryOp 2131 1 1 tensor_200933 tensor_200942 0=7 1=1 2=1.000000e+00 BinaryOp 2132 2 1 tensor_200924 tensor_200942 tensor_200943 0=2 BinaryOp 2133 2 1 tensor_200920 tensor_200932 tensor_200944 0=2 BinaryOp 2134 2 1 tensor_200944 tensor_200943 tensor_200945 0=0 Reshape 2135 1 1 tensor_200945 tensor_200946 0=0 1=1 Gemm 2136 1 1 tensor_200946 tensor_200948 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2137 1 1 tensor_200948 tensor_200949 0=-1 Sigmoid 2138 1 1 tensor_200949 tensor_200950 Reshape 2139 1 1 tensor_200937 tensor_200951 0=0 1=1 Gemm 2140 1 1 tensor_200951 tensor_200953 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2141 1 1 tensor_200953 tensor_200954 0=-1 Split 2142 1 3 tensor_200954 tensor_200955 tensor_200956 tensor_200957 Reshape 2143 1 1 tensor_200941 tensor_200958 0=0 1=1 Gemm 2144 1 1 tensor_200958 tensor_200960 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2145 1 1 tensor_200960 tensor_200961 0=-1 Split 2146 1 2 tensor_200961 tensor_200962 tensor_200963 MemoryData 2147 0 1 blocks.17.att.time_first 0=2048 21=0 BinaryOp 2148 2 1 blocks.17.att.time_first tensor_200955 tensor_200965 0=0 Split 2149 1 2 tensor_200965 tensor_200966 tensor_200967 Split 2150 1 3 state_17_3 tensor_200968 tensor_200969 tensor_200970 BinaryOp 2151 2 1 tensor_200968 tensor_200966 tensor_200971 0=4 Split 2152 1 2 tensor_200971 tensor_200972 tensor_200973 BinaryOp 2153 2 1 tensor_200969 tensor_200972 tensor_200974 0=1 Exp 2154 1 1 tensor_200974 tensor_200975 Split 2155 1 2 tensor_200975 tensor_200976 tensor_200977 BinaryOp 2156 2 1 tensor_200967 tensor_200973 tensor_200978 0=1 Exp 2157 1 1 tensor_200978 tensor_200979 Split 2158 1 2 tensor_200979 tensor_200980 tensor_200981 Split 2159 1 2 state_17_1 tensor_200982 tensor_200983 Split 2160 1 2 state_17_2 tensor_200984 tensor_200985 BinaryOp 2161 2 1 tensor_200977 tensor_200984 tensor_200986 0=2 BinaryOp 2162 2 1 tensor_200986 tensor_200981 tensor_200987 0=0 BinaryOp 2163 2 1 tensor_200980 tensor_200962 tensor_200988 0=2 BinaryOp 2164 2 1 tensor_200976 tensor_200982 tensor_200989 0=2 BinaryOp 2165 2 1 tensor_200989 tensor_200988 tensor_200990 0=0 BinaryOp 2166 2 1 tensor_200990 tensor_200987 tensor_200991 0=3 MemoryData 2167 0 1 blocks.17.att.time_decay 0=2048 21=0 BinaryOp 2168 2 1 blocks.17.att.time_decay tensor_200970 tensor_200993 0=0 Split 2169 1 2 tensor_200993 tensor_200994 tensor_200995 BinaryOp 2170 2 1 tensor_200994 tensor_200956 tensor_200996 0=4 Split 2171 1 3 tensor_200996 tensor_200997 tensor_200998 tensor_200999 BinaryOp 2172 2 1 tensor_200995 tensor_200997 tensor_201000 0=1 Exp 2173 1 1 tensor_201000 tensor_201001 Split 2174 1 2 tensor_201001 tensor_201002 tensor_201003 BinaryOp 2175 2 1 tensor_200957 tensor_200998 tensor_201004 0=1 Exp 2176 1 1 tensor_201004 tensor_201005 Split 2177 1 2 tensor_201005 tensor_201006 tensor_201007 BinaryOp 2178 2 1 tensor_200950 tensor_200991 tensor_201008 0=2 Reshape 2179 1 1 tensor_201008 tensor_201009 0=0 1=1 Gemm 2180 1 1 tensor_201009 tensor_201011 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2181 1 1 tensor_201011 tensor_201012 0=-1 BinaryOp 2182 2 1 tensor_200916 tensor_201012 tensor_201013 0=0 BinaryOp 2183 2 1 tensor_201006 tensor_200963 tensor_201014 0=2 BinaryOp 2184 2 1 tensor_201002 tensor_200983 tensor_201015 0=2 BinaryOp 2185 2 1 tensor_201015 tensor_201014 tensor_201016 0=0 BinaryOp 2186 2 1 tensor_201003 tensor_200985 tensor_201017 0=2 BinaryOp 2187 2 1 tensor_201017 tensor_201007 tensor_201018 0=0 Split 2188 1 1 tensor_200921 output_state_17_0 Split 2189 1 1 tensor_201016 output_state_17_1 Split 2190 1 1 tensor_201018 output_state_17_2 Split 2191 1 1 tensor_200999 output_state_17_3 Split 2192 1 2 tensor_201013 tensor_201023 tensor_201024 LayerNorm 2193 1 1 tensor_201023 tensor_201025 0=2048 1=1.000000e-05 2=1 Split 2194 1 3 tensor_201025 tensor_201026 tensor_201027 tensor_201028 Split 2195 1 2 state_17_4 tensor_201029 tensor_201030 MemoryData 2196 0 1 blocks.17.ffn.time_mix_k 0=2048 21=0 Split 2197 1 2 blocks.17.ffn.time_mix_k tensor_201032 tensor_201033 MemoryData 2198 0 1 blocks.17.ffn.time_mix_r 0=2048 21=0 Split 2199 1 2 blocks.17.ffn.time_mix_r tensor_201035 tensor_201036 BinaryOp 2200 1 1 tensor_201033 tensor_201037 0=7 1=1 2=1.000000e+00 BinaryOp 2201 2 1 tensor_201029 tensor_201037 tensor_201038 0=2 BinaryOp 2202 2 1 tensor_201026 tensor_201032 tensor_201039 0=2 BinaryOp 2203 2 1 tensor_201039 tensor_201038 tensor_201040 0=0 BinaryOp 2204 1 1 tensor_201036 tensor_201041 0=7 1=1 2=1.000000e+00 BinaryOp 2205 2 1 tensor_201030 tensor_201041 tensor_201042 0=2 BinaryOp 2206 2 1 tensor_201027 tensor_201035 tensor_201043 0=2 BinaryOp 2207 2 1 tensor_201043 tensor_201042 tensor_201044 0=0 Reshape 2208 1 1 tensor_201044 tensor_201045 0=0 1=1 Gemm 2209 1 1 tensor_201045 tensor_201047 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2210 1 1 tensor_201047 tensor_201048 0=-1 Sigmoid 2211 1 1 tensor_201048 tensor_201049 Reshape 2212 1 1 tensor_201040 tensor_201050 0=0 1=1 Gemm 2213 1 1 tensor_201050 tensor_201052 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 2214 1 1 tensor_201052 tensor_201053 0=-1 ReLU 2215 1 1 tensor_201053 tensor_201054 BinaryOp 2216 2 1 tensor_201054 tensor_201054 tensor_201055 0=2 Reshape 2217 1 1 tensor_201055 tensor_201056 0=0 1=1 Gemm 2218 1 1 tensor_201056 tensor_201058 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 2219 1 1 tensor_201058 tensor_201059 0=-1 BinaryOp 2220 2 1 tensor_201049 tensor_201059 tensor_201060 0=2 BinaryOp 2221 2 1 tensor_201024 tensor_201060 tensor_201061 0=0 Split 2222 1 1 tensor_201028 output_state_17_4 Split 2223 1 2 tensor_201061 tensor_201063 tensor_201064 LayerNorm 2224 1 1 tensor_201063 tensor_201065 0=2048 1=1.000000e-05 2=1 Split 2225 1 4 tensor_201065 tensor_201066 tensor_201067 tensor_201068 tensor_201069 Split 2226 1 3 state_18_0 tensor_201070 tensor_201071 tensor_201072 MemoryData 2227 0 1 blocks.18.att.time_mix_k 0=2048 21=0 Split 2228 1 2 blocks.18.att.time_mix_k tensor_201074 tensor_201075 MemoryData 2229 0 1 blocks.18.att.time_mix_v 0=2048 21=0 Split 2230 1 2 blocks.18.att.time_mix_v tensor_201077 tensor_201078 MemoryData 2231 0 1 blocks.18.att.time_mix_r 0=2048 21=0 Split 2232 1 2 blocks.18.att.time_mix_r tensor_201080 tensor_201081 BinaryOp 2233 1 1 tensor_201075 tensor_201082 0=7 1=1 2=1.000000e+00 BinaryOp 2234 2 1 tensor_201070 tensor_201082 tensor_201083 0=2 BinaryOp 2235 2 1 tensor_201066 tensor_201074 tensor_201084 0=2 BinaryOp 2236 2 1 tensor_201084 tensor_201083 tensor_201085 0=0 BinaryOp 2237 1 1 tensor_201078 tensor_201086 0=7 1=1 2=1.000000e+00 BinaryOp 2238 2 1 tensor_201071 tensor_201086 tensor_201087 0=2 BinaryOp 2239 2 1 tensor_201067 tensor_201077 tensor_201088 0=2 BinaryOp 2240 2 1 tensor_201088 tensor_201087 tensor_201089 0=0 BinaryOp 2241 1 1 tensor_201081 tensor_201090 0=7 1=1 2=1.000000e+00 BinaryOp 2242 2 1 tensor_201072 tensor_201090 tensor_201091 0=2 BinaryOp 2243 2 1 tensor_201068 tensor_201080 tensor_201092 0=2 BinaryOp 2244 2 1 tensor_201092 tensor_201091 tensor_201093 0=0 Reshape 2245 1 1 tensor_201093 tensor_201094 0=0 1=1 Gemm 2246 1 1 tensor_201094 tensor_201096 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2247 1 1 tensor_201096 tensor_201097 0=-1 Sigmoid 2248 1 1 tensor_201097 tensor_201098 Reshape 2249 1 1 tensor_201085 tensor_201099 0=0 1=1 Gemm 2250 1 1 tensor_201099 tensor_201101 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2251 1 1 tensor_201101 tensor_201102 0=-1 Split 2252 1 3 tensor_201102 tensor_201103 tensor_201104 tensor_201105 Reshape 2253 1 1 tensor_201089 tensor_201106 0=0 1=1 Gemm 2254 1 1 tensor_201106 tensor_201108 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2255 1 1 tensor_201108 tensor_201109 0=-1 Split 2256 1 2 tensor_201109 tensor_201110 tensor_201111 MemoryData 2257 0 1 blocks.18.att.time_first 0=2048 21=0 BinaryOp 2258 2 1 blocks.18.att.time_first tensor_201103 tensor_201113 0=0 Split 2259 1 2 tensor_201113 tensor_201114 tensor_201115 Split 2260 1 3 state_18_3 tensor_201116 tensor_201117 tensor_201118 BinaryOp 2261 2 1 tensor_201116 tensor_201114 tensor_201119 0=4 Split 2262 1 2 tensor_201119 tensor_201120 tensor_201121 BinaryOp 2263 2 1 tensor_201117 tensor_201120 tensor_201122 0=1 Exp 2264 1 1 tensor_201122 tensor_201123 Split 2265 1 2 tensor_201123 tensor_201124 tensor_201125 BinaryOp 2266 2 1 tensor_201115 tensor_201121 tensor_201126 0=1 Exp 2267 1 1 tensor_201126 tensor_201127 Split 2268 1 2 tensor_201127 tensor_201128 tensor_201129 Split 2269 1 2 state_18_1 tensor_201130 tensor_201131 Split 2270 1 2 state_18_2 tensor_201132 tensor_201133 BinaryOp 2271 2 1 tensor_201125 tensor_201132 tensor_201134 0=2 BinaryOp 2272 2 1 tensor_201134 tensor_201129 tensor_201135 0=0 BinaryOp 2273 2 1 tensor_201128 tensor_201110 tensor_201136 0=2 BinaryOp 2274 2 1 tensor_201124 tensor_201130 tensor_201137 0=2 BinaryOp 2275 2 1 tensor_201137 tensor_201136 tensor_201138 0=0 BinaryOp 2276 2 1 tensor_201138 tensor_201135 tensor_201139 0=3 MemoryData 2277 0 1 blocks.18.att.time_decay 0=2048 21=0 BinaryOp 2278 2 1 blocks.18.att.time_decay tensor_201118 tensor_201141 0=0 Split 2279 1 2 tensor_201141 tensor_201142 tensor_201143 BinaryOp 2280 2 1 tensor_201142 tensor_201104 tensor_201144 0=4 Split 2281 1 3 tensor_201144 tensor_201145 tensor_201146 tensor_201147 BinaryOp 2282 2 1 tensor_201143 tensor_201145 tensor_201148 0=1 Exp 2283 1 1 tensor_201148 tensor_201149 Split 2284 1 2 tensor_201149 tensor_201150 tensor_201151 BinaryOp 2285 2 1 tensor_201105 tensor_201146 tensor_201152 0=1 Exp 2286 1 1 tensor_201152 tensor_201153 Split 2287 1 2 tensor_201153 tensor_201154 tensor_201155 BinaryOp 2288 2 1 tensor_201098 tensor_201139 tensor_201156 0=2 Reshape 2289 1 1 tensor_201156 tensor_201157 0=0 1=1 Gemm 2290 1 1 tensor_201157 tensor_201159 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2291 1 1 tensor_201159 tensor_201160 0=-1 BinaryOp 2292 2 1 tensor_201064 tensor_201160 tensor_201161 0=0 BinaryOp 2293 2 1 tensor_201154 tensor_201111 tensor_201162 0=2 BinaryOp 2294 2 1 tensor_201150 tensor_201131 tensor_201163 0=2 BinaryOp 2295 2 1 tensor_201163 tensor_201162 tensor_201164 0=0 BinaryOp 2296 2 1 tensor_201151 tensor_201133 tensor_201165 0=2 BinaryOp 2297 2 1 tensor_201165 tensor_201155 tensor_201166 0=0 Split 2298 1 1 tensor_201069 output_state_18_0 Split 2299 1 1 tensor_201164 output_state_18_1 Split 2300 1 1 tensor_201166 output_state_18_2 Split 2301 1 1 tensor_201147 output_state_18_3 Split 2302 1 2 tensor_201161 tensor_201171 tensor_201172 LayerNorm 2303 1 1 tensor_201171 tensor_201173 0=2048 1=1.000000e-05 2=1 Split 2304 1 3 tensor_201173 tensor_201174 tensor_201175 tensor_201176 Split 2305 1 2 state_18_4 tensor_201177 tensor_201178 MemoryData 2306 0 1 blocks.18.ffn.time_mix_k 0=2048 21=0 Split 2307 1 2 blocks.18.ffn.time_mix_k tensor_201180 tensor_201181 MemoryData 2308 0 1 blocks.18.ffn.time_mix_r 0=2048 21=0 Split 2309 1 2 blocks.18.ffn.time_mix_r tensor_201183 tensor_201184 BinaryOp 2310 1 1 tensor_201181 tensor_201185 0=7 1=1 2=1.000000e+00 BinaryOp 2311 2 1 tensor_201177 tensor_201185 tensor_201186 0=2 BinaryOp 2312 2 1 tensor_201174 tensor_201180 tensor_201187 0=2 BinaryOp 2313 2 1 tensor_201187 tensor_201186 tensor_201188 0=0 BinaryOp 2314 1 1 tensor_201184 tensor_201189 0=7 1=1 2=1.000000e+00 BinaryOp 2315 2 1 tensor_201178 tensor_201189 tensor_201190 0=2 BinaryOp 2316 2 1 tensor_201175 tensor_201183 tensor_201191 0=2 BinaryOp 2317 2 1 tensor_201191 tensor_201190 tensor_201192 0=0 Reshape 2318 1 1 tensor_201192 tensor_201193 0=0 1=1 Gemm 2319 1 1 tensor_201193 tensor_201195 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2320 1 1 tensor_201195 tensor_201196 0=-1 Sigmoid 2321 1 1 tensor_201196 tensor_201197 Reshape 2322 1 1 tensor_201188 tensor_201198 0=0 1=1 Gemm 2323 1 1 tensor_201198 tensor_201200 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 2324 1 1 tensor_201200 tensor_201201 0=-1 ReLU 2325 1 1 tensor_201201 tensor_201202 BinaryOp 2326 2 1 tensor_201202 tensor_201202 tensor_201203 0=2 Reshape 2327 1 1 tensor_201203 tensor_201204 0=0 1=1 Gemm 2328 1 1 tensor_201204 tensor_201206 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 2329 1 1 tensor_201206 tensor_201207 0=-1 BinaryOp 2330 2 1 tensor_201197 tensor_201207 tensor_201208 0=2 BinaryOp 2331 2 1 tensor_201172 tensor_201208 tensor_201209 0=0 Split 2332 1 1 tensor_201176 output_state_18_4 Split 2333 1 2 tensor_201209 tensor_201211 tensor_201212 LayerNorm 2334 1 1 tensor_201211 tensor_201213 0=2048 1=1.000000e-05 2=1 Split 2335 1 4 tensor_201213 tensor_201214 tensor_201215 tensor_201216 tensor_201217 Split 2336 1 3 state_19_0 tensor_201218 tensor_201219 tensor_201220 MemoryData 2337 0 1 blocks.19.att.time_mix_k 0=2048 21=0 Split 2338 1 2 blocks.19.att.time_mix_k tensor_201222 tensor_201223 MemoryData 2339 0 1 blocks.19.att.time_mix_v 0=2048 21=0 Split 2340 1 2 blocks.19.att.time_mix_v tensor_201225 tensor_201226 MemoryData 2341 0 1 blocks.19.att.time_mix_r 0=2048 21=0 Split 2342 1 2 blocks.19.att.time_mix_r tensor_201228 tensor_201229 BinaryOp 2343 1 1 tensor_201223 tensor_201230 0=7 1=1 2=1.000000e+00 BinaryOp 2344 2 1 tensor_201218 tensor_201230 tensor_201231 0=2 BinaryOp 2345 2 1 tensor_201214 tensor_201222 tensor_201232 0=2 BinaryOp 2346 2 1 tensor_201232 tensor_201231 tensor_201233 0=0 BinaryOp 2347 1 1 tensor_201226 tensor_201234 0=7 1=1 2=1.000000e+00 BinaryOp 2348 2 1 tensor_201219 tensor_201234 tensor_201235 0=2 BinaryOp 2349 2 1 tensor_201215 tensor_201225 tensor_201236 0=2 BinaryOp 2350 2 1 tensor_201236 tensor_201235 tensor_201237 0=0 BinaryOp 2351 1 1 tensor_201229 tensor_201238 0=7 1=1 2=1.000000e+00 BinaryOp 2352 2 1 tensor_201220 tensor_201238 tensor_201239 0=2 BinaryOp 2353 2 1 tensor_201216 tensor_201228 tensor_201240 0=2 BinaryOp 2354 2 1 tensor_201240 tensor_201239 tensor_201241 0=0 Reshape 2355 1 1 tensor_201241 tensor_201242 0=0 1=1 Gemm 2356 1 1 tensor_201242 tensor_201244 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2357 1 1 tensor_201244 tensor_201245 0=-1 Sigmoid 2358 1 1 tensor_201245 tensor_201246 Reshape 2359 1 1 tensor_201233 tensor_201247 0=0 1=1 Gemm 2360 1 1 tensor_201247 tensor_201249 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2361 1 1 tensor_201249 tensor_201250 0=-1 Split 2362 1 3 tensor_201250 tensor_201251 tensor_201252 tensor_201253 Reshape 2363 1 1 tensor_201237 tensor_201254 0=0 1=1 Gemm 2364 1 1 tensor_201254 tensor_201256 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2365 1 1 tensor_201256 tensor_201257 0=-1 Split 2366 1 2 tensor_201257 tensor_201258 tensor_201259 MemoryData 2367 0 1 blocks.19.att.time_first 0=2048 21=0 BinaryOp 2368 2 1 blocks.19.att.time_first tensor_201251 tensor_201261 0=0 Split 2369 1 2 tensor_201261 tensor_201262 tensor_201263 Split 2370 1 3 state_19_3 tensor_201264 tensor_201265 tensor_201266 BinaryOp 2371 2 1 tensor_201264 tensor_201262 tensor_201267 0=4 Split 2372 1 2 tensor_201267 tensor_201268 tensor_201269 BinaryOp 2373 2 1 tensor_201265 tensor_201268 tensor_201270 0=1 Exp 2374 1 1 tensor_201270 tensor_201271 Split 2375 1 2 tensor_201271 tensor_201272 tensor_201273 BinaryOp 2376 2 1 tensor_201263 tensor_201269 tensor_201274 0=1 Exp 2377 1 1 tensor_201274 tensor_201275 Split 2378 1 2 tensor_201275 tensor_201276 tensor_201277 Split 2379 1 2 state_19_1 tensor_201278 tensor_201279 Split 2380 1 2 state_19_2 tensor_201280 tensor_201281 BinaryOp 2381 2 1 tensor_201273 tensor_201280 tensor_201282 0=2 BinaryOp 2382 2 1 tensor_201282 tensor_201277 tensor_201283 0=0 BinaryOp 2383 2 1 tensor_201276 tensor_201258 tensor_201284 0=2 BinaryOp 2384 2 1 tensor_201272 tensor_201278 tensor_201285 0=2 BinaryOp 2385 2 1 tensor_201285 tensor_201284 tensor_201286 0=0 BinaryOp 2386 2 1 tensor_201286 tensor_201283 tensor_201287 0=3 MemoryData 2387 0 1 blocks.19.att.time_decay 0=2048 21=0 BinaryOp 2388 2 1 blocks.19.att.time_decay tensor_201266 tensor_201289 0=0 Split 2389 1 2 tensor_201289 tensor_201290 tensor_201291 BinaryOp 2390 2 1 tensor_201290 tensor_201252 tensor_201292 0=4 Split 2391 1 3 tensor_201292 tensor_201293 tensor_201294 tensor_201295 BinaryOp 2392 2 1 tensor_201291 tensor_201293 tensor_201296 0=1 Exp 2393 1 1 tensor_201296 tensor_201297 Split 2394 1 2 tensor_201297 tensor_201298 tensor_201299 BinaryOp 2395 2 1 tensor_201253 tensor_201294 tensor_201300 0=1 Exp 2396 1 1 tensor_201300 tensor_201301 Split 2397 1 2 tensor_201301 tensor_201302 tensor_201303 BinaryOp 2398 2 1 tensor_201246 tensor_201287 tensor_201304 0=2 Reshape 2399 1 1 tensor_201304 tensor_201305 0=0 1=1 Gemm 2400 1 1 tensor_201305 tensor_201307 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2401 1 1 tensor_201307 tensor_201308 0=-1 BinaryOp 2402 2 1 tensor_201212 tensor_201308 tensor_201309 0=0 BinaryOp 2403 2 1 tensor_201302 tensor_201259 tensor_201310 0=2 BinaryOp 2404 2 1 tensor_201298 tensor_201279 tensor_201311 0=2 BinaryOp 2405 2 1 tensor_201311 tensor_201310 tensor_201312 0=0 BinaryOp 2406 2 1 tensor_201299 tensor_201281 tensor_201313 0=2 BinaryOp 2407 2 1 tensor_201313 tensor_201303 tensor_201314 0=0 Split 2408 1 1 tensor_201217 output_state_19_0 Split 2409 1 1 tensor_201312 output_state_19_1 Split 2410 1 1 tensor_201314 output_state_19_2 Split 2411 1 1 tensor_201295 output_state_19_3 Split 2412 1 2 tensor_201309 tensor_201319 tensor_201320 LayerNorm 2413 1 1 tensor_201319 tensor_201321 0=2048 1=1.000000e-05 2=1 Split 2414 1 3 tensor_201321 tensor_201322 tensor_201323 tensor_201324 Split 2415 1 2 state_19_4 tensor_201325 tensor_201326 MemoryData 2416 0 1 blocks.19.ffn.time_mix_k 0=2048 21=0 Split 2417 1 2 blocks.19.ffn.time_mix_k tensor_201328 tensor_201329 MemoryData 2418 0 1 blocks.19.ffn.time_mix_r 0=2048 21=0 Split 2419 1 2 blocks.19.ffn.time_mix_r tensor_201331 tensor_201332 BinaryOp 2420 1 1 tensor_201329 tensor_201333 0=7 1=1 2=1.000000e+00 BinaryOp 2421 2 1 tensor_201325 tensor_201333 tensor_201334 0=2 BinaryOp 2422 2 1 tensor_201322 tensor_201328 tensor_201335 0=2 BinaryOp 2423 2 1 tensor_201335 tensor_201334 tensor_201336 0=0 BinaryOp 2424 1 1 tensor_201332 tensor_201337 0=7 1=1 2=1.000000e+00 BinaryOp 2425 2 1 tensor_201326 tensor_201337 tensor_201338 0=2 BinaryOp 2426 2 1 tensor_201323 tensor_201331 tensor_201339 0=2 BinaryOp 2427 2 1 tensor_201339 tensor_201338 tensor_201340 0=0 Reshape 2428 1 1 tensor_201340 tensor_201341 0=0 1=1 Gemm 2429 1 1 tensor_201341 tensor_201343 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2430 1 1 tensor_201343 tensor_201344 0=-1 Sigmoid 2431 1 1 tensor_201344 tensor_201345 Reshape 2432 1 1 tensor_201336 tensor_201346 0=0 1=1 Gemm 2433 1 1 tensor_201346 tensor_201348 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 2434 1 1 tensor_201348 tensor_201349 0=-1 ReLU 2435 1 1 tensor_201349 tensor_201350 BinaryOp 2436 2 1 tensor_201350 tensor_201350 tensor_201351 0=2 Reshape 2437 1 1 tensor_201351 tensor_201352 0=0 1=1 Gemm 2438 1 1 tensor_201352 tensor_201354 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 2439 1 1 tensor_201354 tensor_201355 0=-1 BinaryOp 2440 2 1 tensor_201345 tensor_201355 tensor_201356 0=2 BinaryOp 2441 2 1 tensor_201320 tensor_201356 tensor_201357 0=0 Split 2442 1 1 tensor_201324 output_state_19_4 Split 2443 1 2 tensor_201357 tensor_201359 tensor_201360 LayerNorm 2444 1 1 tensor_201359 tensor_201361 0=2048 1=1.000000e-05 2=1 Split 2445 1 4 tensor_201361 tensor_201362 tensor_201363 tensor_201364 tensor_201365 Split 2446 1 3 state_20_0 tensor_201366 tensor_201367 tensor_201368 MemoryData 2447 0 1 blocks.20.att.time_mix_k 0=2048 21=0 Split 2448 1 2 blocks.20.att.time_mix_k tensor_201370 tensor_201371 MemoryData 2449 0 1 blocks.20.att.time_mix_v 0=2048 21=0 Split 2450 1 2 blocks.20.att.time_mix_v tensor_201373 tensor_201374 MemoryData 2451 0 1 blocks.20.att.time_mix_r 0=2048 21=0 Split 2452 1 2 blocks.20.att.time_mix_r tensor_201376 tensor_201377 BinaryOp 2453 1 1 tensor_201371 tensor_201378 0=7 1=1 2=1.000000e+00 BinaryOp 2454 2 1 tensor_201366 tensor_201378 tensor_201379 0=2 BinaryOp 2455 2 1 tensor_201362 tensor_201370 tensor_201380 0=2 BinaryOp 2456 2 1 tensor_201380 tensor_201379 tensor_201381 0=0 BinaryOp 2457 1 1 tensor_201374 tensor_201382 0=7 1=1 2=1.000000e+00 BinaryOp 2458 2 1 tensor_201367 tensor_201382 tensor_201383 0=2 BinaryOp 2459 2 1 tensor_201363 tensor_201373 tensor_201384 0=2 BinaryOp 2460 2 1 tensor_201384 tensor_201383 tensor_201385 0=0 BinaryOp 2461 1 1 tensor_201377 tensor_201386 0=7 1=1 2=1.000000e+00 BinaryOp 2462 2 1 tensor_201368 tensor_201386 tensor_201387 0=2 BinaryOp 2463 2 1 tensor_201364 tensor_201376 tensor_201388 0=2 BinaryOp 2464 2 1 tensor_201388 tensor_201387 tensor_201389 0=0 Reshape 2465 1 1 tensor_201389 tensor_201390 0=0 1=1 Gemm 2466 1 1 tensor_201390 tensor_201392 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2467 1 1 tensor_201392 tensor_201393 0=-1 Sigmoid 2468 1 1 tensor_201393 tensor_201394 Reshape 2469 1 1 tensor_201381 tensor_201395 0=0 1=1 Gemm 2470 1 1 tensor_201395 tensor_201397 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2471 1 1 tensor_201397 tensor_201398 0=-1 Split 2472 1 3 tensor_201398 tensor_201399 tensor_201400 tensor_201401 Reshape 2473 1 1 tensor_201385 tensor_201402 0=0 1=1 Gemm 2474 1 1 tensor_201402 tensor_201404 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2475 1 1 tensor_201404 tensor_201405 0=-1 Split 2476 1 2 tensor_201405 tensor_201406 tensor_201407 MemoryData 2477 0 1 blocks.20.att.time_first 0=2048 21=0 BinaryOp 2478 2 1 blocks.20.att.time_first tensor_201399 tensor_201409 0=0 Split 2479 1 2 tensor_201409 tensor_201410 tensor_201411 Split 2480 1 3 state_20_3 tensor_201412 tensor_201413 tensor_201414 BinaryOp 2481 2 1 tensor_201412 tensor_201410 tensor_201415 0=4 Split 2482 1 2 tensor_201415 tensor_201416 tensor_201417 BinaryOp 2483 2 1 tensor_201413 tensor_201416 tensor_201418 0=1 Exp 2484 1 1 tensor_201418 tensor_201419 Split 2485 1 2 tensor_201419 tensor_201420 tensor_201421 BinaryOp 2486 2 1 tensor_201411 tensor_201417 tensor_201422 0=1 Exp 2487 1 1 tensor_201422 tensor_201423 Split 2488 1 2 tensor_201423 tensor_201424 tensor_201425 Split 2489 1 2 state_20_1 tensor_201426 tensor_201427 Split 2490 1 2 state_20_2 tensor_201428 tensor_201429 BinaryOp 2491 2 1 tensor_201421 tensor_201428 tensor_201430 0=2 BinaryOp 2492 2 1 tensor_201430 tensor_201425 tensor_201431 0=0 BinaryOp 2493 2 1 tensor_201424 tensor_201406 tensor_201432 0=2 BinaryOp 2494 2 1 tensor_201420 tensor_201426 tensor_201433 0=2 BinaryOp 2495 2 1 tensor_201433 tensor_201432 tensor_201434 0=0 BinaryOp 2496 2 1 tensor_201434 tensor_201431 tensor_201435 0=3 MemoryData 2497 0 1 blocks.20.att.time_decay 0=2048 21=0 BinaryOp 2498 2 1 blocks.20.att.time_decay tensor_201414 tensor_201437 0=0 Split 2499 1 2 tensor_201437 tensor_201438 tensor_201439 BinaryOp 2500 2 1 tensor_201438 tensor_201400 tensor_201440 0=4 Split 2501 1 3 tensor_201440 tensor_201441 tensor_201442 tensor_201443 BinaryOp 2502 2 1 tensor_201439 tensor_201441 tensor_201444 0=1 Exp 2503 1 1 tensor_201444 tensor_201445 Split 2504 1 2 tensor_201445 tensor_201446 tensor_201447 BinaryOp 2505 2 1 tensor_201401 tensor_201442 tensor_201448 0=1 Exp 2506 1 1 tensor_201448 tensor_201449 Split 2507 1 2 tensor_201449 tensor_201450 tensor_201451 BinaryOp 2508 2 1 tensor_201394 tensor_201435 tensor_201452 0=2 Reshape 2509 1 1 tensor_201452 tensor_201453 0=0 1=1 Gemm 2510 1 1 tensor_201453 tensor_201455 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2511 1 1 tensor_201455 tensor_201456 0=-1 BinaryOp 2512 2 1 tensor_201360 tensor_201456 tensor_201457 0=0 BinaryOp 2513 2 1 tensor_201450 tensor_201407 tensor_201458 0=2 BinaryOp 2514 2 1 tensor_201446 tensor_201427 tensor_201459 0=2 BinaryOp 2515 2 1 tensor_201459 tensor_201458 tensor_201460 0=0 BinaryOp 2516 2 1 tensor_201447 tensor_201429 tensor_201461 0=2 BinaryOp 2517 2 1 tensor_201461 tensor_201451 tensor_201462 0=0 Split 2518 1 1 tensor_201365 output_state_20_0 Split 2519 1 1 tensor_201460 output_state_20_1 Split 2520 1 1 tensor_201462 output_state_20_2 Split 2521 1 1 tensor_201443 output_state_20_3 Split 2522 1 2 tensor_201457 tensor_201467 tensor_201468 LayerNorm 2523 1 1 tensor_201467 tensor_201469 0=2048 1=1.000000e-05 2=1 Split 2524 1 3 tensor_201469 tensor_201470 tensor_201471 tensor_201472 Split 2525 1 2 state_20_4 tensor_201473 tensor_201474 MemoryData 2526 0 1 blocks.20.ffn.time_mix_k 0=2048 21=0 Split 2527 1 2 blocks.20.ffn.time_mix_k tensor_201476 tensor_201477 MemoryData 2528 0 1 blocks.20.ffn.time_mix_r 0=2048 21=0 Split 2529 1 2 blocks.20.ffn.time_mix_r tensor_201479 tensor_201480 BinaryOp 2530 1 1 tensor_201477 tensor_201481 0=7 1=1 2=1.000000e+00 BinaryOp 2531 2 1 tensor_201473 tensor_201481 tensor_201482 0=2 BinaryOp 2532 2 1 tensor_201470 tensor_201476 tensor_201483 0=2 BinaryOp 2533 2 1 tensor_201483 tensor_201482 tensor_201484 0=0 BinaryOp 2534 1 1 tensor_201480 tensor_201485 0=7 1=1 2=1.000000e+00 BinaryOp 2535 2 1 tensor_201474 tensor_201485 tensor_201486 0=2 BinaryOp 2536 2 1 tensor_201471 tensor_201479 tensor_201487 0=2 BinaryOp 2537 2 1 tensor_201487 tensor_201486 tensor_201488 0=0 Reshape 2538 1 1 tensor_201488 tensor_201489 0=0 1=1 Gemm 2539 1 1 tensor_201489 tensor_201491 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2540 1 1 tensor_201491 tensor_201492 0=-1 Sigmoid 2541 1 1 tensor_201492 tensor_201493 Reshape 2542 1 1 tensor_201484 tensor_201494 0=0 1=1 Gemm 2543 1 1 tensor_201494 tensor_201496 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 2544 1 1 tensor_201496 tensor_201497 0=-1 ReLU 2545 1 1 tensor_201497 tensor_201498 BinaryOp 2546 2 1 tensor_201498 tensor_201498 tensor_201499 0=2 Reshape 2547 1 1 tensor_201499 tensor_201500 0=0 1=1 Gemm 2548 1 1 tensor_201500 tensor_201502 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 2549 1 1 tensor_201502 tensor_201503 0=-1 BinaryOp 2550 2 1 tensor_201493 tensor_201503 tensor_201504 0=2 BinaryOp 2551 2 1 tensor_201468 tensor_201504 tensor_201505 0=0 Split 2552 1 1 tensor_201472 output_state_20_4 Split 2553 1 2 tensor_201505 tensor_201507 tensor_201508 LayerNorm 2554 1 1 tensor_201507 tensor_201509 0=2048 1=1.000000e-05 2=1 Split 2555 1 4 tensor_201509 tensor_201510 tensor_201511 tensor_201512 tensor_201513 Split 2556 1 3 state_21_0 tensor_201514 tensor_201515 tensor_201516 MemoryData 2557 0 1 blocks.21.att.time_mix_k 0=2048 21=0 Split 2558 1 2 blocks.21.att.time_mix_k tensor_201518 tensor_201519 MemoryData 2559 0 1 blocks.21.att.time_mix_v 0=2048 21=0 Split 2560 1 2 blocks.21.att.time_mix_v tensor_201521 tensor_201522 MemoryData 2561 0 1 blocks.21.att.time_mix_r 0=2048 21=0 Split 2562 1 2 blocks.21.att.time_mix_r tensor_201524 tensor_201525 BinaryOp 2563 1 1 tensor_201519 tensor_201526 0=7 1=1 2=1.000000e+00 BinaryOp 2564 2 1 tensor_201514 tensor_201526 tensor_201527 0=2 BinaryOp 2565 2 1 tensor_201510 tensor_201518 tensor_201528 0=2 BinaryOp 2566 2 1 tensor_201528 tensor_201527 tensor_201529 0=0 BinaryOp 2567 1 1 tensor_201522 tensor_201530 0=7 1=1 2=1.000000e+00 BinaryOp 2568 2 1 tensor_201515 tensor_201530 tensor_201531 0=2 BinaryOp 2569 2 1 tensor_201511 tensor_201521 tensor_201532 0=2 BinaryOp 2570 2 1 tensor_201532 tensor_201531 tensor_201533 0=0 BinaryOp 2571 1 1 tensor_201525 tensor_201534 0=7 1=1 2=1.000000e+00 BinaryOp 2572 2 1 tensor_201516 tensor_201534 tensor_201535 0=2 BinaryOp 2573 2 1 tensor_201512 tensor_201524 tensor_201536 0=2 BinaryOp 2574 2 1 tensor_201536 tensor_201535 tensor_201537 0=0 Reshape 2575 1 1 tensor_201537 tensor_201538 0=0 1=1 Gemm 2576 1 1 tensor_201538 tensor_201540 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2577 1 1 tensor_201540 tensor_201541 0=-1 Sigmoid 2578 1 1 tensor_201541 tensor_201542 Reshape 2579 1 1 tensor_201529 tensor_201543 0=0 1=1 Gemm 2580 1 1 tensor_201543 tensor_201545 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2581 1 1 tensor_201545 tensor_201546 0=-1 Split 2582 1 3 tensor_201546 tensor_201547 tensor_201548 tensor_201549 Reshape 2583 1 1 tensor_201533 tensor_201550 0=0 1=1 Gemm 2584 1 1 tensor_201550 tensor_201552 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2585 1 1 tensor_201552 tensor_201553 0=-1 Split 2586 1 2 tensor_201553 tensor_201554 tensor_201555 MemoryData 2587 0 1 blocks.21.att.time_first 0=2048 21=0 BinaryOp 2588 2 1 blocks.21.att.time_first tensor_201547 tensor_201557 0=0 Split 2589 1 2 tensor_201557 tensor_201558 tensor_201559 Split 2590 1 3 state_21_3 tensor_201560 tensor_201561 tensor_201562 BinaryOp 2591 2 1 tensor_201560 tensor_201558 tensor_201563 0=4 Split 2592 1 2 tensor_201563 tensor_201564 tensor_201565 BinaryOp 2593 2 1 tensor_201561 tensor_201564 tensor_201566 0=1 Exp 2594 1 1 tensor_201566 tensor_201567 Split 2595 1 2 tensor_201567 tensor_201568 tensor_201569 BinaryOp 2596 2 1 tensor_201559 tensor_201565 tensor_201570 0=1 Exp 2597 1 1 tensor_201570 tensor_201571 Split 2598 1 2 tensor_201571 tensor_201572 tensor_201573 Split 2599 1 2 state_21_1 tensor_201574 tensor_201575 Split 2600 1 2 state_21_2 tensor_201576 tensor_201577 BinaryOp 2601 2 1 tensor_201569 tensor_201576 tensor_201578 0=2 BinaryOp 2602 2 1 tensor_201578 tensor_201573 tensor_201579 0=0 BinaryOp 2603 2 1 tensor_201572 tensor_201554 tensor_201580 0=2 BinaryOp 2604 2 1 tensor_201568 tensor_201574 tensor_201581 0=2 BinaryOp 2605 2 1 tensor_201581 tensor_201580 tensor_201582 0=0 BinaryOp 2606 2 1 tensor_201582 tensor_201579 tensor_201583 0=3 MemoryData 2607 0 1 blocks.21.att.time_decay 0=2048 21=0 BinaryOp 2608 2 1 blocks.21.att.time_decay tensor_201562 tensor_201585 0=0 Split 2609 1 2 tensor_201585 tensor_201586 tensor_201587 BinaryOp 2610 2 1 tensor_201586 tensor_201548 tensor_201588 0=4 Split 2611 1 3 tensor_201588 tensor_201589 tensor_201590 tensor_201591 BinaryOp 2612 2 1 tensor_201587 tensor_201589 tensor_201592 0=1 Exp 2613 1 1 tensor_201592 tensor_201593 Split 2614 1 2 tensor_201593 tensor_201594 tensor_201595 BinaryOp 2615 2 1 tensor_201549 tensor_201590 tensor_201596 0=1 Exp 2616 1 1 tensor_201596 tensor_201597 Split 2617 1 2 tensor_201597 tensor_201598 tensor_201599 BinaryOp 2618 2 1 tensor_201542 tensor_201583 tensor_201600 0=2 Reshape 2619 1 1 tensor_201600 tensor_201601 0=0 1=1 Gemm 2620 1 1 tensor_201601 tensor_201603 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2621 1 1 tensor_201603 tensor_201604 0=-1 BinaryOp 2622 2 1 tensor_201508 tensor_201604 tensor_201605 0=0 BinaryOp 2623 2 1 tensor_201598 tensor_201555 tensor_201606 0=2 BinaryOp 2624 2 1 tensor_201594 tensor_201575 tensor_201607 0=2 BinaryOp 2625 2 1 tensor_201607 tensor_201606 tensor_201608 0=0 BinaryOp 2626 2 1 tensor_201595 tensor_201577 tensor_201609 0=2 BinaryOp 2627 2 1 tensor_201609 tensor_201599 tensor_201610 0=0 Split 2628 1 1 tensor_201513 output_state_21_0 Split 2629 1 1 tensor_201608 output_state_21_1 Split 2630 1 1 tensor_201610 output_state_21_2 Split 2631 1 1 tensor_201591 output_state_21_3 Split 2632 1 2 tensor_201605 tensor_201615 tensor_201616 LayerNorm 2633 1 1 tensor_201615 tensor_201617 0=2048 1=1.000000e-05 2=1 Split 2634 1 3 tensor_201617 tensor_201618 tensor_201619 tensor_201620 Split 2635 1 2 state_21_4 tensor_201621 tensor_201622 MemoryData 2636 0 1 blocks.21.ffn.time_mix_k 0=2048 21=0 Split 2637 1 2 blocks.21.ffn.time_mix_k tensor_201624 tensor_201625 MemoryData 2638 0 1 blocks.21.ffn.time_mix_r 0=2048 21=0 Split 2639 1 2 blocks.21.ffn.time_mix_r tensor_201627 tensor_201628 BinaryOp 2640 1 1 tensor_201625 tensor_201629 0=7 1=1 2=1.000000e+00 BinaryOp 2641 2 1 tensor_201621 tensor_201629 tensor_201630 0=2 BinaryOp 2642 2 1 tensor_201618 tensor_201624 tensor_201631 0=2 BinaryOp 2643 2 1 tensor_201631 tensor_201630 tensor_201632 0=0 BinaryOp 2644 1 1 tensor_201628 tensor_201633 0=7 1=1 2=1.000000e+00 BinaryOp 2645 2 1 tensor_201622 tensor_201633 tensor_201634 0=2 BinaryOp 2646 2 1 tensor_201619 tensor_201627 tensor_201635 0=2 BinaryOp 2647 2 1 tensor_201635 tensor_201634 tensor_201636 0=0 Reshape 2648 1 1 tensor_201636 tensor_201637 0=0 1=1 Gemm 2649 1 1 tensor_201637 tensor_201639 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2650 1 1 tensor_201639 tensor_201640 0=-1 Sigmoid 2651 1 1 tensor_201640 tensor_201641 Reshape 2652 1 1 tensor_201632 tensor_201642 0=0 1=1 Gemm 2653 1 1 tensor_201642 tensor_201644 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 2654 1 1 tensor_201644 tensor_201645 0=-1 ReLU 2655 1 1 tensor_201645 tensor_201646 BinaryOp 2656 2 1 tensor_201646 tensor_201646 tensor_201647 0=2 Reshape 2657 1 1 tensor_201647 tensor_201648 0=0 1=1 Gemm 2658 1 1 tensor_201648 tensor_201650 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 2659 1 1 tensor_201650 tensor_201651 0=-1 BinaryOp 2660 2 1 tensor_201641 tensor_201651 tensor_201652 0=2 BinaryOp 2661 2 1 tensor_201616 tensor_201652 tensor_201653 0=0 Split 2662 1 1 tensor_201620 output_state_21_4 Split 2663 1 2 tensor_201653 tensor_201655 tensor_201656 LayerNorm 2664 1 1 tensor_201655 tensor_201657 0=2048 1=1.000000e-05 2=1 Split 2665 1 4 tensor_201657 tensor_201658 tensor_201659 tensor_201660 tensor_201661 Split 2666 1 3 state_22_0 tensor_201662 tensor_201663 tensor_201664 MemoryData 2667 0 1 blocks.22.att.time_mix_k 0=2048 21=0 Split 2668 1 2 blocks.22.att.time_mix_k tensor_201666 tensor_201667 MemoryData 2669 0 1 blocks.22.att.time_mix_v 0=2048 21=0 Split 2670 1 2 blocks.22.att.time_mix_v tensor_201669 tensor_201670 MemoryData 2671 0 1 blocks.22.att.time_mix_r 0=2048 21=0 Split 2672 1 2 blocks.22.att.time_mix_r tensor_201672 tensor_201673 BinaryOp 2673 1 1 tensor_201667 tensor_201674 0=7 1=1 2=1.000000e+00 BinaryOp 2674 2 1 tensor_201662 tensor_201674 tensor_201675 0=2 BinaryOp 2675 2 1 tensor_201658 tensor_201666 tensor_201676 0=2 BinaryOp 2676 2 1 tensor_201676 tensor_201675 tensor_201677 0=0 BinaryOp 2677 1 1 tensor_201670 tensor_201678 0=7 1=1 2=1.000000e+00 BinaryOp 2678 2 1 tensor_201663 tensor_201678 tensor_201679 0=2 BinaryOp 2679 2 1 tensor_201659 tensor_201669 tensor_201680 0=2 BinaryOp 2680 2 1 tensor_201680 tensor_201679 tensor_201681 0=0 BinaryOp 2681 1 1 tensor_201673 tensor_201682 0=7 1=1 2=1.000000e+00 BinaryOp 2682 2 1 tensor_201664 tensor_201682 tensor_201683 0=2 BinaryOp 2683 2 1 tensor_201660 tensor_201672 tensor_201684 0=2 BinaryOp 2684 2 1 tensor_201684 tensor_201683 tensor_201685 0=0 Reshape 2685 1 1 tensor_201685 tensor_201686 0=0 1=1 Gemm 2686 1 1 tensor_201686 tensor_201688 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2687 1 1 tensor_201688 tensor_201689 0=-1 Sigmoid 2688 1 1 tensor_201689 tensor_201690 Reshape 2689 1 1 tensor_201677 tensor_201691 0=0 1=1 Gemm 2690 1 1 tensor_201691 tensor_201693 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2691 1 1 tensor_201693 tensor_201694 0=-1 Split 2692 1 3 tensor_201694 tensor_201695 tensor_201696 tensor_201697 Reshape 2693 1 1 tensor_201681 tensor_201698 0=0 1=1 Gemm 2694 1 1 tensor_201698 tensor_201700 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2695 1 1 tensor_201700 tensor_201701 0=-1 Split 2696 1 2 tensor_201701 tensor_201702 tensor_201703 MemoryData 2697 0 1 blocks.22.att.time_first 0=2048 21=0 BinaryOp 2698 2 1 blocks.22.att.time_first tensor_201695 tensor_201705 0=0 Split 2699 1 2 tensor_201705 tensor_201706 tensor_201707 Split 2700 1 3 state_22_3 tensor_201708 tensor_201709 tensor_201710 BinaryOp 2701 2 1 tensor_201708 tensor_201706 tensor_201711 0=4 Split 2702 1 2 tensor_201711 tensor_201712 tensor_201713 BinaryOp 2703 2 1 tensor_201709 tensor_201712 tensor_201714 0=1 Exp 2704 1 1 tensor_201714 tensor_201715 Split 2705 1 2 tensor_201715 tensor_201716 tensor_201717 BinaryOp 2706 2 1 tensor_201707 tensor_201713 tensor_201718 0=1 Exp 2707 1 1 tensor_201718 tensor_201719 Split 2708 1 2 tensor_201719 tensor_201720 tensor_201721 Split 2709 1 2 state_22_1 tensor_201722 tensor_201723 Split 2710 1 2 state_22_2 tensor_201724 tensor_201725 BinaryOp 2711 2 1 tensor_201717 tensor_201724 tensor_201726 0=2 BinaryOp 2712 2 1 tensor_201726 tensor_201721 tensor_201727 0=0 BinaryOp 2713 2 1 tensor_201720 tensor_201702 tensor_201728 0=2 BinaryOp 2714 2 1 tensor_201716 tensor_201722 tensor_201729 0=2 BinaryOp 2715 2 1 tensor_201729 tensor_201728 tensor_201730 0=0 BinaryOp 2716 2 1 tensor_201730 tensor_201727 tensor_201731 0=3 MemoryData 2717 0 1 blocks.22.att.time_decay 0=2048 21=0 BinaryOp 2718 2 1 blocks.22.att.time_decay tensor_201710 tensor_201733 0=0 Split 2719 1 2 tensor_201733 tensor_201734 tensor_201735 BinaryOp 2720 2 1 tensor_201734 tensor_201696 tensor_201736 0=4 Split 2721 1 3 tensor_201736 tensor_201737 tensor_201738 tensor_201739 BinaryOp 2722 2 1 tensor_201735 tensor_201737 tensor_201740 0=1 Exp 2723 1 1 tensor_201740 tensor_201741 Split 2724 1 2 tensor_201741 tensor_201742 tensor_201743 BinaryOp 2725 2 1 tensor_201697 tensor_201738 tensor_201744 0=1 Exp 2726 1 1 tensor_201744 tensor_201745 Split 2727 1 2 tensor_201745 tensor_201746 tensor_201747 BinaryOp 2728 2 1 tensor_201690 tensor_201731 tensor_201748 0=2 Reshape 2729 1 1 tensor_201748 tensor_201749 0=0 1=1 Gemm 2730 1 1 tensor_201749 tensor_201751 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2731 1 1 tensor_201751 tensor_201752 0=-1 BinaryOp 2732 2 1 tensor_201656 tensor_201752 tensor_201753 0=0 BinaryOp 2733 2 1 tensor_201746 tensor_201703 tensor_201754 0=2 BinaryOp 2734 2 1 tensor_201742 tensor_201723 tensor_201755 0=2 BinaryOp 2735 2 1 tensor_201755 tensor_201754 tensor_201756 0=0 BinaryOp 2736 2 1 tensor_201743 tensor_201725 tensor_201757 0=2 BinaryOp 2737 2 1 tensor_201757 tensor_201747 tensor_201758 0=0 Split 2738 1 1 tensor_201661 output_state_22_0 Split 2739 1 1 tensor_201756 output_state_22_1 Split 2740 1 1 tensor_201758 output_state_22_2 Split 2741 1 1 tensor_201739 output_state_22_3 Split 2742 1 2 tensor_201753 tensor_201763 tensor_201764 LayerNorm 2743 1 1 tensor_201763 tensor_201765 0=2048 1=1.000000e-05 2=1 Split 2744 1 3 tensor_201765 tensor_201766 tensor_201767 tensor_201768 Split 2745 1 2 state_22_4 tensor_201769 tensor_201770 MemoryData 2746 0 1 blocks.22.ffn.time_mix_k 0=2048 21=0 Split 2747 1 2 blocks.22.ffn.time_mix_k tensor_201772 tensor_201773 MemoryData 2748 0 1 blocks.22.ffn.time_mix_r 0=2048 21=0 Split 2749 1 2 blocks.22.ffn.time_mix_r tensor_201775 tensor_201776 BinaryOp 2750 1 1 tensor_201773 tensor_201777 0=7 1=1 2=1.000000e+00 BinaryOp 2751 2 1 tensor_201769 tensor_201777 tensor_201778 0=2 BinaryOp 2752 2 1 tensor_201766 tensor_201772 tensor_201779 0=2 BinaryOp 2753 2 1 tensor_201779 tensor_201778 tensor_201780 0=0 BinaryOp 2754 1 1 tensor_201776 tensor_201781 0=7 1=1 2=1.000000e+00 BinaryOp 2755 2 1 tensor_201770 tensor_201781 tensor_201782 0=2 BinaryOp 2756 2 1 tensor_201767 tensor_201775 tensor_201783 0=2 BinaryOp 2757 2 1 tensor_201783 tensor_201782 tensor_201784 0=0 Reshape 2758 1 1 tensor_201784 tensor_201785 0=0 1=1 Gemm 2759 1 1 tensor_201785 tensor_201787 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2760 1 1 tensor_201787 tensor_201788 0=-1 Sigmoid 2761 1 1 tensor_201788 tensor_201789 Reshape 2762 1 1 tensor_201780 tensor_201790 0=0 1=1 Gemm 2763 1 1 tensor_201790 tensor_201792 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 2764 1 1 tensor_201792 tensor_201793 0=-1 ReLU 2765 1 1 tensor_201793 tensor_201794 BinaryOp 2766 2 1 tensor_201794 tensor_201794 tensor_201795 0=2 Reshape 2767 1 1 tensor_201795 tensor_201796 0=0 1=1 Gemm 2768 1 1 tensor_201796 tensor_201798 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 2769 1 1 tensor_201798 tensor_201799 0=-1 BinaryOp 2770 2 1 tensor_201789 tensor_201799 tensor_201800 0=2 BinaryOp 2771 2 1 tensor_201764 tensor_201800 tensor_201801 0=0 Split 2772 1 1 tensor_201768 output_state_22_4 Split 2773 1 2 tensor_201801 tensor_201803 tensor_201804 LayerNorm 2774 1 1 tensor_201803 tensor_201805 0=2048 1=1.000000e-05 2=1 Split 2775 1 4 tensor_201805 tensor_201806 tensor_201807 tensor_201808 tensor_201809 Split 2776 1 3 state_23_0 tensor_201810 tensor_201811 tensor_201812 MemoryData 2777 0 1 blocks.23.att.time_mix_k 0=2048 21=0 Split 2778 1 2 blocks.23.att.time_mix_k tensor_201814 tensor_201815 MemoryData 2779 0 1 blocks.23.att.time_mix_v 0=2048 21=0 Split 2780 1 2 blocks.23.att.time_mix_v tensor_201817 tensor_201818 MemoryData 2781 0 1 blocks.23.att.time_mix_r 0=2048 21=0 Split 2782 1 2 blocks.23.att.time_mix_r tensor_201820 tensor_201821 BinaryOp 2783 1 1 tensor_201815 tensor_201822 0=7 1=1 2=1.000000e+00 BinaryOp 2784 2 1 tensor_201810 tensor_201822 tensor_201823 0=2 BinaryOp 2785 2 1 tensor_201806 tensor_201814 tensor_201824 0=2 BinaryOp 2786 2 1 tensor_201824 tensor_201823 tensor_201825 0=0 BinaryOp 2787 1 1 tensor_201818 tensor_201826 0=7 1=1 2=1.000000e+00 BinaryOp 2788 2 1 tensor_201811 tensor_201826 tensor_201827 0=2 BinaryOp 2789 2 1 tensor_201807 tensor_201817 tensor_201828 0=2 BinaryOp 2790 2 1 tensor_201828 tensor_201827 tensor_201829 0=0 BinaryOp 2791 1 1 tensor_201821 tensor_201830 0=7 1=1 2=1.000000e+00 BinaryOp 2792 2 1 tensor_201812 tensor_201830 tensor_201831 0=2 BinaryOp 2793 2 1 tensor_201808 tensor_201820 tensor_201832 0=2 BinaryOp 2794 2 1 tensor_201832 tensor_201831 tensor_201833 0=0 Reshape 2795 1 1 tensor_201833 tensor_201834 0=0 1=1 Gemm 2796 1 1 tensor_201834 tensor_201836 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2797 1 1 tensor_201836 tensor_201837 0=-1 Sigmoid 2798 1 1 tensor_201837 tensor_201838 Reshape 2799 1 1 tensor_201825 tensor_201839 0=0 1=1 Gemm 2800 1 1 tensor_201839 tensor_201841 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2801 1 1 tensor_201841 tensor_201842 0=-1 Split 2802 1 3 tensor_201842 tensor_201843 tensor_201844 tensor_201845 Reshape 2803 1 1 tensor_201829 tensor_201846 0=0 1=1 Gemm 2804 1 1 tensor_201846 tensor_201848 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2805 1 1 tensor_201848 tensor_201849 0=-1 Split 2806 1 2 tensor_201849 tensor_201850 tensor_201851 MemoryData 2807 0 1 blocks.23.att.time_first 0=2048 21=0 BinaryOp 2808 2 1 blocks.23.att.time_first tensor_201843 tensor_201853 0=0 Split 2809 1 2 tensor_201853 tensor_201854 tensor_201855 Split 2810 1 3 state_23_3 tensor_201856 tensor_201857 tensor_201858 BinaryOp 2811 2 1 tensor_201856 tensor_201854 tensor_201859 0=4 Split 2812 1 2 tensor_201859 tensor_201860 tensor_201861 BinaryOp 2813 2 1 tensor_201857 tensor_201860 tensor_201862 0=1 Exp 2814 1 1 tensor_201862 tensor_201863 Split 2815 1 2 tensor_201863 tensor_201864 tensor_201865 BinaryOp 2816 2 1 tensor_201855 tensor_201861 tensor_201866 0=1 Exp 2817 1 1 tensor_201866 tensor_201867 Split 2818 1 2 tensor_201867 tensor_201868 tensor_201869 Split 2819 1 2 state_23_1 tensor_201870 tensor_201871 Split 2820 1 2 state_23_2 tensor_201872 tensor_201873 BinaryOp 2821 2 1 tensor_201865 tensor_201872 tensor_201874 0=2 BinaryOp 2822 2 1 tensor_201874 tensor_201869 tensor_201875 0=0 BinaryOp 2823 2 1 tensor_201868 tensor_201850 tensor_201876 0=2 BinaryOp 2824 2 1 tensor_201864 tensor_201870 tensor_201877 0=2 BinaryOp 2825 2 1 tensor_201877 tensor_201876 tensor_201878 0=0 BinaryOp 2826 2 1 tensor_201878 tensor_201875 tensor_201879 0=3 MemoryData 2827 0 1 blocks.23.att.time_decay 0=2048 21=0 BinaryOp 2828 2 1 blocks.23.att.time_decay tensor_201858 tensor_201881 0=0 Split 2829 1 2 tensor_201881 tensor_201882 tensor_201883 BinaryOp 2830 2 1 tensor_201882 tensor_201844 tensor_201884 0=4 Split 2831 1 3 tensor_201884 tensor_201885 tensor_201886 tensor_201887 BinaryOp 2832 2 1 tensor_201883 tensor_201885 tensor_201888 0=1 Exp 2833 1 1 tensor_201888 tensor_201889 Split 2834 1 2 tensor_201889 tensor_201890 tensor_201891 BinaryOp 2835 2 1 tensor_201845 tensor_201886 tensor_201892 0=1 Exp 2836 1 1 tensor_201892 tensor_201893 Split 2837 1 2 tensor_201893 tensor_201894 tensor_201895 BinaryOp 2838 2 1 tensor_201838 tensor_201879 tensor_201896 0=2 Reshape 2839 1 1 tensor_201896 tensor_201897 0=0 1=1 Gemm 2840 1 1 tensor_201897 tensor_201899 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2841 1 1 tensor_201899 tensor_201900 0=-1 BinaryOp 2842 2 1 tensor_201804 tensor_201900 tensor_201901 0=0 BinaryOp 2843 2 1 tensor_201894 tensor_201851 tensor_201902 0=2 BinaryOp 2844 2 1 tensor_201890 tensor_201871 tensor_201903 0=2 BinaryOp 2845 2 1 tensor_201903 tensor_201902 tensor_201904 0=0 BinaryOp 2846 2 1 tensor_201891 tensor_201873 tensor_201905 0=2 BinaryOp 2847 2 1 tensor_201905 tensor_201895 tensor_201906 0=0 Split 2848 1 1 tensor_201809 output_state_23_0 Split 2849 1 1 tensor_201904 output_state_23_1 Split 2850 1 1 tensor_201906 output_state_23_2 Split 2851 1 1 tensor_201887 output_state_23_3 Split 2852 1 2 tensor_201901 tensor_201911 tensor_201912 LayerNorm 2853 1 1 tensor_201911 tensor_201913 0=2048 1=1.000000e-05 2=1 Split 2854 1 3 tensor_201913 tensor_201914 tensor_201915 tensor_201916 Split 2855 1 2 state_23_4 tensor_201917 tensor_201918 MemoryData 2856 0 1 blocks.23.ffn.time_mix_k 0=2048 21=0 Split 2857 1 2 blocks.23.ffn.time_mix_k tensor_201920 tensor_201921 MemoryData 2858 0 1 blocks.23.ffn.time_mix_r 0=2048 21=0 Split 2859 1 2 blocks.23.ffn.time_mix_r tensor_201923 tensor_201924 BinaryOp 2860 1 1 tensor_201921 tensor_201925 0=7 1=1 2=1.000000e+00 BinaryOp 2861 2 1 tensor_201917 tensor_201925 tensor_201926 0=2 BinaryOp 2862 2 1 tensor_201914 tensor_201920 tensor_201927 0=2 BinaryOp 2863 2 1 tensor_201927 tensor_201926 tensor_201928 0=0 BinaryOp 2864 1 1 tensor_201924 tensor_201929 0=7 1=1 2=1.000000e+00 BinaryOp 2865 2 1 tensor_201918 tensor_201929 tensor_201930 0=2 BinaryOp 2866 2 1 tensor_201915 tensor_201923 tensor_201931 0=2 BinaryOp 2867 2 1 tensor_201931 tensor_201930 tensor_201932 0=0 Reshape 2868 1 1 tensor_201932 tensor_201933 0=0 1=1 Gemm 2869 1 1 tensor_201933 tensor_201935 4=0 5=1 6=1 7=0 8=2048 9=2048 10=-1 Reshape 2870 1 1 tensor_201935 tensor_201936 0=-1 Sigmoid 2871 1 1 tensor_201936 tensor_201937 Reshape 2872 1 1 tensor_201928 tensor_201938 0=0 1=1 Gemm 2873 1 1 tensor_201938 tensor_201940 4=0 5=1 6=1 7=0 8=8192 9=2048 10=-1 Reshape 2874 1 1 tensor_201940 tensor_201941 0=-1 ReLU 2875 1 1 tensor_201941 tensor_201942 BinaryOp 2876 2 1 tensor_201942 tensor_201942 tensor_201943 0=2 Reshape 2877 1 1 tensor_201943 tensor_201944 0=0 1=1 Gemm 2878 1 1 tensor_201944 tensor_201946 4=0 5=1 6=1 7=0 8=2048 9=8192 10=-1 Reshape 2879 1 1 tensor_201946 tensor_201947 0=-1 BinaryOp 2880 2 1 tensor_201937 tensor_201947 tensor_201948 0=2 BinaryOp 2881 2 1 tensor_201912 tensor_201948 tensor_201949 0=0 Split 2882 1 1 tensor_201916 output_state_23_4 LayerNorm 2883 1 1 tensor_201949 tensor_201951 0=2048 1=1.000000e-05 2=1 Reshape 2884 1 1 tensor_201951 tensor_201952 0=0 1=1 Gemm 2885 1 1 tensor_201952 tensor_201954 4=0 5=1 6=1 7=0 8=65536 9=2048 10=-1 Reshape 2886 1 1 tensor_201954 tensor_201955 0=-1 Split 2887 1 1 tensor_201955 output